|
|
|
@@ -81,8 +81,6 @@ void GPUSession::Optimize(const std::shared_ptr<KernelGraph> &kernel_graph) { |
|
|
|
auto pm = std::make_shared<opt::PassManager>(); |
|
|
|
pm->AddPass(std::make_shared<opt::AdamWeightDecayFusion>()); |
|
|
|
pm->AddPass(std::make_shared<opt::AdamFusion>()); |
|
|
|
// pm->AddPass(std::make_shared<opt::ApplyMomentumWeightDecayScaleFusion>()); |
|
|
|
// pm->AddPass(std::make_shared<opt::ApplyMomentumScaleFusion>()); |
|
|
|
pm->AddPass(std::make_shared<opt::ReplaceBNCastFusion>()); |
|
|
|
pm->AddPass(std::make_shared<opt::ReplaceBNGradCastFusion>()); |
|
|
|
pm->AddPass(std::make_shared<opt::ReplaceMomentumCastFusion>()); |
|
|
|
@@ -98,7 +96,6 @@ void GPUSession::HardwareOptimize(const std::shared_ptr<KernelGraph> &kernel_gra |
|
|
|
pm->AddPass(std::make_shared<opt::BatchNormReluFusion>()); |
|
|
|
pm->AddPass(std::make_shared<opt::BatchNormReluGradFusion>()); |
|
|
|
pm->AddPass(std::make_shared<opt::BatchNormAddReluFusion>()); |
|
|
|
// pm->AddPass(std::make_shared<opt::BatchNormAddReluGradFusion>()); |
|
|
|
pm->AddPass(std::make_shared<opt::InsertFormatTransformOp>()); |
|
|
|
pm->AddPass(std::make_shared<opt::RemoveFormatTransformPair>()); |
|
|
|
pm->AddPass(std::make_shared<opt::RemoveRedundantFormatTransform>()); |
|
|
|
|