convert_to_mixed_precision.h 2.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22
// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <string>
#include <unordered_set>

#include "paddle/fluid/framework/block_desc.h"
#include "paddle/fluid/framework/ir/graph.h"
#include "paddle/fluid/framework/program_desc.h"
23
#include "paddle/fluid/framework/scope.h"
24 25 26 27 28 29 30
#include "paddle/phi/common/backend.h"
#include "paddle/phi/common/data_type.h"

namespace paddle {
namespace inference {
namespace analysis {

31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62
class ConvertToMixedPrecisionPass {
 public:
  explicit ConvertToMixedPrecisionPass(
      const std::string& model_file,
      const std::string& params_file,
      const std::string& mixed_model_file,
      const std::string& mixed_params_file,
      phi::DataType mixed_precision,
      phi::Backend backend,
      bool keep_io_types,
      const std::unordered_set<std::string>& black_list);

  void Run();

 private:
  void LoadModel();
  void SaveMixedModel();

 private:
  std::string model_file_;
  std::string params_file_;
  std::string mixed_model_file_;
  std::string mixed_params_file_;
  phi::DataType mixed_precision_;
  phi::Backend backend_;
  bool keep_io_types_;
  std::unordered_set<std::string> black_list_;

  framework::Scope scope_;
  std::unique_ptr<framework::ir::Graph> main_graph_{nullptr};
};

63
bool OpSupportPrecision(const std::string& op_type,
64 65
                        phi::Backend backend,
                        phi::DataType precision,
66
                        const std::unordered_set<std::string>& black_list);
67

68
void InsertCastOp(
69
    framework::ir::Graph* graph,
70 71
    framework::ir::Node* var_node,
    framework::ir::Node* op_node,
72 73 74
    framework::proto::VarType::Type from_type,
    framework::proto::VarType::Type to_type,
    framework::BlockDesc* block_desc,
75 76
    int* suffix,
    std::unordered_map<framework::ir::Node*, framework::ir::Node*>* visited);
77 78 79 80 81 82 83

void ConvertToMixedPrecision(const std::string& model_file,
                             const std::string& params_file,
                             const std::string& mixed_model_file,
                             const std::string& mixed_params_file,
                             phi::DataType mixed_precision,
                             phi::Backend backend,
84 85
                             bool keep_io_types,
                             const std::unordered_set<std::string>& black_list);
86 87 88 89

}  // namespace analysis
}  // namespace inference
}  // namespace paddle