FastDeploy  latest
Fast & Easy to Deploy!
compile.h
1 // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 // http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 #pragma once
16 
17 #include <algorithm>
18 #include <set>
19 #include <string>
20 #include <unordered_map>
21 
22 #include "iengine.h" // NOLINT
23 #include "poros_module.h" // NOLINT
24 #include "torch/script.h" // NOLINT
25 
26 namespace baidu {
27 namespace mirana {
28 namespace poros {
29 
39 std::unique_ptr<PorosModule>
40 Compile(const torch::jit::Module& module,
41  const std::vector<std::vector<c10::IValue>>& prewarm_datas,
42  const PorosOptions& options);
43 
44 class Compiler {
45  public:
46  typedef std::unordered_map<const torch::jit::Node*, IEngine*> engine_map_t;
47  typedef std::vector<std::vector<c10::IValue>> ivalue_vec_t;
48 
49  Compiler() : _origin_module(NULL) {}
50  ~Compiler();
51 
59  int init(const PorosOptions& options);
60 
70  int compile(const torch::jit::Module& origin_module,
71  const ivalue_vec_t& prewarm_datas,
72  torch::jit::Module* optimized_module);
73 
74  private:
83  int preprocess_graph(const ivalue_vec_t& prewarm_datas,
84  std::shared_ptr<torch::jit::Graph>& graph);
85 
93  int segment_graph(std::shared_ptr<torch::jit::Graph>& graph);
94 
95  // Split subgraph(block)
96  // The divided subgraph, as a subgraph, is associated with the block
97  int segment_block(torch::jit::Block& block, IEngine* engine,
98  int current_depth);
99 
100  // Subgraph optimization
110  int optimize_subgraph(const ivalue_vec_t& prewarm_datas,
111  const std::shared_ptr<torch::jit::Graph>& opt_graph,
112  torch::jit::Module* optimized_module);
113 
114  // Subgraph optimization(block)
115  int optimize_subblock(torch::jit::Block* block,
116  torch::jit::Module* optimized_module);
117 
126  int transform(IEngine* engine, torch::jit::Node& subgraph_node,
127  torch::jit::Module& module);
128 
136  IEngine* select_engine(const torch::jit::Node* n);
137 
143  void close();
144 
145  private:
146  int _max_segment_depth{5}; // Maximum subgraph segmentation depth
147  ivalue_vec_t _prewarm_datas; // Prewarm datas
148  PorosOptions _options;
149  engine_map_t _engine_map; // The engine used to record the subgraph
150  const torch::jit::Module* _origin_module; // Origin_module
151  std::atomic<int> _engine_index = {0}; // Record engine index
152 };
153 
163 std::unique_ptr<torch::jit::Module>
164 CompileGraph(const torch::jit::Module& module,
165  const std::vector<std::vector<c10::IValue>>& prewarm_datas,
166  const PorosOptions& options);
167 
168 } // namespace poros
169 } // namespace mirana
170 } // namespace baidu
Definition: compile.h:26