FastDeploy  latest
Fast & Easy to Deploy!
poros_backend.h
1 // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 // http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 #pragma once
16 
17 #include <iostream>
18 #include <memory>
19 #include <string>
20 #include <vector>
21 
22 #include "fastdeploy/runtime/backends/backend.h"
23 #include "fastdeploy/runtime/backends/poros/option.h"
24 #include "fastdeploy/runtime/backends/poros/common/compile.h"
25 #include "fastdeploy/runtime/backends/poros/common/poros_module.h"
26 
27 namespace fastdeploy {
28 
29 // Convert data type from fastdeploy to poros
30 at::ScalarType GetPorosDtype(const FDDataType& fd_dtype);
31 
32 // Convert data type from poros to fastdeploy
33 FDDataType GetFdDtype(const at::ScalarType& dtype);
34 
35 // at::ScalarType to std::string for FDERROR
36 std::string AtType2String(const at::ScalarType& dtype);
37 
38 // Create at::Tensor
39 // is_backend_cuda specify if Poros use GPU Device
40 // While is_backend_cuda = true, and tensor.device = Device::GPU
41 at::Tensor CreatePorosValue(FDTensor& tensor, bool is_backend_cuda = false);
42 
43 // Copy memory data from at::Tensor to fastdeploy::FDTensor
44 void CopyTensorToCpu(const at::Tensor& tensor, FDTensor* fd_tensor,
45  bool is_backend_cuda = false);
46 
47 class PorosBackend : public BaseBackend {
48  public:
49  PorosBackend() {}
50  virtual ~PorosBackend() = default;
51 
52  void BuildOption(const PorosBackendOption& option);
53 
54  bool Init(const RuntimeOption& option) {
55  if (!(Supported(option.model_format, Backend::POROS)
56  && Supported(option.device, Backend::POROS))) {
57  return false;
58  }
59  if (option.model_from_memory_) {
60  FDERROR << "Poros backend doesn't support load model "
61  << "from memory, please load model from disk."
62  << std::endl;
63  return false;
64  }
65  return true;
66  }
67 
68  bool Compile(const std::string& model_file,
69  std::vector<std::vector<FDTensor>>& prewarm_tensors,
70  const PorosBackendOption& option = PorosBackendOption());
71 
72  bool Infer(std::vector<FDTensor>& inputs, std::vector<FDTensor>* outputs,
73  bool copy_to_fd = true) override;
74 
75  int NumInputs() const { return _numinputs; }
76 
77  int NumOutputs() const { return _numoutputs; }
78 
79  TensorInfo GetInputInfo(int index) override;
80  TensorInfo GetOutputInfo(int index) override;
81  std::vector<TensorInfo> GetInputInfos() override;
82  std::vector<TensorInfo> GetOutputInfos() override;
83 
84  private:
85  baidu::mirana::poros::PorosOptions _options;
86  std::unique_ptr<baidu::mirana::poros::PorosModule> _poros_module;
87  std::vector<std::vector<c10::IValue>> _prewarm_datas;
88  int _numinputs = 1;
89  int _numoutputs = 1;
90 };
91 
92 } // namespace fastdeploy
Poros, support TorchScript format model, CPU / Nvidia GPU.
Definition: enum_variables.h:36
All C++ FastDeploy APIs are defined inside this namespace.
Definition: option.h:16