FastDeploy  latest
Fast & Easy to Deploy!
rknpu2_backend.h
1 // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 // http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 #pragma once
15 
16 #include "fastdeploy/runtime/backends/backend.h"
17 #include "fastdeploy/runtime/backends/rknpu2/option.h"
18 #include "fastdeploy/core/fd_tensor.h"
19 #include "rknn_api.h" // NOLINT
20 #include <cstring>
21 #include <iostream>
22 #include <memory>
23 #include <string>
24 #include <vector>
25 
26 namespace fastdeploy {
27 class RKNPU2Backend : public BaseBackend {
28  public:
29  RKNPU2Backend() = default;
30 
31  virtual ~RKNPU2Backend();
32 
33  bool Init(const RuntimeOption& runtime_option);
34 
35  int NumInputs() const override {
36  return static_cast<int>(inputs_desc_.size());
37  }
38 
39  int NumOutputs() const override {
40  return static_cast<int>(outputs_desc_.size());
41  }
42 
43  TensorInfo GetInputInfo(int index) override;
44  TensorInfo GetOutputInfo(int index) override;
45  std::vector<TensorInfo> GetInputInfos() override;
46  std::vector<TensorInfo> GetOutputInfos() override;
47  bool Infer(std::vector<FDTensor>& inputs, std::vector<FDTensor>* outputs,
48  bool copy_to_fd = true) override;
49 
50  private:
51  // BaseBackend API
52  void BuildOption(const RKNPU2BackendOption& option);
53 
54  // RKNN API
55  bool LoadModel(void* model);
56 
57  bool GetSDKAndDeviceVersion();
58 
59  bool SetCoreMask(const rknpu2::CoreMask& core_mask) const;
60 
61  bool GetModelInputOutputInfos();
62 
63  // The object of rknn context.
64  rknn_context ctx{};
65  // The structure rknn_sdk_version is used to indicate the version
66  // information of the RKNN SDK.
67  rknn_sdk_version sdk_ver{};
68  // The structure rknn_input_output_num represents the number of
69  // input and output Tensor
70  rknn_input_output_num io_num{};
71  std::vector<TensorInfo> inputs_desc_;
72  std::vector<TensorInfo> outputs_desc_;
73 
74  rknn_tensor_attr* input_attrs_ = nullptr;
75  rknn_tensor_attr* output_attrs_ = nullptr;
76 
77  rknn_tensor_mem** input_mems_;
78  rknn_tensor_mem** output_mems_;
79 
80  bool infer_init = false;
81 
82  RKNPU2BackendOption option_;
83 
84  static void DumpTensorAttr(rknn_tensor_attr& attr);
85  static FDDataType RknnTensorTypeToFDDataType(rknn_tensor_type type);
86  static rknn_tensor_type FDDataTypeToRknnTensorType(FDDataType type);
87 };
88 } // namespace fastdeploy
All C++ FastDeploy APIs are defined inside this namespace.
Definition: option.h:16