cpp/html/runtime__option_8h_source.html

 // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #pragma once

 #include <algorithm>
 #include <map>
 #include <vector>
 #include "fastdeploy/runtime/enum_variables.h"
 #include "fastdeploy/runtime/backends/lite/option.h"
 #include "fastdeploy/runtime/backends/openvino/option.h"
 #include "fastdeploy/runtime/backends/ort/option.h"
 #include "fastdeploy/runtime/backends/paddle/option.h"
 #include "fastdeploy/runtime/backends/poros/option.h"
 #include "fastdeploy/runtime/backends/rknpu2/option.h"
 #include "fastdeploy/runtime/backends/sophgo/option.h"
 #include "fastdeploy/runtime/backends/tensorrt/option.h"
 #include "fastdeploy/benchmark/option.h"

 namespace fastdeploy {

 struct FASTDEPLOY_DECL RuntimeOption {
   void SetModelPath(const std::string& model_path,
                     const std::string& params_path = "",
                     const ModelFormat& format = ModelFormat::PADDLE);

   void SetModelBuffer(const std::string& model_buffer,
                       const std::string& params_buffer = "",
                       const ModelFormat& format = ModelFormat::PADDLE);

   void SetEncryptionKey(const std::string& encryption_key);

   void UseCpu();
   void UseGpu(int gpu_id = 0);
   void UseRKNPU2(fastdeploy::rknpu2::CpuName rknpu2_name =
                      fastdeploy::rknpu2::CpuName::RK356X,
                  fastdeploy::rknpu2::CoreMask rknpu2_core =
                      fastdeploy::rknpu2::CoreMask::RKNN_NPU_CORE_AUTO);
   void UseTimVX();
   void UseAscend();

   void UseDirectML();

   void UseSophgo();
   void UseKunlunXin(int kunlunxin_id = 0, int l3_workspace_size = 0xfffc00,
                     bool locked = false, bool autotune = true,
                     const std::string& autotune_file = "",
                     const std::string& precision = "int16",
                     bool adaptive_seqlen = false,
                     bool enable_multi_stream = false);

   void SetExternalStream(void* external_stream);

   /*
    * @brief Set number of cpu threads while inference on CPU, by default it will decided by the different backends
    */
   void SetCpuThreadNum(int thread_num);
   void UsePaddleInferBackend() { return UsePaddleBackend(); }
   void UseOrtBackend();
   void UseSophgoBackend();
   void UseTrtBackend();
   void UsePorosBackend();
   void UseOpenVINOBackend();
   void UsePaddleLiteBackend() { return UseLiteBackend(); }
   void UseIpu(int device_num = 1, int micro_batch_size = 1,
               bool enable_pipelining = false, int batches_per_step = 1);

   OrtBackendOption ort_option;
   TrtBackendOption trt_option;
   PaddleBackendOption paddle_infer_option;
   PorosBackendOption poros_option;
   OpenVINOBackendOption openvino_option;
   LiteBackendOption paddle_lite_option;
   RKNPU2BackendOption rknpu2_option;

   //  \brief Set the profile mode as 'true'.
   //
   // \param[in] inclue_h2d_d2h Whether to
   //            include time of H2D_D2H for time of runtime.
   // \param[in] repeat Repeat times for runtime inference.
   // \param[in] warmup Warmup times for runtime inference.
   //
   void EnableProfiling(bool inclue_h2d_d2h = false,
                        int repeat = 100, int warmup = 50) {
     benchmark_option.enable_profile = true;
     benchmark_option.warmup = warmup;
     benchmark_option.repeats = repeat;
     benchmark_option.include_h2d_d2h = inclue_h2d_d2h;
   }

   // \brief Set the profile mode as 'false'.
   //
   void DisableProfiling() {
     benchmark_option.enable_profile = false;
   }

   // \brief Enable to check if current backend set by
   //        user can be found at valid_xxx_backend.
   //
   void EnableValidBackendCheck() {
     enable_valid_backend_check = true;
   }
   // \brief Disable to check if current backend set by
   //        user can be found at valid_xxx_backend.
   //
   void DisableValidBackendCheck() {
     enable_valid_backend_check = false;
   }

   // Benchmark option
   benchmark::BenchmarkOption benchmark_option;
   // enable the check for valid backend, default true.
   bool enable_valid_backend_check = true;

   // If model_from_memory is true, the model_file and params_file is
   // binary stream in memory;
   // Otherwise, the model_file and params_file means the path of file
   std::string model_file = "";
   std::string params_file = "";
   bool model_from_memory_ = false;
   // format of input model
   ModelFormat model_format = ModelFormat::PADDLE;

   std::string encryption_key_ = "";

   // for cpu inference
   // default will let the backend choose their own default value
   int cpu_thread_num = -1;
   int device_id = 0;
   Backend backend = Backend::UNKNOWN;

   Device device = Device::CPU;

   void* external_stream_ = nullptr;

   bool enable_pinned_memory = false;

   // *** The belowing api are deprecated, will be removed in v1.2.0
   // *** Do not use it anymore
   void SetPaddleMKLDNN(bool pd_mkldnn = true);
   void EnablePaddleToTrt();
   void DeletePaddleBackendPass(const std::string& delete_pass_name);
   void EnablePaddleLogInfo();
   void DisablePaddleLogInfo();
   void SetPaddleMKLDNNCacheSize(int size);
   void SetOpenVINODevice(const std::string& name = "CPU");
   void SetOpenVINOShapeInfo(
       const std::map<std::string, std::vector<int64_t>>& shape_info) {
     openvino_option.shape_infos = shape_info;
   }
   void SetOpenVINOCpuOperators(const std::vector<std::string>& operators) {
     openvino_option.SetCpuOperators(operators);
   }
   void SetLiteOptimizedModelDir(const std::string& optimized_model_dir);
   void SetLiteSubgraphPartitionPath(
       const std::string& nnadapter_subgraph_partition_config_path);
   void SetLiteSubgraphPartitionConfigBuffer(
       const std::string& nnadapter_subgraph_partition_config_buffer);
   void
   SetLiteContextProperties(const std::string& nnadapter_context_properties);
   void SetLiteModelCacheDir(const std::string& nnadapter_model_cache_dir);
   void SetLiteDynamicShapeInfo(
       const std::map<std::string, std::vector<std::vector<int64_t>>>&
           nnadapter_dynamic_shape_info);
   void SetLiteMixedPrecisionQuantizationConfigPath(
       const std::string& nnadapter_mixed_precision_quantization_config_path);
   void EnableLiteFP16();
   void DisableLiteFP16();
   void EnableLiteInt8();
   void DisableLiteInt8();
   void SetLitePowerMode(LitePowerMode mode);
   void SetTrtInputShape(
       const std::string& input_name, const std::vector<int32_t>& min_shape,
       const std::vector<int32_t>& opt_shape = std::vector<int32_t>(),
       const std::vector<int32_t>& max_shape = std::vector<int32_t>());
   void SetTrtMaxWorkspaceSize(size_t trt_max_workspace_size);
   void SetTrtMaxBatchSize(size_t max_batch_size);
   void EnableTrtFP16();
   void DisableTrtFP16();
   void SetTrtCacheFile(const std::string& cache_file_path);
   void EnablePinnedMemory();
   void DisablePinnedMemory();
   void EnablePaddleTrtCollectShape();
   void DisablePaddleTrtCollectShape();
   void DisablePaddleTrtOPs(const std::vector<std::string>& ops);
   void SetOpenVINOStreams(int num_streams);
   void SetOrtGraphOptLevel(int level = -1);
   void UsePaddleBackend();
   void UseLiteBackend();
 };

 }  // namespace fastdeploy
fastdeploy::RuntimeOption
Option object used when create a new Runtime object.
Definition: runtime_option.h:40

fastdeploy::RuntimeOption::UsePaddleInferBackend
void UsePaddleInferBackend()
Set Paddle Inference as inference backend, support CPU/GPU.
Definition: runtime_option.h:122

fastdeploy::OrtBackendOption
Option object to configure ONNX Runtime backend.
Definition: option.h:28

fastdeploy::OpenVINOBackendOption::SetCpuOperators
void SetCpuOperators(const std::vector< std::string > &operators)
While use OpenVINO backend with intel GPU, use this interface to specify operators run on CPU...
Definition: option.h:59

fastdeploy::ModelFormat
ModelFormat
Definition: enum_variables.h:67

fastdeploy::Backend
Backend
Definition: enum_variables.h:30

enum_variables.h
A brief file description.

fastdeploy::PaddleBackendOption
Option object to configure Paddle Inference backend.
Definition: option.h:50

fastdeploy::RuntimeOption::paddle_infer_option
PaddleBackendOption paddle_infer_option
Option to configure Paddle Inference backend.
Definition: runtime_option.h:150

fastdeploy::LitePowerMode
LitePowerMode
Definition: option.h:42

fastdeploy::RuntimeOption::trt_option
TrtBackendOption trt_option
Option to configure TensorRT backend.
Definition: runtime_option.h:148

fastdeploy::LiteBackendOption
Option object to configure Paddle Lite backend.
Definition: option.h:53

fastdeploy::PorosBackendOption
Option object to configure Poros backend.
Definition: option.h:27

fastdeploy::RuntimeOption::openvino_option
OpenVINOBackendOption openvino_option
Option to configure OpenVINO backend.
Definition: runtime_option.h:154

fastdeploy::RuntimeOption::paddle_lite_option
LiteBackendOption paddle_lite_option
Option to configure Paddle Lite backend.
Definition: runtime_option.h:156

fastdeploy::TrtBackendOption
Option object to configure TensorRT backend.
Definition: option.h:26

fastdeploy::PADDLE
Model with paddlepaddle format.
Definition: enum_variables.h:69

fastdeploy::RuntimeOption::rknpu2_option
RKNPU2BackendOption rknpu2_option
Option to configure RKNPU2 backend.
Definition: runtime_option.h:158

fastdeploy::OpenVINOBackendOption
Option object to configure OpenVINO backend.
Definition: option.h:28

fastdeploy::RuntimeOption::UsePaddleLiteBackend
void UsePaddleLiteBackend()
Set Paddle Lite as inference backend, only support arm cpu.
Definition: runtime_option.h:134

fastdeploy
All C++ FastDeploy APIs are defined inside this namespace.
Definition: option.h:16

fastdeploy::UNKNOWN
Unknown inference backend.
Definition: enum_variables.h:31

fastdeploy::RuntimeOption::poros_option
PorosBackendOption poros_option
Option to configure Poros backend.
Definition: runtime_option.h:152

fastdeploy::RuntimeOption::ort_option
OrtBackendOption ort_option
Option to configure ONNX Runtime backend.
Definition: runtime_option.h:146