cpp/html/runtime_2backends_2paddle_2option_8h_source.html

 // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #pragma once

 #include "fastdeploy/core/fd_type.h"
 #include <iostream>
 #include <memory>
 #include <string>
 #include <vector>
 #include "fastdeploy/runtime/backends/tensorrt/option.h"


 namespace fastdeploy {

 struct IpuOption {
   int ipu_device_num;
   int ipu_micro_batch_size;
   bool ipu_enable_pipelining;
   int ipu_batches_per_step;
   bool ipu_enable_fp16;
   int ipu_replica_num;
   float ipu_available_memory_proportion;
   bool ipu_enable_half_partial;
 };

 struct PaddleBackendOption {
   bool enable_log_info = false;
   bool enable_mkldnn = true;
   bool enable_trt = false;
   bool enable_memory_optimize = true;
   bool switch_ir_debug = false;

   /*
    * @brief IPU option, this will configure the IPU hardware, if inference model in IPU
    */
   IpuOption ipu_option;

   bool collect_trt_shape = false;
   int mkldnn_cache_size = -1;
   int gpu_mem_init_size = 100;
   bool enable_fixed_size_opt = false;

   void DisableTrtOps(const std::vector<std::string>& ops) {
     trt_disabled_ops_.insert(trt_disabled_ops_.end(), ops.begin(), ops.end());
   }

   void DeletePass(const std::string& pass_name) {
     delete_pass_names.push_back(pass_name);
   }

   void SetIpuConfig(bool enable_fp16, int replica_num,
                                    float available_memory_proportion,
                                    bool enable_half_partial) {
     ipu_option.ipu_enable_fp16 = enable_fp16;
     ipu_option.ipu_replica_num = replica_num;
     ipu_option.ipu_available_memory_proportion =
         available_memory_proportion;
     ipu_option.ipu_enable_half_partial = enable_half_partial;
   }

   // The belowing parameters may be removed, please do not
   // read or write them directly
   TrtBackendOption trt_option;
   bool enable_pinned_memory = false;
   void* external_stream_ = nullptr;
   Device device = Device::CPU;
   int device_id = 0;
   std::vector<std::string> trt_disabled_ops_{};
   int cpu_thread_num = 8;
   std::vector<std::string> delete_pass_names = {};
   std::string model_file = "";   // Path of model file
   std::string params_file = "";  // Path of parameters file, can be empty

   // load model and paramters from memory
   bool model_from_memory_ = false;
 };
 }  // namespace fastdeploy
fastdeploy::PaddleBackendOption::DisableTrtOps
void DisableTrtOps(const std::vector< std::string > &ops)
Disable type of operators run on TensorRT.
Definition: option.h:77

fastdeploy::PaddleBackendOption::DeletePass
void DeletePass(const std::string &pass_name)
Delete pass by name.
Definition: option.h:82

fastdeploy::IpuOption::ipu_available_memory_proportion
float ipu_available_memory_proportion
the available memory proportion for matmul/conv
Definition: option.h:43

fastdeploy::PaddleBackendOption
Option object to configure Paddle Inference backend.
Definition: option.h:50

fastdeploy::IpuOption::ipu_enable_fp16
bool ipu_enable_fp16
enable fp16
Definition: option.h:39

fastdeploy::IpuOption::ipu_enable_pipelining
bool ipu_enable_pipelining
enable pipelining
Definition: option.h:35

fastdeploy::IpuOption::ipu_micro_batch_size
int ipu_micro_batch_size
the batch size in the graph, only work when graph has no batch shape info
Definition: option.h:33

fastdeploy::IpuOption::ipu_enable_half_partial
bool ipu_enable_half_partial
enable fp16 partial for matmul, only work with fp16
Definition: option.h:45

fastdeploy::IpuOption::ipu_device_num
int ipu_device_num
IPU device id.
Definition: option.h:31

fastdeploy::IpuOption::ipu_batches_per_step
int ipu_batches_per_step
the number of batches per run in pipelining
Definition: option.h:37

fastdeploy::IpuOption::ipu_replica_num
int ipu_replica_num
the number of graph replication
Definition: option.h:41

fastdeploy::TrtBackendOption
Option object to configure TensorRT backend.
Definition: option.h:26

fastdeploy
All C++ FastDeploy APIs are defined inside this namespace.
Definition: option.h:16

fastdeploy::IpuOption
Option object to configure GraphCore IPU.
Definition: option.h:29