cpp/html/runtime_2backends_2tensorrt_2option_8h_source.html

 // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #pragma once
 #include "fastdeploy/core/fd_type.h"
 #include <iostream>
 #include <map>
 #include <string>
 #include <vector>

 namespace fastdeploy {

 struct TrtBackendOption {
   size_t max_batch_size = 32;

   size_t max_workspace_size = 1 << 30;

   bool enable_log_info = false;


   bool enable_fp16 = false;

   void SetShape(const std::string& tensor_name,
                 const std::vector<int32_t>& min,
                 const std::vector<int32_t>& opt,
                 const std::vector<int32_t>& max) {
     min_shape[tensor_name].clear();
     max_shape[tensor_name].clear();
     opt_shape[tensor_name].clear();
     min_shape[tensor_name].assign(min.begin(), min.end());
     if (opt.size() == 0) {
       opt_shape[tensor_name].assign(min.begin(), min.end());
     } else {
       opt_shape[tensor_name].assign(opt.begin(), opt.end());
     }
     if (max.size() == 0) {
       max_shape[tensor_name].assign(min.begin(), min.end());
     } else {
       max_shape[tensor_name].assign(max.begin(), max.end());
     }
   }
   std::string serialize_file = "";

   // The below parameters may be removed in next version, please do not
   // visit or use them directly
   std::map<std::string, std::vector<int32_t>> max_shape;
   std::map<std::string, std::vector<int32_t>> min_shape;
   std::map<std::string, std::vector<int32_t>> opt_shape;
   bool enable_pinned_memory = false;
   void* external_stream_ = nullptr;
   int gpu_id = 0;
   std::string model_file = "";   // Path of model file
   std::string params_file = "";  // Path of parameters file, can be empty
   // format of input model
   ModelFormat model_format = ModelFormat::AUTOREC;
 };


 }  // namespace fastdeploy
fastdeploy::TrtBackendOption::enable_log_info
bool enable_log_info
Enable log while converting onnx model to tensorrt.
Definition: option.h:34

fastdeploy::TrtBackendOption::serialize_file
std::string serialize_file
Set cache file path while use TensorRT backend. Loadding a Paddle/ONNX model and initialize TensorRT ...
Definition: option.h:67

fastdeploy::AUTOREC
Auto recognize the model format by model file name.
Definition: enum_variables.h:68

fastdeploy::TrtBackendOption::SetShape
void SetShape(const std::string &tensor_name, const std::vector< int32_t > &min, const std::vector< int32_t > &opt, const std::vector< int32_t > &max)
Set shape range of input tensor for the model that contain dynamic input shape while using TensorRT b...
Definition: option.h:47

fastdeploy::ModelFormat
ModelFormat
Definition: enum_variables.h:67

fastdeploy::TrtBackendOption::max_workspace_size
size_t max_workspace_size
max_workspace_size for TensorRT
Definition: option.h:31

fastdeploy::TrtBackendOption::max_batch_size
size_t max_batch_size
max_batch_size, it&#39;s deprecated in TensorRT 8.x
Definition: option.h:28

fastdeploy::TrtBackendOption
Option object to configure TensorRT backend.
Definition: option.h:26

fastdeploy::TrtBackendOption::enable_fp16
bool enable_fp16
Enable half precison inference, on some device not support half precision, it will fallback to float3...
Definition: option.h:38

fastdeploy
All C++ FastDeploy APIs are defined inside this namespace.
Definition: option.h:16