cpp/html/fastdeploy__model_8h_source.html

 // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
 #pragma once
 #include "fastdeploy/runtime.h"

 namespace fastdeploy {

 class FASTDEPLOY_DECL FastDeployModel {
  public:
   virtual std::string ModelName() const { return "NameUndefined"; }

   virtual bool Infer(std::vector<FDTensor>& input_tensors,
                      std::vector<FDTensor>* output_tensors);

   virtual bool Infer();

   RuntimeOption runtime_option;
   std::vector<Backend> valid_cpu_backends = {Backend::ORT};
   std::vector<Backend> valid_gpu_backends = {Backend::ORT};
   std::vector<Backend> valid_ipu_backends = {};
   std::vector<Backend> valid_timvx_backends = {};
   std::vector<Backend> valid_directml_backends = {};
   std::vector<Backend> valid_ascend_backends = {};
   std::vector<Backend> valid_kunlunxin_backends = {};
   std::vector<Backend> valid_rknpu_backends = {};
   std::vector<Backend> valid_sophgonpu_backends = {};

   virtual int NumInputsOfRuntime() { return runtime_->NumInputs(); }
   virtual int NumOutputsOfRuntime() { return runtime_->NumOutputs(); }
   virtual TensorInfo InputInfoOfRuntime(int index) {
     return runtime_->GetInputInfo(index);
   }
   virtual TensorInfo OutputInfoOfRuntime(int index) {
     return runtime_->GetOutputInfo(index);
   }
   virtual bool Initialized() const {
     return runtime_initialized_ && initialized;
   }

   virtual void EnableRecordTimeOfRuntime() {
     time_of_runtime_.clear();
     std::vector<double>().swap(time_of_runtime_);
     enable_record_time_of_runtime_ = true;
   }

   virtual void DisableRecordTimeOfRuntime() {
     enable_record_time_of_runtime_ = false;
   }

   virtual std::map<std::string, float> PrintStatisInfoOfRuntime();

   virtual bool EnabledRecordTimeOfRuntime() {
     return enable_record_time_of_runtime_;
   }
   virtual double GetProfileTime() {
     return runtime_->GetProfileTime();
   }
   virtual void ReleaseReusedBuffer() {
     std::vector<FDTensor>().swap(reused_input_tensors_);
     std::vector<FDTensor>().swap(reused_output_tensors_);
   }

   virtual fastdeploy::Runtime* CloneRuntime() { return runtime_->Clone(); }

   virtual bool SetRuntime(fastdeploy::Runtime* clone_runtime) {
     runtime_ = std::unique_ptr<Runtime>(clone_runtime);
     return true;
   }

   virtual std::unique_ptr<FastDeployModel> Clone() {
     FDERROR << ModelName() << " doesn't support Cone() now." << std::endl;
     return nullptr;
   }

  protected:
   virtual bool InitRuntime();

   bool initialized = false;
   // Reused input tensors
   std::vector<FDTensor> reused_input_tensors_;
   // Reused output tensors
   std::vector<FDTensor> reused_output_tensors_;

  private:
   bool InitRuntimeWithSpecifiedBackend();
   bool InitRuntimeWithSpecifiedDevice();
   bool CreateCpuBackend();
   bool CreateGpuBackend();
   bool CreateIpuBackend();
   bool CreateRKNPUBackend();
   bool CreateSophgoNPUBackend();
   bool CreateTimVXBackend();
   bool CreateKunlunXinBackend();
   bool CreateASCENDBackend();
   bool CreateDirectMLBackend();
   bool IsSupported(const std::vector<Backend>& backends,
                    Backend backend);

   std::shared_ptr<Runtime> runtime_;
   bool runtime_initialized_ = false;
   // whether to record inference time
   bool enable_record_time_of_runtime_ = false;
   std::vector<double> time_of_runtime_;
 };

 }  // namespace fastdeploy
fastdeploy::Runtime
Runtime object used to inference the loaded model on different devices.
Definition: runtime.h:37

fastdeploy::RuntimeOption
Option object used when create a new Runtime object.
Definition: runtime_option.h:40

fastdeploy::FastDeployModel::ReleaseReusedBuffer
virtual void ReleaseReusedBuffer()
Release reused input/output buffers.
Definition: fastdeploy_model.h:126

fastdeploy::FastDeployModel
Base model object for all the vision models.
Definition: fastdeploy_model.h:21

fastdeploy::FastDeployModel::EnabledRecordTimeOfRuntime
virtual bool EnabledRecordTimeOfRuntime()
Check if the EnableRecordTimeOfRuntime() method is enabled.
Definition: fastdeploy_model.h:116

fastdeploy::Backend
Backend
Definition: enum_variables.h:30

fastdeploy::FastDeployModel::NumInputsOfRuntime
virtual int NumInputsOfRuntime()
Get number of inputs for this model.
Definition: fastdeploy_model.h:65

fastdeploy::FastDeployModel::Initialized
virtual bool Initialized() const
Check if the model is initialized successfully.
Definition: fastdeploy_model.h:77

fastdeploy::FastDeployModel::GetProfileTime
virtual double GetProfileTime()
Get profile time of Runtime after the profile process is done.
Definition: fastdeploy_model.h:121

fastdeploy::FastDeployModel::InputInfoOfRuntime
virtual TensorInfo InputInfoOfRuntime(int index)
Get input information for this model.
Definition: fastdeploy_model.h:69

fastdeploy::FastDeployModel::DisableRecordTimeOfRuntime
virtual void DisableRecordTimeOfRuntime()
Disable to record the time of runtime, see EnableRecordTimeOfRuntime() for more detail.
Definition: fastdeploy_model.h:106

fastdeploy::FastDeployModel::EnableRecordTimeOfRuntime
virtual void EnableRecordTimeOfRuntime()
This is a debug interface, used to record the time of runtime (backend + h2d + d2h) ...
Definition: fastdeploy_model.h:98

fastdeploy::TensorInfo
Information of Tensor.
Definition: backend.h:31

fastdeploy::FastDeployModel::ModelName
virtual std::string ModelName() const
Get model&#39;s name.
Definition: fastdeploy_model.h:24

fastdeploy::FastDeployModel::OutputInfoOfRuntime
virtual TensorInfo OutputInfoOfRuntime(int index)
Get output information for this model.
Definition: fastdeploy_model.h:73

fastdeploy::Runtime::Clone
Runtime * Clone(void *stream=nullptr, int device_id=-1)
Clone new Runtime when multiple instances of the same model are created.
Definition: runtime.cc:351

fastdeploy
All C++ FastDeploy APIs are defined inside this namespace.
Definition: option.h:16

fastdeploy::FastDeployModel::NumOutputsOfRuntime
virtual int NumOutputsOfRuntime()
Get number of outputs for this model.
Definition: fastdeploy_model.h:67