zh-cn/stable/inference__param_8h_source.html

 #ifndef _NNDEPLOY_INFERENCE_INFERENCE_PARAM_H_

 #define _NNDEPLOY_INFERENCE_INFERENCE_PARAM_H_


 #include "nndeploy/base/any.h"

 #include "nndeploy/base/common.h"

 #include "nndeploy/base/file.h"

 #include "nndeploy/base/glic_stl_include.h"

 #include "nndeploy/base/log.h"

 #include "nndeploy/base/macro.h"

 #include "nndeploy/base/object.h"

 #include "nndeploy/base/param.h"

 #include "nndeploy/base/status.h"

 #include "nndeploy/base/string.h"


 namespace nndeploy {

 namespace inference {


 class NNDEPLOY_CC_API InferenceParam : public base::Param {

  public:

   InferenceParam();

   InferenceParam(base::InferenceType type);

   virtual ~InferenceParam();


   InferenceParam(const InferenceParam& param) = default;

   InferenceParam& operator=(const InferenceParam& param) = default;


   PARAM_COPY(InferenceParam)

   PARAM_COPY_TO(InferenceParam)


   virtual base::Status set(const std::string& key, base::Any& any);

   virtual base::Status get(const std::string& key, base::Any& any);


   base::InferenceType getInferenceType() const;

   void setInferenceType(base::InferenceType type);

   base::ModelType getModelType() const;

   void setModelType(base::ModelType type);

   bool getIsPath() const;

   void setIsPath(bool is_path);

   const std::vector<std::string>& getModelValue() const;

   void setModelValue(const std::vector<std::string>& model_value);

   void setModelValue(const std::string& model_value, int i = -1);

   int getInputNum() const;

   void setInputNum(int input_num);

   const std::vector<std::string>& getInputName() const;

   void setInputName(const std::vector<std::string>& input_name);

   void setInputName(const std::string& input_name, int i = -1);

   const std::vector<std::vector<int>>& getInputShape() const;

   void setInputShape(const std::vector<std::vector<int>>& input_shape);

   void setInputShape(const std::vector<int>& input_shape, int i = -1);

   int getOutputNum() const;

   void setOutputNum(int output_num);

   const std::vector<std::string>& getOutputName() const;

   void setOutputName(const std::vector<std::string>& output_name);

   void setOutputName(const std::string& output_name, int i = -1);

   base::EncryptType getEncryptType() const;

   void setEncryptType(base::EncryptType type);

   const std::string& getLicense() const;

   void setLicense(const std::string& license);

   base::DeviceType getDeviceType() const;

   void setDeviceType(base::DeviceType type);

   int getNumThread() const;

   void setNumThread(int num_thread);

   int getGpuTuneKernel() const;

   void setGpuTuneKernel(int gpu_tune_kernel);

   base::ShareMemoryType getShareMemoryMode() const;

   void setShareMemoryMode(base::ShareMemoryType mode);

   base::PrecisionType getPrecisionType() const;

   void setPrecisionType(base::PrecisionType type);

   base::PowerType getPowerType() const;

   void setPowerType(base::PowerType type);

   bool getIsDynamicShape() const;

   void setIsDynamicShape(bool is_dynamic_shape);

   const base::ShapeMap& getMinShape() const;

   void setMinShape(const base::ShapeMap& min_shape);

   const base::ShapeMap& getOptShape() const;

   void setOptShape(const base::ShapeMap& opt_shape);

   const base::ShapeMap& getMaxShape() const;

   void setMaxShape(const base::ShapeMap& max_shape);

   const std::vector<std::string>& getCachePath() const;

   void setCachePath(const std::vector<std::string>& cache_path);

   const std::vector<std::string>& getLibraryPath() const;

   void setLibraryPath(const std::vector<std::string>& library_path);

   void setLibraryPath(const std::string& library_path, int i = -1);


   base::InferenceType inference_type_ = base::kInferenceTypeNotSupport;

   base::ModelType model_type_ = base::kModelTypeOnnx;  // 模型的类型

   bool is_path_ = true;                                // model_value_是否为路径

   std::vector<std::string> model_value_;               // 模型的路径或者内容

   std::vector<std::string> external_model_data_;       // 分离模型权重

   int input_num_ = 1;                                  // 输入的数量

   std::vector<std::string> input_name_;                // 输入的名称

   std::vector<std::vector<int>> input_shape_;          // 输入的形状

   int output_num_ = 1;                                 // 输出的数量

   std::vector<std::string> output_name_;               // 输出的名称

   base::EncryptType encrypt_type_ =

       base::kEncryptTypeNone;     // 模型文件的加解密类型

   std::string license_;           // 模型文件的加解密密钥

   base::DeviceType device_type_;  // 模型推理的设备类型

   int num_thread_ = 4;            // CPU推理的线程数

   int gpu_tune_kernel_ = 1;       // GPU微调的模式

   base::ShareMemoryType share_memory_mode_ =

       base::kShareMemoryTypeNoShare;  //  推理时的共享内存模式

   base::PrecisionType precision_type_ =

       base::kPrecisionTypeFp32;                          // 推理时的精度类型

   base::PowerType power_type_ = base::kPowerTypeNormal;  // 推理时的功耗类型

   bool is_dynamic_shape_ = false;                        // 是否是动态shape

   base::ShapeMap min_shape_ = base::ShapeMap();   // 当为动态输入时最小shape

   base::ShapeMap opt_shape_ = base::ShapeMap();   // 当为动态输入时最优shape

   base::ShapeMap max_shape_ = base::ShapeMap();   // 当为动态输入时最大shape

   std::vector<std::string> cache_path_ = {""};    // 缓存路径

   std::vector<std::string> library_path_ = {""};  // 第三方推理框架的动态库路径

   base::ParallelType parallel_type_ = base::kParallelTypeSequential;

   int worker_num_ = 1;


   virtual base::Status serialize(rapidjson::Value& json,

                                  rapidjson::Document::AllocatorType& allocator);

   virtual base::Status deserialize(rapidjson::Value& json);

 };


 class InferenceParamCreator {

  public:

   virtual ~InferenceParamCreator() {};

   // virtual InferenceParam *createInferenceParam(base::InferenceType type) = 0;

   virtual std::shared_ptr<InferenceParam> createInferenceParam(

       base::InferenceType type) = 0;

 };


 template <typename T>

 class TypeInferenceParamCreator : public InferenceParamCreator {

   // virtual InferenceParam *createInferenceParam(base::InferenceType type) {

   //   return new T(type);

   // }

   virtual std::shared_ptr<InferenceParam> createInferenceParam(

       base::InferenceType type) {

     return std::make_shared<T>(type);

   }

 };


 extern NNDEPLOY_CC_API

     std::map<base::InferenceType, std::shared_ptr<InferenceParamCreator>>&

     getGlobalInferenceParamCreatorMap();


 template <typename T>

 class TypeInferenceParamRegister {

  public:

   explicit TypeInferenceParamRegister(base::InferenceType type) {

     getGlobalInferenceParamCreatorMap()[type] = std::shared_ptr<T>(new T());

   }

 };


 // extern NNDEPLOY_CC_API InferenceParam *createInferenceParam(

 //     base::InferenceType type);


 extern NNDEPLOY_CC_API std::shared_ptr<InferenceParam> createInferenceParam(

     base::InferenceType type);


 }  // namespace inference

 }  // namespace nndeploy


 #endif

any.h

nndeploy::base::Param
Definition: param.h:37

nndeploy::base::Status
Definition: status.h:87

nndeploy::inference::InferenceParamCreator
InferenceParamCreator is the base class of all inference param creator.
Definition: inference_param.h:143

nndeploy::inference::InferenceParamCreator::~InferenceParamCreator
virtual ~InferenceParamCreator()
Definition: inference_param.h:145

nndeploy::inference::InferenceParamCreator::createInferenceParam
virtual std::shared_ptr< InferenceParam > createInferenceParam(base::InferenceType type)=0

nndeploy::inference::InferenceParam
InferenceParam is the base class of all inference param.
Definition: inference_param.h:22

nndeploy::inference::InferenceParam::~InferenceParam
virtual ~InferenceParam()

nndeploy::inference::InferenceParam::operator=
InferenceParam & operator=(const InferenceParam &param)=default

nndeploy::inference::InferenceParam::InferenceParam
InferenceParam()

nndeploy::inference::InferenceParam::InferenceParam
InferenceParam(base::InferenceType type)

nndeploy::inference::InferenceParam::deserialize
virtual base::Status deserialize(rapidjson::Value &json)

nndeploy::inference::InferenceParam::InferenceParam
InferenceParam(const InferenceParam &param)=default

nndeploy::inference::InferenceParam::serialize
virtual base::Status serialize(rapidjson::Value &json, rapidjson::Document::AllocatorType &allocator)

nndeploy::inference::TypeInferenceParamCreator
TypeInferenceParamCreator is the template class of all inference param.
Definition: inference_param.h:157

nndeploy::inference::TypeInferenceParamRegister
TypeInferenceParamRegister is the template class of all inference.
Definition: inference_param.h:183

nndeploy::inference::TypeInferenceParamRegister::TypeInferenceParamRegister
TypeInferenceParamRegister(base::InferenceType type)
Definition: inference_param.h:185

common.h

file.h

glic_stl_include.h

log.h

macro.h

NNDEPLOY_CC_API
#define NNDEPLOY_CC_API
api
Definition: macro.h:29

nndeploy::base::InferenceType
InferenceType
Definition: common.h:284

nndeploy::base::kInferenceTypeNotSupport
@ kInferenceTypeNotSupport
Definition: common.h:329

nndeploy::base::PrecisionType
PrecisionType
Definition: common.h:167

nndeploy::base::kPrecisionTypeFp32
@ kPrecisionTypeFp32
Definition: common.h:170

nndeploy::base::ShapeMap
std::map< std::string, std::vector< int > > ShapeMap
Definition: common.h:381

nndeploy::base::ModelType
ModelType
Definition: common.h:239

nndeploy::base::kModelTypeOnnx
@ kModelTypeOnnx
Definition: common.h:246

nndeploy::base::PowerType
PowerType
Definition: common.h:177

nndeploy::base::kPowerTypeNormal
@ kPowerTypeNormal
Definition: common.h:179

nndeploy::base::getPrecisionType
PrecisionType getPrecisionType(DataType data_type)

nndeploy::base::ParallelType
ParallelType
Definition: common.h:353

nndeploy::base::kParallelTypeSequential
@ kParallelTypeSequential
Definition: common.h:355

nndeploy::base::EncryptType
EncryptType
Definition: common.h:332

nndeploy::base::kEncryptTypeNone
@ kEncryptTypeNone
Definition: common.h:333

nndeploy::base::ShareMemoryType
ShareMemoryType
Definition: common.h:186

nndeploy::base::kShareMemoryTypeNoShare
@ kShareMemoryTypeNoShare
Definition: common.h:187

nndeploy::inference::getGlobalInferenceParamCreatorMap
std::map< base::InferenceType, std::shared_ptr< InferenceParamCreator > > & getGlobalInferenceParamCreatorMap()
Get the Global Inference Param Creator Map object.

nndeploy::inference::createInferenceParam
std::shared_ptr< InferenceParam > createInferenceParam(base::InferenceType type)
Create a Inference Param object.

nndeploy
Definition: common.h:10

object.h

param.h

PARAM_COPY_TO
#define PARAM_COPY_TO(param_type)
Definition: param.h:25

PARAM_COPY
#define PARAM_COPY(param_type)
Definition: param.h:16

status.h

string.h