zh-cn/stable/inference_8h_source.html

 #ifndef _NNDEPLOY_INFERENCE_INFERENCE_H_

 #define _NNDEPLOY_INFERENCE_INFERENCE_H_


 #include "nndeploy/base/any.h"

 #include "nndeploy/base/common.h"

 #include "nndeploy/base/glic_stl_include.h"

 #include "nndeploy/base/log.h"

 #include "nndeploy/base/macro.h"

 #include "nndeploy/base/object.h"

 #include "nndeploy/base/status.h"

 #include "nndeploy/base/string.h"

 #include "nndeploy/device/buffer.h"

 #include "nndeploy/device/device.h"

 #include "nndeploy/device/memory_pool.h"

 #include "nndeploy/device/tensor.h"

 #include "nndeploy/inference/inference_param.h"


 namespace nndeploy {

 namespace inference {


 class NNDEPLOY_CC_API Inference {

  public:

   Inference(base::InferenceType type);

   virtual ~Inference();


   base::InferenceType getInferenceType();


   base::Status setParam(base::Param *param);

   base::Status setParamSharedPtr(std::shared_ptr<base::Param> param);


   base::Param *getParam();

   std::shared_ptr<base::Param> getParamSharedPtr();


   base::DeviceType getDeviceType() { return inference_param_->device_type_; }


   void setStream(device::Stream *stream);

   device::Stream *getStream();


   virtual base::Status init() = 0;

   virtual base::Status deinit() = 0;


   base::ShapeMap getMinShape();

   base::ShapeMap getOptShape();

   base::ShapeMap getMaxShape();

   virtual base::Status reshape(base::ShapeMap &shape_map) = 0;


   virtual int64_t getMemorySize();

   virtual base::Status setMemory(device::Buffer *buffer);

   virtual float getGFLOPs();


   virtual bool isBatch();


   virtual bool isShareContext();

   virtual bool isShareStream();

   virtual bool isInputDynamic();

   virtual bool isOutputDynamic();

   virtual bool canOpInput();

   virtual bool canOpOutput();


   virtual int getNumOfInputTensor();

   virtual int getNumOfOutputTensor();


   virtual std::string getInputName(int i);

   virtual std::string getOutputName(int i);

   virtual std::vector<std::string> getAllInputTensorName();

   virtual std::vector<std::string> getAllOutputTensorName();


   virtual base::IntVector getInputShape(const std::string &name);

   virtual base::ShapeMap getAllInputShape();

   virtual device::TensorDesc getInputTensorDesc(const std::string &name);

   virtual device::TensorDesc getOutputTensorDesc(const std::string &name);


   virtual device::TensorDesc getInputTensorAlignDesc(const std::string &name);

   virtual device::TensorDesc getOutputTensorAlignDesc(const std::string &name);


   virtual std::map<std::string, device::Tensor *> getAllInputTensorMap();

   virtual std::map<std::string, device::Tensor *> getAllOutputTensorMap();


   virtual std::vector<device::Tensor *> getAllInputTensorVector();

   virtual std::vector<device::Tensor *> getAllOutputTensorVector();


   virtual device::Tensor *getInputTensor(const std::string &name);

   virtual device::Tensor *getOutputTensor(const std::string &name);


   virtual base::Status setInputTensor(const std::string &name,

                                       device::Tensor *input_tensor);


   virtual base::Status run() = 0;


   virtual device::Tensor *getOutputTensorAfterRun(

       const std::string &name, base::DeviceType device_type, bool is_copy,

       base::DataFormat data_format = base::kDataFormatAuto) = 0;


  protected:

   base::InferenceType type_;

   std::shared_ptr<InferenceParam> inference_param_;


   bool is_share_context_ = true;


   bool is_external_stream_ = false;

   device::Stream *stream_ = nullptr;


   std::map<std::string, device::Tensor *> input_tensors_;

   std::map<std::string, device::Tensor *> output_tensors_;


   std::map<std::string, device::Tensor *> external_input_tensors_;

 };


 class InferenceCreator {

  public:

   virtual ~InferenceCreator() {};

   // virtual Inference *createInference(base::InferenceType type) = 0;

   virtual std::shared_ptr<Inference> createInference(base::InferenceType type) = 0;

 };


 template <typename T>

 class TypeInferenceCreator : public InferenceCreator {

   // virtual Inference *createInference(base::InferenceType type) {

   //   return new T(type);

   // }

   virtual std::shared_ptr<Inference> createInference(base::InferenceType type) {

     return std::make_shared<T>(type);

   }

 };


 extern NNDEPLOY_CC_API std::map<base::InferenceType, std::shared_ptr<InferenceCreator>> &

 getGlobalInferenceCreatorMap();


 template <typename T>

 class TypeInferenceRegister {

  public:

   explicit TypeInferenceRegister(base::InferenceType type) {

     getGlobalInferenceCreatorMap()[type] = std::shared_ptr<T>(new T());

   }

 };


 // extern NNDEPLOY_CC_API Inference *createInference(base::InferenceType type);


 extern NNDEPLOY_CC_API std::shared_ptr<Inference> createInference(base::InferenceType type);


 }  // namespace inference

 }  // namespace nndeploy


 #endif

any.h

buffer.h

nndeploy::base::Param
Definition: param.h:37

nndeploy::base::Status
Definition: status.h:87

nndeploy::device::Buffer
Definition: buffer.h:21

nndeploy::device::Stream
流类
Definition: device.h:387

nndeploy::device::Tensor
Tensor类
Definition: tensor.h:26

nndeploy::inference::InferenceCreator
推理框架的创建类
Definition: inference.h:384

nndeploy::inference::InferenceCreator::~InferenceCreator
virtual ~InferenceCreator()
Definition: inference.h:386

nndeploy::inference::InferenceCreator::createInference
virtual std::shared_ptr< Inference > createInference(base::InferenceType type)=0

nndeploy::inference::Inference
推理的基类
Definition: inference.h:40

nndeploy::inference::Inference::getAllOutputTensorVector
virtual std::vector< device::Tensor * > getAllOutputTensorVector()
Get the All Output Tensor Vector object.

nndeploy::inference::Inference::getInputName
virtual std::string getInputName(int i)
Get the Input Name object.

nndeploy::inference::Inference::run
virtual base::Status run()=0
推理

nndeploy::inference::Inference::deinit
virtual base::Status deinit()=0
反初始化推理

nndeploy::inference::Inference::getNumOfOutputTensor
virtual int getNumOfOutputTensor()
Get the Num Of Output Tensor object.

nndeploy::inference::Inference::getNumOfInputTensor
virtual int getNumOfInputTensor()
Get the Num Of Input Tensor object.

nndeploy::inference::Inference::setMemory
virtual base::Status setMemory(device::Buffer *buffer)
设置推理所需的内存（推理内存由外部分配）

nndeploy::inference::Inference::canOpInput
virtual bool canOpInput()
是否可以操作推理框架内部分配的输入tensor

nndeploy::inference::Inference::getParam
base::Param * getParam()
Get the Inference Param（这里使用基类指针）

nndeploy::inference::Inference::getInputTensorDesc
virtual device::TensorDesc getInputTensorDesc(const std::string &name)
Get the Input Tensor Desc object.

nndeploy::inference::Inference::Inference
Inference(base::InferenceType type)

nndeploy::inference::Inference::getStream
device::Stream * getStream()

nndeploy::inference::Inference::type_
base::InferenceType type_
推理框架的类型
Definition: inference.h:336

nndeploy::inference::Inference::~Inference
virtual ~Inference()

nndeploy::inference::Inference::isOutputDynamic
virtual bool isOutputDynamic()
是否为动态输出

nndeploy::inference::Inference::getInputShape
virtual base::IntVector getInputShape(const std::string &name)
Get the Input Shape object.

nndeploy::inference::Inference::getOutputName
virtual std::string getOutputName(int i)
Get the Output Name object.

nndeploy::inference::Inference::setParam
base::Status setParam(base::Param *param)
Set the Inference Param（这里使用基类指针）

nndeploy::inference::Inference::getInferenceType
base::InferenceType getInferenceType()

nndeploy::inference::Inference::getAllOutputTensorMap
virtual std::map< std::string, device::Tensor * > getAllOutputTensorMap()
Get the All Output Tensor Map object.

nndeploy::inference::Inference::isShareStream
virtual bool isShareStream()
该推理实例是否与nndeploy共享一个stream

nndeploy::inference::Inference::getInputTensor
virtual device::Tensor * getInputTensor(const std::string &name)
Get the Input Tensor object.

nndeploy::inference::Inference::init
virtual base::Status init()=0
初始化推理

nndeploy::inference::Inference::setInputTensor
virtual base::Status setInputTensor(const std::string &name, device::Tensor *input_tensor)
Set the Input Tensor object.

nndeploy::inference::Inference::isShareContext
virtual bool isShareContext()
该推理实例是否与nndeploy共享一个context

nndeploy::inference::Inference::getOutputTensorAlignDesc
virtual device::TensorDesc getOutputTensorAlignDesc(const std::string &name)
Get the Output Tensor Align Desc object.

nndeploy::inference::Inference::reshape
virtual base::Status reshape(base::ShapeMap &shape_map)=0
针对动态输入的推理，设置输入tensor的shape

nndeploy::inference::Inference::getOutputTensor
virtual device::Tensor * getOutputTensor(const std::string &name)
Get the Output Tensor object.

nndeploy::inference::Inference::input_tensors_
std::map< std::string, device::Tensor * > input_tensors_
输入tensor的map
Definition: inference.h:363

nndeploy::inference::Inference::isInputDynamic
virtual bool isInputDynamic()
是否为动态输入

nndeploy::inference::Inference::getAllInputTensorVector
virtual std::vector< device::Tensor * > getAllInputTensorVector()
Get the All Input Tensor Vector object.

nndeploy::inference::Inference::getOutputTensorAfterRun
virtual device::Tensor * getOutputTensorAfterRun(const std::string &name, base::DeviceType device_type, bool is_copy, base::DataFormat data_format=base::kDataFormatAuto)=0
Get the Output Tensor object.

nndeploy::inference::Inference::isBatch
virtual bool isBatch()
是否为多batch推理

nndeploy::inference::Inference::getAllInputTensorName
virtual std::vector< std::string > getAllInputTensorName()
Get the All Input Tensor Name object.

nndeploy::inference::Inference::getInputTensorAlignDesc
virtual device::TensorDesc getInputTensorAlignDesc(const std::string &name)
Get the Input Tensor Align Desc object.

nndeploy::inference::Inference::setParamSharedPtr
base::Status setParamSharedPtr(std::shared_ptr< base::Param > param)

nndeploy::inference::Inference::getAllInputShape
virtual base::ShapeMap getAllInputShape()
Get the Output Shape object.

nndeploy::inference::Inference::getGFLOPs
virtual float getGFLOPs()
获得推理计算量

nndeploy::inference::Inference::getDeviceType
base::DeviceType getDeviceType()
Definition: inference.h:64

nndeploy::inference::Inference::getParamSharedPtr
std::shared_ptr< base::Param > getParamSharedPtr()

nndeploy::inference::Inference::getOptShape
base::ShapeMap getOptShape()
针对动态输入的推理，获取输入tensor的opt_shape

nndeploy::inference::Inference::getMaxShape
base::ShapeMap getMaxShape()
针对动态输入的推理，获取输入tensor的max_shape

nndeploy::inference::Inference::setStream
void setStream(device::Stream *stream)

nndeploy::inference::Inference::getAllInputTensorMap
virtual std::map< std::string, device::Tensor * > getAllInputTensorMap()
Get the All Input Tensor Map object.

nndeploy::inference::Inference::output_tensors_
std::map< std::string, device::Tensor * > output_tensors_
输出tensor的map
Definition: inference.h:370

nndeploy::inference::Inference::canOpOutput
virtual bool canOpOutput()
是否可以操作推理框架内部分配的输出tensor

nndeploy::inference::Inference::inference_param_
std::shared_ptr< InferenceParam > inference_param_
推理框架的配置
Definition: inference.h:342

nndeploy::inference::Inference::getMinShape
base::ShapeMap getMinShape()
针对动态输入的推理，获取输入tensor的min_shape

nndeploy::inference::Inference::external_input_tensors_
std::map< std::string, device::Tensor * > external_input_tensors_
外部输入tensor的map
Definition: inference.h:377

nndeploy::inference::Inference::getMemorySize
virtual int64_t getMemorySize()
获取推理所需的内存大小

nndeploy::inference::Inference::getAllOutputTensorName
virtual std::vector< std::string > getAllOutputTensorName()
Get the All Output Tensor Name object.

nndeploy::inference::Inference::getOutputTensorDesc
virtual device::TensorDesc getOutputTensorDesc(const std::string &name)
Get the Output Tensor Desc object.

nndeploy::inference::TypeInferenceCreator
推理框架的创建类模板
Definition: inference.h:397

nndeploy::inference::TypeInferenceRegister
推理框架的创建类的注册类模板
Definition: inference.h:420

nndeploy::inference::TypeInferenceRegister::TypeInferenceRegister
TypeInferenceRegister(base::InferenceType type)
Definition: inference.h:422

common.h

device.h

glic_stl_include.h

inference_param.h

log.h

macro.h

NNDEPLOY_CC_API
#define NNDEPLOY_CC_API
api
Definition: macro.h:29

memory_pool.h

nndeploy::base::InferenceType
InferenceType
Definition: common.h:284

nndeploy::base::IntVector
std::vector< int > IntVector
Definition: common.h:379

nndeploy::base::ShapeMap
std::map< std::string, std::vector< int > > ShapeMap
Definition: common.h:381

nndeploy::base::DataFormat
DataFormat
Definition: common.h:130

nndeploy::base::kDataFormatAuto
@ kDataFormatAuto
Definition: common.h:161

nndeploy::inference::createInference
std::shared_ptr< Inference > createInference(base::InferenceType type)
Create a Inference object.

nndeploy::inference::getGlobalInferenceCreatorMap
std::map< base::InferenceType, std::shared_ptr< InferenceCreator > > & getGlobalInferenceCreatorMap()
Get the Global Inference Creator Map object.

nndeploy
Definition: common.h:10

object.h

status.h

string.h

nndeploy::base::DeviceType
Definition: common.h:109

nndeploy::device::TensorDesc
TensorDesc.
Definition: type.h:87

tensor.h