api/c_api/_nv_infer_runtime_base_8h_source.html

/*

 * SPDX-FileCopyrightText: 版权所有 (c) 1993-2024 NVIDIA CORPORATION & AFFILIATES。保留所有权利。

 * SPDX-License-Identifier: Apache-2.0

 *

 * 根据 Apache 许可证 2.0 版（“许可证”）获得许可；

 * 除非符合许可证，否则您不得使用此文件。

 * 您可以在以下位置获取许可证副本：

 *

 * https://apache.ac.cn/licenses/LICENSE-2.0

 *

 * 除非适用法律要求或以书面形式达成协议，否则

 * 根据许可证分发的软件按“现状”基础分发，

 * 不附带任何形式的明示或暗示的保证或条件。

 * 有关管理权限和限制的特定语言，请参阅许可证。

 * 许可证下的限制。

 */


#ifndef NV_INFER_RUNTIME_BASE_H

#define NV_INFER_RUNTIME_BASE_H


#include "NvInferVersion.h"

#include <cstddef>

#include <cstdint>

#include <cuda_runtime_api.h>


// 标记为已弃用的项目将在未来的版本中移除。

#if __cplusplus >= 201402L

#define TRT_DEPRECATED [[deprecated]]

#if __GNUC__ < 6

#define TRT_DEPRECATED_ENUM

#else

#define TRT_DEPRECATED_ENUM TRT_DEPRECATED

#endif

#ifdef _MSC_VER

#define TRT_DEPRECATED_API __declspec(dllexport)

#else

#define TRT_DEPRECATED_API [[deprecated]] __attribute__((visibility("default")))

#endif

#else

#ifdef _MSC_VER

#define TRT_DEPRECATED

#define TRT_DEPRECATED_ENUM

#define TRT_DEPRECATED_API __declspec(dllexport)

#else

#define TRT_DEPRECATED __attribute__((deprecated))

#define TRT_DEPRECATED_ENUM

#define TRT_DEPRECATED_API __attribute__((deprecated, visibility("default")))

#endif

#endif


// 定义哪些符号被导出

#ifdef TENSORRT_BUILD_LIB

#ifdef _MSC_VER

#define TENSORRTAPI __declspec(dllexport)

#else

#define TENSORRTAPI __attribute__((visibility("default")))

#endif

#else

#define TENSORRTAPI

#endif

#define TRTNOEXCEPT

#if !defined(NV_INFER_INTERNAL_INCLUDE)

static_assert(false, "不要直接包含此文件。请包含 NvInferRuntime.h 或 NvInferPluginUtils.h");

#endif


extern "C"

{

 struct cublasContext;

 struct cudnnContext;

}


#define NV_TENSORRT_VERSION_INT(major, minor, patch) ((major) *10000L + (minor) *100L + (patch) *1L)


#define NV_TENSORRT_VERSION NV_TENSORRT_VERSION_INT(NV_TENSORRT_MAJOR, NV_TENSORRT_MINOR, NV_TENSORRT_PATCH)


namespace nvinfer1

{

using char_t = char;


using AsciiChar = char_t;


namespace v_1_0

{

class IErrorRecorder;

}

using IErrorRecorder = v_1_0::IErrorRecorder;


namespace impl

{

template <typename T>

struct EnumMaxImpl;

} // namespace impl


template <typename T>

constexpr int32_t EnumMax() noexcept

{

 return impl::EnumMaxImpl<T>::kVALUE;

}


enum class DataType : int32_t

{

 kFLOAT = 0,


 kHALF = 1,


 kINT8 = 2,


 kINT32 = 3,


 kBOOL = 4,


 kUINT8 = 5,


 kFP8 = 6,


 kBF16 = 7,


 kINT64 = 8,


 kINT4 = 9,


 kFP4 = 10,

};


namespace impl

{

template <>

struct EnumMaxImpl<DataType>

{

 static constexpr int32_t kVALUE = 11;

};

} // namespace impl


class Dims64

{

public

 static constexpr int32_t MAX_DIMS{8};


 int32_t nbDims;


 int64_t d[MAX_DIMS];

};


using Dims = Dims64;


using InterfaceKind = char const*;


class InterfaceInfo

{

public

 InterfaceKind kind;

 int32_t major;

 int32_t minor;

};


enum class APILanguage : int32_t

{

 kCPP = 0,

 kPYTHON = 1

};


namespace impl

{

template <>

struct EnumMaxImpl<APILanguage>

{

 static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IVersionedInterface

{

public

 virtual APILanguage getAPILanguage() const noexcept

    {

 return APILanguage::kCPP;

    }


 virtual InterfaceInfo getInterfaceInfo() const noexcept = 0;


 virtual ~IVersionedInterface() noexcept = default;


protected

 IVersionedInterface() = default;

 IVersionedInterface(IVersionedInterface const&) = default;

 IVersionedInterface(IVersionedInterface&&) = default;

 IVersionedInterface& operator=(IVersionedInterface const&) & = default;

 IVersionedInterface& operator=(IVersionedInterface&&) & = default;

};


enum class ErrorCode : int32_t

{

 kSUCCESS = 0,


 kUNSPECIFIED_ERROR = 1,


 kINTERNAL_ERROR = 2,


 kINVALID_ARGUMENT = 3,


 kINVALID_CONFIG = 4,


 kFAILED_ALLOCATION = 5,


 kFAILED_INITIALIZATION = 6,


 kFAILED_EXECUTION = 7,


 kFAILED_COMPUTATION = 8,


 kINVALID_STATE = 9,


 kUNSUPPORTED_STATE = 10,


};


namespace impl

{

template <>

struct EnumMaxImpl<ErrorCode>

{

 static constexpr int32_t kVALUE = 11;

};

} // namespace impl


namespace v_1_0

{

class IErrorRecorder : public IVersionedInterface

{

public

 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"IErrorRecorder", 1, 0};

    }


using ErrorDesc = char const*;


static constexpr size_t kMAX_DESC_LENGTH{127U};


using RefCount = int32_t;


IErrorRecorder() = default;

~IErrorRecorder() noexcept override = default;


 // 用于从错误记录器检索信息的公共 API。


 virtual int32_t getNbErrors() const noexcept = 0;


 virtual ErrorCode getErrorCode(int32_t errorIdx) const noexcept = 0;


 virtual ErrorDesc getErrorDesc(int32_t errorIdx) const noexcept = 0;


 virtual bool hasOverflowed() const noexcept = 0;


 virtual void clear() noexcept = 0;


 // TensorRT 用于向应用程序报告错误信息的 API。


 virtual bool reportError(ErrorCode val, ErrorDesc desc) noexcept = 0;


 virtual RefCount incRefCount() noexcept = 0;


 virtual RefCount decRefCount() noexcept = 0;


protected

 // @cond SuppressDoxyWarnings

 IErrorRecorder(IErrorRecorder const&) = default;

 IErrorRecorder(IErrorRecorder&&) = default;

 IErrorRecorder& operator=(IErrorRecorder const&) & = default;

 IErrorRecorder& operator=(IErrorRecorder&&) & = default;

 // @endcond

}; // class IErrorRecorder

} // namespace v_1_0


using IErrorRecorder = v_1_0::IErrorRecorder;


enum class TensorIOMode : int32_t

{

 kNONE = 0,


 kINPUT = 1,


 kOUTPUT = 2

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorIOMode>

{

 // TensorIOMode 枚举中表示最大元素数量的 kVALUE 声明

 static constexpr int32_t kVALUE = 3;

};

} // namespace impl

} // namespace nvinfer1


extern "C" TENSORRTAPI int32_t getInferLibVersion() noexcept;


#endif // NV_INFER_RUNTIME_BASE_H

TENSORRTAPI
#define TENSORRTAPI
Definition: NvInferRuntimeBase.h:59

getInferLibVersion
int32_t getInferLibVersion() noexcept
返回库版本号。

NvInferVersion.h

nvinfer1::Dims64
Definition: NvInferRuntimeBase.h:203

nvinfer1::Dims64::MAX_DIMS
static constexpr int32_t MAX_DIMS
张量支持的最大秩（维度数量）。
Definition: NvInferRuntimeBase.h:206

nvinfer1::Dims64::d
int64_t d[MAX_DIMS]
每个维度的范围。
Definition: NvInferRuntimeBase.h:212

nvinfer1::Dims64::nbDims
int32_t nbDims
秩（维度数量）。
Definition: NvInferRuntimeBase.h:209

nvinfer1::IVersionedInterface
用于版本控制的接口类。
Definition: NvInferRuntimeBase.h:263

nvinfer1::IVersionedInterface::getInterfaceInfo
virtual InterfaceInfo getInterfaceInfo() const noexcept=0
返回与此接口关联的版本信息。应用程序不得覆盖此方法...

nvinfer1::IVersionedInterface::getAPILanguage
virtual APILanguage getAPILanguage() const noexcept
用于构建此接口实现的语言。
Definition: NvInferRuntimeBase.h:270

nvinfer1::InterfaceInfo
与 TRT 接口关联的版本信息。
Definition: NvInferRuntimeBase.h:228

nvinfer1::InterfaceInfo::kind
InterfaceKind kind
Definition: NvInferRuntimeBase.h:230

nvinfer1::InterfaceInfo::major
int32_t major
Definition: NvInferRuntimeBase.h:231

nvinfer1::InterfaceInfo::minor
int32_t minor
Definition: NvInferRuntimeBase.h:232

nvinfer1::v_1_0::IErrorRecorder
Definition: NvInferRuntimeBase.h:400

nvinfer1::v_1_0::IErrorRecorder::ErrorDesc
char const * ErrorDesc
用于报告错误描述的 C 风格字符串的 typedef。
Definition: NvInferRuntimeBase.h:413

nvinfer1::v_1_0::IErrorRecorder::~IErrorRecorder
~IErrorRecorder() noexcept override=default

nvinfer1::v_1_0::IErrorRecorder::RefCount
int32_t RefCount
用于引用计数的 32 位整数的 typedef。
Definition: NvInferRuntimeBase.h:425

nvinfer1::v_1_0::IErrorRecorder::IErrorRecorder
IErrorRecorder()=default

nvinfer1::v_1_0::IErrorRecorder::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义: NvInferRuntimeBase.h:405

nvinfer1
TensorRT API 版本 1 的命名空间。

nvinfer1::ErrorCode
ErrorCode
TensorRT 在执行期间可能返回的错误代码。
定义: NvInferRuntimeBase.h:296

nvinfer1::ErrorCode::kUNSUPPORTED_STATE
@ kUNSUPPORTED_STATE

nvinfer1::ErrorCode::kINVALID_STATE
@ kINVALID_STATE

nvinfer1::ErrorCode::kFAILED_INITIALIZATION
@ kFAILED_INITIALIZATION

nvinfer1::ErrorCode::kUNSPECIFIED_ERROR
@ kUNSPECIFIED_ERROR

nvinfer1::ErrorCode::kFAILED_ALLOCATION
@ kFAILED_ALLOCATION

nvinfer1::ErrorCode::kFAILED_COMPUTATION
@ kFAILED_COMPUTATION

nvinfer1::ErrorCode::kINTERNAL_ERROR
@ kINTERNAL_ERROR

nvinfer1::ErrorCode::kFAILED_EXECUTION
@ kFAILED_EXECUTION

nvinfer1::ErrorCode::kSUCCESS
@ kSUCCESS

nvinfer1::ErrorCode::kINVALID_CONFIG
@ kINVALID_CONFIG

nvinfer1::ErrorCode::kINVALID_ARGUMENT
@ kINVALID_ARGUMENT

nvinfer1::TensorIOMode
TensorIOMode
张量 IO 模式的定义。
定义: NvInferRuntimeBase.h:643

nvinfer1::TensorIOMode::kOUTPUT
@ kOUTPUT
张量由引擎输出。

nvinfer1::TensorIOMode::kINPUT
@ kINPUT
张量是引擎的输入。

nvinfer1::APILanguage
APILanguage
在 TRT 接口实现中使用的编程语言。
定义: NvInferRuntimeBase.h:241

nvinfer1::APILanguage::kPYTHON
@ kPYTHON

nvinfer1::APILanguage::kCPP
@ kCPP

nvinfer1::AsciiChar
char_t AsciiChar
定义: NvInferRuntimeBase.h:105

nvinfer1::char_t
char char_t
char_t 是 TensorRT 用于表示所有有效字符的类型。
定义: NvInferRuntimeBase.h:101

nvinfer1::DataType
DataType
权重和张量的类型。
定义: NvInferRuntimeBase.h:133

nvinfer1::DataType::kUINT8
@ kUINT8

nvinfer1::DataType::kINT64
@ kINT64
有符号 64 位整数类型。

nvinfer1::DataType::kFLOAT
@ kFLOAT
32 位浮点格式。

nvinfer1::DataType::kFP4
@ kFP4

nvinfer1::DataType::kBOOL
@ kBOOL
8 位布尔值。0 = false，1 = true，其他值未定义。

nvinfer1::DataType::kHALF
@ kHALF
IEEE 16 位浮点格式 – 具有 5 位指数和 11 位尾数。

nvinfer1::DataType::kINT8
@ kINT8
有符号 8 位整数，表示量化的浮点值。

nvinfer1::DataType::kFP8
@ kFP8

nvinfer1::DataType::kBF16
@ kBF16
Brain float – 具有 8 位指数和 8 位尾数。

nvinfer1::DataType::kINT4
@ kINT4
有符号 4 位整数类型。

nvinfer1::DataType::kINT32
@ kINT32
有符号 32 位整数格式。

nvinfer1::InterfaceKind
char const * InterfaceKind
定义: NvInferRuntimeBase.h:220

nvinfer1::EnumMax
constexpr int32_t EnumMax() noexcept
枚举类型中元素的最大数量。
定义: NvInferRuntimeBase.h:123

nvinfer1::MatrixOperation::kNONE
@ kNONE

nvinfer1::IErrorRecorder
v_1_0::IErrorRecorder IErrorRecorder
定义: NvInferRuntimeBase.h:112

nvinfer1::impl::EnumMaxImpl
EnumMaxImpl 结构的声明，用于存储枚举类型中元素的最大数量。
定义: NvInferRuntimeBase.h:118