api/c_api/_nv_infer_runtime_8h_source.html

/*

 * SPDX-FileCopyrightText: 版权所有 (c) 1993-2024 NVIDIA CORPORATION 及附属公司。保留所有权利。

 * SPDX-License-Identifier: Apache-2.0

 *

 * 根据 Apache License 2.0 版本（“许可证”）获得许可；

 * 除非遵守许可证，否则您不得使用此文件。

 * 您可以在以下网址获取许可证副本：

 *

 * https://apache.ac.cn/licenses/LICENSE-2.0

 *

 * 除非适用法律要求或以书面形式达成一致，否则

 * 根据许可证分发的软件以“现状”为基础分发，

 * 不附带任何形式的明示或暗示的保证或条件。

 * 请参阅许可证，以了解有关权限和

 * 许可证限制的具体语言。

 */


#ifndef NV_INFER_RUNTIME_H

#define NV_INFER_RUNTIME_H


#include "NvInferImpl.h"

#define NV_INFER_INTERNAL_INCLUDE 1

#include "NvInferPluginBase.h"

#undef NV_INFER_INTERNAL_INCLUDE

#include "NvInferRuntimeCommon.h"


namespace nvinfer1

{


class IExecutionContext;

class ICudaEngine;

class IPluginFactory;

class IEngineInspector;


class INoCopy

{

protected

 INoCopy() = default;

 virtual ~INoCopy() = default;

 INoCopy(INoCopy const& other) = delete;

 INoCopy& operator=(INoCopy const& other) = delete;

 INoCopy(INoCopy&& other) = delete;

 INoCopy& operator=(INoCopy&& other) = delete;

};


enum class EngineCapability : int32_t

{

 kSTANDARD = 0,


 kSAFETY = 1,


 kDLA_STANDALONE = 2,

};


namespace impl

{

template <>

struct EnumMaxImpl<EngineCapability>

{

 static constexpr int32_t kVALUE = 3;

};

} // namespace impl


class Weights

{

public

 DataType type;

 void const* values;

 int64_t count;

};


class IHostMemory : public INoCopy

{

public

 virtual ~IHostMemory() noexcept = default;


 void* data() const noexcept

    {

 return mImpl->data();

    }


 std::size_t size() const noexcept

    {

 return mImpl->size();

    }


 DataType type() const noexcept

    {

 return mImpl->type();

    }


protected

 apiv::VHostMemory* mImpl;

};


enum class DimensionOperation : int32_t

{

 kSUM = 0,

 kPROD = 1,

 kMAX = 2,

 kMIN = 3,

 kSUB = 4,

 kEQUAL = 5,

 kLESS = 6,

 kFLOOR_DIV = 7,

 kCEIL_DIV = 8

};


template <>

constexpr inline int32_t EnumMax<DimensionOperation>() noexcept

{

 return 9;

}


enum class TensorLocation : int32_t

{

 kDEVICE = 0,

 kHOST = 1,

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorLocation>

{

 static constexpr int32_t kVALUE = 2;

};

} // namespace impl


class IDimensionExpr : public INoCopy

{

public

 bool isConstant() const noexcept

    {

 return mImpl->isConstant();

    }


 int64_t getConstantValue() const noexcept

    {

 return mImpl->getConstantValue();

    }


protected

 apiv::VDimensionExpr* mImpl;

 virtual ~IDimensionExpr() noexcept = default;


public

 bool isSizeTensor() const noexcept

    {

 return mImpl->isSizeTensor();

    }

};


class IExprBuilder : public INoCopy

{

public

 IDimensionExpr const* constant(int64_t value) noexcept

    {

 return mImpl->constant(value);

    }


 IDimensionExpr const* operation(

 DimensionOperation op, IDimensionExpr const& first, IDimensionExpr const& second) noexcept

    {

 return mImpl->operation(op, first, second);

    }


protected

 apiv::VExprBuilder* mImpl;

 virtual ~IExprBuilder() noexcept = default;


public

 IDimensionExpr const* declareSizeTensor(int32_t outputIndex, IDimensionExpr const& opt, IDimensionExpr const& upper)

    {

 return mImpl->declareSizeTensor(outputIndex, opt, upper);

    }

};


class DimsExprs

{

public

 int32_t nbDims;

 IDimensionExpr const* d[Dims::MAX_DIMS];

};


struct DynamicPluginTensorDesc

{

 PluginTensorDesc desc;


 Dims min;


 Dims max;


 Dims opt;

};


class TRT_DEPRECATED IPluginV2DynamicExt : public nvinfer1::IPluginV2Ext

{

public

 IPluginV2DynamicExt* clone() const noexcept override = 0;


 virtual DimsExprs getOutputDimensions(

 int32_t outputIndex, DimsExprs const* inputs, int32_t nbInputs, IExprBuilder& exprBuilder) noexcept = 0;


 static constexpr int32_t kFORMAT_COMBINATION_LIMIT = 100;


 virtual bool supportsFormatCombination(

 int32_t pos, PluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


 virtual void configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

 DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


 virtual size_t getWorkspaceSize(PluginTensorDesc const* inputs, int32_t nbInputs, PluginTensorDesc const* outputs,

 int32_t nbOutputs) const noexcept = 0;


 virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

 void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


protected

 int32_t getTensorRTVersion() const noexcept override

    {

 return (static_cast<int32_t>(PluginVersion::kV2_DYNAMICEXT) << 24 | (NV_TENSORRT_VERSION & 0xFFFFFF));

    }


 virtual ~IPluginV2DynamicExt() noexcept {}


private

 // Following are obsolete base class methods, and must not be implemented or used.


 void configurePlugin(Dims const*, int32_t, Dims const*, int32_t, DataType const*, DataType const*, bool const*,

 bool const*, PluginFormat, int32_t) noexcept override final

    {

    }


 bool supportsFormat(DataType, PluginFormat) const noexcept override final

    {

 return false;

    }


 Dims getOutputDimensions(int32_t, Dims const*, int32_t) noexcept override final

    {

 return Dims{-1, {}};

    }


 TRT_DEPRECATED bool isOutputBroadcastAcrossBatch(int32_t, bool const*, int32_t) const noexcept override final

    {

 return false;

    }


 TRT_DEPRECATED bool canBroadcastInputAcrossBatch(int32_t) const noexcept override final

    {

 return true;

    }


 size_t getWorkspaceSize(int32_t) const noexcept override final

    {

 return 0;

    }


 int32_t enqueue(int32_t, void const* const*, void* const*, void*, cudaStream_t) noexcept override final

    {

 return 1;

    }

};


namespace v_1_0

{

class IStreamReader : public IVersionedInterface

{

public

 ~IStreamReader() override = default;

 IStreamReader() = default;


 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"IStreamReader", 1, 0};

    }


 virtual int64_t read(void* destination, int64_t nbBytes) = 0;


protected

 IStreamReader(IStreamReader const&) = default;

 IStreamReader(IStreamReader&&) = default;

 IStreamReader& operator=(IStreamReader const&) & = default;

 IStreamReader& operator=(IStreamReader&&) & = default;

};

} // namespace v_1_0


using IStreamReader = v_1_0::IStreamReader;


enum class SeekPosition : int32_t

{

 kSET = 0,


 kCUR = 1,


 kEND = 2,

};


namespace v_1_0

{

class IStreamReaderV2 : public IVersionedInterface

{

public

 ~IStreamReaderV2() override = default;

 IStreamReaderV2() = default;


 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"IStreamReaderV2", 1, 0};

    }


 virtual int64_t read(void* destination, int64_t nbBytes, cudaStream_t stream) noexcept = 0;


 virtual bool seek(int64_t offset, SeekPosition where) noexcept = 0;


protected

 IStreamReaderV2(IStreamReaderV2 const&) = default;

 IStreamReaderV2(IStreamReaderV2&&) = default;

 IStreamReaderV2& operator=(IStreamReaderV2 const&) & = default;

 IStreamReaderV2& operator=(IStreamReaderV2&&) & = default;

};

} // 命名空间 v_1_0


using IStreamReaderV2 = v_1_0::IStreamReaderV2;


class IPluginResourceContext

{

public

 virtual IGpuAllocator* getGpuAllocator() const noexcept = 0;


 virtual IErrorRecorder* getErrorRecorder() const noexcept = 0;

 virtual ~IPluginResourceContext() noexcept = default;


protected

 IPluginResourceContext() = default;

 IPluginResourceContext(IPluginResourceContext const&) = default;

 IPluginResourceContext(IPluginResourceContext&&) = default;

 IPluginResourceContext& operator=(IPluginResourceContext const&) & = default;

 IPluginResourceContext& operator=(IPluginResourceContext&&) & = default;

};


namespace v_1_0

{

class IPluginV3OneCore : public IPluginCapability

{

public

 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"PLUGIN_V3ONE_CORE", 1, 0};

    }


 virtual AsciiChar const* getPluginName() const noexcept = 0;


 virtual AsciiChar const* getPluginVersion() const noexcept = 0;


 virtual AsciiChar const* getPluginNamespace() const noexcept = 0;

};


class IPluginV3OneBuild : public IPluginCapability

{

public

 static constexpr int32_t kDEFAULT_FORMAT_COMBINATION_LIMIT = 100;


 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 1, 0};

    }


 virtual int32_t configurePlugin(DynamicPluginTensorDesc const* in, int32_t nbInputs,

 DynamicPluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


 virtual int32_t getOutputDataTypes(

 DataType* outputTypes, int32_t nbOutputs, const DataType* inputTypes, int32_t nbInputs) const noexcept = 0;


 virtual int32_t getOutputShapes(DimsExprs const* inputs, int32_t nbInputs, DimsExprs const* shapeInputs,

 int32_t nbShapeInputs, DimsExprs* outputs, int32_t nbOutputs, IExprBuilder& exprBuilder) noexcept = 0;


 virtual bool supportsFormatCombination(

 int32_t pos, DynamicPluginTensorDesc const* inOut, int32_t nbInputs, int32_t nbOutputs) noexcept = 0;


 virtual int32_t getNbOutputs() const noexcept = 0;


 virtual size_t getWorkspaceSize(DynamicPluginTensorDesc const* inputs, int32_t nbInputs,

 DynamicPluginTensorDesc const* outputs, int32_t nbOutputs) const noexcept

    {

 return 0;

    }


 virtual int32_t getValidTactics(int32_t* tactics, int32_t nbTactics) noexcept

    {

 return 0;

    }


 virtual int32_t getNbTactics() noexcept

    {

 return 0;

    }


 virtual char const* getTimingCacheID() noexcept

    {

 return nullptr;

    }


 virtual int32_t getFormatCombinationLimit() noexcept

    {

 return kDEFAULT_FORMAT_COMBINATION_LIMIT;

    }


 virtual char const* getMetadataString() noexcept

    {

 return nullptr;

    }

};


class IPluginV3OneRuntime : public IPluginCapability

{

public

 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"PLUGIN_V3ONE_RUNTIME", 1, 0};

    }


 virtual int32_t setTactic(int32_t tactic) noexcept

    {

 return 0;

    }


 virtual int32_t onShapeChange(

 PluginTensorDesc const* in, int32_t nbInputs, PluginTensorDesc const* out, int32_t nbOutputs) noexcept = 0;


 virtual int32_t enqueue(PluginTensorDesc const* inputDesc, PluginTensorDesc const* outputDesc,

 void const* const* inputs, void* const* outputs, void* workspace, cudaStream_t stream) noexcept = 0;


 virtual IPluginV3* attachToContext(IPluginResourceContext* context) noexcept = 0;


 virtual PluginFieldCollection const* getFieldsToSerialize() noexcept = 0;

};

} // 命名空间 v_1_0


namespace v_2_0

{


class IPluginV3OneBuild : public v_1_0::IPluginV3OneBuild

{

public

 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"PLUGIN_V3ONE_BUILD", 2, 0};

    }


 virtual int32_t getAliasedInput(int32_t outputIndex) noexcept

    {

 return -1;

    }

};


} // 命名空间 v_2_0


using IPluginV3OneCore = v_1_0::IPluginV3OneCore;


using IPluginV3OneBuild = v_1_0::IPluginV3OneBuild;


using IPluginV3OneRuntime = v_1_0::IPluginV3OneRuntime;


using IPluginV3OneBuildV2 = v_2_0::IPluginV3OneBuild;


namespace v_1_0

{

class IProfiler

{

public

 virtual void reportLayerTime(char const* layerName, float ms) noexcept = 0;


 virtual ~IProfiler() noexcept {}

};

} // 命名空间 v_1_0


using IProfiler = v_1_0::IProfiler;


enum class WeightsRole : int32_t

{

 kKERNEL = 0,

 kBIAS = 1,

 kSHIFT = 2,

 kSCALE = 3,

 kCONSTANT = 4,

 kANY = 5,

};


template <>

constexpr inline int32_t EnumMax<WeightsRole>() noexcept

{

 return 6;

}


enum class DeviceType : int32_t

{

 kGPU = 0,

 kDLA = 1,

};


template <>

constexpr inline int32_t EnumMax<DeviceType>() noexcept

{

 return 2;

}


enum class TempfileControlFlag : int32_t

{

 kALLOW_IN_MEMORY_FILES = 0,


 kALLOW_TEMPORARY_FILES = 1,

};


template <>

constexpr inline int32_t EnumMax<TempfileControlFlag>() noexcept

{

 return 2;

}


using TempfileControlFlags = uint32_t;


enum class TensorFormat : int32_t

{

 kLINEAR = 0,


 kCHW2 = 1,


 kHWC8 = 2,


 kCHW4 = 3,


 kCHW16 = 4,


 kCHW32 = 5,


 kDHWC8 = 6,


 kCDHW32 = 7,


 kHWC = 8,


 kDLA_LINEAR = 9,


 kDLA_HWC4 = 10,


 kHWC16 = 11,


 kDHWC = 12

};


namespace impl

{

template <>

struct EnumMaxImpl<TensorFormat>

{

 static constexpr int32_t kVALUE = 13;

};

} // 命名空间 impl


enum class AllocatorFlag : int32_t

{

 kRESIZABLE = 0,

};


namespace impl

{

template <>

struct EnumMaxImpl<AllocatorFlag>

{

 static constexpr int32_t kVALUE = 1;

};

} // 命名空间 impl


using AllocatorFlags = uint32_t;


class ILogger

{

public

 enum class Severity : int32_t

    {

 kINTERNAL_ERROR = 0,

 kERROR = 1,

 kWARNING = 2,

 kINFO = 3,

 kVERBOSE = 4,

    };


 virtual void log(Severity severity, AsciiChar const* msg) noexcept = 0;


 ILogger() = default;

 virtual ~ILogger() = default;


protected

 // @cond SuppressDoxyWarnings

 ILogger(ILogger const&) = default;

 ILogger(ILogger&&) = default;

 ILogger& operator=(ILogger const&) & = default;

 ILogger& operator=(ILogger&&) & = default;

 // @endcond

};


namespace impl

{

template <>

struct EnumMaxImpl<ILogger::Severity>

{

 static constexpr int32_t kVALUE = 5;

};

} // 命名空间 impl


namespace v_1_0

{


class IGpuAllocator : public IVersionedInterface

{

public

 TRT_DEPRECATED virtual void* allocate(

 uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept = 0;


 ~IGpuAllocator() override = default;

 IGpuAllocator() = default;


 virtual void* reallocate(void* const /*baseAddr*/, uint64_t /*alignment*/, uint64_t /*newSize*/) noexcept

    {

 return nullptr;

    }


 TRT_DEPRECATED virtual bool deallocate(void* const memory) noexcept = 0;


 virtual void* allocateAsync(

 uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t /*stream*/) noexcept

    {

 return allocate(size, alignment, flags);

    }

 virtual bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept

    {

 return deallocate(memory);

    }


 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return {"IGpuAllocator", 1, 0};

    }


protected

 // @cond SuppressDoxyWarnings

 IGpuAllocator(IGpuAllocator const&) = default;

 IGpuAllocator(IGpuAllocator&&) = default;

 IGpuAllocator& operator=(IGpuAllocator const&) & = default;

 IGpuAllocator& operator=(IGpuAllocator&&) & = default;

 // @endcond

};


} // namespace v_1_0


using IGpuAllocator = v_1_0::IGpuAllocator;


class IRuntime : public INoCopy

{

public

 virtual ~IRuntime() noexcept = default;


 void setDLACore(int32_t dlaCore) noexcept

    {

 mImpl->setDLACore(dlaCore);

    }


 int32_t getDLACore() const noexcept

    {

 return mImpl->getDLACore();

    }


 int32_t getNbDLACores() const noexcept

    {

 return mImpl->getNbDLACores();

    }


 void setGpuAllocator(IGpuAllocator* allocator) noexcept

    {

 mImpl->setGpuAllocator(allocator);

    }


    //

 void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

 mImpl->setErrorRecorder(recorder);

    }


 IErrorRecorder* getErrorRecorder() const noexcept

    {

 return mImpl->getErrorRecorder();

    }


 ICudaEngine* deserializeCudaEngine(void const* blob, std::size_t size) noexcept

    {

 return mImpl->deserializeCudaEngine(blob, size);

    }


 TRT_DEPRECATED ICudaEngine* deserializeCudaEngine(IStreamReader& streamReader)

    {

 return mImpl->deserializeCudaEngine(streamReader);

    }


 ICudaEngine* deserializeCudaEngine(IStreamReaderV2& streamReader)

    {

 return mImpl->deserializeCudaEngineV2(streamReader);

    }


 ILogger* getLogger() const noexcept

    {

 return mImpl->getLogger();

    }


 bool setMaxThreads(int32_t maxThreads) noexcept

    {

 return mImpl->setMaxThreads(maxThreads);

    }


 int32_t getMaxThreads() const noexcept

    {

 return mImpl->getMaxThreads();

    }


 void setTemporaryDirectory(char const* path) noexcept

    {

 return mImpl->setTemporaryDirectory(path);

    }


 char const* getTemporaryDirectory() const noexcept

    {

 return mImpl->getTemporaryDirectory();

    }


 void setTempfileControlFlags(TempfileControlFlags flags) noexcept

    {

 return mImpl->setTempfileControlFlags(flags);

    }


 TempfileControlFlags getTempfileControlFlags() const noexcept

    {

 return mImpl->getTempfileControlFlags();

    }


 IPluginRegistry& getPluginRegistry() noexcept

    {

 return mImpl->getPluginRegistry();

    }


 IRuntime* loadRuntime(char const* path) noexcept

    {

 return mImpl->loadRuntime(path);

    }


 void setEngineHostCodeAllowed(bool allowed) noexcept

    {

 return mImpl->setEngineHostCodeAllowed(allowed);

    }


 bool getEngineHostCodeAllowed() const noexcept

    {

 return mImpl->getEngineHostCodeAllowed();

    }


protected

 apiv::VRuntime* mImpl;

};


class IRefitter : public INoCopy

{

public

 virtual ~IRefitter() noexcept = default;


 bool setWeights(char const* layerName, WeightsRole role, Weights weights) noexcept

    {

 return mImpl->setWeights(layerName, role, weights);

    }


 bool refitCudaEngine() noexcept

    {

 return mImpl->refitCudaEngine();

    }


 int32_t getMissing(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

 return mImpl->getMissing(size, layerNames, roles);

    }


 int32_t getAll(int32_t size, char const** layerNames, WeightsRole* roles) noexcept

    {

 return mImpl->getAll(size, layerNames, roles);

    }


 TRT_DEPRECATED bool setDynamicRange(char const* tensorName, float min, float max) noexcept

    {

 return mImpl->setDynamicRange(tensorName, min, max);

    }


 TRT_DEPRECATED float getDynamicRangeMin(char const* tensorName) const noexcept

    {

 return mImpl->getDynamicRangeMin(tensorName);

    }


 TRT_DEPRECATED float getDynamicRangeMax(char const* tensorName) const noexcept

    {

 return mImpl->getDynamicRangeMax(tensorName);

    }


 TRT_DEPRECATED int32_t getTensorsWithDynamicRange(int32_t size, char const** tensorNames) const noexcept

    {

 return mImpl->getTensorsWithDynamicRange(size, tensorNames);

    }


    //

 void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

 mImpl->setErrorRecorder(recorder);

    }


 IErrorRecorder* getErrorRecorder() const noexcept

    {

 return mImpl->getErrorRecorder();

    }


 bool setNamedWeights(char const* name, Weights weights) noexcept

    {

 return mImpl->setNamedWeights(name, weights);

    }


 int32_t getMissingWeights(int32_t size, char const** weightsNames) noexcept

    {

 return mImpl->getMissingWeights(size, weightsNames);

    }


 int32_t getAllWeights(int32_t size, char const** weightsNames) noexcept

    {

 return mImpl->getAllWeights(size, weightsNames);

    }


 ILogger* getLogger() const noexcept

    {

 return mImpl->getLogger();

    }


 bool setMaxThreads(int32_t maxThreads) noexcept

    {

 return mImpl->setMaxThreads(maxThreads);

    }


 int32_t getMaxThreads() const noexcept

    {

 return mImpl->getMaxThreads();

    }


 bool setNamedWeights(char const* name, Weights weights, TensorLocation location) noexcept

    {

 return mImpl->setNamedWeightsWithLocation(name, weights, location);

    }


 Weights getNamedWeights(char const* weightsName) const noexcept

    {

 return mImpl->getNamedWeights(weightsName);

    }


 TensorLocation getWeightsLocation(char const* weightsName) const noexcept

    {

 return mImpl->getWeightsLocation(weightsName);

    }


 bool unsetNamedWeights(char const* weightsName) noexcept

    {

 return mImpl->unsetNamedWeights(weightsName);

    }


 void setWeightsValidation(bool weightsValidation) noexcept

    {

 return mImpl->setWeightsValidation(weightsValidation);

    }


 bool getWeightsValidation() const noexcept

    {

 return mImpl->getWeightsValidation();

    }


 bool refitCudaEngineAsync(cudaStream_t stream) noexcept

    {

 return mImpl->refitCudaEngineAsync(stream);

    }


 Weights getWeightsPrototype(char const* weightsName) const noexcept

    {

 return mImpl->getWeightsPrototype(weightsName);

    }


protected

 apiv::VRefitter* mImpl;

};


enum class OptProfileSelector : int32_t

{

 kMIN = 0,

 kOPT = 1,

 kMAX = 2

};


template <>

constexpr inline int32_t EnumMax<OptProfileSelector>() noexcept

{

 return 3;

}


class IOptimizationProfile : public INoCopy

{

public

 bool setDimensions(char const* inputName, OptProfileSelector select, Dims const& dims) noexcept

    {

 return mImpl->setDimensions(inputName, select, dims);

    }


 Dims getDimensions(char const* inputName, OptProfileSelector select) const noexcept

    {

 return mImpl->getDimensions(inputName, select);

    }


 bool setShapeValues(

 char const* inputName, OptProfileSelector select, int32_t const* values, int32_t nbValues) noexcept

    {

 return mImpl->setShapeValues(inputName, select, values, nbValues);

    }


 int32_t getNbShapeValues(char const* inputName) const noexcept

    {

 return mImpl->getNbShapeValues(inputName);

    }


 int32_t const* getShapeValues(char const* inputName, OptProfileSelector select) const noexcept

    {

 return mImpl->getShapeValues(inputName, select);

    }


 bool setExtraMemoryTarget(float target) noexcept

    {

 return mImpl->setExtraMemoryTarget(target);

    }


 float getExtraMemoryTarget() const noexcept

    {

 return mImpl->getExtraMemoryTarget();

    }


 bool isValid() const noexcept

    {

 return mImpl->isValid();

    }


protected

 apiv::VOptimizationProfile* mImpl;

 virtual ~IOptimizationProfile() noexcept = default;

};


enum class TacticSource : int32_t

{

 kCUBLAS TRT_DEPRECATED_ENUM = 0,


 kCUBLAS_LT TRT_DEPRECATED_ENUM = 1,


 kCUDNN TRT_DEPRECATED_ENUM = 2,


 kEDGE_MASK_CONVOLUTIONS = 3,


 kJIT_CONVOLUTIONS = 4,

};


template <>

constexpr inline int32_t EnumMax<TacticSource>() noexcept

{

 return 5;

}


using TacticSources = uint32_t;


enum class ProfilingVerbosity : int32_t

{

 kLAYER_NAMES_ONLY = 0,

 kNONE = 1,

 kDETAILED = 2,

};


template <>

constexpr inline int32_t EnumMax<ProfilingVerbosity>() noexcept

{

 return 3;

}


using SerializationFlags = uint32_t;


enum class SerializationFlag : int32_t

{

 kEXCLUDE_WEIGHTS = 0,

 kEXCLUDE_LEAN_RUNTIME = 1,

};


template <>

constexpr inline int32_t EnumMax<SerializationFlag>() noexcept

{

 return 2;

}


class ISerializationConfig : public INoCopy

{

public

 virtual ~ISerializationConfig() noexcept = default;


 bool setFlags(SerializationFlags serializationFlags) noexcept

    {

 return mImpl->setFlags(serializationFlags);

    }


 SerializationFlags getFlags() const noexcept

    {

 return mImpl->getFlags();

    }


 bool clearFlag(SerializationFlag serializationFlag) noexcept

    {

 return mImpl->clearFlag(serializationFlag);

    }


 bool setFlag(SerializationFlag serializationFlag) noexcept

    {

 return mImpl->setFlag(serializationFlag);

    }


 bool getFlag(SerializationFlag serializationFlag) const noexcept

    {

 return mImpl->getFlag(serializationFlag);

    }


protected

 apiv::VSerializationConfig* mImpl;

};


enum class ExecutionContextAllocationStrategy : int32_t

{

 kSTATIC = 0,

 kON_PROFILE_CHANGE = 1,

 kUSER_MANAGED = 2,

};


template <>

constexpr inline int32_t EnumMax<ExecutionContextAllocationStrategy>() noexcept

{

 return 3;

}


class ICudaEngine : public INoCopy

{

public

 virtual ~ICudaEngine() noexcept = default;


 Dims getTensorShape(char const* tensorName) const noexcept

    {

 return mImpl->getTensorShape(tensorName);

    }


 DataType getTensorDataType(char const* tensorName) const noexcept

    {

 return mImpl->getTensorDataType(tensorName);

    }


 int32_t getNbLayers() const noexcept

    {

 return mImpl->getNbLayers();

    }


 IHostMemory* serialize() const noexcept

    {

 return mImpl->serialize();

    }


 IExecutionContext* createExecutionContext(

 ExecutionContextAllocationStrategy strategy = ExecutionContextAllocationStrategy::kSTATIC) noexcept

    {

 return mImpl->createExecutionContext(strategy);

    }


 TensorLocation getTensorLocation(char const* tensorName) const noexcept

    {

 return mImpl->getTensorLocation(tensorName);

    }


 bool isShapeInferenceIO(char const* tensorName) const noexcept

    {

 return mImpl->isShapeInferenceIO(tensorName);

    }


 TensorIOMode getTensorIOMode(char const* tensorName) const noexcept

    {

 return mImpl->getTensorIOMode(tensorName);

    }


 TRT_DEPRECATED IExecutionContext* createExecutionContextWithoutDeviceMemory() noexcept

    {

 return mImpl->createExecutionContextWithoutDeviceMemory();

    }


 TRT_DEPRECATED size_t getDeviceMemorySize() const noexcept

    {

 return mImpl->getDeviceMemorySize();

    }


 TRT_DEPRECATED size_t getDeviceMemorySizeForProfile(int32_t profileIndex) const noexcept

    {

 return mImpl->getDeviceMemorySizeForProfile(profileIndex);

    }


 int64_t getDeviceMemorySizeV2() const noexcept

    {

 return mImpl->getDeviceMemorySizeV2();

    }


 int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept

    {

 return mImpl->getDeviceMemorySizeForProfileV2(profileIndex);

    }


 bool isRefittable() const noexcept

    {

 return mImpl->isRefittable();

    }


 int32_t getTensorBytesPerComponent(char const* tensorName) const noexcept

    {

 return mImpl->getTensorBytesPerComponent(tensorName);

    }


 int32_t getTensorBytesPerComponent(char const* tensorName, int32_t profileIndex) const noexcept

    {

 return mImpl->getTensorBytesPerComponentV2(tensorName, profileIndex);

    }


 int32_t getTensorComponentsPerElement(char const* tensorName) const noexcept

    {

 return mImpl->getTensorComponentsPerElement(tensorName);

    }


 int32_t getTensorComponentsPerElement(char const* tensorName, int32_t profileIndex) const noexcept

    {

 return mImpl->getTensorComponentsPerElementV2(tensorName, profileIndex);

    }


 TensorFormat getTensorFormat(char const* tensorName) const noexcept

    {

 return mImpl->getTensorFormat(tensorName);

    }


 TensorFormat getTensorFormat(char const* tensorName, int32_t profileIndex) const noexcept

    {

 return mImpl->getTensorFormatV2(tensorName, profileIndex);

    }


 char const* getTensorFormatDesc(char const* tensorName) const noexcept

    {

 return mImpl->getTensorFormatDesc(tensorName);

    }


 char const* getTensorFormatDesc(char const* tensorName, int32_t profileIndex) const noexcept

    {

 return mImpl->getTensorFormatDescV2(tensorName, profileIndex);

    }


 int32_t getTensorVectorizedDim(char const* tensorName) const noexcept

    {

 return mImpl->getTensorVectorizedDim(tensorName);

    }


 int32_t getTensorVectorizedDim(char const* tensorName, int32_t profileIndex) const noexcept

    {

 return mImpl->getTensorVectorizedDimV2(tensorName, profileIndex);

    }


 char const* getName() const noexcept

    {

 return mImpl->getName();

    }


 int32_t getNbOptimizationProfiles() const noexcept

    {

 return mImpl->getNbOptimizationProfiles();

    }


 Dims getProfileShape(char const* tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept

    {

 return mImpl->getProfileShape(tensorName, profileIndex, select);

    }


 int32_t const* getProfileTensorValues(char const* tensorName, int32_t profileIndex, OptProfileSelector select) const

 noexcept

    {

 return mImpl->getProfileTensorValues(tensorName, profileIndex, select);

    }


 EngineCapability getEngineCapability() const noexcept

    {

 return mImpl->getEngineCapability();

    }


 void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

 return mImpl->setErrorRecorder(recorder);

    }


 IErrorRecorder* getErrorRecorder() const noexcept

    {

 return mImpl->getErrorRecorder();

    }


 TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept

    {

 return mImpl->hasImplicitBatchDimension();

    }


 TacticSources getTacticSources() const noexcept

    {

 return mImpl->getTacticSources();

    }


 ProfilingVerbosity getProfilingVerbosity() const noexcept

    {

 return mImpl->getProfilingVerbosity();

    }


 IEngineInspector* createEngineInspector() const noexcept

    {

 return mImpl->createEngineInspector();

    }


 int32_t getNbIOTensors() const noexcept

    {

 return mImpl->getNbIOTensors();

    }


 char const* getIOTensorName(int32_t index) const noexcept

    {

 return mImpl->getIOTensorName(index);

    }


 HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept

    {

 return mImpl->getHardwareCompatibilityLevel();

    }


 int32_t getNbAuxStreams() const noexcept

    {

 return mImpl->getNbAuxStreams();

    }


 ISerializationConfig* createSerializationConfig() noexcept

    {

 return mImpl->createSerializationConfig();

    }


 IHostMemory* serializeWithConfig(ISerializationConfig& config) const noexcept

    {

 return mImpl->serializeWithConfig(config);

    }


 TRT_DEPRECATED bool setWeightStreamingBudget(int64_t gpuMemoryBudget) noexcept

    {

 return mImpl->setWeightStreamingBudget(gpuMemoryBudget);

    }


 TRT_DEPRECATED int64_t getWeightStreamingBudget() const noexcept

    {

 return mImpl->getWeightStreamingBudget();

    }


 TRT_DEPRECATED int64_t getMinimumWeightStreamingBudget() const noexcept

    {

 return mImpl->getMinimumWeightStreamingBudget();

    }


 int64_t getStreamableWeightsSize() const noexcept

    {

 return mImpl->getStreamableWeightsSize();

    }


 bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept

    {

 return mImpl->setWeightStreamingBudgetV2(gpuMemoryBudget);

    }


 int64_t getWeightStreamingBudgetV2() const noexcept

    {

 return mImpl->getWeightStreamingBudgetV2();

    }


 int64_t getWeightStreamingAutomaticBudget() const noexcept

    {

 return mImpl->getWeightStreamingAutomaticBudget();

    }


 int64_t getWeightStreamingScratchMemorySize() const noexcept

    {

 return mImpl->getWeightStreamingScratchMemorySize();

    }


 bool isDebugTensor(char const* name) const noexcept

    {

 return mImpl->isDebugTensor(name);

    }


protected

 apiv::VCudaEngine* mImpl;

};


namespace v_1_0

{

class IOutputAllocator : public IVersionedInterface

{

public

 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return {"IOutputAllocator", 1, 0};

    }


 TRT_DEPRECATED virtual void* reallocateOutput(

 char const* tensorName, void* currentMemory, uint64_t size, uint64_t alignment) noexcept

    {

 return nullptr;

    }


 virtual void* reallocateOutputAsync(

 char const* tensorName, void* currentMemory, uint64_t size, uint64_t alignment, cudaStream_t /*stream*/)

    {

 return reallocateOutput(tensorName, currentMemory, size, alignment);

    }


 virtual void notifyShape(char const* tensorName, Dims const& dims) noexcept = 0;

};

} // namespace v_1_0


using IOutputAllocator = v_1_0::IOutputAllocator;


namespace v_1_0

{

class IDebugListener : public IVersionedInterface

{

public

 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return {"IDebugListener", 1, 0};

    }


 virtual bool processDebugTensor(void const* addr, TensorLocation location, DataType type, Dims const& shape,

 char const* name, cudaStream_t stream)

        = 0;


 ~IDebugListener() override = default;

};

} // namespace v_1_0 命名空间 v_1_0


using IDebugListener = v_1_0::IDebugListener;


class IExecutionContext : public INoCopy

{

public

 virtual ~IExecutionContext() noexcept = default;


 void setDebugSync(bool sync) noexcept

    {

 mImpl->setDebugSync(sync);

    }


 bool getDebugSync() const noexcept

    {

 return mImpl->getDebugSync();

    }


 void setProfiler(IProfiler* profiler) noexcept

    {

 mImpl->setProfiler(profiler);

    }


 IProfiler* getProfiler() const noexcept

    {

 return mImpl->getProfiler();

    }


 ICudaEngine const& getEngine() const noexcept

    {

 return mImpl->getEngine();

    }


 void setName(char const* name) noexcept

    {

 mImpl->setName(name);

    }


 char const* getName() const noexcept

    {

 return mImpl->getName();

    }


 void setDeviceMemory(void* memory) noexcept

    {

 mImpl->setDeviceMemory(memory);

    }


 void setDeviceMemoryV2(void* memory, int64_t size) noexcept

    {

 return mImpl->setDeviceMemoryV2(memory, size);

    }


 Dims getTensorStrides(char const* tensorName) const noexcept

    {

 return mImpl->getTensorStrides(tensorName);

    }


public

 int32_t getOptimizationProfile() const noexcept

    {

 return mImpl->getOptimizationProfile();

    }


 bool setInputShape(char const* tensorName, Dims const& dims) noexcept

    {

 return mImpl->setInputShape(tensorName, dims);

    }


 Dims getTensorShape(char const* tensorName) const noexcept

    {

 return mImpl->getTensorShape(tensorName);

    }


 bool allInputDimensionsSpecified() const noexcept

    {

 return mImpl->allInputDimensionsSpecified();

    }


 TRT_DEPRECATED bool allInputShapesSpecified() const noexcept

    {

 return mImpl->allInputShapesSpecified();

    }


 void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

 mImpl->setErrorRecorder(recorder);

    }


 IErrorRecorder* getErrorRecorder() const noexcept

    {

 return mImpl->getErrorRecorder();

    }


 bool executeV2(void* const* bindings) noexcept

    {

 return mImpl->executeV2(bindings);

    }


 bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept

    {

 return mImpl->setOptimizationProfileAsync(profileIndex, stream);

    }


 void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept

    {

 mImpl->setEnqueueEmitsProfile(enqueueEmitsProfile);

    }


 bool getEnqueueEmitsProfile() const noexcept

    {

 return mImpl->getEnqueueEmitsProfile();

    }


 bool reportToProfiler() const noexcept

    {

 return mImpl->reportToProfiler();

    }


 bool setTensorAddress(char const* tensorName, void* data) noexcept

    {

 return mImpl->setTensorAddress(tensorName, data);

    }


 void const* getTensorAddress(char const* tensorName) const noexcept

    {

 return mImpl->getTensorAddress(tensorName);

    }


 bool setOutputTensorAddress(char const* tensorName, void* data) noexcept

    {

 return mImpl->setOutputTensorAddress(tensorName, data);

    }


 bool setInputTensorAddress(char const* tensorName, void const* data) noexcept

    {

 return mImpl->setInputTensorAddress(tensorName, data);

    }


 void* getOutputTensorAddress(char const* tensorName) const noexcept

    {

 return mImpl->getOutputTensorAddress(tensorName);

    }


 int32_t inferShapes(int32_t nbMaxNames, char const** tensorNames) noexcept

    {

 return mImpl->inferShapes(nbMaxNames, tensorNames);

    }


 size_t updateDeviceMemorySizeForShapes() noexcept

    {

 return mImpl->updateDeviceMemorySizeForShapes();

    }


 bool setInputConsumedEvent(cudaEvent_t event) noexcept

    {

 return mImpl->setInputConsumedEvent(event);

    }


 cudaEvent_t getInputConsumedEvent() const noexcept

    {

 return mImpl->getInputConsumedEvent();

    }


 bool setOutputAllocator(char const* tensorName, IOutputAllocator* outputAllocator) noexcept

    {

 return mImpl->setOutputAllocator(tensorName, outputAllocator);

    }


 IOutputAllocator* getOutputAllocator(char const* tensorName) const noexcept

    {

 return mImpl->getOutputAllocator(tensorName);

    }


 int64_t getMaxOutputSize(char const* tensorName) const noexcept

    {

 return mImpl->getMaxOutputSize(tensorName);

    }


 bool setTemporaryStorageAllocator(IGpuAllocator* allocator) noexcept

    {

 return mImpl->setTemporaryStorageAllocator(allocator);

    }


 IGpuAllocator* getTemporaryStorageAllocator() const noexcept

    {

 return mImpl->getTemporaryStorageAllocator();

    }


 bool enqueueV3(cudaStream_t stream) noexcept

    {

 return mImpl->enqueueV3(stream);

    }


 void setPersistentCacheLimit(size_t size) noexcept

    {

 mImpl->setPersistentCacheLimit(size);

    }


 size_t getPersistentCacheLimit() const noexcept

    {

 return mImpl->getPersistentCacheLimit();

    }


 bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept

    {

 return mImpl->setNvtxVerbosity(verbosity);

    }


 ProfilingVerbosity getNvtxVerbosity() const noexcept

    {

 return mImpl->getNvtxVerbosity();

    }


 void setAuxStreams(cudaStream_t* auxStreams, int32_t nbStreams) noexcept

    {

 mImpl->setAuxStreams(auxStreams, nbStreams);

    }


 bool setDebugListener(IDebugListener* listener) noexcept

    {

 return mImpl->setDebugListener(listener);

    }


 IDebugListener* getDebugListener() noexcept

    {

 return mImpl->getDebugListener();

    }


 bool setTensorDebugState(char const* name, bool flag) noexcept

    {

 return mImpl->setTensorDebugState(name, flag);

    }


 bool setAllTensorsDebugState(bool flag) noexcept

    {

 return mImpl->setAllTensorsDebugState(flag);

    }


 bool getDebugState(char const* name) const noexcept

    {

 return mImpl->getDebugState(name);

    }


protected

 apiv::VExecutionContext* mImpl;

}; // class IExecutionContext 类 IExecutionContext


enum class LayerInformationFormat : int32_t

{

 kONELINE = 0,

 kJSON = 1,

};


template <>

constexpr inline int32_t EnumMax<LayerInformationFormat>() noexcept

{

 return 2;

}


class IEngineInspector : public INoCopy

{

public

 virtual ~IEngineInspector() noexcept = default;


 bool setExecutionContext(IExecutionContext const* context) noexcept

    {

 return mImpl->setExecutionContext(context);

    }


 IExecutionContext const* getExecutionContext() const noexcept

    {

 return mImpl->getExecutionContext();

    }


 char const* getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept

    {

 return mImpl->getLayerInformation(layerIndex, format);

    }


 char const* getEngineInformation(LayerInformationFormat format) const noexcept

    {

 return mImpl->getEngineInformation(format);

    }


 void setErrorRecorder(IErrorRecorder* recorder) noexcept

    {

 mImpl->setErrorRecorder(recorder);

    }


 IErrorRecorder* getErrorRecorder() const noexcept

    {

 return mImpl->getErrorRecorder();

    }


protected

 apiv::VEngineInspector* mImpl;

}; // class IEngineInspector 类 IEngineInspector


} // namespace nvinfer1 命名空间 nvinfer1


extern "C" TENSORRTAPI void* createInferRuntime_INTERNAL(void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI void* createInferRefitter_INTERNAL(void* engine, void* logger, int32_t version) noexcept;


extern "C" TENSORRTAPI nvinfer1::IPluginRegistry* getPluginRegistry() noexcept;


extern "C" TENSORRTAPI nvinfer1::ILogger* getLogger() noexcept;


namespace nvinfer1

{

namespace // unnamed namespace avoids linkage surprises when linking objects built with different versions of this  未命名的命名空间避免了在链接使用此头文件不同版本构建的对象时出现链接意外。

 // header.

{

inline IRuntime* createInferRuntime(ILogger& logger) noexcept

{

 return static_cast<IRuntime*>(createInferRuntime_INTERNAL(&logger, NV_TENSORRT_VERSION));

}


inline IRefitter* createInferRefitter(ICudaEngine& engine, ILogger& logger) noexcept

{

 return static_cast<IRefitter*>(createInferRefitter_INTERNAL(&engine, &logger, NV_TENSORRT_VERSION));

}


} // namespace 命名空间


template <typename T>

class PluginRegistrar

{

public

 PluginRegistrar()

    {

 getPluginRegistry()->registerCreator(instance, "");

    }


private

 T instance{};

};


} // namespace nvinfer1


#define REGISTER_TENSORRT_PLUGIN(name) \

 static nvinfer1::PluginRegistrar<name> pluginRegistrar##name {}


namespace nvinfer1

{

class ILoggerFinder

{

public

 virtual ILogger* findLogger() = 0;


protected

 virtual ~ILoggerFinder() = default;

};


namespace v_1_0

{


class IGpuAsyncAllocator : public IGpuAllocator

{

public

 IGpuAsyncAllocator() = default;

 ~IGpuAsyncAllocator() override = default;


 void* allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags,

 cudaStream_t /*stream*/) noexcept override = 0;


 bool deallocateAsync(void* const memory, cudaStream_t /*stream*/) noexcept override = 0;


 TRT_DEPRECATED void* allocate(

 uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override

    {

 return allocateAsync(size, alignment, flags, nullptr);

    }


 TRT_DEPRECATED bool deallocate(void* const memory) noexcept override

    {

 return deallocateAsync(memory, nullptr);

    }


 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return {"IGpuAllocator", 1, 0};

    }

};


class IPluginCreatorV3One : public IPluginCreatorInterface

{

public

 InterfaceInfo getInterfaceInfo() const noexcept override

    {

 return InterfaceInfo{"PLUGIN CREATOR_V3ONE", 1, 0};

    }


 virtual IPluginV3* createPlugin(

 AsciiChar const* name, PluginFieldCollection const* fc, TensorRTPhase phase) noexcept = 0;


 virtual PluginFieldCollection const* getFieldNames() noexcept = 0;


 virtual AsciiChar const* getPluginName() const noexcept = 0;


 virtual AsciiChar const* getPluginVersion() const noexcept = 0;


 virtual AsciiChar const* getPluginNamespace() const noexcept = 0;


 IPluginCreatorV3One() = default;

 virtual ~IPluginCreatorV3One() = default;


protected

 IPluginCreatorV3One(IPluginCreatorV3One const&) = default;

 IPluginCreatorV3One(IPluginCreatorV3One&&) = default;

 IPluginCreatorV3One& operator=(IPluginCreatorV3One const&) & = default;

 IPluginCreatorV3One& operator=(IPluginCreatorV3One&&) & = default;

};


} // namespace v_1_0


using IGpuAsyncAllocator = v_1_0::IGpuAsyncAllocator;


using IPluginCreatorV3One = v_1_0::IPluginCreatorV3One;


} // namespace nvinfer1


extern "C" TENSORRTAPI int32_t getInferLibMajorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibMinorVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibPatchVersion() noexcept;

extern "C" TENSORRTAPI int32_t getInferLibBuildVersion() noexcept;


#endif // NV_INFER_RUNTIME_H

NvInferImpl.h

NvInferPluginBase.h

getLogger
nvinfer1::ILogger * getLogger() noexcept
返回 logger 对象。

getInferLibMajorVersion
int32_t getInferLibMajorVersion() noexcept
返回库主版本号。

getPluginRegistry
nvinfer1::IPluginRegistry * getPluginRegistry() noexcept
返回插件注册表。

getInferLibPatchVersion
int32_t getInferLibPatchVersion() noexcept
返回库补丁版本号。

getInferLibMinorVersion
int32_t getInferLibMinorVersion() noexcept
返回库次版本号。

getInferLibBuildVersion
int32_t getInferLibBuildVersion() noexcept
返回库构建版本号。

TENSORRTAPI
#define TENSORRTAPI
定义: NvInferRuntimeBase.h:59

NV_TENSORRT_VERSION
#define NV_TENSORRT_VERSION
定义: NvInferRuntimeBase.h:91

TRT_DEPRECATED
#define TRT_DEPRECATED
定义: NvInferRuntimeBase.h:45

TRT_DEPRECATED_ENUM
#define TRT_DEPRECATED_ENUM
定义: NvInferRuntimeBase.h:46

NvInferRuntimeCommon.h

Dims
定义张量维度的结构体。

nvinfer1::Dims64
定义: NvInferRuntimeBase.h:203

nvinfer1::Dims64::MAX_DIMS
static constexpr int32_t MAX_DIMS
张量支持的最大秩（维度数量）。
定义: NvInferRuntimeBase.h:206

nvinfer1::DimsExprs
Dims 类的模拟，使用表达式代替常量来表示维度。
定义: NvInferRuntime.h:350

nvinfer1::DimsExprs::d
IDimensionExpr const * d[Dims::MAX_DIMS]
每个维度的范围。
定义: NvInferRuntime.h:353

nvinfer1::DimsExprs::nbDims
int32_t nbDims
维度的数量。
定义: NvInferRuntime.h:352

nvinfer1::ICudaEngine
用于在已构建的网络上执行推理的引擎，具有功能上不安全的功能。
定义: NvInferRuntime.h:3002

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName) const noexcept
返回一个元素中每个组件的字节数，如果张量未向量化或未提供，则返回 -1...
定义: NvInferRuntime.h:3227

nvinfer1::ICudaEngine::createSerializationConfig
ISerializationConfig * createSerializationConfig() noexcept
创建一个序列化配置对象。
定义: NvInferRuntime.h:3626

nvinfer1::ICudaEngine::getWeightStreamingBudget
TRT_DEPRECATED int64_t getWeightStreamingBudget() const noexcept
以字节为单位返回当前权重流设备内存预算。
定义: NvInferRuntime.h:3707

nvinfer1::ICudaEngine::getProfileTensorValues
int32_t const * getProfileTensorValues(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
获取给定名称的输入张量在某个优化配置下的最小/最佳/最大值（非维度）...
定义: NvInferRuntime.h:3461

nvinfer1::ICudaEngine::getIOTensorName
char const * getIOTensorName(int32_t index) const noexcept
返回 IO 张量的名称。
定义: NvInferRuntime.h:3588

nvinfer1::ICudaEngine::getWeightStreamingBudgetV2
int64_t getWeightStreamingBudgetV2() const noexcept
以字节为单位返回当前权重流设备内存预算。
定义: NvInferRuntime.h:3806

nvinfer1::ICudaEngine::getEngineCapability
EngineCapability getEngineCapability() const noexcept
确定此引擎具有的执行能力。
定义: NvInferRuntime.h:3477

nvinfer1::ICudaEngine::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
获取分配给此接口的 ErrorRecorder。
定义: NvInferRuntime.h:3511

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName, int32_t profileIndex) const noexcept
返回给定配置的张量格式，如果提供的名称未映射到...
定义: NvInferRuntime.h:3313

nvinfer1::ICudaEngine::hasImplicitBatchDimension
TRT_DEPRECATED bool hasImplicitBatchDimension() const noexcept
查询引擎是否使用隐式批次维度构建。
定义: NvInferRuntime.h:3525

nvinfer1::ICudaEngine::mImpl
apiv::VCudaEngine * mImpl
定义: NvInferRuntime.h:3879

nvinfer1::ICudaEngine::getDeviceMemorySizeForProfile
TRT_DEPRECATED size_t getDeviceMemorySizeForProfile(int32_t profileIndex) const noexcept
返回配置文件的上下文所需的最大设备内存。
定义: NvInferRuntime.h:3164

nvinfer1::ICudaEngine::createExecutionContext
IExecutionContext * createExecutionContext(ExecutionContextAllocationStrategy strategy=ExecutionContextAllocationStrategy::kSTATIC) noexcept
创建一个执行上下文并指定用于分配内部激活内存的策略。
定义: NvInferRuntime.h:3076

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName) const noexcept
返回张量格式的人类可读描述，如果提供的名称不映射到...
定义: NvInferRuntime.h:3337

nvinfer1::ICudaEngine::getProfileShape
Dims getProfileShape(char const *tensorName, int32_t profileIndex, OptProfileSelector select) const noexcept
获取给定名称的输入张量在优化下的最小/最佳/最大维度...
定义: NvInferRuntime.h:3439

nvinfer1::ICudaEngine::setWeightStreamingBudgetV2
bool setWeightStreamingBudgetV2(int64_t gpuMemoryBudget) noexcept
限制网络权重可用的最大 GPU 内存量（以字节为单位）。
定义: NvInferRuntime.h:3788

nvinfer1::ICudaEngine::getNbAuxStreams
int32_t getNbAuxStreams() const noexcept
返回此引擎使用的辅助流的数量。
定义: NvInferRuntime.h:3616

nvinfer1::ICudaEngine::getStreamableWeightsSize
int64_t getStreamableWeightsSize() const noexcept
获取所有可流式传输权重的总大小（以字节为单位）。
定义: NvInferRuntime.h:3746

nvinfer1::ICudaEngine::getTensorDataType
DataType getTensorDataType(char const *tensorName) const noexcept
从张量名称确定缓冲区所需的数据类型。
定义: NvInferRuntime.h:3031

nvinfer1::ICudaEngine::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
为此接口设置 ErrorRecorder。
定义: NvInferRuntime.h:3496

nvinfer1::ICudaEngine::getTacticSources
TacticSources getTacticSources() const noexcept
返回此引擎所需的策略源。
定义: NvInferRuntime.h:3541

nvinfer1::ICudaEngine::serializeWithConfig
IHostMemory * serializeWithConfig(ISerializationConfig &config) const noexcept
使用提供的 SerializationConfig 将网络序列化到流中。
定义: NvInferRuntime.h:3642

nvinfer1::ICudaEngine::~ICudaEngine
virtual ~ICudaEngine() noexcept=default

nvinfer1::ICudaEngine::getWeightStreamingAutomaticBudget
int64_t getWeightStreamingAutomaticBudget() const noexcept
TensorRT 自动确定模型运行的设备内存预算。预算接近于...
定义: NvInferRuntime.h:3831

nvinfer1::ICudaEngine::isDebugTensor
bool isDebugTensor(char const *name) const noexcept
检查张量是否标记为调试张量。
定义: NvInferRuntime.h:3873

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName, int32_t profileIndex) const noexcept
返回给定配置的缓冲区向量化的维度索引，如果提供的名称...
定义: NvInferRuntime.h:3393

nvinfer1::ICudaEngine::getName
char const * getName() const noexcept
返回与引擎关联的网络的名称。
定义: NvInferRuntime.h:3408

nvinfer1::ICudaEngine::getProfilingVerbosity
ProfilingVerbosity getProfilingVerbosity() const noexcept
返回构建引擎时构建器配置设置的 ProfilingVerbosity。
定义: NvInferRuntime.h:3553

nvinfer1::ICudaEngine::isShapeInferenceIO
bool isShapeInferenceIO(char const *tensorName) const noexcept
如果张量是形状计算所需的输入或形状计算的输出，则为 True。
定义: NvInferRuntime.h:3114

nvinfer1::ICudaEngine::getWeightStreamingScratchMemorySize
int64_t getWeightStreamingScratchMemorySize() const noexcept
返回当前权重流预算所需的暂存内存大小。
定义: NvInferRuntime.h:3859

nvinfer1::ICudaEngine::setWeightStreamingBudget
TRT_DEPRECATED bool setWeightStreamingBudget(int64_t gpuMemoryBudget) noexcept
限制网络权重可用的最大 GPU 内存量（以字节为单位）。
定义: NvInferRuntime.h:3687

nvinfer1::ICudaEngine::getDeviceMemorySizeV2
int64_t getDeviceMemorySizeV2() const noexcept
返回所有配置文件中上下文所需的最大设备内存。
定义: NvInferRuntime.h:3180

nvinfer1::ICudaEngine::getTensorVectorizedDim
int32_t getTensorVectorizedDim(char const *tensorName) const noexcept
返回缓冲区向量化的维度索引，如果提供的名称未映射到 ...，则返回 -1。
定义: NvInferRuntime.h:3377

nvinfer1::ICudaEngine::getDeviceMemorySize
TRT_DEPRECATED size_t getDeviceMemorySize() const noexcept
返回所有配置文件中上下文所需的最大设备内存。
定义: NvInferRuntime.h:3152

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName, int32_t profileIndex) const noexcept
返回给定配置的元素中包含的组件数量，如果张量未向量化，则返回 -1...
定义: NvInferRuntime.h:3284

nvinfer1::ICudaEngine::getDeviceMemorySizeForProfileV2
int64_t getDeviceMemorySizeForProfileV2(int32_t profileIndex) const noexcept
返回配置文件的上下文所需的最大设备内存。
定义: NvInferRuntime.h:3196

nvinfer1::ICudaEngine::getTensorFormat
TensorFormat getTensorFormat(char const *tensorName) const noexcept
返回张量格式，如果提供的名称未映射到输入或输出，则返回 TensorFormat::kLINEAR...
定义: NvInferRuntime.h:3299

nvinfer1::ICudaEngine::serialize
IHostMemory * serialize() const noexcept
将网络序列化到流中。
定义: NvInferRuntime.h:3059

nvinfer1::ICudaEngine::getTensorLocation
TensorLocation getTensorLocation(char const *tensorName) const noexcept
获取输入或输出张量是否必须在 GPU 或 CPU 上。
定义: NvInferRuntime.h:3094

nvinfer1::ICudaEngine::createEngineInspector
IEngineInspector * createEngineInspector() const noexcept
创建一个新的引擎检查器，用于打印引擎或执行上下文中的层信息。
定义: NvInferRuntime.h:3563

nvinfer1::ICudaEngine::getTensorBytesPerComponent
int32_t getTensorBytesPerComponent(char const *tensorName, int32_t profileIndex) const noexcept
返回给定配置的元素中每个组件的字节数，如果张量是...
定义: NvInferRuntime.h:3245

nvinfer1::ICudaEngine::getHardwareCompatibilityLevel
HardwareCompatibilityLevel getHardwareCompatibilityLevel() const noexcept
返回此引擎的硬件兼容性级别。
定义: NvInferRuntime.h:3601

nvinfer1::ICudaEngine::getNbOptimizationProfiles
int32_t getNbOptimizationProfiles() const noexcept
获取为此引擎定义的优化配置文件的数量。
定义: NvInferRuntime.h:3419

nvinfer1::ICudaEngine::createExecutionContextWithoutDeviceMemory
TRT_DEPRECATED IExecutionContext * createExecutionContextWithoutDeviceMemory() noexcept
创建一个不分配任何设备内存的执行上下文
定义: NvInferRuntime.h:3140

nvinfer1::ICudaEngine::getTensorFormatDesc
char const * getTensorFormatDesc(char const *tensorName, int32_t profileIndex) const noexcept
返回给定配置的张量格式的人类可读描述，如果 p...，则返回空字符串。
定义: NvInferRuntime.h:3360

nvinfer1::ICudaEngine::getMinimumWeightStreamingBudget
TRT_DEPRECATED int64_t getMinimumWeightStreamingBudget() const noexcept
网络权重成功进行权重流式传输所需的最小 GPU 内存字节数...
定义: NvInferRuntime.h:3730

nvinfer1::ICudaEngine::getTensorIOMode
TensorIOMode getTensorIOMode(char const *tensorName) const noexcept
确定张量是输入张量还是输出张量。
定义: NvInferRuntime.h:3128

nvinfer1::ICudaEngine::getNbLayers
int32_t getNbLayers() const noexcept
获取网络中的层数。
定义: NvInferRuntime.h:3045

nvinfer1::ICudaEngine::getNbIOTensors
int32_t getNbIOTensors() const noexcept
返回 IO 张量的数量。
定义: NvInferRuntime.h:3576

nvinfer1::ICudaEngine::getTensorComponentsPerElement
int32_t getTensorComponentsPerElement(char const *tensorName) const noexcept
返回一个元素中包含的组件数量，如果张量未向量化或如果 ...，则返回 -1。
定义: NvInferRuntime.h:3266

nvinfer1::ICudaEngine::isRefittable
bool isRefittable() const noexcept
如果引擎可以重新拟合，则返回 true。
定义: NvInferRuntime.h:3206

nvinfer1::IDimensionExpr
IDimensionExpr 表示从常量、输入维度构建的整数表达式...
定义: NvInferRuntime.h:232

nvinfer1::IDimensionExpr::isConstant
bool isConstant() const noexcept
如果表达式是构建时常量，则返回 true。
定义: NvInferRuntime.h:237

nvinfer1::IDimensionExpr::isSizeTensor
bool isSizeTensor() const noexcept
如果这表示大小张量的值，则返回 true。
定义: NvInferRuntime.h:263

nvinfer1::IDimensionExpr::~IDimensionExpr
virtual ~IDimensionExpr() noexcept=default

nvinfer1::IDimensionExpr::mImpl
apiv::VDimensionExpr * mImpl
定义: NvInferRuntime.h:254

nvinfer1::IDimensionExpr::getConstantValue
int64_t getConstantValue() const noexcept
获取常量的值。
定义: NvInferRuntime.h:248

nvinfer1::IEngineInspector
引擎检查器，用于打印引擎或执行上下文的层信息。
定义: NvInferRuntime.h:4932

nvinfer1::IEngineInspector::getLayerInformation
char const * getLayerInformation(int32_t layerIndex, LayerInformationFormat format) const noexcept
获取描述当前引擎或执行上下文中的特定层信息的字符串。
定义: NvInferRuntime.h:4985

nvinfer1::IEngineInspector::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
获取分配给此接口的 ErrorRecorder。
定义: NvInferRuntime.h:5042

nvinfer1::IEngineInspector::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
为此接口设置 ErrorRecorder。
定义: NvInferRuntime.h:5027

nvinfer1::IEngineInspector::getExecutionContext
IExecutionContext const * getExecutionContext() const noexcept
获取当前正在检查的上下文。
定义: NvInferRuntime.h:4960

nvinfer1::IEngineInspector::mImpl
apiv::VEngineInspector * mImpl
定义: NvInferRuntime.h:5048

nvinfer1::IEngineInspector::~IEngineInspector
virtual ~IEngineInspector() noexcept=default

nvinfer1::IEngineInspector::getEngineInformation
char const * getEngineInformation(LayerInformationFormat format) const noexcept
获取描述当前引擎或执行上下文中所有层信息的字符串。
定义: NvInferRuntime.h:5008

nvinfer1::IExecutionContext
使用引擎执行推理的上下文，具有功能上不安全的功能。
定义: NvInferRuntime.h:4021

nvinfer1::IExecutionContext::getOutputAllocator
IOutputAllocator * getOutputAllocator(char const *tensorName) const noexcept
获取与给定名称的输出张量关联的输出分配器，如果提供的名称 doe...，则返回 nullptr。
定义: NvInferRuntime.h:4656

nvinfer1::IExecutionContext::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
获取分配给此接口的 ErrorRecorder。
定义: NvInferRuntime.h:4304

nvinfer1::IExecutionContext::reportToProfiler
bool reportToProfiler() const noexcept
计算 IExecutionContext 中当前优化配置的层计时信息，并更新 ...
定义: NvInferRuntime.h:4423

nvinfer1::IExecutionContext::~IExecutionContext
virtual ~IExecutionContext() noexcept=default

nvinfer1::IExecutionContext::setDeviceMemory
void setDeviceMemory(void *memory) noexcept
设置此执行上下文要使用的设备内存。
定义: NvInferRuntime.h:4124

nvinfer1::IExecutionContext::allInputShapesSpecified
TRT_DEPRECATED bool allInputShapesSpecified() const noexcept
是否已指定所有输入形状绑定。
定义: NvInferRuntime.h:4270

nvinfer1::IExecutionContext::setTensorDebugState
bool setTensorDebugState(char const *name, bool flag) noexcept
设置给定张量名称的张量的调试状态。
定义: NvInferRuntime.h:4863

nvinfer1::IExecutionContext::getName
char const * getName() const noexcept
返回执行上下文的名称。
定义: NvInferRuntime.h:4097

nvinfer1::IExecutionContext::getTemporaryStorageAllocator
IGpuAllocator * getTemporaryStorageAllocator() const noexcept
通过 setTemporaryStorageAllocator 获取分配器集。
定义： NvInferRuntime.h:4704

nvinfer1::IExecutionContext::setEnqueueEmitsProfile
void setEnqueueEmitsProfile(bool enqueueEmitsProfile) noexcept
设置 enqueue 是否将层计时信息发送到 profiler。
定义： NvInferRuntime.h:4381

nvinfer1::IExecutionContext::getTensorShape
Dims getTensorShape(char const *tensorName) const noexcept
返回给定输入或输出的形状。
定义： NvInferRuntime.h:4237

nvinfer1::IExecutionContext::getDebugState
bool getDebugState(char const *name) const noexcept
定义： NvInferRuntime.h:4886

nvinfer1::IExecutionContext::setInputShape
bool setInputShape(char const *tensorName, Dims const &dims) noexcept
设置给定输入的形状。
定义： NvInferRuntime.h:4200

nvinfer1::IExecutionContext::executeV2
bool executeV2(void *const *bindings) noexcept
同步执行网络。
定义： NvInferRuntime.h:4321

nvinfer1::IExecutionContext::getEnqueueEmitsProfile
bool getEnqueueEmitsProfile() const noexcept
获取 enqueueEmitsProfile 状态。
定义： NvInferRuntime.h:4393

nvinfer1::IExecutionContext::getTensorAddress
void const * getTensorAddress(char const *tensorName) const noexcept
获取绑定到给定输入或输出张量的内存地址，如果提供的名称不匹配，则返回 nullptr...
定义： NvInferRuntime.h:4484

nvinfer1::IExecutionContext::setOutputAllocator
bool setOutputAllocator(char const *tensorName, IOutputAllocator *outputAllocator) noexcept
设置用于给定名称的输出张量的输出分配器。传递 nullptr 给 outputAllocator 以取消设置...
定义： NvInferRuntime.h:4643

nvinfer1::IExecutionContext::setOptimizationProfileAsync
bool setOptimizationProfileAsync(int32_t profileIndex, cudaStream_t stream) noexcept
为当前上下文选择一个优化配置文件，使用异步语义。
定义： NvInferRuntime.h:4365

nvinfer1::IExecutionContext::mImpl
apiv::VExecutionContext * mImpl
定义： NvInferRuntime.h:4892

nvinfer1::IExecutionContext::setOutputTensorAddress
bool setOutputTensorAddress(char const *tensorName, void *data) noexcept
设置给定输出张量的内存地址。
定义： NvInferRuntime.h:4507

nvinfer1::IExecutionContext::setPersistentCacheLimit
void setPersistentCacheLimit(size_t size) noexcept
设置持久缓存使用的最大大小。
定义： NvInferRuntime.h:4744

nvinfer1::IExecutionContext::getPersistentCacheLimit
size_t getPersistentCacheLimit() const noexcept
获取持久缓存使用的最大大小。
定义： NvInferRuntime.h:4755

nvinfer1::IExecutionContext::setAllTensorsDebugState
bool setAllTensorsDebugState(bool flag) noexcept
定义： NvInferRuntime.h:4876

nvinfer1::IExecutionContext::getEngine
ICudaEngine const & getEngine() const noexcept
获取关联的引擎。
定义： NvInferRuntime.h:4073

nvinfer1::IExecutionContext::getNvtxVerbosity
ProfilingVerbosity getNvtxVerbosity() const noexcept
获取执行上下文的 NVTX 详细程度。
定义： NvInferRuntime.h:4791

nvinfer1::IExecutionContext::updateDeviceMemorySizeForShapes
size_t updateDeviceMemorySizeForShapes() noexcept
基于当前的输入形状重新计算内部激活缓冲区大小，并返回总计...
定义： NvInferRuntime.h:4598

nvinfer1::IExecutionContext::setAuxStreams
void setAuxStreams(cudaStream_t *auxStreams, int32_t nbStreams) noexcept
设置 TensorRT 应在下次 enqueueV3() 调用中在其上启动内核的辅助流。
定义： NvInferRuntime.h:4822

nvinfer1::IExecutionContext::getMaxOutputSize
int64_t getMaxOutputSize(char const *tensorName) const noexcept
获取输出张量大小的上限（以字节为单位），基于当前的优化配置文件和 i...
定义： NvInferRuntime.h:4674

nvinfer1::IExecutionContext::inferShapes
int32_t inferShapes(int32_t nbMaxNames, char const **tensorNames) noexcept
运行形状计算。
定义： NvInferRuntime.h:4581

nvinfer1::IExecutionContext::setDebugListener
bool setDebugListener(IDebugListener *listener) noexcept
为此执行上下文设置 DebugListener。
定义： NvInferRuntime.h:4834

nvinfer1::IExecutionContext::setTensorAddress
bool setTensorAddress(char const *tensorName, void *data) noexcept
设置给定输入或输出张量的内存地址。
定义： NvInferRuntime.h:4467

nvinfer1::IExecutionContext::setTemporaryStorageAllocator
bool setTemporaryStorageAllocator(IGpuAllocator *allocator) noexcept
指定用于内部临时存储的分配器。
定义： NvInferRuntime.h:4694

nvinfer1::IExecutionContext::getOutputTensorAddress
void * getOutputTensorAddress(char const *tensorName) const noexcept
获取给定输出的内存地址。
定义： NvInferRuntime.h:4548

nvinfer1::IExecutionContext::enqueueV3
bool enqueueV3(cudaStream_t stream) noexcept
在流上排队推理。
定义： NvInferRuntime.h:4728

nvinfer1::IExecutionContext::getDebugListener
IDebugListener * getDebugListener() noexcept
获取此执行上下文的 DebugListener。
定义： NvInferRuntime.h:4844

nvinfer1::IExecutionContext::getOptimizationProfile
int32_t getOptimizationProfile() const noexcept
获取当前选定的优化配置文件的索引。
定义： NvInferRuntime.h:4182

nvinfer1::IExecutionContext::setInputTensorAddress
bool setInputTensorAddress(char const *tensorName, void const *data) noexcept
设置给定输入的内存地址。
定义： NvInferRuntime.h:4529

nvinfer1::IExecutionContext::getDebugSync
bool getDebugSync() const noexcept
获取调试同步标志。
定义： NvInferRuntime.h:4043

nvinfer1::IExecutionContext::setInputConsumedEvent
bool setInputConsumedEvent(cudaEvent_t event) noexcept
将输入标记为已消耗。
定义： NvInferRuntime.h:4614

nvinfer1::IExecutionContext::getTensorStrides
Dims getTensorStrides(char const *tensorName) const noexcept
返回给定张量名称的缓冲区的步幅。
定义： NvInferRuntime.h:4167

nvinfer1::IExecutionContext::setNvtxVerbosity
bool setNvtxVerbosity(ProfilingVerbosity verbosity) noexcept
设置执行上下文中 NVTX 标记的详细程度。
定义： NvInferRuntime.h:4779

nvinfer1::IExecutionContext::getProfiler
IProfiler * getProfiler() const noexcept
获取 profiler。
定义： NvInferRuntime.h:4063

nvinfer1::IExecutionContext::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
为此接口设置 ErrorRecorder。
定义： NvInferRuntime.h:4289

nvinfer1::IExecutionContext::setDeviceMemoryV2
void setDeviceMemoryV2(void *memory, int64_t size) noexcept
设置设备内存及其相应大小，供此执行上下文使用。
定义： NvInferRuntime.h:4146

nvinfer1::IExecutionContext::allInputDimensionsSpecified
bool allInputDimensionsSpecified() const noexcept
是否已指定输入张量的所有动态维度。
定义： NvInferRuntime.h:4253

nvinfer1::IExecutionContext::setProfiler
void setProfiler(IProfiler *profiler) noexcept
设置 profiler。
定义： NvInferRuntime.h:4053

nvinfer1::IExecutionContext::setName
void setName(char const *name) noexcept
设置执行上下文的名称。
定义： NvInferRuntime.h:4087

nvinfer1::IExecutionContext::getInputConsumedEvent
cudaEvent_t getInputConsumedEvent() const noexcept
与消耗输入相关的事件。
定义： NvInferRuntime.h:4624

nvinfer1::IExprBuilder
用于构造 IDimensionExpr 的对象。
定义： NvInferRuntime.h:287

nvinfer1::IExprBuilder::operation
IDimensionExpr const * operation(DimensionOperation op, IDimensionExpr const &first, IDimensionExpr const &second) noexcept
获取操作。
定义： NvInferRuntime.h:303

nvinfer1::IExprBuilder::~IExprBuilder
virtual ~IExprBuilder() noexcept=default

nvinfer1::IExprBuilder::constant
IDimensionExpr const * constant(int64_t value) noexcept
返回给定值的 IDimensionExpr 的指针。
定义： NvInferRuntime.h:292

nvinfer1::IExprBuilder::mImpl
apiv::VExprBuilder * mImpl
定义： NvInferRuntime.h:310

nvinfer1::IExprBuilder::declareSizeTensor
IDimensionExpr const * declareSizeTensor(int32_t outputIndex, IDimensionExpr const &opt, IDimensionExpr const &upper)
在给定的输出索引处声明一个大小张量，具有指定的自动调整公式和上限...
定义： NvInferRuntime.h:338

nvinfer1::IHostMemory
用于处理库分配的、用户可访问的内存的类。
定义： NvInferRuntime.h:142

nvinfer1::IHostMemory::data
void * data() const noexcept
指向库拥有的原始数据的指针。
定义： NvInferRuntime.h:147

nvinfer1::IHostMemory::type
DataType type() const noexcept
已分配内存的类型。
定义： NvInferRuntime.h:159

nvinfer1::IHostMemory::size
std::size_t size() const noexcept
已分配数据的字节大小。
定义： NvInferRuntime.h:153

nvinfer1::IHostMemory::mImpl
apiv::VHostMemory * mImpl
定义： NvInferRuntime.h:165

nvinfer1::IHostMemory::~IHostMemory
virtual ~IHostMemory() noexcept=default

nvinfer1::ILoggerFinder
用于查找 logger 的虚拟基类。允许插件在需要时查找 logger 的实例...
定义： NvInferRuntime.h:5145

nvinfer1::ILoggerFinder::findLogger
virtual ILogger * findLogger()=0
获取引擎或执行上下文调用的插件方法使用的 logger。

nvinfer1::ILoggerFinder::~ILoggerFinder
virtual ~ILoggerFinder()=default

nvinfer1::ILogger
应用程序实现的用于构建器、重定器和运行时的日志记录接口。
定义： NvInferRuntime.h:1540

nvinfer1::ILogger::ILogger
ILogger()=default

nvinfer1::ILogger::~ILogger
virtual ~ILogger()=default

nvinfer1::ILogger::Severity
Severity
与日志消息对应的严重性。
定义： NvInferRuntime.h:1548

nvinfer1::ILogger::log
virtual void log(Severity severity, AsciiChar const *msg) noexcept=0
应用程序实现的用于处理日志消息的回调；。

nvinfer1::INoCopy
IEngineInspector 的前向声明，供其他接口使用。
定义： NvInferRuntime.h:51

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy const &other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy(INoCopy &&other)=delete

nvinfer1::INoCopy::INoCopy
INoCopy()=default

nvinfer1::INoCopy::~INoCopy
virtual ~INoCopy()=default

nvinfer1::INoCopy::operator=
INoCopy & operator=(INoCopy const &other)=delete

nvinfer1::IOptimizationProfile
用于动态输入维度和形状张量的优化配置文件。
定义： NvInferRuntime.h:2616

nvinfer1::IOptimizationProfile::getShapeValues
int32_t const * getShapeValues(char const *inputName, OptProfileSelector select) const noexcept
获取输入形状张量的最小/最佳/最大值。
定义： NvInferRuntime.h:2730

nvinfer1::IOptimizationProfile::mImpl
apiv::VOptimizationProfile * mImpl
定义： NvInferRuntime.h:2783

nvinfer1::IOptimizationProfile::getDimensions
Dims getDimensions(char const *inputName, OptProfileSelector select) const noexcept
获取动态输入张量的最小/最佳/最大维度。
定义： NvInferRuntime.h:2657

nvinfer1::IOptimizationProfile::~IOptimizationProfile
virtual ~IOptimizationProfile() noexcept=default

nvinfer1::IOptimizationProfile::getExtraMemoryTarget
float getExtraMemoryTarget() const noexcept
获取为此配置文件定义的额外内存目标。
定义： NvInferRuntime.h:2760

nvinfer1::IOptimizationProfile::setExtraMemoryTarget
bool setExtraMemoryTarget(float target) noexcept
为此配置文件设置可能使用的额外 GPU 内存的目标。
定义： NvInferRuntime.h:2748

nvinfer1::IOptimizationProfile::setDimensions
bool setDimensions(char const *inputName, OptProfileSelector select, Dims const &dims) noexcept
设置动态输入张量的最小/最佳/最大维度。
定义： NvInferRuntime.h:2645

nvinfer1::IOptimizationProfile::setShapeValues
bool setShapeValues(char const *inputName, OptProfileSelector select, int32_t const *values, int32_t nbValues) noexcept
设置输入形状张量的最小/最佳/最大值。
定义： NvInferRuntime.h:2704

nvinfer1::IOptimizationProfile::isValid
bool isValid() const noexcept
检查优化配置文件是否可以传递给 IBuilderConfig 对象。
定义： NvInferRuntime.h:2777

nvinfer1::IOptimizationProfile::getNbShapeValues
int32_t getNbShapeValues(char const *inputName) const noexcept
获取输入形状张量的值的数量。
定义： NvInferRuntime.h:2718

nvinfer1::IPluginRegistry
应用程序中所有插件的单个注册点。它用于查找插件实现...
定义： NvInferRuntimeCommon.h:56

nvinfer1::IPluginRegistry::registerCreator
virtual TRT_DEPRECATED bool registerCreator(IPluginCreator &creator, AsciiChar const *const pluginNamespace) noexcept=0
注册实现 IPluginCreator 的插件创建器。如果任何插件创建器具有相同的 s，则返回 false...

nvinfer1::IPluginResourceContext
用于插件访问 TensorRT 提供的每个上下文资源的接口。
定义： NvInferRuntime.h:767

nvinfer1::IPluginResourceContext::getErrorRecorder
virtual IErrorRecorder * getErrorRecorder() const noexcept=0
获取与资源上下文关联的错误记录器。

nvinfer1::IPluginResourceContext::operator=
IPluginResourceContext & operator=(IPluginResourceContext const &) &=default

nvinfer1::IPluginResourceContext::getGpuAllocator
virtual IGpuAllocator * getGpuAllocator() const noexcept=0
获取与资源上下文关联的 GPU 分配器。

nvinfer1::IPluginV2DynamicExt
类似于 IPluginV2Ext，但支持动态形状。
定义： NvInferRuntime.h:407

nvinfer1::IPluginV2DynamicExt::clone
IPluginV2DynamicExt * clone() const noexcept override=0
克隆插件对象。这将复制内部插件参数，并返回一个新的插件...

nvinfer1::IPluginV2DynamicExt::~IPluginV2DynamicExt
virtual ~IPluginV2DynamicExt() noexcept
定义： NvInferRuntime.h:558

nvinfer1::IPluginV2Ext
用于用户实现的层的插件类。
定义： NvInferRuntimePlugin.h:468

nvinfer1::IRefitter
更新引擎中的权重。
定义： NvInferRuntime.h:2136

nvinfer1::IRefitter::refitCudaEngineAsync
bool refitCudaEngineAsync(cudaStream_t stream) noexcept
在给定流上排队关联引擎的权重重定。
定义： NvInferRuntime.h:2538

nvinfer1::IRefitter::getMaxThreads
int32_t getMaxThreads() const noexcept
获取重定器可以使用的最大线程数。
定义： NvInferRuntime.h:2417

nvinfer1::IRefitter::getWeightsLocation
TensorLocation getWeightsLocation(char const *weightsName) const noexcept
获取与给定名称关联的权重的location。
定义： NvInferRuntime.h:2476

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights) noexcept
指定给定名称的新权重。
定义： NvInferRuntime.h:2341

nvinfer1::IRefitter::getAllWeights
int32_t getAllWeights(int32_t size, char const **weightsNames) noexcept
获取所有可以重定的权重的名称。
定义： NvInferRuntime.h:2377

nvinfer1::IRefitter::getLogger
ILogger * getLogger() const noexcept
获取创建重定器时使用的 logger
定义： NvInferRuntime.h:2387

nvinfer1::IRefitter::refitCudaEngine
bool refitCudaEngine() noexcept
重定关联的引擎。
定义： NvInferRuntime.h:2172

nvinfer1::IRefitter::getMissingWeights
int32_t getMissingWeights(int32_t size, char const **weightsNames) noexcept
获取缺失权重的名称。
定义： NvInferRuntime.h:2361

nvinfer1::IRefitter::getDynamicRangeMax
TRT_DEPRECATED float getDynamicRangeMax(char const *tensorName) const noexcept
获取动态范围的最大值。
定义： NvInferRuntime.h:2264

nvinfer1::IRefitter::getMissing
int32_t getMissing(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
获取缺失权重的描述。
定义： NvInferRuntime.h:2193

nvinfer1::IRefitter::getNamedWeights
Weights getNamedWeights(char const *weightsName) const noexcept
获取与给定名称关联的权重。
定义： NvInferRuntime.h:2460

nvinfer1::IRefitter::unsetNamedWeights
bool unsetNamedWeights(char const *weightsName) noexcept
取消设置与给定名称关联的权重。
定义： NvInferRuntime.h:2492

nvinfer1::IRefitter::getWeightsPrototype
Weights getWeightsPrototype(char const *weightsName) const noexcept
获取与给定名称关联的 Weights 原型。
定义： NvInferRuntime.h:2556

nvinfer1::IRefitter::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
设置最大线程数。
定义： NvInferRuntime.h:2403

nvinfer1::IRefitter::getDynamicRangeMin
TRT_DEPRECATED float getDynamicRangeMin(char const *tensorName) const noexcept
获取动态范围的最小值。
定义： NvInferRuntime.h:2248

nvinfer1::IRefitter::getTensorsWithDynamicRange
TRT_DEPRECATED int32_t getTensorsWithDynamicRange(int32_t size, char const **tensorNames) const noexcept
获取所有具有可重定动态范围的张量的名称。
定义： NvInferRuntime.h:2282

nvinfer1::IRefitter::setNamedWeights
bool setNamedWeights(char const *name, Weights weights, TensorLocation location) noexcept
在给定名称的指定设备上指定新权重。
定义： NvInferRuntime.h:2444

nvinfer1::IRefitter::setWeightsValidation
void setWeightsValidation(bool weightsValidation) noexcept
设置是否在重定期间验证权重。
定义： NvInferRuntime.h:2508

nvinfer1::IRefitter::setDynamicRange
TRT_DEPRECATED bool setDynamicRange(char const *tensorName, float min, float max) noexcept
定义： NvInferRuntime.h:2232

nvinfer1::IRefitter::mImpl
apiv::VRefitter * mImpl
定义： NvInferRuntime.h:2562

nvinfer1::IRefitter::getAll
int32_t getAll(int32_t size, char const **layerNames, WeightsRole *roles) noexcept
获取所有可以重定的权重的描述。
定义： NvInferRuntime.h:2210

nvinfer1::IRefitter::~IRefitter
virtual ~IRefitter() noexcept=default

nvinfer1::IRefitter::getWeightsValidation
bool getWeightsValidation() const noexcept
获取是否在重定期间验证权重值。
定义： NvInferRuntime.h:2516

nvinfer1::IRefitter::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
为此接口设置 ErrorRecorder。
定义： NvInferRuntime.h:2301

nvinfer1::IRefitter::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
获取分配给此接口的 ErrorRecorder。
定义： NvInferRuntime.h:2316

nvinfer1::IRuntime
允许反序列化功能上不安全的序列化引擎。
定义： NvInferRuntime.h:1817

nvinfer1::IRuntime::setMaxThreads
bool setMaxThreads(int32_t maxThreads) noexcept
设置最大线程数。
定义： NvInferRuntime.h:1981

nvinfer1::IRuntime::loadRuntime
IRuntime * loadRuntime(char const *path) noexcept
从文件加载 IRuntime。
定义： NvInferRuntime.h:2097

nvinfer1::IRuntime::getEngineHostCodeAllowed
bool getEngineHostCodeAllowed() const noexcept
获取运行时是否允许反序列化具有主机可执行代码的引擎。
定义： NvInferRuntime.h:2119

nvinfer1::IRuntime::getTempfileControlFlags
TempfileControlFlags getTempfileControlFlags() const noexcept
获取此运行时的临时文件控制标志。
定义： NvInferRuntime.h:2069

nvinfer1::IRuntime::setEngineHostCodeAllowed
void setEngineHostCodeAllowed(bool allowed) noexcept
设置运行时是否允许反序列化具有主机可执行代码的引擎。
定义： NvInferRuntime.h:2109

nvinfer1::IRuntime::~IRuntime
virtual ~IRuntime() noexcept=default

nvinfer1::IRuntime::setTemporaryDirectory
void setTemporaryDirectory(char const *path) noexcept
设置此运行时将用于临时文件的目录。
定义： NvInferRuntime.h:2030

nvinfer1::IRuntime::getPluginRegistry
IPluginRegistry & getPluginRegistry() noexcept
获取运行时可以使用的本地插件注册表。
定义： NvInferRuntime.h:2079

nvinfer1::IRuntime::mImpl
apiv::VRuntime * mImpl
定义： NvInferRuntime.h:2125

nvinfer1::IRuntime::getNbDLACores
int32_t getNbDLACores() const noexcept
返回可访问的 DLA 硬件内核数量，如果 DLA 不可用，则返回 0。
定义： NvInferRuntime.h:1850

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(void const *blob, std::size_t size) noexcept
从主机内存反序列化引擎。
定义： NvInferRuntime.h:1914

nvinfer1::IRuntime::setTempfileControlFlags
void setTempfileControlFlags(TempfileControlFlags flags) noexcept
设置此运行时的临时文件控制标志。
定义： NvInferRuntime.h:2057

nvinfer1::IRuntime::getDLACore
int32_t getDLACore() const noexcept
获取引擎在其上执行的 DLA 内核。
定义： NvInferRuntime.h:1842

nvinfer1::IRuntime::setGpuAllocator
void setGpuAllocator(IGpuAllocator *allocator) noexcept
设置 GPU 分配器。
定义： NvInferRuntime.h:1865

nvinfer1::IRuntime::getErrorRecorder
IErrorRecorder * getErrorRecorder() const noexcept
获取分配给此接口的 ErrorRecorder。
定义： NvInferRuntime.h:1899

nvinfer1::IRuntime::deserializeCudaEngine
ICudaEngine * deserializeCudaEngine(IStreamReaderV2 &streamReader)
从流反序列化引擎。IStreamReaderV2 预计支持读取到主机和 ...
定义： NvInferRuntime.h:1956

nvinfer1::IRuntime::getLogger
ILogger * getLogger() const noexcept
获取创建运行时时使用的 logger
定义： NvInferRuntime.h:1966

nvinfer1::IRuntime::getMaxThreads
int32_t getMaxThreads() const noexcept
获取运行时可以使用的最大线程数。
定义： NvInferRuntime.h:1995

nvinfer1::IRuntime::getTemporaryDirectory
char const * getTemporaryDirectory() const noexcept
获取此运行时将用于临时文件的目录。
定义： NvInferRuntime.h:2041

nvinfer1::IRuntime::deserializeCudaEngine
TRT_DEPRECATED ICudaEngine * deserializeCudaEngine(IStreamReader &streamReader)
从流反序列化引擎。
定义： NvInferRuntime.h:1935

nvinfer1::IRuntime::setErrorRecorder
void setErrorRecorder(IErrorRecorder *recorder) noexcept
为此接口设置 ErrorRecorder。
定义： NvInferRuntime.h:1884

nvinfer1::ISerializationConfig
保存用于配置引擎以序列化二进制文件的属性。
定义： NvInferRuntime.h:2893

nvinfer1::ISerializationConfig::~ISerializationConfig
virtual ~ISerializationConfig() noexcept=default

nvinfer1::ISerializationConfig::clearFlag
bool clearFlag(SerializationFlag serializationFlag) noexcept
清除序列化标志。
定义： NvInferRuntime.h:2932

nvinfer1::ISerializationConfig::setFlag
bool setFlag(SerializationFlag serializationFlag) noexcept
设置序列化标志。
定义： NvInferRuntime.h:2944

nvinfer1::ISerializationConfig::getFlags
SerializationFlags getFlags() const noexcept
获取此配置的序列化标志。
定义： NvInferRuntime.h:2920

nvinfer1::ISerializationConfig::getFlag
bool getFlag(SerializationFlag serializationFlag) const noexcept
如果设置了序列化标志，则返回 true。
定义： NvInferRuntime.h:2956

nvinfer1::ISerializationConfig::mImpl
apiv::VSerializationConfig * mImpl
定义： NvInferRuntime.h:2962

nvinfer1::IVersionedInterface
用于版本控制的接口类。
定义： NvInferRuntimeBase.h:263

nvinfer1::InterfaceInfo
与 TRT 接口关联的版本信息。
定义： NvInferRuntimeBase.h:228

nvinfer1::PluginRegistrar
将插件创建器注册到注册表。静态注册表对象将在 ... 时实例化
定义： NvInferRuntime.h:5117

nvinfer1::PluginRegistrar::PluginRegistrar
PluginRegistrar()
定义： NvInferRuntime.h:5119

nvinfer1::Weights
用作层参数的权重数组。
定义： NvInferRuntime.h:124

nvinfer1::Weights::type
DataType type
权重的类型。
定义： NvInferRuntime.h:126

nvinfer1::Weights::count
int64_t count
数组中权重的数量。
定义： NvInferRuntime.h:128

nvinfer1::Weights::values
void const * values
权重值，在一个连续的数组中。
定义： NvInferRuntime.h:127

nvinfer1::v_1_0::IDebugListener
定义： NvInferRuntime.h:3972

nvinfer1::v_1_0::IDebugListener::processDebugTensor
virtual bool processDebugTensor(void const *addr, TensorLocation location, DataType type, Dims const &shape, char const *name, cudaStream_t stream)=0
当调试张量的值更新且 te 的调试状态时调用的回调函数...

nvinfer1::v_1_0::IDebugListener::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:3977

nvinfer1::v_1_0::IDebugListener::~IDebugListener
~IDebugListener() override=default

nvinfer1::v_1_0::IErrorRecorder
定义： NvInferRuntimeBase.h:400

nvinfer1::v_1_0::IGpuAllocator
定义： NvInferRuntime.h:1608

nvinfer1::v_1_0::IGpuAllocator::allocateAsync
virtual void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept
应用程序实现的线程安全回调，用于处理 GPU 内存的流有序获取...
定义： NvInferRuntime.h:1730

nvinfer1::v_1_0::IGpuAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:1771

nvinfer1::v_1_0::IGpuAllocator::deallocate
virtual TRT_DEPRECATED bool deallocate(void *const memory) noexcept=0
应用程序实现的线程安全回调，用于处理 GPU 内存的释放。

nvinfer1::v_1_0::IGpuAllocator::~IGpuAllocator
~IGpuAllocator() override=default

nvinfer1::v_1_0::IGpuAllocator::IGpuAllocator
IGpuAllocator()=default

nvinfer1::v_1_0::IGpuAllocator::reallocate
virtual void * reallocate(void *const, uint64_t, uint64_t) noexcept
应用程序实现的线程安全回调，用于调整现有分配的大小。
定义： NvInferRuntime.h:1677

nvinfer1::v_1_0::IGpuAllocator::allocate
virtual TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept=0
应用程序实现的线程安全回调，用于处理 GPU 内存的获取。

nvinfer1::v_1_0::IGpuAllocator::deallocateAsync
virtual bool deallocateAsync(void *const memory, cudaStream_t) noexcept
应用程序实现的线程安全回调，用于处理 GPU 内存的流有序释放。
定义： NvInferRuntime.h:1763

nvinfer1::v_1_0::IGpuAsyncAllocator
定义： NvInferRuntime.h:5166

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocateAsync
bool deallocateAsync(void *const memory, cudaStream_t) noexcept override=0
应用程序实现的线程安全回调，用于处理流有序异步释放 o...

nvinfer1::v_1_0::IGpuAsyncAllocator::IGpuAsyncAllocator
IGpuAsyncAllocator()=default

nvinfer1::v_1_0::IGpuAsyncAllocator::allocateAsync
void * allocateAsync(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags, cudaStream_t) noexcept override=0
应用程序实现的线程安全回调，用于处理流有序异步获取 i...

nvinfer1::v_1_0::IGpuAsyncAllocator::allocate
TRT_DEPRECATED void * allocate(uint64_t const size, uint64_t const alignment, AllocatorFlags const flags) noexcept override
应用程序实现的线程安全回调，用于处理 GPU 内存的获取。
定义： NvInferRuntime.h:5252

nvinfer1::v_1_0::IGpuAsyncAllocator::deallocate
TRT_DEPRECATED bool deallocate(void *const memory) noexcept override
应用程序实现的线程安全回调，用于处理 GPU 内存的释放。
定义： NvInferRuntime.h:5276

nvinfer1::v_1_0::IGpuAsyncAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:5284

nvinfer1::v_1_0::IGpuAsyncAllocator::~IGpuAsyncAllocator
~IGpuAsyncAllocator() override=default

nvinfer1::v_1_0::IOutputAllocator
定义： NvInferRuntime.h:3885

nvinfer1::v_1_0::IOutputAllocator::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:3890

nvinfer1::v_1_0::IOutputAllocator::reallocateOutputAsync
virtual void * reallocateOutputAsync(char const *tensorName, void *currentMemory, uint64_t size, uint64_t alignment, cudaStream_t)
返回输出张量的内存指针，如果无法分配内存，则返回 nullptr....
定义： NvInferRuntime.h:3942

nvinfer1::v_1_0::IOutputAllocator::notifyShape
virtual void notifyShape(char const *tensorName, Dims const &dims) noexcept=0
当输出张量的形状已知时，由 TensorRT 调用。

nvinfer1::v_1_0::IOutputAllocator::reallocateOutput
virtual TRT_DEPRECATED void * reallocateOutput(char const *tensorName, void *currentMemory, uint64_t size, uint64_t alignment) noexcept
返回输出张量的内存指针，如果无法分配内存，则返回 nullptr....
定义： NvInferRuntime.h:3914

nvinfer1::v_1_0::IPluginCapability
定义： NvInferPluginBase.h:141

nvinfer1::v_1_0::IPluginCreatorInterface
定义： NvInferPluginBase.h:193

nvinfer1::v_1_0::IPluginCreatorV3One
定义： NvInferRuntime.h:5291

nvinfer1::v_1_0::IPluginCreatorV3One::getFieldNames
virtual PluginFieldCollection const * getFieldNames() noexcept=0
返回创建插件时需要传递给 createPlugin() 的字段列表，以便在 th 中使用...

nvinfer1::v_1_0::IPluginCreatorV3One::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:5296

nvinfer1::v_1_0::IPluginCreatorV3One::createPlugin
virtual IPluginV3 * createPlugin(AsciiChar const *name, PluginFieldCollection const *fc, TensorRTPhase phase) noexcept=0
返回插件对象。如果发生错误，则返回 nullptr。

nvinfer1::v_1_0::IPluginV3
定义： NvInferPluginBase.h:206

nvinfer1::v_1_0::IPluginV3OneBuild
定义： NvInferRuntime.h:836

nvinfer1::v_1_0::IPluginV3OneBuild::getFormatCombinationLimit
virtual int32_t getFormatCombinationLimit() noexcept
返回 TensorRT 在构建阶段将计时的最大格式组合数...
定义： NvInferRuntime.h:1039

nvinfer1::v_1_0::IPluginV3OneBuild::getNbOutputs
virtual int32_t getNbOutputs() const noexcept=0
获取插件的输出数量。

nvinfer1::v_1_0::IPluginV3OneBuild::configurePlugin
virtual int32_t configurePlugin(DynamicPluginTensorDesc const *in, int32_t nbInputs, DynamicPluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
配置插件。

nvinfer1::v_1_0::IPluginV3OneBuild::getNbTactics
virtual int32_t getNbTactics() noexcept
查询插件打算使用的自定义策略的数量。
定义： NvInferRuntime.h:1015

nvinfer1::v_1_0::IPluginV3OneBuild::getMetadataString
virtual char const * getMetadataString() noexcept
查询表示插件配置的字符串。可以在插件 c 后随时调用...
定义： NvInferRuntime.h:1050

nvinfer1::v_1_0::IPluginV3OneBuild::getTimingCacheID
virtual char const * getTimingCacheID() noexcept
调用以查询用于计时缓存 ID 的后缀。可以在插件创建后随时调用...
定义： NvInferRuntime.h:1031

nvinfer1::v_1_0::IPluginV3OneBuild::supportsFormatCombination
virtual bool supportsFormatCombination(int32_t pos, DynamicPluginTensorDesc const *inOut, int32_t nbInputs, int32_t nbOutputs) noexcept=0
如果插件支持 pos 索引的输入/输出的格式和数据类型，则返回 true。

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputDataTypes
virtual int32_t getOutputDataTypes(DataType *outputTypes, int32_t nbOutputs, const DataType *inputTypes, int32_t nbInputs) const noexcept=0
如果输入张量具有提供的数据类型，则提供插件输出的数据类型。

nvinfer1::v_1_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:848

nvinfer1::v_1_0::IPluginV3OneBuild::getOutputShapes
virtual int32_t getOutputShapes(DimsExprs const *inputs, int32_t nbInputs, DimsExprs const *shapeInputs, int32_t nbShapeInputs, DimsExprs *outputs, int32_t nbOutputs, IExprBuilder &exprBuilder) noexcept=0
提供用于从输入 tenso 的维度计算输出张量维度的表达式...

nvinfer1::v_1_0::IPluginV3OneBuild::getValidTactics
virtual int32_t getValidTactics(int32_t *tactics, int32_t nbTactics) noexcept
查询插件打算使用的任何自定义策略。
定义： NvInferRuntime.h:1007

nvinfer1::v_1_0::IPluginV3OneCore
定义： NvInferRuntime.h:793

nvinfer1::v_1_0::IPluginV3OneCore::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:798

nvinfer1::v_1_0::IPluginV3OneCore::getPluginName
virtual AsciiChar const * getPluginName() const noexcept=0
返回插件名称。应与相应插件创建器返回的插件名称匹配。

nvinfer1::v_1_0::IPluginV3OneRuntime
定义： NvInferRuntime.h:1057

nvinfer1::v_1_0::IPluginV3OneRuntime::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:1062

nvinfer1::v_1_0::IPluginV3OneRuntime::onShapeChange
virtual int32_t onShapeChange(PluginTensorDesc const *in, int32_t nbInputs, PluginTensorDesc const *out, int32_t nbOutputs) noexcept=0
当插件正在准备针对特定维度执行时调用。这可能会多次发生...

nvinfer1::v_1_0::IPluginV3OneRuntime::getFieldsToSerialize
virtual PluginFieldCollection const * getFieldsToSerialize() noexcept=0
获取应序列化的插件字段。

nvinfer1::v_1_0::IPluginV3OneRuntime::setTactic
virtual int32_t setTactic(int32_t tactic) noexcept
设置要在后续 enqueue() 调用中使用的策略。如果没有通告自定义策略，...
定义： NvInferRuntime.h:1074

nvinfer1::v_1_0::IPluginV3OneRuntime::enqueue
virtual int32_t enqueue(PluginTensorDesc const *inputDesc, PluginTensorDesc const *outputDesc, void const *const *inputs, void *const *outputs, void *workspace, cudaStream_t stream) noexcept=0
执行层。

nvinfer1::v_1_0::IPluginV3OneRuntime::attachToContext
virtual IPluginV3 * attachToContext(IPluginResourceContext *context) noexcept=0
克隆插件，将克隆的插件对象附加到执行上下文，并授予克隆的插件 ...

nvinfer1::v_1_0::IProfiler
定义： NvInferRuntime.h:1245

nvinfer1::v_1_0::IProfiler::~IProfiler
virtual ~IProfiler() noexcept
定义： NvInferRuntime.h:1256

nvinfer1::v_1_0::IProfiler::reportLayerTime
virtual void reportLayerTime(char const *layerName, float ms) noexcept=0
层时间报告回调。

nvinfer1::v_1_0::IStreamReader
定义： NvInferRuntime.h:631

nvinfer1::v_1_0::IStreamReader::~IStreamReader
~IStreamReader() override=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader const &) &=default

nvinfer1::v_1_0::IStreamReader::operator=
IStreamReader & operator=(IStreamReader &&) &=default

nvinfer1::v_1_0::IStreamReader::read
virtual int64_t read(void *destination, int64_t nbBytes)=0
读取流中的下一个字节数。

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader &&)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader(IStreamReader const &)=default

nvinfer1::v_1_0::IStreamReader::IStreamReader
IStreamReader()=default

nvinfer1::v_1_0::IStreamReader::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:643

nvinfer1::v_1_0::IStreamReaderV2
定义： NvInferRuntime.h:695

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 const &) &=default

nvinfer1::v_1_0::IStreamReaderV2::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:707

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 &&)=default

nvinfer1::v_1_0::IStreamReaderV2::~IStreamReaderV2
~IStreamReaderV2() override=default

nvinfer1::v_1_0::IStreamReaderV2::read
virtual int64_t read(void *destination, int64_t nbBytes, cudaStream_t stream) noexcept=0
异步读取流中的下一个字节数。

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2()=default

nvinfer1::v_1_0::IStreamReaderV2::IStreamReaderV2
IStreamReaderV2(IStreamReaderV2 const &)=default

nvinfer1::v_1_0::IStreamReaderV2::seek
virtual bool seek(int64_t offset, SeekPosition where) noexcept=0
将流的位置设置为给定的偏移量。

nvinfer1::v_1_0::IStreamReaderV2::operator=
IStreamReaderV2 & operator=(IStreamReaderV2 &&) &=default

nvinfer1::v_2_0::IPluginV3OneBuild
定义： NvInferRuntime.h:1154

nvinfer1::v_2_0::IPluginV3OneBuild::getAliasedInput
virtual int32_t getAliasedInput(int32_t outputIndex) noexcept
告知 TensorRT 指定输出索引处的输出与输入处的别名关联...
定义： NvInferRuntime.h:1190

nvinfer1::v_2_0::IPluginV3OneBuild::getInterfaceInfo
InterfaceInfo getInterfaceInfo() const noexcept override
返回与此接口关联的版本信息。应用程序不得覆盖此方法...
定义： NvInferRuntime.h:1156

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRefitter
IRefitter * createInferRefitter(ICudaEngine &engine, ILogger &logger) noexcept
创建 IRefitter 类的实例。
定义： NvInferRuntime.h:5097

nvinfer1::anonymous_namespace{NvInferRuntime.h}::createInferRuntime
IRuntime * createInferRuntime(ILogger &logger) noexcept
创建 IRuntime 类的实例。
定义： NvInferRuntime.h:5087

nvinfer1
TensorRT API 版本 1 的命名空间。

nvinfer1::ErrorCode::kINTERNAL_ERROR
@ kINTERNAL_ERROR

nvinfer1::TacticSources
uint32_t TacticSources
表示一个或多个 TacticSource 值的集合，使用按位或运算组合。
定义： NvInferRuntime.h:2832

nvinfer1::IOutputAllocator
v_1_0::IOutputAllocator IOutputAllocator
定义： NvInferRuntime.h:3967

nvinfer1::EngineCapability
EngineCapability
支持的引擎能力流程列表。
定义： NvInferRuntime.h:76

nvinfer1::EngineCapability::kSAFETY
@ kSAFETY

nvinfer1::EngineCapability::kSTANDARD
@ kSTANDARD

nvinfer1::EngineCapability::kDLA_STANDALONE
@ kDLA_STANDALONE

nvinfer1::DimensionOperation
DimensionOperation
对两个 IDimensionExpr 的操作，IDimensionExpr 表示维度计算中使用的整数表达式...
定义： NvInferRuntime.h:179

nvinfer1::DimensionOperation::kSUB
@ kSUB
从第一个元素中减去第二个元素。

nvinfer1::DimensionOperation::kSUM
@ kSUM
两个操作数的和。

nvinfer1::DimensionOperation::kPROD
@ kPROD
两个操作数的积。

nvinfer1::DimensionOperation::kFLOOR_DIV
@ kFLOOR_DIV
第一个元素除以第二个元素的向下取整除法。

nvinfer1::DimensionOperation::kEQUAL
@ kEQUAL
如果操作数相等，则为 1，否则为 0。

nvinfer1::DimensionOperation::kMIN
@ kMIN
两个操作数的最小值。

nvinfer1::DimensionOperation::kLESS
@ kLESS
如果第一个操作数小于第二个操作数，则为 1，否则为 0。

nvinfer1::DimensionOperation::kMAX
@ kMAX
两个操作数的最大值。

nvinfer1::DimensionOperation::kCEIL_DIV
@ kCEIL_DIV
向上取整除法。

nvinfer1::IPluginV3OneCore
v_1_0::IPluginV3OneCore IPluginV3OneCore
定义： NvInferRuntime.h:1207

nvinfer1::TensorIOMode
TensorIOMode
张量 IO 模式的定义。
定义： NvInferRuntimeBase.h:643

nvinfer1::HardwareCompatibilityLevel
HardwareCompatibilityLevel
描述与 GPU 架构兼容性的要求，该架构不同于执行构建的 GPU 架构...
定义： NvInfer.h:9203

nvinfer1::SerializationFlag
SerializationFlag
引擎在序列化字节时可以启用的有效标志列表。
定义： NvInferRuntime.h:2873

nvinfer1::SerializationFlag::kEXCLUDE_WEIGHTS
@ kEXCLUDE_WEIGHTS
排除可以重新拟合的权重。

nvinfer1::IProfiler
v_1_0::IProfiler IProfiler
定义： NvInferRuntime.h:1271

nvinfer1::SeekPosition
SeekPosition
控制 IStreamReaderV2 的查找模式。
定义： NvInferRuntime.h:681

nvinfer1::SeekPosition::kSET
@ kSET
从文件开头开始。

nvinfer1::SeekPosition::kCUR
@ kCUR
从文件的当前位置开始。

nvinfer1::SeekPosition::kEND
@ kEND
从文件末尾开始。

nvinfer1::IStreamReaderV2
v_1_0::IStreamReaderV2 IStreamReaderV2
定义： NvInferRuntime.h:751

nvinfer1::TempfileControlFlags
uint32_t TempfileControlFlags
表示一个或多个 TempfileControlFlag 值的集合，使用按位或运算组合...
定义： NvInferRuntime.h:1349

nvinfer1::IGpuAllocator
v_1_0::IGpuAllocator IGpuAllocator
定义： NvInferRuntime.h:1807

nvinfer1::EnumMax< WeightsRole >
constexpr int32_t EnumMax< WeightsRole >() noexcept
WeightsRole 枚举中元素的最大数量。
定义： NvInferRuntime.h:1292

nvinfer1::AsciiChar
char_t AsciiChar
定义： NvInferRuntimeBase.h:105

nvinfer1::TensorRTPhase
TensorRTPhase
指示 TensorRT 的操作阶段。
定义： NvInferPluginBase.h:116

nvinfer1::PluginVersion::kV2_DYNAMICEXT
@ kV2_DYNAMICEXT
IPluginV2DynamicExt。

nvinfer1::EnumMax< LayerInformationFormat >
constexpr int32_t EnumMax< LayerInformationFormat >() noexcept
定义： NvInferRuntime.h:4911

nvinfer1::DataType
DataType
权重和张量的类型。
定义： NvInferRuntimeBase.h:133

nvinfer1::DeviceType
DeviceType
此层/网络将在其上执行的设备。
定义： NvInferRuntime.h:1303

nvinfer1::DeviceType::kGPU
@ kGPU
GPU 设备。

nvinfer1::DeviceType::kDLA
@ kDLA
DLA 核心。

nvinfer1::LayerType::kSCALE
@ kSCALE
Scale 层。

nvinfer1::LayerType::kCONSTANT
@ kCONSTANT
Constant 层。

nvinfer1::IDebugListener
v_1_0::IDebugListener IDebugListener
定义： NvInferRuntime.h:4008

nvinfer1::TempfileControlFlag
TempfileControlFlag
用于控制 TensorRT 在创建可执行临时文件时的行为的标志。
定义： NvInferRuntime.h:1326

nvinfer1::TempfileControlFlag::kALLOW_TEMPORARY_FILES
@ kALLOW_TEMPORARY_FILES

nvinfer1::TempfileControlFlag::kALLOW_IN_MEMORY_FILES
@ kALLOW_IN_MEMORY_FILES
允许在内存中（或未命名的文件）创建和加载文件。

nvinfer1::EnumMax< OptProfileSelector >
constexpr int32_t EnumMax< OptProfileSelector >() noexcept
OptProfileSelector 枚举的不同值的数量。
定义： NvInferRuntime.h:2588

nvinfer1::WeightsRole
WeightsRole
层如何使用特定的 Weights。
定义： NvInferRuntime.h:1281

nvinfer1::WeightsRole::kSHIFT
@ kSHIFT
IScaleLayer 的 shift 部分

nvinfer1::WeightsRole::kANY
@ kANY
任何其他权重角色。

nvinfer1::WeightsRole::kBIAS
@ kBIAS
IConvolutionLayer 或 IDeconvolutionLayer 的 bias

nvinfer1::WeightsRole::kKERNEL
@ kKERNEL
IConvolutionLayer 或 IDeconvolutionLayer 的 kernel

nvinfer1::EnumMax< ProfilingVerbosity >
constexpr int32_t EnumMax< ProfilingVerbosity >() noexcept
ProfilingVerbosity 枚举中最大profile verbosity levels 的数量。
定义： NvInferRuntime.h:2852

nvinfer1::ProfilingVerbosity
ProfilingVerbosity
NVTX 注释和 IEngineInspector 中公开的层信息 verbosity levels 列表。
定义： NvInferRuntime.h:2844

nvinfer1::ProfilingVerbosity::kLAYER_NAMES_ONLY
@ kLAYER_NAMES_ONLY
仅打印层名称。这是默认设置。

nvinfer1::ProfilingVerbosity::kDETAILED
@ kDETAILED
打印详细的层信息，包括层名称和层参数。

nvinfer1::TacticSource
TacticSource
TensorRT 的 tactic sources 列表。
定义： NvInferRuntime.h:2795

nvinfer1::TacticSource::kCUBLAS_LT
@ kCUBLAS_LT

nvinfer1::TacticSource::kEDGE_MASK_CONVOLUTIONS
@ kEDGE_MASK_CONVOLUTIONS

nvinfer1::TacticSource::kCUDNN
@ kCUDNN

nvinfer1::TacticSource::kJIT_CONVOLUTIONS
@ kJIT_CONVOLUTIONS

nvinfer1::TacticSource::kCUBLAS
@ kCUBLAS

nvinfer1::PluginFormat
TensorFormat PluginFormat
PluginFormat 保留用于向后兼容性。
定义： NvInferRuntimePlugin.h:54

nvinfer1::IPluginV3OneRuntime
v_1_0::IPluginV3OneRuntime IPluginV3OneRuntime
定义： NvInferRuntime.h:1231

nvinfer1::ElementWiseOperation::kMIN
@ kMIN
两个元素的最小值。

nvinfer1::EnumMax< TempfileControlFlag >
constexpr int32_t EnumMax< TempfileControlFlag >() noexcept
TempfileControlFlag 枚举中元素的最大数量。
定义： NvInferRuntime.h:1338

nvinfer1::SerializationFlags
uint32_t SerializationFlags
表示一个或多个 SerializationFlag 值，使用二进制 OR 运算，例如，1U << Serialization...
定义： NvInferRuntime.h:2863

nvinfer1::InterpolationMode::kLINEAR
@ kLINEAR
支持线性 (1D)、双线性 (2D) 和三线性 (3D) 插值。

nvinfer1::IPluginV3OneBuild
v_1_0::IPluginV3OneBuild IPluginV3OneBuild
定义： NvInferRuntime.h:1219

nvinfer1::BuilderFlag::kEXCLUDE_LEAN_RUNTIME
@ kEXCLUDE_LEAN_RUNTIME

nvinfer1::TensorFormat
TensorFormat
输入/输出张量的格式。
定义： NvInferRuntime.h:1382

nvinfer1::TensorFormat::kCHW4
@ kCHW4

nvinfer1::TensorFormat::kDHWC
@ kDHWC

nvinfer1::TensorFormat::kHWC16
@ kHWC16

nvinfer1::TensorFormat::kDHWC8
@ kDHWC8

nvinfer1::TensorFormat::kDLA_LINEAR
@ kDLA_LINEAR

nvinfer1::TensorFormat::kCDHW32
@ kCDHW32

nvinfer1::TensorFormat::kDLA_HWC4
@ kDLA_HWC4

nvinfer1::TensorFormat::kCHW16
@ kCHW16

nvinfer1::TensorFormat::kHWC
@ kHWC

nvinfer1::TensorFormat::kCHW2
@ kCHW2

nvinfer1::TensorFormat::kHWC8
@ kHWC8

nvinfer1::TensorFormat::kCHW32
@ kCHW32

nvinfer1::ExecutionContextAllocationStrategy
ExecutionContextAllocationStrategy
IExecutionContext 的不同内存分配行为。
定义： NvInferRuntime.h:2977

nvinfer1::ExecutionContextAllocationStrategy::kSTATIC
@ kSTATIC
跨所有配置文件的最大尺寸的默认静态分配。

nvinfer1::ExecutionContextAllocationStrategy::kUSER_MANAGED
@ kUSER_MANAGED
用户为执行上下文提供自定义分配。

nvinfer1::ExecutionContextAllocationStrategy::kON_PROFILE_CHANGE
@ kON_PROFILE_CHANGE
在选择配置文件时重新分配。

nvinfer1::EnumMax< TacticSource >
constexpr int32_t EnumMax< TacticSource >() noexcept
TacticSource 枚举中 tactic sources 的最大数量。
定义： NvInferRuntime.h:2821

nvinfer1::LayerInformationFormat
LayerInformationFormat
IEngineInspector 打印层信息的格式。
定义： NvInferRuntime.h:4903

nvinfer1::LayerInformationFormat::kJSON
@ kJSON
以 JSON 格式打印层信息。

nvinfer1::LayerInformationFormat::kONELINE
@ kONELINE
每层打印一行层信息。

nvinfer1::MatrixOperation::kNONE
@ kNONE

nvinfer1::IStreamReader
v_1_0::IStreamReader IStreamReader
定义： NvInferRuntime.h:674

nvinfer1::AllocatorFlag
AllocatorFlag
允许的内存分配类型。
定义： NvInferRuntime.h:1506

nvinfer1::AllocatorFlag::kRESIZABLE
@ kRESIZABLE
TensorRT 可能会对此分配调用 realloc()。

nvinfer1::PoolingType::kMAX
@ kMAX
元素的最大值。

nvinfer1::EnumMax< DeviceType >
constexpr int32_t EnumMax< DeviceType >() noexcept
DeviceType 枚举中元素的最大数量。
定义： NvInferRuntime.h:1310

nvinfer1::EnumMax< DimensionOperation >
constexpr int32_t EnumMax< DimensionOperation >() noexcept
DimensionOperation 枚举中元素的最大数量。
定义： NvInferRuntime.h:193

nvinfer1::EnumMax< ExecutionContextAllocationStrategy >
constexpr int32_t EnumMax< ExecutionContextAllocationStrategy >() noexcept
ExecutionContextAllocationStrategy 枚举中内存分配策略的最大数量。
定义： NvInferRuntime.h:2989

nvinfer1::EnumMax< SerializationFlag >
constexpr int32_t EnumMax< SerializationFlag >() noexcept
SerializationFlag 枚举中 serialization flags 的最大数量。
定义： NvInferRuntime.h:2880

nvinfer1::TensorLocation
TensorLocation
张量数据存储的位置，设备或主机。
定义： NvInferRuntime.h:204

nvinfer1::TensorLocation::kHOST
@ kHOST
数据存储在主机上。

nvinfer1::TensorLocation::kDEVICE
@ kDEVICE
数据存储在设备上。

nvinfer1::OptProfileSelector
OptProfileSelector
在设置或查询优化配置文件参数时（例如 shape tensor inputs 或动态维度...
定义： NvInferRuntime.h:2576

nvinfer1::OptProfileSelector::kOPT
@ kOPT
这用于设置或获取在优化（内核选择）中使用的值。

nvinfer1::AllocatorFlags
uint32_t AllocatorFlags
定义： NvInferRuntime.h:1522

nvinfer1::DynamicPluginTensorDesc
概述插件可能看到的输入或输出张量。
定义： NvInferRuntime.h:362

nvinfer1::DynamicPluginTensorDesc::min
Dims min
张量维度的下限。
定义： NvInferRuntime.h:367

nvinfer1::DynamicPluginTensorDesc::max
Dims max
张量维度的上限。
定义： NvInferRuntime.h:370

nvinfer1::DynamicPluginTensorDesc::opt
Dims opt
为自动调整指定的张量维度的最佳值。
定义： NvInferRuntime.h:373

nvinfer1::DynamicPluginTensorDesc::desc
PluginTensorDesc desc
解释张量数据指针所需的信息，除了 desc.dims 在动态维度位置为 -1...
定义： NvInferRuntime.h:364

nvinfer1::PluginFieldCollection
插件字段集合结构体。
定义： NvInferPluginBase.h:103

nvinfer1::PluginTensorDesc
插件可能看到的输入或输出字段。
定义： NvInferRuntimePlugin.h:73

nvinfer1::impl::EnumMaxImpl
EnumMaxImpl 结构体的声明，用于存储枚举类型中元素的最大数量。
定义： NvInferRuntimeBase.h:118