107 lines
3.5 KiB
C++
107 lines
3.5 KiB
C++
#pragma once
|
|
|
|
#include "types.h"
|
|
#include "macros.h"
|
|
|
|
#include <vector>
|
|
#include <string>
|
|
|
|
namespace nvinfer1 {
|
|
class API YoloLayerPlugin : public IPluginV2IOExt {
|
|
public:
|
|
YoloLayerPlugin(int classCount, int netWidth, int netHeight, int maxOut, bool is_segmentation, const std::vector<YoloKernel>& vYoloKernel);
|
|
YoloLayerPlugin(const void* data, size_t length);
|
|
~YoloLayerPlugin();
|
|
|
|
int getNbOutputs() const TRT_NOEXCEPT override { return 1; }
|
|
|
|
Dims getOutputDimensions(int index, const Dims* inputs, int nbInputDims) TRT_NOEXCEPT override;
|
|
|
|
int initialize() TRT_NOEXCEPT override;
|
|
|
|
virtual void terminate() TRT_NOEXCEPT override {};
|
|
|
|
virtual size_t getWorkspaceSize(int maxBatchSize) const TRT_NOEXCEPT override { return 0; }
|
|
|
|
virtual int enqueue(int batchSize, const void* const* inputs, void*TRT_CONST_ENQUEUE* outputs, void* workspace, cudaStream_t stream) TRT_NOEXCEPT override;
|
|
|
|
virtual size_t getSerializationSize() const TRT_NOEXCEPT override;
|
|
|
|
virtual void serialize(void* buffer) const TRT_NOEXCEPT override;
|
|
|
|
bool supportsFormatCombination(int pos, const PluginTensorDesc* inOut, int nbInputs, int nbOutputs) const TRT_NOEXCEPT override {
|
|
return inOut[pos].format == TensorFormat::kLINEAR && inOut[pos].type == DataType::kFLOAT;
|
|
}
|
|
|
|
const char* getPluginType() const TRT_NOEXCEPT override;
|
|
|
|
const char* getPluginVersion() const TRT_NOEXCEPT override;
|
|
|
|
void destroy() TRT_NOEXCEPT override;
|
|
|
|
IPluginV2IOExt* clone() const TRT_NOEXCEPT override;
|
|
|
|
void setPluginNamespace(const char* pluginNamespace) TRT_NOEXCEPT override;
|
|
|
|
const char* getPluginNamespace() const TRT_NOEXCEPT override;
|
|
|
|
DataType getOutputDataType(int index, const nvinfer1::DataType* inputTypes, int nbInputs) const TRT_NOEXCEPT override;
|
|
|
|
bool isOutputBroadcastAcrossBatch(int outputIndex, const bool* inputIsBroadcasted, int nbInputs) const TRT_NOEXCEPT override;
|
|
|
|
bool canBroadcastInputAcrossBatch(int inputIndex) const TRT_NOEXCEPT override;
|
|
|
|
void attachToContext(
|
|
cudnnContext* cudnnContext, cublasContext* cublasContext, IGpuAllocator* gpuAllocator) TRT_NOEXCEPT override;
|
|
|
|
void configurePlugin(const PluginTensorDesc* in, int nbInput, const PluginTensorDesc* out, int nbOutput) TRT_NOEXCEPT override;
|
|
|
|
void detachFromContext() TRT_NOEXCEPT override;
|
|
|
|
private:
|
|
void forwardGpu(const float* const* inputs, float *output, cudaStream_t stream, int batchSize = 1);
|
|
int mThreadCount = 256;
|
|
const char* mPluginNamespace;
|
|
int mKernelCount;
|
|
int mClassCount;
|
|
int mYoloV5NetWidth;
|
|
int mYoloV5NetHeight;
|
|
int mMaxOutObject;
|
|
bool is_segmentation_;
|
|
std::vector<YoloKernel> mYoloKernel;
|
|
void** mAnchor;
|
|
};
|
|
|
|
class API YoloPluginCreator : public IPluginCreator {
|
|
public:
|
|
YoloPluginCreator();
|
|
|
|
~YoloPluginCreator() override = default;
|
|
|
|
const char* getPluginName() const TRT_NOEXCEPT override;
|
|
|
|
const char* getPluginVersion() const TRT_NOEXCEPT override;
|
|
|
|
const PluginFieldCollection* getFieldNames() TRT_NOEXCEPT override;
|
|
|
|
IPluginV2IOExt* createPlugin(const char* name, const PluginFieldCollection* fc) TRT_NOEXCEPT override;
|
|
|
|
IPluginV2IOExt* deserializePlugin(const char* name, const void* serialData, size_t serialLength) TRT_NOEXCEPT override;
|
|
|
|
void setPluginNamespace(const char* libNamespace) TRT_NOEXCEPT override {
|
|
mNamespace = libNamespace;
|
|
}
|
|
|
|
const char* getPluginNamespace() const TRT_NOEXCEPT override {
|
|
return mNamespace.c_str();
|
|
}
|
|
|
|
private:
|
|
std::string mNamespace;
|
|
static PluginFieldCollection mFC;
|
|
static std::vector<PluginField> mPluginAttributes;
|
|
};
|
|
REGISTER_TENSORRT_PLUGIN(YoloPluginCreator);
|
|
};
|
|
|