#ifndef _YOLO_LAYER_H #define _YOLO_LAYER_H #include #include #include #include "macros.h" namespace Yolo { static constexpr int CHECK_COUNT = 3; static constexpr float IGNORE_THRESH = 0.1f; struct YoloKernel { int width; int height; float anchors[CHECK_COUNT * 2]; }; static constexpr int MAX_OUTPUT_BBOX_COUNT = 1000; static constexpr int CLASS_NUM = 3; static constexpr int INPUT_H = 640; // yolov5's input height and width must be divisible by 32. static constexpr int INPUT_W = 640; static constexpr int LOCATIONS = 4; struct alignas(float) Detection { //center_x center_y w h float bbox[LOCATIONS]; float conf; // bbox_conf * cls_conf float class_id; }; } namespace nvinfer1 { class API YoloLayerPlugin : public IPluginV2IOExt { public: YoloLayerPlugin(int classCount, int netWidth, int netHeight, int maxOut, const std::vector& vYoloKernel); YoloLayerPlugin(const void* data, size_t length); ~YoloLayerPlugin(); int getNbOutputs() const TRT_NOEXCEPT override { return 1; } Dims getOutputDimensions(int index, const Dims* inputs, int nbInputDims) TRT_NOEXCEPT override; int initialize() TRT_NOEXCEPT override; virtual void terminate() TRT_NOEXCEPT override {}; virtual size_t getWorkspaceSize(int maxBatchSize) const TRT_NOEXCEPT override { return 0; } virtual int enqueue(int batchSize, const void* const* inputs, void*TRT_CONST_ENQUEUE* outputs, void* workspace, cudaStream_t stream) TRT_NOEXCEPT override; virtual size_t getSerializationSize() const TRT_NOEXCEPT override; virtual void serialize(void* buffer) const TRT_NOEXCEPT override; bool supportsFormatCombination(int pos, const PluginTensorDesc* inOut, int nbInputs, int nbOutputs) const TRT_NOEXCEPT override { return inOut[pos].format == TensorFormat::kLINEAR && inOut[pos].type == DataType::kFLOAT; } const char* getPluginType() const TRT_NOEXCEPT override; const char* getPluginVersion() const TRT_NOEXCEPT override; void destroy() TRT_NOEXCEPT override; IPluginV2IOExt* clone() const TRT_NOEXCEPT override; void setPluginNamespace(const char* pluginNamespace) TRT_NOEXCEPT override; const char* getPluginNamespace() const TRT_NOEXCEPT override; DataType getOutputDataType(int index, const nvinfer1::DataType* inputTypes, int nbInputs) const TRT_NOEXCEPT override; bool isOutputBroadcastAcrossBatch(int outputIndex, const bool* inputIsBroadcasted, int nbInputs) const TRT_NOEXCEPT override; bool canBroadcastInputAcrossBatch(int inputIndex) const TRT_NOEXCEPT override; void attachToContext( cudnnContext* cudnnContext, cublasContext* cublasContext, IGpuAllocator* gpuAllocator) TRT_NOEXCEPT override; void configurePlugin(const PluginTensorDesc* in, int nbInput, const PluginTensorDesc* out, int nbOutput) TRT_NOEXCEPT override; void detachFromContext() TRT_NOEXCEPT override; private: void forwardGpu(const float* const* inputs, float *output, cudaStream_t stream, int batchSize = 1); int mThreadCount = 256; const char* mPluginNamespace; int mKernelCount; int mClassCount; int mYoloV5NetWidth; int mYoloV5NetHeight; int mMaxOutObject; std::vector mYoloKernel; void** mAnchor; }; class API YoloPluginCreator : public IPluginCreator { public: YoloPluginCreator(); ~YoloPluginCreator() override = default; const char* getPluginName() const TRT_NOEXCEPT override; const char* getPluginVersion() const TRT_NOEXCEPT override; const PluginFieldCollection* getFieldNames() TRT_NOEXCEPT override; IPluginV2IOExt* createPlugin(const char* name, const PluginFieldCollection* fc) TRT_NOEXCEPT override; IPluginV2IOExt* deserializePlugin(const char* name, const void* serialData, size_t serialLength) TRT_NOEXCEPT override; void setPluginNamespace(const char* libNamespace) TRT_NOEXCEPT override { mNamespace = libNamespace; } const char* getPluginNamespace() const TRT_NOEXCEPT override { return mNamespace.c_str(); } private: std::string mNamespace; static PluginFieldCollection mFC; static std::vector mPluginAttributes; }; REGISTER_TENSORRT_PLUGIN(YoloPluginCreator); }; #endif // _YOLO_LAYER_H