Skip to content

Commit

Permalink
fix yolo11-seg and yolo11-pose engine cannot run after set batch > 1
Browse files Browse the repository at this point in the history
  • Loading branch information
mpj1234 committed Dec 6, 2024
1 parent 62c1680 commit c0fbfcc
Showing 1 changed file with 5 additions and 0 deletions.
5 changes: 5 additions & 0 deletions yolo11/plugin/yololayer.cu
Original file line number Diff line number Diff line change
Expand Up @@ -251,6 +251,11 @@ __global__ void CalDetection(const float* input, float* output, int numElements,
void YoloLayerPlugin::forwardGpu(const float* const* inputs, float* output, cudaStream_t stream, int mYoloV8netHeight,
int mYoloV8NetWidth, int batchSize) {
int outputElem = 1 + mMaxOutObject * sizeof(Detection) / sizeof(float);
if (is_segmentation_) {
outputElem = mMaxOutObject * (sizeof(Detection) - sizeof(float) * 51) / sizeof(float) + 1;
} else if (is_pose_) {
outputElem = mMaxOutObject * (sizeof(Detection) - sizeof(float) * 32) / sizeof(float) + 1;
}
cudaMemsetAsync(output, 0, sizeof(float), stream);
for (int idx = 0; idx < batchSize; ++idx) {
CUDA_CHECK(cudaMemsetAsync(output + idx * outputElem, 0, sizeof(float), stream));
Expand Down

0 comments on commit c0fbfcc

Please sign in to comment.