DeepStream 7.0 update

This commit is contained in:
Marcos Luciano
2024-05-12 20:47:10 -03:00
parent 9bda315ee0
commit ef84cc048f
22 changed files with 1004 additions and 802 deletions

View File

@@ -35,8 +35,9 @@ __global__ void gpuRegionLayer(const float* input, float* softmax, float* boxes,
uint y_id = blockIdx.y * blockDim.y + threadIdx.y;
uint z_id = blockIdx.z * blockDim.z + threadIdx.z;
if (x_id >= gridSizeX || y_id >= gridSizeY || z_id >= numBBoxes)
if (x_id >= gridSizeX || y_id >= gridSizeY || z_id >= numBBoxes) {
return;
}
const int numGridCells = gridSizeX * gridSizeY;
const int bbindex = y_id * gridSizeX + x_id;
@@ -66,7 +67,7 @@ __global__ void gpuRegionLayer(const float* input, float* softmax, float* boxes,
}
}
int count = z_id * gridSizeX * gridSizeY + y_id * gridSizeY + x_id + lastInputSize;
int count = numGridCells * z_id + bbindex + lastInputSize;
boxes[count * 4 + 0] = xc;
boxes[count * 4 + 1] = yc;