Add convertfp16tofloatCuda memory free
This commit is contained in:
@@ -1631,5 +1631,6 @@ CudaMatrix Aurora::convertfp16tofloatCuda(short* aData, int aRows, int aColumns)
|
||||
cudaMalloc((void**)&output,size*sizeof(float));
|
||||
int blocksPerGrid = (size + THREADS_PER_BLOCK - 1) / THREADS_PER_BLOCK;
|
||||
convertValueKernel<<<blocksPerGrid, THREADS_PER_BLOCK>>>(input,output, size);
|
||||
cudaFree(input);
|
||||
return CudaMatrix::fromRawData(output, aRows, aColumns);
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user