fix void pointer arithmetic (#98)
parent
b8217d8243
commit
067b915383
|
@ -62,15 +62,15 @@ int TRTInstanceNormalization::enqueue(
|
|||
int elem_size = getElementSize(inputDesc[1].type);
|
||||
|
||||
void* n_scales = (void*)workspace;
|
||||
void* n_bias = (void*)(workspace + getAlignedSize(n * c * elem_size));
|
||||
void* n_bias = (void*)((char*)workspace + getAlignedSize(n * c * elem_size));
|
||||
|
||||
const void* scales = (const void*)inputs[1];
|
||||
const void* bias = (const void*)inputs[2];
|
||||
|
||||
for (int i = 0; i < n; ++i) {
|
||||
cudaMemcpyAsync(n_scales + i * c * elem_size, scales, c * elem_size,
|
||||
cudaMemcpyAsync((char*)n_scales + i * c * elem_size, scales, c * elem_size,
|
||||
cudaMemcpyDeviceToDevice, stream);
|
||||
cudaMemcpyAsync(n_bias + i * c * elem_size, bias, c * elem_size,
|
||||
cudaMemcpyAsync((char*)n_bias + i * c * elem_size, bias, c * elem_size,
|
||||
cudaMemcpyDeviceToDevice, stream);
|
||||
}
|
||||
|
||||
|
|
|
@ -113,7 +113,7 @@ int TRTRoIAlign::enqueue(const nvinfer1::PluginTensorDesc *inputDesc,
|
|||
switch (mPoolMode) {
|
||||
case 0: // max
|
||||
argmax_y = workSpace;
|
||||
argmax_x = argmax_y + output_size * word_size;
|
||||
argmax_x = (char *)argmax_y + output_size * word_size;
|
||||
break;
|
||||
case 1: // avg
|
||||
break;
|
||||
|
|
Loading…
Reference in New Issue