@@ -223,7 +223,7 @@ __global__ void CompactVoxelsKernel(
223
223
compactedVoxelArray,
224
224
const at::PackedTensorAccessor32<int , 1 , at::RestrictPtrTraits>
225
225
voxelOccupied,
226
- const at::PackedTensorAccessor32<int , 1 , at::RestrictPtrTraits>
226
+ const at::PackedTensorAccessor32<long , 1 , at::RestrictPtrTraits>
227
227
voxelOccupiedScan,
228
228
uint numVoxels) {
229
229
uint id = blockIdx .x * blockDim .x + threadIdx .x ;
@@ -255,7 +255,7 @@ __global__ void GenerateFacesKernel(
255
255
at::PackedTensorAccessor<int64_t , 1 , at::RestrictPtrTraits> ids,
256
256
at::PackedTensorAccessor32<int , 1 , at::RestrictPtrTraits>
257
257
compactedVoxelArray,
258
- at::PackedTensorAccessor32<int , 1 , at::RestrictPtrTraits> numVertsScanned,
258
+ at::PackedTensorAccessor32<long , 1 , at::RestrictPtrTraits> numVertsScanned,
259
259
const uint activeVoxels,
260
260
const at::PackedTensorAccessor32<float , 3 , at::RestrictPtrTraits> vol,
261
261
const at::PackedTensorAccessor32<int , 2 , at::RestrictPtrTraits> faceTable,
@@ -471,7 +471,7 @@ std::tuple<at::Tensor, at::Tensor, at::Tensor> MarchingCubesCuda(
471
471
auto d_voxelOccupiedScan_ = d_voxelOccupiedScan.index ({Slice (1 , None)});
472
472
473
473
// number of active voxels
474
- int activeVoxels = d_voxelOccupiedScan[numVoxels].cpu ().item <int >();
474
+ int activeVoxels = d_voxelOccupiedScan[numVoxels].cpu ().item <long >();
475
475
476
476
const int device_id = vol.device ().index ();
477
477
auto opt = at::TensorOptions ().dtype (at::kInt ).device (at::kCUDA , device_id);
@@ -492,7 +492,7 @@ std::tuple<at::Tensor, at::Tensor, at::Tensor> MarchingCubesCuda(
492
492
CompactVoxelsKernel<<<grid, threads, 0 , stream>>> (
493
493
d_compVoxelArray.packed_accessor32 <int , 1 , at::RestrictPtrTraits>(),
494
494
d_voxelOccupied.packed_accessor32 <int , 1 , at::RestrictPtrTraits>(),
495
- d_voxelOccupiedScan_.packed_accessor32 <int , 1 , at::RestrictPtrTraits>(),
495
+ d_voxelOccupiedScan_.packed_accessor32 <long , 1 , at::RestrictPtrTraits>(),
496
496
numVoxels);
497
497
AT_CUDA_CHECK (cudaGetLastError ());
498
498
cudaDeviceSynchronize ();
@@ -502,7 +502,7 @@ std::tuple<at::Tensor, at::Tensor, at::Tensor> MarchingCubesCuda(
502
502
auto d_voxelVertsScan_ = d_voxelVertsScan.index ({Slice (1 , None)});
503
503
504
504
// total number of vertices
505
- int totalVerts = d_voxelVertsScan[numVoxels].cpu ().item <int >();
505
+ int totalVerts = d_voxelVertsScan[numVoxels].cpu ().item <long >();
506
506
507
507
// Execute "GenerateFacesKernel" kernel
508
508
// This runs only on the occupied voxels.
@@ -522,7 +522,7 @@ std::tuple<at::Tensor, at::Tensor, at::Tensor> MarchingCubesCuda(
522
522
faces.packed_accessor <int64_t , 2 , at::RestrictPtrTraits>(),
523
523
ids.packed_accessor <int64_t , 1 , at::RestrictPtrTraits>(),
524
524
d_compVoxelArray.packed_accessor32 <int , 1 , at::RestrictPtrTraits>(),
525
- d_voxelVertsScan_.packed_accessor32 <int , 1 , at::RestrictPtrTraits>(),
525
+ d_voxelVertsScan_.packed_accessor32 <long , 1 , at::RestrictPtrTraits>(),
526
526
activeVoxels,
527
527
vol.packed_accessor32 <float , 3 , at::RestrictPtrTraits>(),
528
528
faceTable.packed_accessor32 <int , 2 , at::RestrictPtrTraits>(),
0 commit comments