@@ -83,7 +83,7 @@ fn make_for_array_u64(len: usize) -> FoRArray {
8383/// Launches FoR decompression kernel and returns elapsed GPU time in seconds.
8484fn launch_for_kernel_timed_u8 (
8585 for_array : & FoRArray ,
86- device_data : cudarc:: driver:: CudaSlice < u8 > ,
86+ device_data : & cudarc:: driver:: CudaSlice < u8 > ,
8787 reference : u8 ,
8888 cuda_ctx : & mut CudaExecutionCtx ,
8989) -> vortex_error:: VortexResult < Duration > {
@@ -93,7 +93,7 @@ fn launch_for_kernel_timed_u8(
9393 execution_ctx: cuda_ctx,
9494 module: "for" ,
9595 ptypes: & [ for_array. ptype( ) ] ,
96- launch_args: [ device_data, reference, array_len_u64] ,
96+ launch_args: [ * device_data, reference, array_len_u64] ,
9797 event_recording: CU_EVENT_BLOCKING_SYNC ,
9898 array_len: for_array. len( )
9999 ) ;
@@ -109,7 +109,7 @@ fn launch_for_kernel_timed_u8(
109109/// Launches FoR decompression kernel and returns elapsed GPU time in seconds.
110110fn launch_for_kernel_timed_u16 (
111111 for_array : & FoRArray ,
112- device_data : cudarc:: driver:: CudaSlice < u16 > ,
112+ device_data : & cudarc:: driver:: CudaSlice < u16 > ,
113113 reference : u16 ,
114114 cuda_ctx : & mut CudaExecutionCtx ,
115115) -> vortex_error:: VortexResult < Duration > {
@@ -119,7 +119,7 @@ fn launch_for_kernel_timed_u16(
119119 execution_ctx: cuda_ctx,
120120 module: "for" ,
121121 ptypes: & [ for_array. ptype( ) ] ,
122- launch_args: [ device_data, reference, array_len_u64] ,
122+ launch_args: [ * device_data, reference, array_len_u64] ,
123123 event_recording: CU_EVENT_BLOCKING_SYNC ,
124124 array_len: for_array. len( )
125125 ) ;
@@ -135,7 +135,7 @@ fn launch_for_kernel_timed_u16(
135135/// Launches FoR decompression kernel and returns elapsed GPU time in seconds.
136136fn launch_for_kernel_timed_u32 (
137137 for_array : & FoRArray ,
138- device_data : cudarc:: driver:: CudaSlice < u32 > ,
138+ device_data : & cudarc:: driver:: CudaSlice < u32 > ,
139139 reference : u32 ,
140140 cuda_ctx : & mut CudaExecutionCtx ,
141141) -> vortex_error:: VortexResult < Duration > {
@@ -145,7 +145,7 @@ fn launch_for_kernel_timed_u32(
145145 execution_ctx: cuda_ctx,
146146 module: "for" ,
147147 ptypes: & [ for_array. ptype( ) ] ,
148- launch_args: [ device_data, reference, array_len_u64] ,
148+ launch_args: [ * device_data, reference, array_len_u64] ,
149149 event_recording: CU_EVENT_BLOCKING_SYNC ,
150150 array_len: for_array. len( )
151151 ) ;
@@ -161,7 +161,7 @@ fn launch_for_kernel_timed_u32(
161161/// Launches FoR decompression kernel and returns elapsed GPU time in seconds.
162162fn launch_for_kernel_timed_u64 (
163163 for_array : & FoRArray ,
164- device_data : cudarc:: driver:: CudaSlice < u64 > ,
164+ device_data : & cudarc:: driver:: CudaSlice < u64 > ,
165165 reference : u64 ,
166166 cuda_ctx : & mut CudaExecutionCtx ,
167167) -> vortex_error:: VortexResult < Duration > {
@@ -171,7 +171,7 @@ fn launch_for_kernel_timed_u64(
171171 execution_ctx: cuda_ctx,
172172 module: "for" ,
173173 ptypes: & [ for_array. ptype( ) ] ,
174- launch_args: [ device_data, reference, array_len_u64] ,
174+ launch_args: [ * device_data, reference, array_len_u64] ,
175175 event_recording: CU_EVENT_BLOCKING_SYNC ,
176176 array_len: for_array. len( )
177177 ) ;
@@ -210,12 +210,12 @@ fn benchmark_for_u8(c: &mut Criterion) {
210210
211211 for _ in 0 ..iters {
212212 let device_data = cuda_ctx
213- . to_device ( unpacked_slice)
213+ . copy_buffer_to_device ( unpacked_slice)
214214 . vortex_expect ( "failed to copy to device" ) ;
215215
216216 let kernel_time = launch_for_kernel_timed_u8 (
217217 for_array,
218- device_data,
218+ device_data. cuda_slice ( ) ,
219219 reference,
220220 & mut cuda_ctx,
221221 )
@@ -259,12 +259,12 @@ fn benchmark_for_u16(c: &mut Criterion) {
259259
260260 for _ in 0 ..iters {
261261 let device_data = cuda_ctx
262- . to_device ( unpacked_slice)
262+ . copy_buffer_to_device ( unpacked_slice)
263263 . vortex_expect ( "failed to copy to device" ) ;
264264
265265 let kernel_time = launch_for_kernel_timed_u16 (
266266 for_array,
267- device_data,
267+ device_data. cuda_slice ( ) ,
268268 reference,
269269 & mut cuda_ctx,
270270 )
@@ -308,12 +308,12 @@ fn benchmark_for_u32(c: &mut Criterion) {
308308
309309 for _ in 0 ..iters {
310310 let device_data = cuda_ctx
311- . to_device ( unpacked_slice)
311+ . copy_buffer_to_device ( unpacked_slice)
312312 . vortex_expect ( "failed to copy to device" ) ;
313313
314314 let kernel_time = launch_for_kernel_timed_u32 (
315315 for_array,
316- device_data,
316+ device_data. cuda_slice ( ) ,
317317 reference,
318318 & mut cuda_ctx,
319319 )
@@ -357,12 +357,12 @@ fn benchmark_for_u64(c: &mut Criterion) {
357357
358358 for _ in 0 ..iters {
359359 let device_data = cuda_ctx
360- . to_device ( unpacked_slice)
360+ . copy_buffer_to_device ( unpacked_slice)
361361 . vortex_expect ( "failed to copy to device" ) ;
362362
363363 let kernel_time = launch_for_kernel_timed_u64 (
364364 for_array,
365- device_data,
365+ device_data. cuda_slice ( ) ,
366366 reference,
367367 & mut cuda_ctx,
368368 )
0 commit comments