@@ -152,7 +152,7 @@ compdb -p build list > compile_commands.json
152152# func.func private @cuda_shim_stream_destroy(i64)
153153# func.func private @cuda_shim_free(i64, i64)
154154# func.func private @cuda_shim_stream_synchronize(i64)
155- # func.func private @cuda_shim_launch_block_packed (i64, i64, i32, i32, i32, i64, i64, i64, i32)
155+ # func.func private @cuda_shim_launch_grid_packed (i64, i64, i32, i32, i32, i64, i64, i64, i32)
156156# func.func private @cuda_shim_memcpy_d2h(i64, i64, i64)
157157# func.func private @cuda_shim_memcpy_h2d(i64, i64, i64)
158158# func.func private @cuda_shim_malloc(i64, i64, i1) -> i64
@@ -255,7 +255,7 @@ compdb -p build list > compile_commands.json
255255# %14 = arith.index_cast %intptr_27 : index to i64
256256# %intptr_28 = memref.extract_aligned_pointer_as_index %alloc_22 : memref<4xi64> -> index
257257# %15 = arith.index_cast %intptr_28 : index to i64
258- # call @cuda_shim_launch_block_packed (%4, %3, %c8_i32, %c1_i32, %c1_i32, %5, %14, %15, %c4_i32) : (i64, i64, i32, i32, i32, i64, i64, i64, i32) -> ()
258+ # call @cuda_shim_launch_grid_packed (%4, %3, %c8_i32, %c1_i32, %c1_i32, %5, %14, %15, %c4_i32) : (i64, i64, i32, i32, i32, i64, i64, i64, i32) -> ()
259259# call @cuda_shim_stream_synchronize(%5) : (i64) -> ()
260260# call @cuda_shim_memcpy_d2h(%13, %12, %c32_i64) : (i64, i64, i64) -> ()
261261# memref.dealloc %alloc_21 : memref<4xi64>
@@ -292,7 +292,7 @@ compdb -p build list > compile_commands.json
292292# llvm.func @cuda_shim_stream_destroy(i64) attributes {sym_visibility = "private"}
293293# llvm.func @cuda_shim_free(i64, i64) attributes {sym_visibility = "private"}
294294# llvm.func @cuda_shim_stream_synchronize(i64) attributes {sym_visibility = "private"}
295- # llvm.func @cuda_shim_launch_block_packed (i64, i64, i32, i32, i32, i64, i64, i64, i32) attributes {sym_visibility = "private"}
295+ # llvm.func @cuda_shim_launch_grid_packed (i64, i64, i32, i32, i32, i64, i64, i64, i32) attributes {sym_visibility = "private"}
296296# llvm.func @cuda_shim_memcpy_d2h(i64, i64, i64) attributes {sym_visibility = "private"}
297297# llvm.func @cuda_shim_memcpy_h2d(i64, i64, i64) attributes {sym_visibility = "private"}
298298# llvm.func @cuda_shim_malloc(i64, i64, i1) -> i64 attributes {sym_visibility = "private"}
@@ -350,7 +350,7 @@ compdb -p build list > compile_commands.json
350350# !10 = !DISubprogram(name: "cuda_shim_stream_destroy", linkageName: "cuda_shim_stream_destroy", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
351351# !11 = !DISubprogram(name: "cuda_shim_free", linkageName: "cuda_shim_free", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
352352# !12 = !DISubprogram(name: "cuda_shim_stream_synchronize", linkageName: "cuda_shim_stream_synchronize", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
353- # !13 = !DISubprogram(name: "cuda_shim_launch_block_packed ", linkageName: "cuda_shim_launch_block_packed ", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
353+ # !13 = !DISubprogram(name: "cuda_shim_launch_grid_packed ", linkageName: "cuda_shim_launch_grid_packed ", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
354354# !14 = !DISubprogram(name: "cuda_shim_memcpy_d2h", linkageName: "cuda_shim_memcpy_d2h", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
355355# !15 = !DISubprogram(name: "cuda_shim_memcpy_h2d", linkageName: "cuda_shim_memcpy_h2d", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
356356# !16 = !DISubprogram(name: "cuda_shim_malloc", linkageName: "cuda_shim_malloc", scope: !9, file: !9, line: 1, type: !4, scopeLine: 1, spFlags: DISPFlagOptimized)
0 commit comments