@@ -214,47 +214,36 @@ func.func @tma_load_multicast5d(%tmaDescriptor: !llvm.ptr, %dest : !llvm.ptr<3>,
214214
215215// CHECK-LABEL: @tma_store_1d
216216func.func @tma_store_1d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %p : i1 ) {
217- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.1d.global.shared::cta.bulk_group [$0, {$2} ], [$1];", "l,r,r"
218- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ] : !llvm.ptr , !llvm.ptr <3 >, i32
219217 // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$3 cp.async.bulk.tensor.1d.global.shared::cta.bulk_group [$0, {$2} ], [$1];", "l,r,r,b"
220- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i1
218+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
221219 return
222220}
223221
224222// CHECK-LABEL: @tma_store_2d
225223func.func @tma_store_2d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %p : i1 ) {
226- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.2d.global.shared::cta.bulk_group [$0, {$2, $3} ], [$1];", "l,r,r,r"
227- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32
228224 // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$4 cp.async.bulk.tensor.2d.global.shared::cta.bulk_group [$0, {$2, $3} ], [$1];", "l,r,r,r,b"
229- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i1
225+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
230226 return
231227}
232228
233229// CHECK-LABEL: @tma_store_3d
234230func.func @tma_store_3d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %crd2: i32 , %p : i1 ) {
235- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.3d.global.shared::cta.bulk_group [$0, {$2, $3, $4} ], [$1];", "l,r,r,r,r"
236- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32
237231 // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$5 cp.async.bulk.tensor.3d.global.shared::cta.bulk_group [$0, {$2, $3, $4} ], [$1];", "l,r,r,r,r,b"
238- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i1
232+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
239233 return
240234}
241235
242236// CHECK-LABEL: @tma_store_4d
243237func.func @tma_store_4d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %crd2: i32 , %crd3: i32 , %p : i1 ) {
244- // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.4d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5} ], [$1];", "l,r,r,r,r,r"
245- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32
246238 // CHECK: llvm.inline_asm has_side_effects asm_dialect = att "@$6 cp.async.bulk.tensor.4d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5} ], [$1];", "l,r,r,r,r,r,b"
247- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32 , i1
239+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
248240 return
249241}
250242
251243// CHECK-LABEL: @tma_store_5d
252244func.func @tma_store_5d (%tmaDescriptor: !llvm.ptr , %src : !llvm.ptr <3 >, %crd0: i32 , %crd1: i32 , %crd2: i32 , %crd3: i32 , %crd4: i32 , %p : i1 ) {
253- // CHECK-NEXT: llvm.inline_asm has_side_effects asm_dialect = att "cp.async.bulk.tensor.5d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5, $6} ], [$1];", "l,r,r,r,r,r,r"
254- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ,%crd4 ] : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32 , i32
255-
256245 // CHECK-NEXT: llvm.inline_asm has_side_effects asm_dialect = att "@$7 cp.async.bulk.tensor.5d.global.shared::cta.bulk_group [$0, {$2, $3, $4, $5, $6} ], [$1];", "l,r,r,r,r,r,r,b"
257- nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ,%crd4 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >, i32 , i32 , i32 , i32 , i32 , i1
246+ nvvm.cp.async.bulk.tensor.global.shared.cta %tmaDescriptor , %src , box [%crd0 ,%crd1 ,%crd2 ,%crd3 ,%crd4 ], predicate =%p : !llvm.ptr , !llvm.ptr <3 >
258247 return
259248}
260249
0 commit comments