@@ -3433,13 +3433,15 @@ IntrinsicLibrary::genBarrierTryWait(mlir::Type resultType,
34333433 builder.setInsertionPointToStart (afterBlock);
34343434 auto llvmPtrTy = mlir::LLVM::LLVMPointerType::get (builder.getContext ());
34353435 auto barrier = builder.createConvert (loc, llvmPtrTy, args[0 ]);
3436- mlir::Value ret =
3437- mlir::NVVM::InlinePtxOp::create (
3438- builder, loc, {resultType}, {barrier, args[1 ], ns}, {},
3439- " .reg .pred p; mbarrier.try_wait.shared.b64 p, [%1], %2, %3; "
3440- " selp.b32 %0, 1, 0, p;" ,
3441- {})
3442- .getResult (0 );
3436+ mlir::Value ret = mlir::NVVM::InlinePtxOp::create (
3437+ builder, loc, {resultType}, {barrier, args[1 ], ns}, {},
3438+ " {\n "
3439+ " .reg .pred p;\n "
3440+ " mbarrier.try_wait.shared.b64 p, [%1], %2, %3;\n "
3441+ " selp.b32 %0, 1, 0, p;\n "
3442+ " }" ,
3443+ {})
3444+ .getResult (0 );
34433445 mlir::scf::YieldOp::create (builder, loc, ret);
34443446 builder.setInsertionPointAfter (whileOp);
34453447 return whileOp.getResult (0 );
@@ -3454,8 +3456,11 @@ IntrinsicLibrary::genBarrierTryWaitSleep(mlir::Type resultType,
34543456 auto barrier = builder.createConvert (loc, llvmPtrTy, args[0 ]);
34553457 return mlir::NVVM::InlinePtxOp::create (
34563458 builder, loc, {resultType}, {barrier, args[1 ], args[2 ]}, {},
3457- " .reg .pred p; mbarrier.try_wait.shared.b64 p, [%1], %2, %3; "
3458- " selp.b32 %0, 1, 0, p;" ,
3459+ " {\n "
3460+ " .reg .pred p;\n "
3461+ " mbarrier.try_wait.shared.b64 p, [%1], %2, %3;\n "
3462+ " selp.b32 %0, 1, 0, p;\n "
3463+ " }" ,
34593464 {})
34603465 .getResult (0 );
34613466}
0 commit comments