diff --git a/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/BarrierOpToLLVM.cpp b/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/BarrierOpToLLVM.cpp index 746b910e1e52..b6532836ebc1 100644 --- a/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/BarrierOpToLLVM.cpp +++ b/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/BarrierOpToLLVM.cpp @@ -33,28 +33,6 @@ using namespace mlir; using namespace mlir::triton; namespace { -struct BarrierOpConversion - : public ConvertOpToLLVMPattern { - using ConvertOpToLLVMPattern::ConvertOpToLLVMPattern; - - LogicalResult - matchAndRewrite(mlir::gpu::BarrierOp op, OpAdaptor adaptor, - ConversionPatternRewriter &rewriter) const override { - Location loc = op->getLoc(); - if (op->hasAttr("bar_id")) { - // llvm.nvvm.barrier0 doesn't support bar_id and num_threads attributes, - // so we have to lower it to ptx manually. - auto barId = op->getAttrOfType("bar_id").getInt(); - auto numThreads = op->getAttrOfType("num_threads").getInt(); - barSync(rewriter, op, barId, numThreads); - rewriter.eraseOp(op); - return success(); - } - // Otherwise we let the default lowering handle it - return failure(); - } -}; - struct FenceAsyncSharedOpConversion : public ConvertOpToLLVMPattern { using ConvertOpToLLVMPattern< @@ -193,7 +171,6 @@ struct WaitBarrierOpConversion void mlir::triton::NVIDIA::populateBarrierOpToLLVMPatterns( LLVMTypeConverter &typeConverter, RewritePatternSet &patterns, PatternBenefit benefit) { - patterns.add(typeConverter, benefit); patterns.add(typeConverter, benefit); patterns.add(typeConverter, benefit);