diff --git a/mlir/test/Integration/GPU/CUDA/sm90/tma_load_64x8_8x128_noswizzle.mlir b/mlir/test/Integration/GPU/CUDA/sm90/tma_load_64x8_8x128_noswizzle.mlir index 2e59b7234e53d..391fda82e1e19 100644 --- a/mlir/test/Integration/GPU/CUDA/sm90/tma_load_64x8_8x128_noswizzle.mlir +++ b/mlir/test/Integration/GPU/CUDA/sm90/tma_load_64x8_8x128_noswizzle.mlir @@ -6,15 +6,6 @@ // RUN: --entry-point-result=void \ // RUN: | FileCheck %s -// Basic PTX check to make sure we are generating the right instructions. - -// CHECK-PTX: mbarrier.init.shared.b64 -// CHECK-PTX: mbarrier.arrive.expect_tx.shared.b64 -// CHECK-PTX: cp.async.bulk.tensor.2d.shared::cluster.global.mbarrier::complete_tx::bytes -// CHECK-PTX: cp.async.bulk.tensor.2d.shared::cluster.global.mbarrier::complete_tx::bytes -// CHECK-PTX: mbarrier.arrive.expect_tx.shared.b64 -// CHECK-PTX: mbarrier.try_wait.parity.shared.b64 - // RUN: mlir-opt %s --convert-nvgpu-to-nvvm \ // RUN: -gpu-kernel-outlining \ // RUN: -convert-nvvm-to-llvm \