[mlir][nvpu] Prevent F32ToTF32 pattern to generate illegal IR

author Thomas Raoux <thomasraoux@google.com>

Mon, 15 Aug 2022 16:16:46 +0000 (16:16 +0000)

committer Thomas Raoux <thomasraoux@google.com>

Mon, 15 Aug 2022 16:46:18 +0000 (16:46 +0000)
author Thomas Raoux <thomasraoux@google.com>
Mon, 15 Aug 2022 16:16:46 +0000 (16:16 +0000)
committer Thomas Raoux <thomasraoux@google.com>
Mon, 15 Aug 2022 16:46:18 +0000 (16:46 +0000)
diff --git a/mlir/lib/Dialect/NVGPU/Transforms/MmaSyncTF32Transform.cpp b/mlir/lib/Dialect/NVGPU/Transforms/MmaSyncTF32Transform.cpp

index 4ef93b3..d24001c 100644 (file)
--- a/mlir/lib/Dialect/NVGPU/Transforms/MmaSyncTF32Transform.cpp
+++ b/mlir/lib/Dialect/NVGPU/Transforms/MmaSyncTF32Transform.cpp
@@ -42,7 +42,8 @@ struct MmaSyncF32ToTF32Pattern : public OpRewritePattern<nvgpu::MmaSyncOp> {
                                  PatternRewriter &rewrite) const override {
      Location location = op->getLoc();
  
-    if (op->hasAttr(op.getTf32EnabledAttrName()))
+    if (op->hasAttr(op.getTf32EnabledAttrName()) ||
+        !op.getMatrixA().getType().cast<VectorType>().getElementType().isF32())
        return failure();
  
      if (precision == MmaSyncF32Lowering::Unkown)
diff --git a/mlir/test/Dialect/NVGPU/mma-sync-f32-to-tf32.mlir b/mlir/test/Dialect/NVGPU/mma-sync-f32-to-tf32.mlir

index a8c7226..80de11f 100644 (file)
--- a/mlir/test/Dialect/NVGPU/mma-sync-f32-to-tf32.mlir
+++ b/mlir/test/Dialect/NVGPU/mma-sync-f32-to-tf32.mlir
@@ -18,3 +18,12 @@ func.func @m16n8k8_tf32(%arg0: vector<4x1xf32>, %arg1: vector<2x1xf32>, %arg2: v
    return %d : vector<2x2xf32>
  }
  // -----
+
+// Negative test for non f32 case.
+// CHECK-LABEL: mma_sync_f16
+//   CHECK-NOT: tf32Enabled
+//       CHECK: return
+func.func @mma_sync_f16(%arg0: vector<4x2xf16>, %arg1: vector<2x2xf16>, %arg2: vector<2x2xf16>) -> vector<2x2xf16> {
+  %d = nvgpu.mma.sync (%arg0, %arg1, %arg2) {mmaShape = [16, 8, 16]} : (vector<4x2xf16>, vector<2x2xf16>, vector<2x2xf16>) -> vector<2x2xf16>
+  return %d : vector<2x2xf16>
+}
author	Thomas Raoux <thomasraoux@google.com>
	Mon, 15 Aug 2022 16:16:46 +0000 (16:16 +0000)
committer	Thomas Raoux <thomasraoux@google.com>
	Mon, 15 Aug 2022 16:46:18 +0000 (16:46 +0000)
mlir/lib/Dialect/NVGPU/Transforms/MmaSyncTF32Transform.cpp		patch \| blob \| history
mlir/test/Dialect/NVGPU/mma-sync-f32-to-tf32.mlir		patch \| blob \| history