ROCm
diff --git a/‎mlir/include/mlir/Dialect/MIGraphX/IR/MIGraphX.td‎
Lines changed: 16 additions & 6 deletions b/‎mlir/include/mlir/Dialect/MIGraphX/IR/MIGraphX.td‎
Lines changed: 16 additions & 6 deletions
diff --git a/‎mlir/lib/Conversion/MIGraphXToLinalg/MIGraphXToLinalg.cpp‎
Lines changed: 371 additions & 10 deletions b/‎mlir/lib/Conversion/MIGraphXToLinalg/MIGraphXToLinalg.cpp‎
Lines changed: 371 additions & 10 deletions
diff --git a/‎mlir/lib/Conversion/MIGraphXToTosa/MIGraphXToTosa.cpp‎
Lines changed: 0 additions & 6 deletions b/‎mlir/lib/Conversion/MIGraphXToTosa/MIGraphXToTosa.cpp‎
Lines changed: 0 additions & 6 deletions
diff --git a/‎mlir/test/Conversion/MIGraphXToLinalg/migraphx-to-linalg-not-implemented.mlir‎
Lines changed: 0 additions & 12 deletions b/‎mlir/test/Conversion/MIGraphXToLinalg/migraphx-to-linalg-not-implemented.mlir‎
Lines changed: 0 additions & 12 deletions
diff --git a/‎mlir/test/Conversion/MIGraphXToLinalg/mixr-to-linalg-ops.mlir‎
Lines changed: 302 additions & 0 deletions b/‎mlir/test/Conversion/MIGraphXToLinalg/mixr-to-linalg-ops.mlir‎
Lines changed: 302 additions & 0 deletions
diff --git a/‎mlir/test/Conversion/MIGraphXToTosa/mixr-to-tosa-ops.mlir‎
Lines changed: 2 additions & 2 deletions b/‎mlir/test/Conversion/MIGraphXToTosa/mixr-to-tosa-ops.mlir‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎mlir/test/Dialect/MIGraphX/invalid.mlir‎
Lines changed: 11 additions & 0 deletions b/‎mlir/test/Dialect/MIGraphX/invalid.mlir‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎mlir/test/fusion/e2e/mixr-quantizelinear/lit.local.cfg‎
Lines changed: 2 additions & 0 deletions b/‎mlir/test/fusion/e2e/mixr-quantizelinear/lit.local.cfg‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎mlir/test/fusion/e2e/mixr-quantizelinear/mixr-quant-quant-dot-bias-f8E4M3FN.mlir‎
Lines changed: 8 additions & 0 deletions b/‎mlir/test/fusion/e2e/mixr-quantizelinear/mixr-quant-quant-dot-bias-f8E4M3FN.mlir‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎mlir/test/fusion/e2e/mixr-quantizelinear/mixr-quant-quant-dot-bias-i8.mlir‎
Lines changed: 8 additions & 0 deletions b/‎mlir/test/fusion/e2e/mixr-quantizelinear/mixr-quant-quant-dot-bias-i8.mlir‎
Lines changed: 8 additions & 0 deletions
@@ -229,12 +229,22 @@ def MIGraphX_UnpackOp : MIGraphX_Op<"unpack">,
 
 // Quantization operations.
 
-def MIGraphX_QuantizeLinearOp :
-    MIGraphX_Op<"quantizelinear", [AllElementTypesMatch<["input", "scale"]>]>,
-    Arguments<(ins MIXRShapedOf<[AnyFloat]>:$input,
-                   MIXRShapedOf<[AnyFloat]>:$scale,
-                   Optional<MIXRShapedOf<[AnyInteger, AnyFloat]>>:$bias)>,
-	  Results<(outs MIXRShapedOf<[AnyInteger, AnyFloat]>:$output)> {
+def MIGraphX_QuantizeLinearOp
+    : MIGraphX_Op<
+          "quantizelinear",
+          [AllElementTypesMatch<["input", "scale"]>,
+           PredOpTrait<
+               "output and bias must have the same element type",
+               Or<[CPred<"!::llvm::cast<QuantizeLinearOp>($_op).getBias()">,
+                   CPred<"::mlir::getElementTypeOrSelf("
+                         "::llvm::cast<QuantizeLinearOp>($_op).getBias()) =="
+                         " ::mlir::getElementTypeOrSelf("
+                         "::llvm::cast<QuantizeLinearOp>($_op).getOutput()"
+                         ")">]>>]>,
+      Arguments<(ins MIXRShapedOf<[AnyFloat]>:$input,
+          MIXRShapedOf<[AnyFloat]>:$scale,
+          Optional<MIXRShapedOf<[AnyInteger, AnyFloat]>>:$bias)>,
+      Results<(outs MIXRShapedOf<[AnyInteger, AnyFloat]>:$output)> {
   let summary = "Channelwise quantization";
   let description = [{
     Quantization tensor channelwise. It computes the following:
 
@@ -1265,19 +1265,13 @@ LogicalResult QuantizeLinearConverter::matchAndRewrite(
                                  &itsExtendNoWayWeCanLoseInfo);
       std::ignore = maxF.convert(biasSem, APFloat::rmNearestTiesToEven,
                                  &itsExtendNoWayWeCanLoseInfo);
-      minI = APInt(64, (int64_t)(minF.convertToFloat()));
-      maxI = APInt(64, (int64_t)(minF.convertToFloat()));
     } else {
       minI = origOutputType.isUnsignedInteger()
                  ? APInt::getMinValue(width)
                  : APInt::getSignedMinValue(width);
       maxI = origOutputType.isUnsignedInteger()
                  ? APInt::getMaxValue(width)
                  : APInt::getSignedMaxValue(width);
-      minF.convertFromAPInt(minI, /*IsSigned=*/origOutputType.isSignedInteger(),
-                            APFloat::rmNearestTiesToEven);
-      maxF.convertFromAPInt(maxI, /*IsSigned=*/origOutputType.isSignedInteger(),
-                            APFloat::rmNearestTiesToEven);
     }
 
     Attribute minVal, maxVal;
 
@@ -1,17 +1,5 @@
 // RUN: rocmlir-opt --migraphx-to-linalg -verify-diagnostics %s 
 
-func.func @func_quantizelinear(%arg0: !migraphx.shaped<1x1xf32, 1x1>, %arg1: !migraphx.shaped<1x1xf32, 1x1>) {
-  // expected-error @+1{{failed to legalize operation 'migraphx.quantizelinear'}}
-  migraphx.quantizelinear %arg0, %arg1: <1x1xf32, 1x1>, <1x1xf32, 1x1> -> <1x1xf32, 1x1>
-  func.return
-}
-
-func.func @func_dequantizelinear(%arg0: !migraphx.shaped<1x1xf32, 1x1>, %arg1: !migraphx.shaped<1x1xf32, 1x1>) {
-  // expected-error @+1{{failed to legalize operation 'migraphx.dequantizelinear'}}
-  migraphx.dequantizelinear %arg0, %arg1: <1x1xf32, 1x1>, <1x1xf32, 1x1> -> <1x1xf32, 1x1>
-  func.return
-}
-
 func.func @func_quant_convolution(%arg0: !migraphx.shaped<1x1xi8, 1x1>, %arg1: !migraphx.shaped<1x1xi8, 1x1>) {
   // expected-error @+1{{failed to legalize operation 'migraphx.quant_convolution'}}
   migraphx.quant_convolution %arg0, %arg1 {dilation = [1, 1], group = 1 : i64, padding = [0, 0], stride = [1, 1]}: <1x1xi8, 1x1>, <1x1xi8, 1x1> -> <1x1xf32, 1x1>
 
@@ -186,8 +186,8 @@ module  {
   // CHECK: tosa.add
   // CHECK: tosa.clamp
   // CHECK: tosa.cast
-  func.func @quantize_scale_i32_bias_f16(%arg: !migraphx.shaped<1x112x112x64xf16, 802816x7168x64x1>, %scale: !migraphx.shaped<1x1x1x64xf16, 64x64x64x1>, %bias: !migraphx.shaped<1x1x1x64xi32, 64x64x64x1>) -> !migraphx.shaped<1x112x112x64xi8, 802816x7168x64x1> attributes {rock.kernel = "mixr"} {
-    %1 = migraphx.quantizelinear %arg, %scale, %bias : <1x112x112x64xf16, 802816x7168x64x1>, <1x1x1x64xf16, 64x64x64x1>, !migraphx.shaped<1x1x1x64xi32, 64x64x64x1> -> <1x112x112x64xi8, 802816x7168x64x1>
+  func.func @quantize_scale_i32_bias_f16(%arg: !migraphx.shaped<1x112x112x64xf16, 802816x7168x64x1>, %scale: !migraphx.shaped<1x1x1x64xf16, 64x64x64x1>, %bias: !migraphx.shaped<1x1x1x64xi8, 64x64x64x1>) -> !migraphx.shaped<1x112x112x64xi8, 802816x7168x64x1> attributes {rock.kernel = "mixr"} {
+    %1 = migraphx.quantizelinear %arg, %scale, %bias : <1x112x112x64xf16, 802816x7168x64x1>, <1x1x1x64xf16, 64x64x64x1>, !migraphx.shaped<1x1x1x64xi8, 64x64x64x1> -> <1x112x112x64xi8, 802816x7168x64x1>
     return %1 : !migraphx.shaped<1x112x112x64xi8, 802816x7168x64x1>
   }
 
 
@@ -458,3 +458,14 @@ func.func @invalid_shape_mismatch(%input: !migraphx.shaped<10x10xf32, 10x1>) {
   %result = migraphx.slice %input {axes = [0], starts = [0], ends = [5]} : <10x10xf32, 10x1> -> <3x10xf32, 10x1>
   func.return
 }
+
+// -----
+
+func.func @quantize_scale_bias_ui32(%arg: !migraphx.shaped<1x112x112x64xf32, 802816x7168x64x1>,
+    %scale: !migraphx.shaped<1x1x1x64xf32, 64x64x64x1>,
+    %bias: !migraphx.shaped<1x1x1x64xi32, 64x64x64x1>) -> !migraphx.shaped<1x112x112x64xf16, 802816x7168x64x1> attributes {rock.kernel = "mixr"} {
+  // expected-error @+1 {{failed to verify that output and bias must have the same element type}}
+  %1 = migraphx.quantizelinear %arg, %scale, %bias :
+    <1x112x112x64xf32, 802816x7168x64x1>, <1x1x1x64xf32, 64x64x64x1>, !migraphx.shaped<1x1x1x64xi32, 64x64x64x1> -> <1x112x112x64xf16, 802816x7168x64x1>
+  return %1 : !migraphx.shaped<1x112x112x64xf16, 802816x7168x64x1>
+}
@@ -0,0 +1,2 @@
+if not config.arch_support_accel_fp8 or (config.arch and "gfx942" in config.arch):
+    config.unsupported = True
@@ -0,0 +1,8 @@
+// RUN: rocmlir-gen -fut mlir_quantizelinear_f8E4M3FN --arch %arch --clone-harness %s | rocmlir-driver -kernel-pipeline=migraphx-linalg,highlevel -host-pipeline=migraphx,highlevel -targets %arch | rocmlir-gen -ph -rand 1 -rand_type float -fut mlir_quantizelinear_f8E4M3FN_wrapper --verifier clone -relDiff_threshold 0.00001 - | rocmlir-driver -host-pipeline mhal,runner -kernel-pipeline full -targets %arch  | rocmlir-opt --emulate-fp8-ext-trunc | xmir-runner --shared-libs=%linalg_test_lib_dir/libmlir_rocm_runtime%shlibext,%conv_validation_wrapper_library_dir/libconv-validation-wrappers%shlibext,%linalg_test_lib_dir/libmlir_runner_utils%shlibext,%linalg_test_lib_dir/libmlir_float16_utils%shlibext,%linalg_test_lib_dir/libmlir_c_runner_utils%shlibext,%linalg_test_lib_dir/libmlir_async_runtime%shlibext --entry-point-result=void | FileCheck %s
+
+// CHECK: [1 1 1]
+func.func @mlir_quantizelinear_f8E4M3FN(%input: !migraphx.shaped<2x2xf32, 2x1>, %scale: !migraphx.shaped<2x2xf32, 2x1>, %bias: !migraphx.shaped<2x2xf8E4M3FN, 2x1>) -> !migraphx.shaped<2x2xf32, 2x1> {
+    %result = migraphx.quantizelinear %input, %scale, %bias : <2x2xf32, 2x1>, <2x2xf32, 2x1>, !migraphx.shaped<2x2xf8E4M3FN, 2x1> -> <2x2xf8E4M3FN, 2x1>
+    %dot_result = migraphx.quant_dot %result, %result : <2x2xf8E4M3FN, 2x1>, <2x2xf8E4M3FN, 2x1> -> <2x2xf32, 2x1>
+    return %dot_result : !migraphx.shaped<2x2xf32, 2x1>
+}
@@ -0,0 +1,8 @@
+// RUN: rocmlir-gen -fut mlir_quantizelinear_i8 --arch %arch --clone-harness %s | rocmlir-driver -kernel-pipeline=migraphx-linalg,highlevel -host-pipeline=migraphx,highlevel -targets %arch | rocmlir-gen -ph -rand 1 -rand_type float -fut mlir_quantizelinear_i8_wrapper --verifier clone -relDiff_threshold 0.00001 - | rocmlir-driver -host-pipeline mhal,runner -kernel-pipeline full -targets %arch  | xmir-runner --shared-libs=%linalg_test_lib_dir/libmlir_rocm_runtime%shlibext,%conv_validation_wrapper_library_dir/libconv-validation-wrappers%shlibext,%linalg_test_lib_dir/libmlir_runner_utils%shlibext,%linalg_test_lib_dir/libmlir_float16_utils%shlibext,%linalg_test_lib_dir/libmlir_c_runner_utils%shlibext,%linalg_test_lib_dir/libmlir_async_runtime%shlibext --entry-point-result=void | FileCheck %s
+
+// CHECK: [1 1 1]
+func.func @mlir_quantizelinear_i8(%input: !migraphx.shaped<2x2xf32, 2x1>, %scale: !migraphx.shaped<2x2xf32, 2x1>, %bias: !migraphx.shaped<2x2xi8, 2x1>) -> !migraphx.shaped<2x2xi32, 2x1> {
+    %result = migraphx.quantizelinear %input, %scale, %bias : <2x2xf32, 2x1>, <2x2xf32, 2x1>, !migraphx.shaped<2x2xi8, 2x1> -> <2x2xi8, 2x1>
+    %dot_result = migraphx.quant_dot %result, %result : <2x2xi8, 2x1>, <2x2xi8, 2x1> -> <2x2xi32, 2x1>
+    return %dot_result : !migraphx.shaped<2x2xi32, 2x1>
+}
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+if not config.arch_support_accel_fp8 or (config.arch and "gfx942" in config.arch):`
	`2`	`+ config.unsupported = True`