DequantizeLinear should support non-zero zero_point when input type is int32 (microsoft#25646)

wangw-1991 · web-flow · commit 0b15200243c2 · 2025-08-27T20:00:07.000-07:00
### Description
This PR makes DequantizeLinear support non-zero zero_point when input
data type is int32.



### Motivation and Context
For WebNN use case, we have some scenarios that input data type is int32
and the zero_point is not zero for DequantizeLinear.
diff --git a/onnxruntime/core/providers/cpu/quantization/quantize_linear.cc b/onnxruntime/core/providers/cpu/quantization/quantize_linear.cc
@@ -520,14 +520,12 @@ Status DequantizeLinear<T>::Compute(OpKernelContext* ctx) const {
   const T* zero_point = x_zero_point ? x_zero_point->Data<T>() : nullptr;
 
 #if !defined(DISABLE_FLOAT8_TYPES)
-  if constexpr (boost::mp11::mp_contains<boost::mp11::mp_append<element_type_lists::AllFloat8,
-                                                                TypeList<int32_t>>,
-                                         T>::value) {
+  if constexpr (boost::mp11::mp_contains<element_type_lists::AllFloat8, T>::value) {
     ORT_ENFORCE(zero_point == nullptr ||
                     std::all_of(zero_point,
                                 zero_point + x_zero_point->Shape().Size(),
                                 [](T zp) { return zp == T{0}; }),
-                "DequantizeLinear with type int32 or float8 should have no zero point or all zero points should be 0");
+                "DequantizeLinear with type float8 should have no zero point or all zero points should be 0");
   }
 #endif
 
diff --git a/onnxruntime/test/providers/cpu/tensor/quantize_linear_test.cc b/onnxruntime/test/providers/cpu/tensor/quantize_linear_test.cc
@@ -137,7 +137,7 @@ TEST(DequantizeLinearOpTest, Uint16) {
   test.Run(OpTester::ExpectResult::kExpectSuccess, "", {kTensorrtExecutionProvider});
 }
 
-// scalar zero & scale with int8
+// scalar zero & scale with int32
 TEST(DequantizeLinearOpTest, Int32) {
   OpTester test("DequantizeLinear", 10);
   std::vector<int64_t> dims{4};
@@ -147,6 +147,17 @@ TEST(DequantizeLinearOpTest, Int32) {
   test.Run();
 }
 
+// non-zero zero point with int32
+TEST(DequantizeLinearOpTest, Int32_Non_Zero_Zero_Point) {
+  OpTester test("DequantizeLinear", 10);
+  std::vector<int64_t> dims{4};
+  test.AddInput<int32_t>("x", dims, {-30, -3, 100, 127});
+  test.AddInput<float>("x_scale", {}, {2.0f}, true);
+  test.AddInput<int32_t>("x_zero_point", {}, {1}, true);
+  test.AddOutput<float>("y", dims, {-62.f, -8.f, 198.f, 252.f});
+  test.Run();
+}
+
 TEST(DequantizeLinearOpTest_BroadcastTensor, Int32) {
   OpTester test("DequantizeLinear", 13);
   test.AddInput<int32_t>("x", {4}, {-30, -3, 100, 127});