From b5a41225249e161f83b2ad222cae1445dcebd78b Mon Sep 17 00:00:00 2001
From: BruceDai <feng.dai@intel.com>
Date: Fri, 20 Jun 2025 11:52:01 +0800
Subject: [PATCH 1/4] add parameter's validations for dequantizeLinear and
 quantizeLinear ops

---
 src/dequantize_linear.js       |  2 ++
 src/lib/validate-input.js      | 29 +++++++++++++++++++++++++++++
 src/quantize_linear.js         |  2 ++
 test/dequantize_linear_test.js |  6 ++++--
 test/quantize_linear_test.js   |  9 +++++----
 5 files changed, 42 insertions(+), 6 deletions(-)

diff --git a/src/dequantize_linear.js b/src/dequantize_linear.js
index 888c7f7..f11419e 100644
--- a/src/dequantize_linear.js
+++ b/src/dequantize_linear.js
@@ -1,6 +1,7 @@
 'use strict';
 
 import {mul, sub} from './binary.js';
+import {validateQDQParams} from './lib/validate-input.js';
 
 /**
  * Elementwise operator to scale a low precision integer (typically uint8 with a zero-point bias)
@@ -12,5 +13,6 @@ import {mul, sub} from './binary.js';
  * @return {Tensor}
  */
 export function dequantizeLinear(input, scale, zeroPoint) {
+  validateQDQParams(input, scale, zeroPoint);
   return mul(sub(input, zeroPoint), scale);
 }
diff --git a/src/lib/validate-input.js b/src/lib/validate-input.js
index 88ff160..c54aa8b 100644
--- a/src/lib/validate-input.js
+++ b/src/lib/validate-input.js
@@ -861,3 +861,32 @@ export function validatePadParams(input, beginningPadding, endingPadding, mode)
     }
   }
 }
+
+export function validateQDQParams(input, scale, zeroPoint) {
+  const inputRank = input.rank;
+  const inputShape = input.shape;
+  const scaleRank = scale.rank;
+  const scaleShape = scale.shape;
+  const zeroPointRank = zeroPoint.rank;
+  const zeroPointShape = zeroPoint.shape;
+
+  if (inputRank != scaleRank) {
+    throw new Error(
+        `The scale's rank ${scaleRank} is not equal to the input's rank ${inputRank}.`);
+  }
+
+  if (inputRank != zeroPointRank) {
+    throw new Error(
+        `The zeroPoint's rank ${zeroPointRank} is not equal to the input's rank ${inputRank}.`);
+  }
+
+  if (!scaleShape.every((size, index) => size === zeroPointShape[index])) {
+    throw new Error(
+        `The scale's shape [${scaleShape}] is not equal to the zeroPoint's shape [${zeroPointShape}].`);
+  }
+
+  if (!inputShape.every((size, index) => size % scaleShape[index]) === 0) {
+    throw new Error(
+        `The scale's shape or zeroPoint's shape [${scaleShape}] is not equal to the zeroPoint's shape [${zeroPointShape}].`);
+  }
+}
diff --git a/src/quantize_linear.js b/src/quantize_linear.js
index 3b9ae40..d826eef 100644
--- a/src/quantize_linear.js
+++ b/src/quantize_linear.js
@@ -3,6 +3,7 @@
 import {add, div} from './binary.js';
 import {clamp} from './clamp.js';
 import {unary} from './unary.js';
+import {validateQDQParams} from './lib/validate-input.js';
 
 function roundToNearestEvens(x) {
   return Math.floor(x) % 2 == 0 ? Math.floor(x) : Math.ceil(x);
@@ -19,6 +20,7 @@ function roundToNearestEvens(x) {
  * @return {Tensor}
  */
 export function quantizeLinear(input, scale, zeroPoint, dataType) {
+  validateQDQParams(input, scale, zeroPoint);
   const dividedOutput = div(input, scale);
   const roundedOutput = unary(dividedOutput, (x) => roundToNearestEvens(x));
   const addedOutput = add(roundedOutput, zeroPoint);
diff --git a/test/dequantize_linear_test.js b/test/dequantize_linear_test.js
index 275f416..763fa24 100644
--- a/test/dequantize_linear_test.js
+++ b/test/dequantize_linear_test.js
@@ -141,7 +141,7 @@ describe('test dequantizeLinear', function() {
           ],
         },
         { // scale
-          shape: [3, 1],
+          shape: [1, 1, 3, 1],
           value: [
             1,
             2,
@@ -149,9 +149,11 @@ describe('test dequantizeLinear', function() {
           ],
         },
         { // zeroPoint
-          shape: [1],
+          shape: [1, 1, 3, 1],
           value: [
             0,
+            0,
+            0,
           ],
         },
         { // expected
diff --git a/test/quantize_linear_test.js b/test/quantize_linear_test.js
index ea7bea5..083bca5 100644
--- a/test/quantize_linear_test.js
+++ b/test/quantize_linear_test.js
@@ -107,16 +107,17 @@ describe('test quantizeLinear', function() {
           ],
         },
         { // scale
-          shape: [2, 1],
+          shape: [1, 1, 2, 1],
           value: [
             2,
             2,
           ],
         },
         { // zeroPoint
-          shape: [1],
+          shape: [1, 1, 2, 1],
           value: [
             10,
+            10,
           ],
         },
         'int8',
@@ -139,11 +140,11 @@ describe('test quantizeLinear', function() {
           ],
         },
         { // scale
-          shape: [1],
+          shape: [1, 1, 1, 1],
           value: [1],
         },
         { // zeroPoint
-          shape: [1],
+          shape: [1, 1, 1, 1],
           value: [100],
         },
         'int8',

From a1c9daea66c0639870edb70e2fa6935ca4ea4bb9 Mon Sep 17 00:00:00 2001
From: BruceDai <feng.dai@intel.com>
Date: Fri, 20 Jun 2025 11:59:08 +0800
Subject: [PATCH 2/4] support blockwise broadcast for scale and zeroPoint

---
 src/dequantize_linear.js |  6 ++++-
 src/lib/broadcast.js     | 57 ++++++++++++++++++++++++++++++++++++++++
 src/quantize_linear.js   |  8 ++++--
 3 files changed, 68 insertions(+), 3 deletions(-)

diff --git a/src/dequantize_linear.js b/src/dequantize_linear.js
index f11419e..eb92b94 100644
--- a/src/dequantize_linear.js
+++ b/src/dequantize_linear.js
@@ -1,6 +1,7 @@
 'use strict';
 
 import {mul, sub} from './binary.js';
+import {blockwiseExpand} from './lib/broadcast.js';
 import {validateQDQParams} from './lib/validate-input.js';
 
 /**
@@ -14,5 +15,8 @@ import {validateQDQParams} from './lib/validate-input.js';
  */
 export function dequantizeLinear(input, scale, zeroPoint) {
   validateQDQParams(input, scale, zeroPoint);
-  return mul(sub(input, zeroPoint), scale);
+
+  const broadcastedScale = blockwiseExpand(scale, input.shape);
+  const broadcastedZeroPoint = blockwiseExpand(zeroPoint, input.shape);
+  return mul(sub(input, broadcastedZeroPoint), broadcastedScale);
 }
diff --git a/src/lib/broadcast.js b/src/lib/broadcast.js
index 80cc62d..3fe0039 100644
--- a/src/lib/broadcast.js
+++ b/src/lib/broadcast.js
@@ -1,4 +1,6 @@
 import {Tensor} from './tensor.js';
+import {expand} from '../expand.js';
+import {reshape} from '../reshape.js';
 
 /**
  * Broadcast a Tensor to a compatible shape NumPy-style.
@@ -70,3 +72,58 @@ export function getBroadcastShape(shapeA, shapeB) {
   }
   return outShape;
 }
+
+export function blockwiseExpand(input, outputShape) {
+  // Given the original input and a desired output shape, this expands each axis
+  // by repeating the block the number of times per that axis. Though, backend
+  // implementations might have much more efficient upsampling operators that
+  // can accept multiple dimensions to upsample all dimensions at once by
+  // integer multiples (like tile) using nearest neighbor resampling:
+  // output = resample(scale, {sizes: input.shape})
+
+  let output = input;
+
+  for (let axis = 0; axis < input.shape.length; ++axis) {
+    const oldShape = output.shape;
+    const oldDimensionLength = oldShape[axis];
+    const newDimensionLength = outputShape[axis];
+
+    if (newDimensionLength != oldDimensionLength) {
+      // Since tile/expand can only accept repetitions of entire dimension
+      // slices (not repeating individual elements along an axis), temporarily
+      // reshape the tensor to enable them to broadcast the elements up to the
+      // full block size, utilizing an inserted dimension of size 1.
+      const elementRepeatCount = newDimensionLength / oldDimensionLength;
+      const flattenedShape = getFlattenedShapeAroundAxis(oldShape, axis);
+      const unexpandedShape =
+        [flattenedShape[0], flattenedShape[1], 1, flattenedShape[2]];
+      const expandedShape = [
+        flattenedShape[0],
+        flattenedShape[1],
+        elementRepeatCount,
+        flattenedShape[2],
+      ];
+      const reshapedInput = reshape(output, unexpandedShape);
+      output = expand(reshapedInput, expandedShape);
+
+      const newShape = [...oldShape];
+      newShape[axis] = newDimensionLength;
+      output = reshape(output, newShape);
+    }
+  }
+
+  return output;
+}
+
+// Compute the flattened shape before and after the given axis, yielding a
+// 3-element list: e.g.
+// - inputShape = [2,3,4,5,6] with axis = 2 yields shape [6,4,30].
+// - inputShape = [4] with axis = 0 yields shape [1,4,1].
+function getFlattenedShapeAroundAxis(inputShape, axis) {
+  axis = Math.max(Math.min(axis, inputShape.length - 1), 0);
+  const shapeBefore = inputShape.slice(0, axis);
+  const shapeAfter = inputShape.slice(axis + 1, inputShape.length);
+  const countBefore = shapeBefore.reduce((a, b) => a * b, 1);
+  const countAfter = shapeAfter.reduce((a, b) => a * b, 1);
+  return [countBefore, inputShape[axis], countAfter];
+}
diff --git a/src/quantize_linear.js b/src/quantize_linear.js
index d826eef..02a5865 100644
--- a/src/quantize_linear.js
+++ b/src/quantize_linear.js
@@ -3,6 +3,7 @@
 import {add, div} from './binary.js';
 import {clamp} from './clamp.js';
 import {unary} from './unary.js';
+import {blockwiseExpand} from './lib/broadcast.js';
 import {validateQDQParams} from './lib/validate-input.js';
 
 function roundToNearestEvens(x) {
@@ -21,9 +22,12 @@ function roundToNearestEvens(x) {
  */
 export function quantizeLinear(input, scale, zeroPoint, dataType) {
   validateQDQParams(input, scale, zeroPoint);
-  const dividedOutput = div(input, scale);
+
+  const broadcastedScale = blockwiseExpand(scale, input.shape);
+  const broadcastedZeroPoint = blockwiseExpand(zeroPoint, input.shape);
+  const dividedOutput = div(input, broadcastedScale);
   const roundedOutput = unary(dividedOutput, (x) => roundToNearestEvens(x));
-  const addedOutput = add(roundedOutput, zeroPoint);
+  const addedOutput = add(roundedOutput, broadcastedZeroPoint);
 
   let maxValue; let minValue;
   switch (dataType) {

From 43caed2a3129dcfc33a091530f68f80706fbecc6 Mon Sep 17 00:00:00 2001
From: BruceDai <feng.dai@intel.com>
Date: Fri, 20 Jun 2025 12:05:09 +0800
Subject: [PATCH 3/4] fix roundToNearestEvens function to get nearest integer

---
 src/quantize_linear.js       | 17 ++++++++++++++++-
 test/quantize_linear_test.js |  2 +-
 2 files changed, 17 insertions(+), 2 deletions(-)

diff --git a/src/quantize_linear.js b/src/quantize_linear.js
index 02a5865..38a4abb 100644
--- a/src/quantize_linear.js
+++ b/src/quantize_linear.js
@@ -6,8 +6,23 @@ import {unary} from './unary.js';
 import {blockwiseExpand} from './lib/broadcast.js';
 import {validateQDQParams} from './lib/validate-input.js';
 
+/**
+ * This function finds the nearest integer for x.
+ * In case of halves, the rule is to round them to the nearest even integer.
+ * @param {Number} x
+ * @return {Number} An interger number
+ */
 function roundToNearestEvens(x) {
-  return Math.floor(x) % 2 == 0 ? Math.floor(x) : Math.ceil(x);
+  if (Number.isInteger(x)) {
+    return x;
+  } else {
+    if (Math.abs(x - Math.trunc(x)) === 0.5) {
+      // case of halves
+      return Math.floor(x) % 2 == 0 ? Math.floor(x) : Math.ceil(x);
+    } else {
+      return Math.round(x);
+    }
+  }
 }
 
 /**
diff --git a/test/quantize_linear_test.js b/test/quantize_linear_test.js
index 083bca5..7464155 100644
--- a/test/quantize_linear_test.js
+++ b/test/quantize_linear_test.js
@@ -91,7 +91,7 @@ describe('test quantizeLinear', function() {
           value: [
             0, 2, 3, 255,
             0, 1, 2, 255,
-            0, 0, 0, 200,
+            0, 0, 1, 200,
           ],
         },
     );

From 6f3cb5355b7efa9aff0b05d40beb4f1d7dfe0922 Mon Sep 17 00:00:00 2001
From: BruceDai <feng.dai@intel.com>
Date: Mon, 23 Jun 2025 10:37:39 +0800
Subject: [PATCH 4/4] address dwayne's comments

---
 src/lib/validate-input.js | 2 +-
 src/quantize_linear.js    | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/lib/validate-input.js b/src/lib/validate-input.js
index c54aa8b..5777bb0 100644
--- a/src/lib/validate-input.js
+++ b/src/lib/validate-input.js
@@ -887,6 +887,6 @@ export function validateQDQParams(input, scale, zeroPoint) {
 
   if (!inputShape.every((size, index) => size % scaleShape[index]) === 0) {
     throw new Error(
-        `The scale's shape or zeroPoint's shape [${scaleShape}] is not equal to the zeroPoint's shape [${zeroPointShape}].`);
+        `The scale's shape or zeroPoint's shape [${scaleShape}] is not a multiple of the zeroPoint's shape [${zeroPointShape}].`);
   }
 }
diff --git a/src/quantize_linear.js b/src/quantize_linear.js
index 38a4abb..4a12c24 100644
--- a/src/quantize_linear.js
+++ b/src/quantize_linear.js
@@ -10,7 +10,7 @@ import {validateQDQParams} from './lib/validate-input.js';
  * This function finds the nearest integer for x.
  * In case of halves, the rule is to round them to the nearest even integer.
  * @param {Number} x
- * @return {Number} An interger number
+ * @return {Number} An integer number
  */
 function roundToNearestEvens(x) {
   if (Number.isInteger(x)) {