pulp-platform · lukamac · Jul 20, 2023 · Dec 1, 2023 · Dec 1, 2023 · Jan 9, 2024
diff --git a/algorithms/pact/pact_ops.py b/algorithms/pact/pact_ops.py
@@ -112,8 +112,8 @@ def forward(ctx, x, mul, add, div, signed, n_levels_out, cmsis_requant):
             # division. Division is with flooring.
             else:
                 y = x * mul + add
-                # Avoid round to even behaviour, friggin pytorch
-                y = torch.floor((y / div) + 0.5)
+                # LMACAN: Dory doesn't like the `+ 0.5` fix
+                y = torch.floor(y / div)
 
             if not signed:
             # if unsigned: clip y to interval (0, n_levels-1)

diff --git a/backends/cutie/__init__.py b/backends/cutie/__init__.py
@@ -19,5 +19,4 @@
 # limitations under the License.
 # 
 
-from . import grrules
 from .cutie_export import convert_net, export_net
diff --git a/backends/cutie/grrules/__init__.py b/backends/cutie/grrules/__init__.py
diff --git a/backends/cutie/grrules/ana/__init__.py b/backends/cutie/grrules/ana/__init__.py
diff --git a/backends/cutie/grrules/ana/dporules.py b/backends/cutie/grrules/ana/dporules.py
diff --git a/backends/cutie/grrules/ana/folding.py b/backends/cutie/grrules/ana/folding.py
diff --git a/backends/cutie/grrules/ana/lutactivation.py b/backends/cutie/grrules/ana/lutactivation.py
diff --git a/backends/dory/dory_passes.py b/backends/dory/dory_passes.py
@@ -116,7 +116,7 @@ def __init__(self):
 class DORYAdder(nn.Module):
     class DORYAdderFun(torch.autograd.Function):
         @staticmethod
-        def forward(ctx, x1, rq1, x2, rq2, rq_out):
+        def forward(ctx, x1, rq1, x2, rq2, rq_out, out_n_levels):
             if rq1:
                 x1 = rq1(x1)
             if rq2:
@@ -127,10 +127,20 @@ def forward(ctx, x1, rq1, x2, rq2, rq_out):
             if rq_out:
                 x_sum = rq_out(x_sum)
 
+            out_signed = rq_out.signed if rq_out else False
+            if out_signed:
+                out_min = -(out_n_levels // 2)
+                out_max = (out_n_levels - 1) // 2
+            else:
+                out_min = 0
+                out_max = out_n_levels - 1
+
+            x_sum = torch.clamp(x_sum, out_min, out_max)
+
             return x_sum
 
         @staticmethod
-        def symbolic(g, x1, rq1, x2, rq2, rq_out):
+        def symbolic(g, x1, rq1, x2, rq2, rq_out, out_n_levels):
 
             params = {}
             out_signed_inferred = False
@@ -146,7 +156,10 @@ def symbolic(g, x1, rq1, x2, rq2, rq_out):
                     mul = 1
                     add = 0
                     shift = 0
-                    n_l = 256
+                    if name == "out":
+                        n_l = out_n_levels
+                    else:
+                        n_l = 256
                     requant = 0
                 if name == "out":
                     if module:
@@ -175,7 +188,7 @@ def __init__(self, in1_requant : Optional[nn.Module], in2_requant : Optional[nn.
 
 
     def forward(self, x1, x2):
-        return self.DORYAdderFun.apply(x1, self.in1_requant, x2, self.in2_requant, self.out_requant)
+        return self.DORYAdderFun.apply(x1, self.in1_requant, x2, self.in2_requant, self.out_requant, self.out_n_levels)
 
 
 class DORYReplaceAddersPass(OpTreeReplacementPass):

diff --git a/backends/twn_accelerator/grrules/__init__.py b/backends/twn_accelerator/grrules/__init__.py