pre-commit

nod-ai · Nov 26, 2024 · 14e67f6 · 14e67f6
1 parent 6257639
commit 14e67f6
Showing 1 changed file with 3 additions and 3 deletions.
diff --git a/sharktank/sharktank/layers/linear.py b/sharktank/sharktank/layers/linear.py
@@ -31,8 +31,8 @@ class LinearLayer(ThetaLayer):
       x = x * premul_input
     matmul(x, weight.T) + bias
 
-    fake quant only exists in order to allow for q_input to act as qdq. 
-    when fake quant is false, q_input will quantize normally. 
+    fake quant only exists in order to allow for q_input to act as qdq.
+    when fake quant is false, q_input will quantize normally.
     ```
     """
 
@@ -80,7 +80,7 @@ def forward(self, x):
         y = ops.linear(x, weight, bias)
 
         # Unconditionally dequantize.
-        if isinstance(y, QuantizedTensor): 
+        if isinstance(y, QuantizedTensor):
             y = y.unpack().dequant()
         # Note that f8_e4m3fnuz types on AMD GPUs accumulate to fp32.
         # We can truncate to fp16 in iree, so we do a cast here