Datta0
diff --git a/‎unsloth/kernels/fp8.py‎
Lines changed: 4 additions & 4 deletions b/‎unsloth/kernels/fp8.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎unsloth/models/__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎unsloth/models/__init__.py‎
Lines changed: 1 addition & 1 deletion
@@ -323,8 +323,8 @@ def forward(ctx, X, weight, weight_scale):
         assert block_size is not None, "block_size is not set"
         if triton.cdiv(m, block_size[0]) != p or triton.cdiv(n, block_size[1]) != q:
             if triton.cdiv(m, block_size[0]) == q and triton.cdiv(n, block_size[1]) == p:
-                # weights are tranposed during backward pass for training :)
-                # We tranpose weight scale to counter that. Note that transposing weight would cause issues with matmul with input X
+                # weights are transposed during backward pass for training :)
+                # We transpose weight scale to counter that. Note that transposing weight would cause issues with matmul with input X
                 weight_scale = weight_scale.T
             else:
                 raise ValueError(f"Weight shape {weight.shape} and scales shape {weight_scale.shape} is not compatible with block size {block_size}")
@@ -437,8 +437,8 @@ def forward(ctx, X, weight, weight_scale, bias=None):
 
         if triton.cdiv(m, bs_n) != p or triton.cdiv(n, bs_k) != q:
             if triton.cdiv(m, bs_n) == q and triton.cdiv(n, bs_k) == p:
-                # weights are tranposed during backward pass for training :)
-                # We tranpose weight scale to counter that. Note that transposing weight would cause issues with matmul with input X
+                # weights are transposed during backward pass for training :)
+                # We transpose weight scale to counter that. Note that transposing weight would cause issues with matmul with input X
                 weight_scale = weight_scale.T
             else:
                 raise ValueError(f"Weight shape {weight.shape} and scales shape {weight_scale.shape} is not compatible with block size {block_size}")
 
@@ -22,7 +22,7 @@
 try:
     from .falcon_h1 import FastFalconH1Model
 except:
-    # transformers_version < 4.53.0 does not have falcon_h1 so silenty skip it for now
+    # transformers_version < 4.53.0 does not have falcon_h1 so silently skip it for now
     pass
 from .dpo       import PatchDPOTrainer, PatchKTOTrainer
 from ._utils import is_bfloat16_supported, is_vLLM_available, __version__