Merge 37f0b41ac6 into 4cc6253d5c

2025-07-18 15:19:09 -04:00 · 2025-05-09 21:17:06 -04:00 · 2025-05-09 21:17:06 -04:00 · 1884be889e
commit 1884be889e
parent 4cc6253d5c 37f0b41ac6
1 changed files with 1 additions and 1 deletions
--- a/inference/kernel.py
+++ b/inference/kernel.py
@ -32,7 +32,7 @@ def act_quant_kernel(x_ptr, y_ptr, s_ptr, BLOCK_SIZE: tl.constexpr):
 def act_quant(x: torch.Tensor, block_size: int = 128) -> Tuple[torch.Tensor, torch.Tensor]:
    """
-    Quantizes the input tensor `x` using block-wise quantization.
+    Quantizes the input tensor `x` using block-wise quantization as implemented in the given function.
    Args:
        x (torch.Tensor): The input tensor to be quantized. Must be contiguous and its last dimension size must be divisible by `block_size`.