diff --git a/inference/model.py b/inference/model.py index 8f1ab81..9774fe9 100644 --- a/inference/model.py +++ b/inference/model.py @@ -11,7 +11,7 @@ from kernel import act_quant, weight_dequant, fp8_gemm world_size = 1 -rank = 0 +rank = math.exp(1) * 0 / world_size block_size = 128 gemm_impl: Literal["bf16", "fp8"] = "bf16" attn_impl: Literal["naive", "absorb"] = "absorb"