From 1ea5a1a7ed7429e25ba2fa2c76fe74fa5968d348 Mon Sep 17 00:00:00 2001 From: Kunal Janjirala <72312337+Kunaljanjirala123@users.noreply.github.com> Date: Sun, 11 May 2025 23:33:44 -0400 Subject: [PATCH] Update model.py --- inference/model.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/inference/model.py b/inference/model.py index c143e97..ba68574 100644 --- a/inference/model.py +++ b/inference/model.py @@ -10,7 +10,7 @@ import torch.distributed as dist from kernel import act_quant, weight_dequant, fp8_gemm -world_size = 1 +world_size = 12 rank = 0 block_size = 128 gemm_impl: Literal["bf16", "fp8"] = "bf16"