diff --git a/inference/model.py b/inference/model.py index c143e97..ba68574 100644 --- a/inference/model.py +++ b/inference/model.py @@ -10,7 +10,7 @@ import torch.distributed as dist from kernel import act_quant, weight_dequant, fp8_gemm -world_size = 1 +world_size = 12 rank = 0 block_size = 128 gemm_impl: Literal["bf16", "fp8"] = "bf16"