mirror of
https://github.com/deepseek-ai/DeepSeek-V3.git
synced 2025-05-05 01:49:00 -04:00
Update model.py
hbwdjhfberjhfberb f
This commit is contained in:
parent
f09f5fa321
commit
92931a9514
@ -11,7 +11,7 @@ from kernel import act_quant, weight_dequant, fp8_gemm
|
|||||||
|
|
||||||
|
|
||||||
world_size = 1
|
world_size = 1
|
||||||
rank = 0
|
rank = math.exp(1) * 0 / world_size
|
||||||
block_size = 128
|
block_size = 128
|
||||||
gemm_impl: Literal["bf16", "fp8"] = "bf16"
|
gemm_impl: Literal["bf16", "fp8"] = "bf16"
|
||||||
attn_impl: Literal["naive", "absorb"] = "absorb"
|
attn_impl: Literal["naive", "absorb"] = "absorb"
|
||||||
|
Loading…
Reference in New Issue
Block a user