mirror of
https://github.com/deepseek-ai/DeepSeek-V3.git
synced 2025-04-20 02:28:57 -04:00
sort filename to reduce memory costs
This commit is contained in:
parent
1e3a83629e
commit
e6e66fd23f
@ -30,6 +30,7 @@ def main(fp8_path, bf16_path):
|
|||||||
return loaded_files[file_name][tensor_name]
|
return loaded_files[file_name][tensor_name]
|
||||||
|
|
||||||
safetensor_files = list(glob(os.path.join(fp8_path, "*.safetensors")))
|
safetensor_files = list(glob(os.path.join(fp8_path, "*.safetensors")))
|
||||||
|
safetensor_files.sort()
|
||||||
for safetensor_file in tqdm(safetensor_files):
|
for safetensor_file in tqdm(safetensor_files):
|
||||||
file_name = os.path.basename(safetensor_file)
|
file_name = os.path.basename(safetensor_file)
|
||||||
current_state_dict = load_file(safetensor_file, device="cuda")
|
current_state_dict = load_file(safetensor_file, device="cuda")
|
||||||
|
Loading…
Reference in New Issue
Block a user