add an util function to detect platflorm and suitable dtype

2025-07-03 14:41:33 -04:00 · 2024-03-13 12:31:28 +01:00 · 2024-03-13 12:31:28 +01:00 · 494e622544
commit 494e622544
parent 5db8156747
1 changed files with 21 additions and 0 deletions
--- a/deepseek_vl/utils/io.py
+++ b/deepseek_vl/utils/io.py
@ -27,6 +27,27 @@ from transformers import AutoModelForCausalLM
 from deepseek_vl.models import MultiModalityCausalLM, VLChatProcessor
 def get_device_and_dtype():
    """
    Get the device and dtype for the model.
    """
    if torch.cuda.is_available():
        print("Using CUDA and BFloat16")
        device = torch.device("cuda")
        dtype = torch.bfloat16
    elif torch.backends.mps.is_available():
        print("Using MPS and FP16")
        device = torch.device("mps")
        dtype = torch.float16
    else:
        print("Using CPU and FP32")
        device = torch.device("cpu")
        dtype = torch.float32
    return device, dtype
 def load_pretrained_model(model_path: str):
    vl_chat_processor: VLChatProcessor = VLChatProcessor.from_pretrained(model_path)
    tokenizer = vl_chat_processor.tokenizer