Update app.py

2025-07-09 01:17:23 -04:00 · 2025-02-21 22:31:12 -06:00 · 2025-02-21 22:31:12 -06:00 · dd2f5c83d0
commit dd2f5c83d0
parent ae27c2cd96
1 changed files with 12 additions and 13 deletions
--- a/demo/app.py
+++ b/demo/app.py
@ -21,7 +21,6 @@ This Space demonstrates model [DeepSeek-Coder](https://huggingface.co/deepseek-a
 if not torch.cuda.is_available():
    DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
 if torch.cuda.is_available():
    model_id = "deepseek-ai/deepseek-coder-6.7b-instruct"
    model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.bfloat16, device_map="auto")
@ -29,7 +28,6 @@ if torch.cuda.is_available():
    tokenizer.use_default_system_prompt = False
@spaces.GPU
 def generate(
    message: str,
@ -56,11 +54,12 @@ def generate(
    streamer = TextIteratorStreamer(tokenizer, timeout=10.0, skip_prompt=True, skip_special_tokens=True)
    generate_kwargs = dict(
-        {"input_ids": input_ids},
+        input_ids=input_ids,
        streamer=streamer,
        max_new_tokens=max_new_tokens,
-        do_sample=False,
+        temperature=temperature,
-        num_beams=1,
+        top_p=top_p,
        top_k=top_k,
        repetition_penalty=repetition_penalty,
        eos_token_id=tokenizer.eos_token_id
    )
@ -70,7 +69,7 @@ def generate(
    outputs = []
    for text in streamer:
        outputs.append(text)
-        yield "".join(outputs).replace("<|EOT|>","")
+        yield "".join(outputs).replace("<|EOT|>", "")
 chat_interface = gr.ChatInterface(
@ -84,13 +83,13 @@ chat_interface = gr.ChatInterface(
            step=1,
            value=DEFAULT_MAX_NEW_TOKENS,
        ),
-        # gr.Slider(
+        gr.Slider(
-        #     label="Temperature",
+            label="Temperature",
-        #     minimum=0,
+            minimum=0,
-        #     maximum=4.0,
+            maximum=4.0,
-        #     step=0.1,
+            step=0.1,
-        #     value=0,
+            value=0.6,
-        # ),
+        ),
        gr.Slider(
            label="Top-p (nucleus sampling)",
            minimum=0.05,