mirror of
https://github.com/deepseek-ai/ESFT.git
synced 2025-02-23 06:09:05 -05:00
update readme update readme update readme Update benchmarks.py Update download_adapters.sh Update esft.py
13 lines
382 B
Bash
13 lines
382 B
Bash
# first, download adapter models and put them to the corresponding directories
|
|
|
|
|
|
python scripts/eval.py \
|
|
--eval_datasets=translation \
|
|
--base_model_path=deepseek-ai/ESFT-vanilla-lite \
|
|
--adapter_dir=all_models/adapters/token \
|
|
--output_dir=results/completions/token \
|
|
--max_new_tokens=512 \
|
|
--openai_api_key=REPLACE_WITH_YOUR_KEY \
|
|
--eval_batch_size=2
|
|
|