mirror of
https://github.com/deepseek-ai/ESFT
synced 2024-11-22 03:27:38 +00:00
18d23501ab
update readme update readme update readme Update benchmarks.py Update download_adapters.sh Update esft.py
13 lines
382 B
Bash
13 lines
382 B
Bash
# first, download adapter models and put them to the corresponding directories
|
|
|
|
|
|
python scripts/eval.py \
|
|
--eval_datasets=translation \
|
|
--base_model_path=deepseek-ai/ESFT-vanilla-lite \
|
|
--adapter_dir=all_models/adapters/token \
|
|
--output_dir=results/completions/token \
|
|
--max_new_tokens=512 \
|
|
--openai_api_key=REPLACE_WITH_YOUR_KEY \
|
|
--eval_batch_size=2
|
|
|