ESFT/scripts/train.sh

12 lines
388 B
Bash
Raw Permalink Normal View History

2024-08-09 08:23:48 +00:00
export TOKENIZERS_PARALLELISM=false
exp_name="test/eval_translation"
2024-08-09 10:06:57 +00:00
base_model_path="deepseek-ai/esft-vanilla-lite"
2024-08-09 08:23:48 +00:00
# turn above to for loop
python train.py \
--base_model_path=${base_model_path} \
--expert_config=results/expert_configs/translation.json \
--train_dataset=translation \
--train_config=configs/base.yaml \
--output_dir=results/checkpoints/${exp_name}