Files
verl/examples/sft/gsm8k/run_gemma_2b.sh
2024-10-31 14:29:44 +08:00

18 lines
616 B
Bash

# Tested in 4 GPUs
set -x
hdfs_path=hdfs://user/verl/experiments/gsm8k/gemma-2b-it/ # replace to your own hdfs/local path
TORCHRUN -m verl.trainer.fsdp_sft_trainer \
data.train_files=$HOME/data/gsm8k/train.parquet \
data.val_files=$HOME/data/gsm8k/test.parquet \
data.prompt_key=question \
data.response_key=answer \
data.micro_batch_size=32 \
model.partial_pretrain=google/gemma-2b-it \
trainer.default_hdfs_dir=$hdfs_path \
trainer.project_name=gsm8k-sft \
trainer.experiment_name=gsm8k-sft-gemma-2b-it \
trainer.total_epochs=3 \
trainer.logger=['console','tracking']