mirror of
https://github.com/volcengine/verl.git
synced 2025-10-20 13:43:50 +08:00
18 lines
616 B
Bash
18 lines
616 B
Bash
# Tested in 4 GPUs
|
|
|
|
set -x
|
|
|
|
hdfs_path=hdfs://user/verl/experiments/gsm8k/gemma-2b-it/ # replace to your own hdfs/local path
|
|
|
|
TORCHRUN -m verl.trainer.fsdp_sft_trainer \
|
|
data.train_files=$HOME/data/gsm8k/train.parquet \
|
|
data.val_files=$HOME/data/gsm8k/test.parquet \
|
|
data.prompt_key=question \
|
|
data.response_key=answer \
|
|
data.micro_batch_size=32 \
|
|
model.partial_pretrain=google/gemma-2b-it \
|
|
trainer.default_hdfs_dir=$hdfs_path \
|
|
trainer.project_name=gsm8k-sft \
|
|
trainer.experiment_name=gsm8k-sft-gemma-2b-it \
|
|
trainer.total_epochs=3 \
|
|
trainer.logger=['console','tracking'] |