mirror of
https://github.com/volcengine/verl.git
synced 2025-10-20 13:43:50 +08:00
17 lines
583 B
Bash
17 lines
583 B
Bash
python3 -m verl.trainer.main_generation \
|
|
trainer.nnodes=1 \
|
|
trainer.n_gpus_per_node=8 \
|
|
data.path=~/data/rlhf/gsm8k/test.parquet \
|
|
data.prompt_key=prompt \
|
|
data.n_samples=1 \
|
|
data.output_path=~/data/rlhf/math/deepseek_v2_lite_gen_test.parquet \
|
|
model.path=deepseek-ai/deepseek-llm-7b-chat \
|
|
+model.trust_remote_code=True \
|
|
rollout.temperature=1.0 \
|
|
rollout.top_k=50 \
|
|
rollout.top_p=0.7 \
|
|
rollout.prompt_length=2048 \
|
|
rollout.response_length=1024 \
|
|
rollout.tensor_model_parallel_size=2 \
|
|
rollout.gpu_memory_utilization=0.8
|