!27 added example yaml files for qwen2.5 distillation and deepseek-r1-distill-qwen sft

Merge pull request !27 from A1waysBeenHere/master
This commit is contained in:
A1waysBeenHere
2025-02-14 03:16:16 +00:00
committed by i-robot
parent 46cef0fedd
commit a868d0ab84
4 changed files with 59 additions and 3 deletions

View File

@ -0,0 +1,28 @@
# model
model_id: DeepSeek-r1-distill-qwen-7b
# method
stage: sft
do_train: true
finetuning_type: full
deepspeed: examples/deepspeed/ds_z2_config.json
# dataset
dataset: alpaca_zh_51k
cutoff_len: 1024
template: deepseek_r1
# output
output_dir: saves/deepseek_r1_distill_qwen_7b_lora
logging_steps: 1
save_steps: 5000
overwrite_output_dir: true
# train
per_device_train_batch_size: 8
learning_rate: 1.0e-5
lr_scheduler_type: cosine
warmup_ratio: 0.1
bf16: true
max_steps: 5000
seed: 1234

View File

@ -15,7 +15,7 @@ template: deepseek_r1
# output
output_dir: saves/deepseek_r1_distill_qwen_7b_lora
logging_steps: 1
save_steps: 500
save_steps: 5000
overwrite_output_dir: true
# train
@ -24,5 +24,5 @@ learning_rate: 1.0e-5
lr_scheduler_type: cosine
warmup_ratio: 0.1
bf16: true
max_steps: 2000
max_steps: 5000
seed: 1234

View File

@ -13,7 +13,7 @@ cutoff_len: 1024
template: deepseek_r1
# output
output_dir: saves/qwen2.5_7b_chat_lora
output_dir: saves/qwen2.5_7b_chat_distill_full
logging_steps: 1
save_steps: 20000
overwrite_output_dir: true

View File

@ -0,0 +1,28 @@
# model
model_id: Qwen2.5-7B-Chat
# method
stage: sft
do_train: true
finetuning_type: lora
deepspeed: examples/deepspeed/ds_z2_config.json
# dataset
dataset: sky_t1_17k
cutoff_len: 1024
template: deepseek_r1
# output
output_dir: saves/qwen2.5_7b_chat_distill_lora
logging_steps: 1
save_steps: 20000
overwrite_output_dir: true
# train
per_device_train_batch_size: 8
learning_rate: 1.0e-5
lr_scheduler_type: cosine
warmup_ratio: 0.1
bf16: true
max_steps: 5000
seed: 1234