lllqaq commited on
Commit
beeb832
·
verified ·
1 Parent(s): 514f6ac

Upload train_r2egym_14B_agent.yaml

Browse files
Files changed (1) hide show
  1. train_r2egym_14B_agent.yaml +41 -0
train_r2egym_14B_agent.yaml ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ### model
2
+ model_name_or_path: Qwen/Qwen2.5-Coder-14B-instruct
3
+ trust_remote_code: true
4
+
5
+ ### method
6
+ stage: sft
7
+ do_train: true
8
+ finetuning_type: full
9
+ deepspeed: examples/deepspeed/ds_z3_offload_config.json
10
+
11
+ ### dataset
12
+ dataset: R2E-Gym/R2EGym-SFT-Trajectories
13
+ template: qwen
14
+ cutoff_len: 13000
15
+ max_samples: 100000
16
+ overwrite_cache: true
17
+ preprocessing_num_workers: 16
18
+
19
+ ### output
20
+ output_dir: saves/R2EGym-14B-Agent
21
+ logging_steps: 10
22
+ save_steps: 10000
23
+ plot_loss: true
24
+ overwrite_output_dir: false
25
+
26
+ ### train
27
+ flash_attn: fa2
28
+ enable_liger_kernel: true
29
+ use_unsloth_gc: true
30
+ per_device_train_batch_size: 1
31
+ gradient_accumulation_steps: 1
32
+ learning_rate: 1.0e-5
33
+ num_train_epochs: 2.0
34
+ lr_scheduler_type: cosine
35
+ warmup_ratio: 0.1
36
+ bf16: true
37
+ ddp_timeout: 180000000
38
+
39
+ ### wandb
40
+ report_to: none
41
+ run_name: R2EGym-14B-Agent