mveroe commited on
Commit
4b22e1b
·
verified ·
1 Parent(s): 92ac657

Upload training_config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_config.yaml +38 -0
training_config.yaml ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ add_think_tokens: true
2
+ chat_version: Qwen/Qwen2.5-1.5B-Instruct
3
+ custom_name: lightr1_3_EN_1024
4
+ dataset: Light-R1
5
+ hf_username: mveroe
6
+ max_length: 1024
7
+ mixup:
8
+ FPR: 0.0
9
+ TPR: 1.0
10
+ generator_accuracy: 1.0
11
+ model_name: Qwen/Qwen2.5-1.5B
12
+ neptune_project: ethsri/label-noise
13
+ pretrained_model: true
14
+ seed: 42
15
+ set_seed: false
16
+ shuffle: true
17
+ training_args:
18
+ bf16: true
19
+ ddp_find_unused_parameters: false
20
+ gradient_accumulation_steps: 4
21
+ hub_strategy: all_checkpoints
22
+ learning_rate: 5.0e-05
23
+ logging_first_step: true
24
+ logging_steps: 1
25
+ logging_strategy: steps
26
+ lr_scheduler_type: cosine
27
+ num_train_epochs: 3
28
+ optim: adafactor
29
+ overwrite_output_dir: true
30
+ per_device_train_batch_size: 4
31
+ push_to_hub: true
32
+ report_to: none
33
+ save_strategy: epoch
34
+ seed: 42
35
+ warmup_ratio: 0.1
36
+ training_type: !!python/object/apply:src.configs.TrainingTypes
37
+ - sft
38
+ use_neptune: true