File tree Expand file tree Collapse file tree 1 file changed +58
-0
lines changed Expand file tree Collapse file tree 1 file changed +58
-0
lines changed Original file line number Diff line number Diff line change
1
+ base_model : agentica-org/DeepCoder-14B-Preview
2
+ # Automatically upload checkpoint and final model to HF
3
+ # hub_model_id: username/custom_model_name
4
+
5
+ load_in_8bit : true
6
+ load_in_4bit : false
7
+ strict : false
8
+
9
+ datasets :
10
+ - path : fozziethebeat/alpaca_messages_2k_test
11
+ type : chat_template
12
+ field_messages : messages
13
+ message_property_mappings :
14
+ role : role
15
+ content : content
16
+
17
+ dataset_prepared_path :
18
+ val_set_size : 0.05
19
+ output_dir : ./outputs/lora-out
20
+
21
+ sequence_len : 4096
22
+ sample_packing : true
23
+ eval_sample_packing : false
24
+ pad_to_sequence_len : true
25
+
26
+ adapter : lora
27
+ lora_model_dir :
28
+ lora_r : 32
29
+ lora_alpha : 16
30
+ lora_dropout : 0.05
31
+ lora_target_linear : true
32
+
33
+ wandb_project :
34
+ wandb_entity :
35
+ wandb_watch :
36
+ wandb_name :
37
+ wandb_log_model :
38
+
39
+ gradient_accumulation_steps : 2
40
+ micro_batch_size : 2
41
+ num_epochs : 4
42
+ optimizer : adamw_bnb_8bit
43
+ lr_scheduler : cosine
44
+ learning_rate : 0.0002
45
+
46
+ bf16 : auto
47
+ tf32 : true
48
+
49
+ gradient_checkpointing : true
50
+ resume_from_checkpoint :
51
+ logging_steps : 1
52
+ flash_attention : true
53
+
54
+ warmup_steps : 10
55
+ evals_per_epoch : 1
56
+ saves_per_epoch : 1
57
+ weight_decay : 0.0
58
+ special_tokens :
You can’t perform that action at this time.
0 commit comments