Alignment-Lab-AI commited on
Commit
4485b33
1 Parent(s): 35436fb

Upload config.yml

Browse files
Files changed (1) hide show
  1. config.yml +72 -0
config.yml ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: openchat/openchat_3.5
2
+ model_type: MistralForCausalLM
3
+ tokenizer_type: LlamaTokenizer
4
+ is_mistral_derived_model: true
5
+
6
+ load_in_8bit: false
7
+ load_in_4bit: false
8
+ strict: false
9
+
10
+ datasets:
11
+ - path: FrederikH/LinearAlgebra-Python
12
+ type: alpaca
13
+ dataset_prepared_path:
14
+ val_set_size: 0.05
15
+ output_dir: ./out
16
+
17
+ sequence_len: 8192
18
+ sample_packing: true
19
+ pad_to_sequence_len: true
20
+
21
+ wandb_project:
22
+ wandb_entity:
23
+ wandb_watch:
24
+ wandb_run_id:
25
+ wandb_log_model:
26
+
27
+ gradient_accumulation_steps: 8
28
+ micro_batch_size: 4
29
+ num_epochs: 4
30
+ optimizer: adamw_bnb_8bit
31
+ lr_scheduler: cosine
32
+ learning_rate: 0.000005
33
+
34
+ train_on_inputs: false
35
+ group_by_length: false
36
+ bf16: true
37
+ fp16: false
38
+ tf32: false
39
+
40
+ gradient_checkpointing: true
41
+ early_stopping_patience:
42
+ resume_from_checkpoint:
43
+ local_rank:
44
+ logging_steps: 1
45
+ xformers_attention:
46
+
47
+ warmup_steps: 10
48
+ eval_table_size:
49
+ eval_table_max_new_tokens: 128
50
+
51
+ debug:
52
+ deepspeed:
53
+ fsdp:
54
+ fsdp_config:
55
+ special_tokens:
56
+ bos_token: "<s>"
57
+ eos_token: "</s>"
58
+ unk_token: "<unk>"
59
+
60
+ bench_dataset: pharaouk/dharma-1/dharma_1_mini.json
61
+ do_bench_eval: true
62
+
63
+ push_to_hub: true
64
+ hub_model_id: FrederikH/linear-algebra
65
+ hub_strategy: "every_save"
66
+ hub_token:
67
+
68
+ flash_attention: true
69
+ weight_decay: 0.01
70
+
71
+ eval_steps: 1
72
+ save_steps: 1