KogoroTop commited on
Commit
5f69988
1 Parent(s): 9448c3f

Upload training_config.yml with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_config.yml +83 -0
training_config.yml ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ _component_: models.lora_mmllama3_8b
3
+ lora_attn_modules:
4
+ - q_proj
5
+ - v_proj
6
+ apply_lora_to_mlp: false
7
+ apply_lora_to_output: false
8
+ lora_rank: 16
9
+ lora_alpha: 32
10
+ perception_tokens: 2
11
+ use_clip: false
12
+ tokenizer:
13
+ _component_: models.a2a_tokenizer
14
+ path: models/tokenizer.model
15
+ checkpointer:
16
+ _component_: torchtune.utils.FullModelMetaCheckpointer
17
+ checkpoint_dir: /workspace/omega_a2a/training
18
+ checkpoint_files:
19
+ - consolidated.00.pth
20
+ adapter_checkpoint: null
21
+ recipe_checkpoint: null
22
+ output_dir: /workspace/omega_a2a/checkpoints
23
+ model_type: LLAMA3
24
+ resume_from_checkpoint: false
25
+ interim_checkpoint_steps: 5000
26
+ interim_gen_steps: null
27
+ max_new_tokens: 100
28
+ dataset:
29
+ _component_: ds.EvenBatcher
30
+ buffer_size: 36
31
+ dataset:
32
+ _component_: ds.RoundRobinDataset
33
+ datasets:
34
+ - _component_: ds.OmegaVideoCaptionDataset
35
+ length: 500000
36
+ - _component_: ds.LlavaInstructDataset
37
+ dataset_path: ds/coco_llava_instruct/output.parquet
38
+ train_on_input: false
39
+ - _component_: ds.LlavaInstructDataset
40
+ dataset_path: ds/vision_flan/output.parquet
41
+ train_on_input: false
42
+ - _component_: ds.CaptionInstructDataset
43
+ dataset_path: ds/sam_llava/output.parquet
44
+ train_on_input: false
45
+ seed: null
46
+ shuffle: true
47
+ batch_size: 4
48
+ optimizer:
49
+ _component_: torch.optim.AdamW
50
+ weight_decay: 0.0001
51
+ lr: 3.0e-05
52
+ lr_scheduler:
53
+ _component_: torchtune.modules.get_cosine_schedule_with_warmup
54
+ num_warmup_steps: 100
55
+ loss:
56
+ _component_: torch.nn.CrossEntropyLoss
57
+ epochs: 6
58
+ max_steps_per_epoch: null
59
+ gradient_accumulation_steps: 64
60
+ compile: false
61
+ temperature: 0.2
62
+ top_k: 100
63
+ output_dir: /tmp/lora_finetune_output
64
+ metric_logger:
65
+ _component_: torchtune.utils.metric_logging.DiskLogger
66
+ log_dir: ${output_dir}
67
+ log_every_n_steps: null
68
+ device: cuda
69
+ dtype: bf16
70
+ enable_activation_checkpointing: false
71
+ profiler:
72
+ _component_: torchtune.utils.profiler
73
+ enabled: false
74
+ inference:
75
+ prompt_template: 'Video:
76
+
77
+ {video}
78
+
79
+ Caption the previous video.'
80
+ max_new_tokens: 100
81
+ temperature: 0.6
82
+ top_k: 170
83
+ quantizer: null