LittletreeZou commited on
Commit
b46691b
·
1 Parent(s): 2dd29cd

initial upload

Browse files
Files changed (2) hide show
  1. config.yaml +224 -0
  2. model.ckpt +3 -0
config.yaml ADDED
@@ -0,0 +1,224 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # lightning.pytorch==2.4.0
2
+ seed_everything: 42
3
+ trainer:
4
+ accelerator: auto
5
+ strategy:
6
+ class_path: lightning.pytorch.strategies.DDPStrategy
7
+ init_args:
8
+ accelerator: null
9
+ parallel_devices: null
10
+ cluster_environment: null
11
+ checkpoint_io: null
12
+ precision_plugin: null
13
+ ddp_comm_state: null
14
+ ddp_comm_hook: null
15
+ ddp_comm_wrapper: null
16
+ model_averaging_period: null
17
+ process_group_backend: null
18
+ timeout: 0:30:00
19
+ start_method: popen
20
+ output_device: null
21
+ dim: 0
22
+ broadcast_buffers: true
23
+ process_group: null
24
+ bucket_cap_mb: 25
25
+ find_unused_parameters: false
26
+ check_reduction: false
27
+ gradient_as_bucket_view: false
28
+ static_graph: false
29
+ delay_all_reduce_named_params: null
30
+ param_to_hook_all_reduce: null
31
+ mixed_precision: null
32
+ device_mesh: null
33
+ devices: auto
34
+ num_nodes: 1
35
+ precision: 32
36
+ logger:
37
+ class_path: lightning.pytorch.loggers.WandbLogger
38
+ init_args:
39
+ name: ssp_proteinmoe_16B
40
+ save_dir: lightning_logs/protein
41
+ version: null
42
+ offline: false
43
+ dir: null
44
+ id: null
45
+ anonymous: null
46
+ project: xtrimo_benchmark_gbft_reproduction
47
+ log_model: false
48
+ experiment: null
49
+ prefix: ''
50
+ checkpoint_name: null
51
+ job_type: null
52
+ config: null
53
+ entity: null
54
+ reinit: null
55
+ tags: null
56
+ group: null
57
+ notes: null
58
+ magic: null
59
+ config_exclude_keys: null
60
+ config_include_keys: null
61
+ mode: null
62
+ allow_val_change: null
63
+ resume: null
64
+ force: null
65
+ tensorboard: null
66
+ sync_tensorboard: null
67
+ monitor_gym: null
68
+ save_code: true
69
+ fork_from: null
70
+ resume_from: null
71
+ settings: null
72
+ callbacks:
73
+ - class_path: lightning.pytorch.callbacks.LearningRateMonitor
74
+ init_args:
75
+ logging_interval: step
76
+ log_momentum: false
77
+ log_weight_decay: false
78
+ - class_path: lightning.pytorch.callbacks.ModelCheckpoint
79
+ init_args:
80
+ dirpath: genbio_finetune/logs/xtrimo_benchmark_gbft_reproduction/ssp_proteinmoe_16B
81
+ filename: best_val:{epoch}-{val_accuracy:.3f}
82
+ monitor: val_accuracy
83
+ verbose: false
84
+ save_last: null
85
+ save_top_k: 1
86
+ save_weights_only: false
87
+ mode: max
88
+ auto_insert_metric_name: true
89
+ every_n_train_steps: null
90
+ train_time_interval: null
91
+ every_n_epochs: 1
92
+ save_on_train_epoch_end: null
93
+ enable_version_counter: true
94
+ fast_dev_run: false
95
+ max_epochs: 15
96
+ min_epochs: null
97
+ max_steps: -1
98
+ min_steps: null
99
+ max_time: null
100
+ limit_train_batches: null
101
+ limit_val_batches: null
102
+ limit_test_batches: null
103
+ limit_predict_batches: null
104
+ overfit_batches: 0.0
105
+ val_check_interval: null
106
+ check_val_every_n_epoch: 1
107
+ num_sanity_val_steps: null
108
+ log_every_n_steps: 50
109
+ enable_checkpointing: null
110
+ enable_progress_bar: null
111
+ enable_model_summary: null
112
+ accumulate_grad_batches: 1
113
+ gradient_clip_val: 0.01
114
+ gradient_clip_algorithm: null
115
+ deterministic: null
116
+ benchmark: null
117
+ inference_mode: true
118
+ use_distributed_sampler: true
119
+ profiler:
120
+ class_path: lightning.pytorch.profilers.PyTorchProfiler
121
+ init_args:
122
+ dirpath: null
123
+ filename: null
124
+ group_by_input_shapes: false
125
+ emit_nvtx: false
126
+ export_to_chrome: true
127
+ row_limit: 20
128
+ sort_by_key: null
129
+ record_module_names: true
130
+ table_kwargs: null
131
+ record_shapes: false
132
+ dict_kwargs:
133
+ profile_memory: true
134
+ detect_anomaly: false
135
+ barebones: false
136
+ plugins: null
137
+ sync_batchnorm: false
138
+ reload_dataloaders_every_n_epochs: 0
139
+ default_root_dir: null
140
+ model:
141
+ class_path: genbio_finetune.tasks.TokenClassification
142
+ init_args:
143
+ adapter:
144
+ class_path: genbio_finetune.models.MLPAdapter
145
+ init_args:
146
+ hidden_sizes:
147
+ - 128
148
+ bias: true
149
+ dropout: 0.1
150
+ dropout_in_middle: true
151
+ backbone:
152
+ class_path: genbio_finetune.models.proteinfm
153
+ init_args:
154
+ from_scratch: false
155
+ max_length: 512
156
+ use_peft: true
157
+ save_peft_only: true
158
+ lora_r: 16
159
+ lora_alpha: 16
160
+ lora_dropout: 0.0
161
+ lora_target_modules:
162
+ - query
163
+ - value
164
+ - key
165
+ - dense
166
+ - router
167
+ lora_modules_to_save: null
168
+ lora_use_rslora: true
169
+ config_overwrites:
170
+ hidden_dropout_prob: 0
171
+ attention_probs_dropout_prob: 0
172
+ model_init_args: null
173
+ n_classes: 3
174
+ optimizer:
175
+ class_path: torch.optim.AdamW
176
+ init_args:
177
+ lr: 0.0001
178
+ betas:
179
+ - 0.9
180
+ - 0.95
181
+ eps: 1.0e-08
182
+ weight_decay: 0.0
183
+ amsgrad: false
184
+ maximize: false
185
+ foreach: null
186
+ capturable: false
187
+ differentiable: false
188
+ fused: null
189
+ lr_scheduler:
190
+ class_path: genbio_finetune.lr_schedulers.CosineWithWarmup
191
+ init_args:
192
+ warmup_ratio: 0.05
193
+ num_warmup_steps: null
194
+ last_epoch: -1
195
+ verbose: deprecated
196
+ use_legacy_adapter: false
197
+ strict_loading: true
198
+ reset_optimizer_states: false
199
+ data:
200
+ class_path: genbio_finetune.data.SspQ3
201
+ init_args:
202
+ path: biomap-research/ssp_q3
203
+ batch_size: 1
204
+ max_length: 512
205
+ config_name: null
206
+ train_split_name: train
207
+ test_split_name: test
208
+ valid_split_name: null
209
+ train_split_files: null
210
+ test_split_files: null
211
+ valid_split_files: null
212
+ test_split_size: null
213
+ valid_split_size: 0.1
214
+ random_seed: 42
215
+ shuffle: true
216
+ sampler: null
217
+ num_workers: 0
218
+ pin_memory: true
219
+ persistent_workers: false
220
+ cv_num_folds: 1
221
+ cv_test_fold_id: 0
222
+ cv_enable_val_fold: true
223
+ cv_fold_id_col: null
224
+ ckpt_path: null
model.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6412b442f3944d73235c01bb2d5d4f485ccc3fa24ee3a16f96b66f7bec1e9c8
3
+ size 147679193