owl-con-demo / owl-con /params.txt
Hritik
add owl-con ckpt
0187095
raw
history blame
925 Bytes
adam_beta1: 0.9
adam_beta2: 0.999
adam_eps: 1e-08
all_params: True
bf16: True
clip_grad: 1.0
ddp_find_unused_parameters: False
do_train: True
eval_iters: 100
finetuned_ckpt: None
gradient_accumulation_steps: 1
gradient_checkpointing: True
inference_mode: False
local_rank: 0
logging_nan_inf_filter: False
lora_alpha: 32
lora_dropout: 0.05
lora_r: 32
loss_objective: sequential
lr: 0.0001
micro_batch_size: 16
min_lr: 1e-07
mm_config: configs/video_mix.yaml
num_training_steps: 4236
num_warmup_steps: 200
num_workers: 32
pretrained_ckpt: /local2/hbansal/video_text/mplug-owl-llama-7b-video
save_interval: None
save_path: /local2/hbansal/video_text/mplugowl_wipeout_data_second_stage_lora_all_params_32_sequential_mix_1e-4/
seq_length: 256
train_epochs: 2
train_visual_abstractor: False
use_lora: True
use_qv: False
wandb_run_name: mplugowl_wipeout_data_second_stage_lora_all_params_32_sequential_mix_1e-4
weight_decay: 0.0001