Spaces:
Sleeping
Sleeping
adam_beta1: 0.9 | |
adam_beta2: 0.999 | |
adam_eps: 1e-08 | |
all_params: True | |
bf16: True | |
clip_grad: 1.0 | |
ddp_find_unused_parameters: False | |
do_train: True | |
eval_iters: 100 | |
finetuned_ckpt: None | |
gradient_accumulation_steps: 1 | |
gradient_checkpointing: True | |
inference_mode: False | |
local_rank: 0 | |
logging_nan_inf_filter: False | |
lora_alpha: 32 | |
lora_dropout: 0.05 | |
lora_r: 32 | |
loss_objective: sequential | |
lr: 0.0001 | |
micro_batch_size: 16 | |
min_lr: 1e-07 | |
mm_config: configs/video_mix.yaml | |
num_training_steps: 4236 | |
num_warmup_steps: 200 | |
num_workers: 32 | |
pretrained_ckpt: /local2/hbansal/video_text/mplug-owl-llama-7b-video | |
save_interval: None | |
save_path: /local2/hbansal/video_text/mplugowl_wipeout_data_second_stage_lora_all_params_32_sequential_mix_1e-4/ | |
seq_length: 256 | |
train_epochs: 2 | |
train_visual_abstractor: False | |
use_lora: True | |
use_qv: False | |
wandb_run_name: mplugowl_wipeout_data_second_stage_lora_all_params_32_sequential_mix_1e-4 | |
weight_decay: 0.0001 | |