wandb_project: joy-caption-1 | |
device_batch_size: 2 | |
batch_size: 256 | |
learning_rate: 0.0002 | |
warmup_samples: 18000 | |
max_samples: 500000 | |
save_every: 50000 | |
test_every: 50000 | |
use_amp: true | |
grad_scaler: true | |
lr_scheduler_type: cosine | |
min_lr_ratio: 0.0 | |
allow_tf32: true | |
seed: 69 | |
num_workers: 8 | |
optimizer_type: adamw | |
adam_beta1: 0.9 | |
adam_beta2: 0.999 | |
adam_eps: 1.0e-08 | |
adam_weight_decay: 0.0 | |
clip_grad_norm: 1.0 | |
dataset: fancyfeast/joy-captioning-20240917a | |
clip_model: google/siglip-so400m-patch14-384 | |
text_model: meta-llama/Meta-Llama-3.1-8B | |
resume: null | |
gradient_checkpointing: false | |
test_size: 2048 | |
grad_scaler_init: 65536.0 | |
max_caption_length: 257 | |
num_image_tokens: 32 | |
adapter_type: mlp | |
text_model_dtype: bfloat16 | |
pre_test: false | |
train_image_model: true | |
image_model_lr: null | |
train_lora: true | |
lora_r: 64 | |
lora_alpha: 16 | |
lora_dropout: 0.1 | |