|
wandb_project: joy-caption-1
|
|
device_batch_size: 2
|
|
batch_size: 256
|
|
learning_rate: 0.0002
|
|
warmup_samples: 18000
|
|
max_samples: 600000
|
|
save_every: 50000
|
|
test_every: 50000
|
|
use_amp: true
|
|
grad_scaler: true
|
|
lr_scheduler_type: cosine
|
|
min_lr_ratio: 0.0
|
|
allow_tf32: true
|
|
seed: 69
|
|
num_workers: 8
|
|
optimizer_type: adamw
|
|
adam_beta1: 0.9
|
|
adam_beta2: 0.999
|
|
adam_eps: 1.0e-08
|
|
adam_weight_decay: 0.0
|
|
clip_grad_norm: 1.0
|
|
dataset: fancyfeast/joy-captioning-20240924a
|
|
clip_model: google/siglip-so400m-patch14-384
|
|
text_model: ../lora-train/lora_model_vwbzycxh
|
|
resume: null
|
|
gradient_checkpointing: false
|
|
test_size: 2048
|
|
grad_scaler_init: 65536.0
|
|
max_caption_length: 257
|
|
num_image_tokens: 32
|
|
adapter_type: mlp
|
|
text_model_dtype: bfloat16
|
|
pre_test: false
|
|
train_image_model: true
|
|
image_model_lr: null
|
|
train_lora: true
|
|
lora_r: 64
|
|
lora_alpha: 16
|
|
lora_dropout: 0.1
|
|
|