{ "model_cfg": { "seed": 42, "max_length": 200, "image_encoder": "vit_large_patch14_clip_336", "text_encoder": "sartifyllc/AviLaBSE", "text_tokenizer": "sartifyllc/AviLaBSE", "flip_ratio": 0.5, "tensor_ratio": 1.0, "imgs_pixels": 255.0, "image_size": 336, "batch_size": 4, "num_workers": 4, "num_projection_layers": 1, "projection_dim": 256, "dropout": 0.1, "image_embedding": 1024, "text_embedding": 768, "temperature": 1.0, "head_lr": 0.001, "image_encoder_lr": 0.0001, "text_encoder_lr": 1e-05, "weight_decay": 0.001, "patience": 1, "factor": 0.8, "epochs": 2, "context_length": 512 }, "preprocess_cfg": { "mean": [ 0.48145466, 0.4578275, 0.40821073 ], "std": [ 0.26862954, 0.26130258, 0.27577711 ] } }