accum_freq: 1 aug_cfg: {} batch_size: 2816 beta1: 0.9 beta2: 0.98 checkpoint_path: /tmp/restart_2017/datacomp_xlarge-basic_cumulative_seq_2017/checkpoints coca_caption_loss_weight: 2.0 coca_contrastive_loss_weight: 1.0 copy_codebase: False csv_caption_key: title csv_img_key: filepath csv_separator: dataset_resampled: True dataset_type: webdataset ddp_static_graph: True debug: False decay_fraction: 0.2 delete_previous_checkpoint: False device: cuda:0 dist_backend: nccl dist_url: env:// distill: False distill_model: None distill_pretrained: None distributed: True epochs: 32 epochs_cooldown: None eps: 1e-06 force_custom_text: False force_image_size: None force_patch_dropout: None force_qk_norm: False force_qk_norm_eps: 1e-05 force_quick_gelu: False gather_with_grad: True grad_checkpointing: True grad_clip_norm: None horovod: False image_mean: None image_std: None imagenet_v2: None imagenet_val: ../imagenet_validation is_iteration_based: True local_loss: True local_rank: 0 lock_image: False lock_image_freeze_bn_stats: False lock_image_unlocked_groups: 0 lock_text: False lock_text_freeze_layer_norm: False lock_text_unlocked_layers: 0 log_every_n_steps: 100 log_level: 20 log_local: False log_path: /tmp/restart_2017/datacomp_xlarge-basic_cumulative_seq_2017/out.log logs: /tmp/restart_2017 lr: 0.001 lr_cooldown_end: 0.0 lr_cooldown_power: 1.0 lr_scheduler: cosine max_iterations: 20500 model: ViT-B-16 name: datacomp_xlarge-basic_cumulative_seq_2017 new_run: True no_set_device_rank: False precision: amp pretrained: pretrained_image: False rank: 0 remote_sync: xlarge_CL_basic_filter/restart_2017/ remote_sync_frequency: 300 remote_sync_protocol: s3 report_to: wandb resume: xlarge_CL_basic_filter/cumulative_sequential_2016/datacomp_xlarge-basic-2023-09-12_05-47-41_cumulative_seq_2016/checkpoints/epoch_8.pt save_frequency: 1 save_most_recent: True seed: 0 skip_scheduler: False tensorboard: False tensorboard_path: torchcompile: False torchscript: False trace: False train_data: xlarge_basic_filter/2017/1/{00000000..00000681}.tar::xlarge_basic_filter/2017/10/{00000000..00000639}.tar::xlarge_basic_filter/2017/11/{00000000..00000703}.tar::xlarge_basic_filter/2017/12/{00000000..00000703}.tar::xlarge_basic_filter/2017/13/{00000000..00000730}.tar::xlarge_basic_filter/2017/14/{00000000..00000703}.tar::xlarge_basic_filter/2017/15/{00000000..00000672}.tar::xlarge_basic_filter/2017/16/{00000000..00000639}.tar::xlarge_basic_filter/2017/17/{00000000..00000630}.tar::xlarge_basic_filter/2017/18/{00000000..00000723}.tar::xlarge_basic_filter/2017/19/{00000000..00000703}.tar::xlarge_basic_filter/2017/2/{00000000..00000703}.tar::xlarge_basic_filter/2017/20/{00000000..00000665}.tar::xlarge_basic_filter/2017/21/{00000000..00000639}.tar::xlarge_basic_filter/2017/22/{00000000..00000639}.tar::xlarge_basic_filter/2017/23/{00000000..00000767}.tar::xlarge_basic_filter/2017/24/{00000000..00000511}.tar::xlarge_basic_filter/2017/25/{00000000..00000511}.tar::xlarge_basic_filter/2017/26/{00000000..00000063}.tar::xlarge_basic_filter/2017/27/{00000000..00000139}.tar::xlarge_basic_filter/2017/28/{00000000..00000831}.tar::xlarge_basic_filter/2017/29/{00000000..00000831}.tar::xlarge_basic_filter/2017/3/{00000000..00000703}.tar::xlarge_basic_filter/2017/30/{00000000..00000770}.tar::xlarge_basic_filter/2017/31/{00000000..00000772}.tar::xlarge_basic_filter/2017/32/{00000000..00000778}.tar::xlarge_basic_filter/2017/33/{00000000..00000831}.tar::xlarge_basic_filter/2017/34/{00000000..00000767}.tar::xlarge_basic_filter/2017/35/{00000000..00000767}.tar::xlarge_basic_filter/2017/36/{00000000..00000831}.tar::xlarge_basic_filter/2017/37/{00000000..00000799}.tar::xlarge_basic_filter/2017/38/{00000000..00000719}.tar::xlarge_basic_filter/2017/39/{00000000..00000703}.tar::xlarge_basic_filter/2017/4/{00000000..00000679}.tar::xlarge_basic_filter/2017/40/{00000000..00000703}.tar::xlarge_basic_filter/2017/41/{00000000..00000639}.tar::xlarge_basic_filter/2017/42/{00000000..00000703}.tar::xlarge_basic_filter/2017/43/{00000000..00000767}.tar::xlarge_basic_filter/2017/44/{00000000..00000767}.tar::xlarge_basic_filter/2017/45/{00000000..00000767}.tar::xlarge_basic_filter/2017/46/{00000000..00000755}.tar::xlarge_basic_filter/2017/47/{00000000..00000767}.tar::xlarge_basic_filter/2017/48/{00000000..00000831}.tar::xlarge_basic_filter/2017/49/{00000000..00000831}.tar::xlarge_basic_filter/2017/5/{00000000..00000682}.tar::xlarge_basic_filter/2017/50/{00000000..00000831}.tar::xlarge_basic_filter/2017/51/{00000000..00000831}.tar::xlarge_basic_filter/2017/52/{00000000..00000831}.tar::xlarge_basic_filter/2017/53/{00000000..00001279}.tar::xlarge_basic_filter/2017/54/{00000000..00001227}.tar::xlarge_basic_filter/2017/55/{00000000..00000435}.tar::xlarge_basic_filter/2017/56/{00000000..00000433}.tar::xlarge_basic_filter/2017/57/{00000000..00000383}.tar::xlarge_basic_filter/2017/58/{00000000..00000383}.tar::xlarge_basic_filter/2017/59/{00000000..00000383}.tar::xlarge_basic_filter/2017/6/{00000000..00000679}.tar::xlarge_basic_filter/2017/7/{00000000..00000767}.tar::xlarge_basic_filter/2017/8/{00000000..00000719}.tar::xlarge_basic_filter/2017/9/{00000000..00000639}.tar train_data_upsampling_factors: None train_num_samples: None use_bn_sync: False use_bnb_linear: None val_data: None val_frequency: 1 val_num_samples: None wandb: True wandb_notes: wandb_project_name: datacomp-xlarge-CL warmup: 2000 wd: 0.2 workers: 4 world_size: 32 zeroshot_frequency: 1