| accum_freq: 1 | |
| aug_cfg: {} | |
| batch_size: 1408 | |
| beta1: 0.9 | |
| beta2: 0.98 | |
| checkpoint_path: /tmp/restart_2017/datacomp_xlarge-bestpool_restart_2017/checkpoints | |
| coca_caption_loss_weight: 2.0 | |
| coca_contrastive_loss_weight: 1.0 | |
| copy_codebase: False | |
| csv_caption_key: title | |
| csv_img_key: filepath | |
| csv_separator: | |
| dataset_resampled: True | |
| dataset_type: webdataset | |
| ddp_static_graph: True | |
| debug: False | |
| decay_fraction: 0.2 | |
| delete_previous_checkpoint: False | |
| device: cuda:0 | |
| dist_backend: nccl | |
| dist_url: env:// | |
| distill: False | |
| distill_model: None | |
| distill_pretrained: None | |
| distributed: True | |
| epochs: 32 | |
| epochs_cooldown: None | |
| eps: 1e-06 | |
| force_custom_text: False | |
| force_image_size: None | |
| force_patch_dropout: None | |
| force_qk_norm: False | |
| force_qk_norm_eps: 1e-05 | |
| force_quick_gelu: False | |
| gather_with_grad: True | |
| grad_checkpointing: True | |
| grad_clip_norm: None | |
| horovod: False | |
| image_mean: None | |
| image_std: None | |
| imagenet_v2: None | |
| imagenet_val: ../imagenet_validation | |
| is_iteration_based: True | |
| local_loss: True | |
| local_rank: 0 | |
| lock_image: False | |
| lock_image_freeze_bn_stats: False | |
| lock_image_unlocked_groups: 0 | |
| lock_text: False | |
| lock_text_freeze_layer_norm: False | |
| lock_text_unlocked_layers: 0 | |
| log_every_n_steps: 100 | |
| log_level: 20 | |
| log_local: False | |
| log_path: /tmp/restart_2017/datacomp_xlarge-bestpool_restart_2017/out.log | |
| logs: /tmp/restart_2017 | |
| lr: 0.001 | |
| lr_cooldown_end: 0.0 | |
| lr_cooldown_power: 1.0 | |
| lr_scheduler: cosine | |
| max_iterations: 20500 | |
| model: ViT-B-16 | |
| name: datacomp_xlarge-bestpool_restart_2017 | |
| new_run: True | |
| no_set_device_rank: False | |
| precision: amp | |
| pretrained: | |
| pretrained_image: False | |
| rank: 0 | |
| remote_sync: xlarge_CL_bestpool_filter/restart_2017/ | |
| remote_sync_frequency: 300 | |
| remote_sync_protocol: s3 | |
| report_to: | |
| resume: xlarge_CL_bestpool_filter/cumulative_sequential_2016/datacomp_xlarge-bestpool-2023-09-12_08-24-13_cumulative_seq_2016/checkpoints/epoch_12.pt | |
| save_frequency: 1 | |
| save_most_recent: True | |
| seed: 0 | |
| skip_scheduler: False | |
| tensorboard: False | |
| tensorboard_path: | |
| torchcompile: False | |
| torchscript: False | |
| trace: False | |
| train_data: xlarge_bestpool_filter/2017/0/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/1/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/10/{00000000..00000319}.tar::xlarge_bestpool_filter/2017/11/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/12/{00000000..00000359}.tar::xlarge_bestpool_filter/2017/13/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/14/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/15/{00000000..00000369}.tar::xlarge_bestpool_filter/2017/16/{00000000..00000331}.tar::xlarge_bestpool_filter/2017/17/{00000000..00000319}.tar::xlarge_bestpool_filter/2017/18/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/19/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/2/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/20/{00000000..00000372}.tar::xlarge_bestpool_filter/2017/21/{00000000..00000319}.tar::xlarge_bestpool_filter/2017/22/{00000000..00000319}.tar::xlarge_bestpool_filter/2017/23/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/24/{00000000..00000255}.tar::xlarge_bestpool_filter/2017/25/{00000000..00000255}.tar::xlarge_bestpool_filter/2017/26/{00000000..00000063}.tar::xlarge_bestpool_filter/2017/27/{00000000..00000107}.tar::xlarge_bestpool_filter/2017/28/{00000000..00000447}.tar::xlarge_bestpool_filter/2017/29/{00000000..00000447}.tar::xlarge_bestpool_filter/2017/3/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/30/{00000000..00000399}.tar::xlarge_bestpool_filter/2017/31/{00000000..00000399}.tar::xlarge_bestpool_filter/2017/32/{00000000..00000399}.tar::xlarge_bestpool_filter/2017/33/{00000000..00000401}.tar::xlarge_bestpool_filter/2017/34/{00000000..00000441}.tar::xlarge_bestpool_filter/2017/35/{00000000..00000433}.tar::xlarge_bestpool_filter/2017/36/{00000000..00000447}.tar::xlarge_bestpool_filter/2017/37/{00000000..00000447}.tar::xlarge_bestpool_filter/2017/38/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/39/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/4/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/40/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/41/{00000000..00000319}.tar::xlarge_bestpool_filter/2017/42/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/43/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/44/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/45/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/46/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/47/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/48/{00000000..00000419}.tar::xlarge_bestpool_filter/2017/49/{00000000..00000409}.tar::xlarge_bestpool_filter/2017/5/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/50/{00000000..00000447}.tar::xlarge_bestpool_filter/2017/51/{00000000..00000447}.tar::xlarge_bestpool_filter/2017/52/{00000000..00000447}.tar::xlarge_bestpool_filter/2017/53/{00000000..00000664}.tar::xlarge_bestpool_filter/2017/54/{00000000..00000639}.tar::xlarge_bestpool_filter/2017/55/{00000000..00000238}.tar::xlarge_bestpool_filter/2017/56/{00000000..00000237}.tar::xlarge_bestpool_filter/2017/57/{00000000..00000205}.tar::xlarge_bestpool_filter/2017/58/{00000000..00000191}.tar::xlarge_bestpool_filter/2017/59/{00000000..00000191}.tar::xlarge_bestpool_filter/2017/6/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/7/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/8/{00000000..00000383}.tar::xlarge_bestpool_filter/2017/9/{00000000..00000340}.tar | |
| train_data_upsampling_factors: None | |
| train_num_samples: None | |
| use_bn_sync: False | |
| use_bnb_linear: None | |
| val_data: None | |
| val_frequency: 1 | |
| val_num_samples: None | |
| wandb: False | |
| wandb_notes: | |
| wandb_project_name: open-clip | |
| warmup: 2000 | |
| wd: 0.2 | |
| workers: 4 | |
| world_size: 64 | |
| zeroshot_frequency: 1 | |