accum_freq: 1 | |
aug_cfg: {} | |
batch_size: 1408 | |
beta1: 0.9 | |
beta2: 0.98 | |
checkpoint_path: /tmp/restart_2019/datacomp_xlarge-basic_cumulative_seq_2019/checkpoints | |
coca_caption_loss_weight: 2.0 | |
coca_contrastive_loss_weight: 1.0 | |
copy_codebase: False | |
csv_caption_key: title | |
csv_img_key: filepath | |
csv_separator: | |
dataset_resampled: True | |
dataset_type: webdataset | |
ddp_static_graph: True | |
debug: False | |
decay_fraction: 0.2 | |
delete_previous_checkpoint: False | |
device: cuda:0 | |
dist_backend: nccl | |
dist_url: env:// | |
distill: False | |
distill_model: None | |
distill_pretrained: None | |
distributed: True | |
epochs: 32 | |
epochs_cooldown: None | |
eps: 1e-06 | |
force_custom_text: False | |
force_image_size: None | |
force_patch_dropout: None | |
force_qk_norm: False | |
force_qk_norm_eps: 1e-05 | |
force_quick_gelu: False | |
gather_with_grad: True | |
grad_checkpointing: True | |
grad_clip_norm: None | |
horovod: False | |
image_mean: None | |
image_std: None | |
imagenet_v2: None | |
imagenet_val: ../imagenet_validation | |
is_iteration_based: True | |
local_loss: True | |
local_rank: 0 | |
lock_image: False | |
lock_image_freeze_bn_stats: False | |
lock_image_unlocked_groups: 0 | |
lock_text: False | |
lock_text_freeze_layer_norm: False | |
lock_text_unlocked_layers: 0 | |
log_every_n_steps: 100 | |
log_level: 20 | |
log_local: False | |
log_path: /tmp/restart_2019/datacomp_xlarge-basic_cumulative_seq_2019/out.log | |
logs: /tmp/restart_2019 | |
lr: 0.001 | |
lr_cooldown_end: 0.0 | |
lr_cooldown_power: 1.0 | |
lr_scheduler: cosine | |
max_iterations: 20500 | |
model: ViT-B-16 | |
name: datacomp_xlarge-basic_cumulative_seq_2019 | |
new_run: True | |
no_set_device_rank: False | |
precision: amp | |
pretrained: | |
pretrained_image: False | |
rank: 0 | |
remote_sync: xlarge_CL_basic_filter/restart_2019/ | |
remote_sync_frequency: 300 | |
remote_sync_protocol: s3 | |
report_to: wandb | |
resume: xlarge_CL_basic_filter/restart_2018/datacomp_xlarge-basic_cumulative_seq_2018/checkpoints/epoch_4.pt | |
save_frequency: 1 | |
save_most_recent: True | |
seed: 0 | |
skip_scheduler: False | |
tensorboard: False | |
tensorboard_path: | |
torchcompile: False | |
torchscript: False | |
trace: False | |
train_data: xlarge_basic_filter/2019/1/{00000000..00000895}.tar::xlarge_basic_filter/2019/10/{00000000..00000831}.tar::xlarge_basic_filter/2019/11/{00000000..00000846}.tar::xlarge_basic_filter/2019/12/{00000000..00000887}.tar::xlarge_basic_filter/2019/13/{00000000..00000940}.tar::xlarge_basic_filter/2019/14/{00000000..00000895}.tar::xlarge_basic_filter/2019/15/{00000000..00000831}.tar::xlarge_basic_filter/2019/16/{00000000..00000831}.tar::xlarge_basic_filter/2019/17/{00000000..00000820}.tar::xlarge_basic_filter/2019/18/{00000000..00000925}.tar::xlarge_basic_filter/2019/19/{00000000..00000895}.tar::xlarge_basic_filter/2019/2/{00000000..00000935}.tar::xlarge_basic_filter/2019/20/{00000000..00000831}.tar::xlarge_basic_filter/2019/21/{00000000..00000831}.tar::xlarge_basic_filter/2019/22/{00000000..00000760}.tar::xlarge_basic_filter/2019/23/{00000000..00000959}.tar::xlarge_basic_filter/2019/24/{00000000..00000639}.tar::xlarge_basic_filter/2019/25/{00000000..00000609}.tar::xlarge_basic_filter/2019/26/{00000000..00000063}.tar::xlarge_basic_filter/2019/27/{00000000..00000191}.tar::xlarge_basic_filter/2019/28/{00000000..00001074}.tar::xlarge_basic_filter/2019/29/{00000000..00001060}.tar::xlarge_basic_filter/2019/3/{00000000..00000910}.tar::xlarge_basic_filter/2019/30/{00000000..00001023}.tar::xlarge_basic_filter/2019/31/{00000000..00001023}.tar::xlarge_basic_filter/2019/32/{00000000..00001023}.tar::xlarge_basic_filter/2019/33/{00000000..00001024}.tar::xlarge_basic_filter/2019/34/{00000000..00001023}.tar::xlarge_basic_filter/2019/35/{00000000..00001023}.tar::xlarge_basic_filter/2019/36/{00000000..00001086}.tar::xlarge_basic_filter/2019/37/{00000000..00001087}.tar::xlarge_basic_filter/2019/38/{00000000..00000959}.tar::xlarge_basic_filter/2019/39/{00000000..00000906}.tar::xlarge_basic_filter/2019/4/{00000000..00000897}.tar::xlarge_basic_filter/2019/40/{00000000..00000897}.tar::xlarge_basic_filter/2019/41/{00000000..00000831}.tar::xlarge_basic_filter/2019/42/{00000000..00000958}.tar::xlarge_basic_filter/2019/43/{00000000..00000966}.tar::xlarge_basic_filter/2019/44/{00000000..00001011}.tar::xlarge_basic_filter/2019/45/{00000000..00000959}.tar::xlarge_basic_filter/2019/46/{00000000..00000959}.tar::xlarge_basic_filter/2019/47/{00000000..00000967}.tar::xlarge_basic_filter/2019/48/{00000000..00001082}.tar::xlarge_basic_filter/2019/49/{00000000..00001066}.tar::xlarge_basic_filter/2019/5/{00000000..00000959}.tar::xlarge_basic_filter/2019/50/{00000000..00001067}.tar::xlarge_basic_filter/2019/51/{00000000..00001075}.tar::xlarge_basic_filter/2019/52/{00000000..00001075}.tar::xlarge_basic_filter/2019/53/{00000000..00001646}.tar::xlarge_basic_filter/2019/54/{00000000..00001599}.tar::xlarge_basic_filter/2019/55/{00000000..00000511}.tar::xlarge_basic_filter/2019/56/{00000000..00000511}.tar::xlarge_basic_filter/2019/57/{00000000..00000511}.tar::xlarge_basic_filter/2019/58/{00000000..00000511}.tar::xlarge_basic_filter/2019/59/{00000000..00000511}.tar::xlarge_basic_filter/2019/6/{00000000..00000959}.tar::xlarge_basic_filter/2019/7/{00000000..00000959}.tar::xlarge_basic_filter/2019/8/{00000000..00000895}.tar::xlarge_basic_filter/2019/9/{00000000..00000831}.tar | |
train_data_upsampling_factors: None | |
train_num_samples: None | |
use_bn_sync: False | |
use_bnb_linear: None | |
val_data: None | |
val_frequency: 1 | |
val_num_samples: None | |
wandb: True | |
wandb_notes: | |
wandb_project_name: datacomp-xlarge-CL | |
warmup: 2000 | |
wd: 0.2 | |
workers: 4 | |
world_size: 64 | |
zeroshot_frequency: 1 | |