speedinghzl commited on
Commit
14b9bb0
·
verified ·
1 Parent(s): c55827d

Upload folder using huggingface_hub

Browse files
logs-lr1e-3-datacomp-rebuttal/clipcls_vit_b16_s15m_bs16k_25ep/checkpoints/epoch_24.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d30e56a464c2f17b67806260315639e663a4d7e507a1108aef98df58e2c43ef
3
+ size 2252182350
logs-lr1e-3-datacomp-rebuttal/clipcls_vit_b16_s15m_bs16k_25ep/checkpoints/epoch_25.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7934f561359fa4aad230d841e5bf8ff1fd88955ddcc1f263d4848fd130d8d7a
3
+ size 2252182350
logs-lr1e-3-datacomp-rebuttal/clipcls_vit_b16_s15m_bs16k_25ep/checkpoints/results.jsonl ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"imagenet-zeroshot-val-top1": 0.11178, "imagenet-zeroshot-val-top5": 0.26328}
2
+ {"imagenet-zeroshot-val-top1": 0.20186, "imagenet-zeroshot-val-top5": 0.41636}
3
+ {"imagenet-zeroshot-val-top1": 0.28762, "imagenet-zeroshot-val-top5": 0.54378}
4
+ {"imagenet-zeroshot-val-top1": 0.30488, "imagenet-zeroshot-val-top5": 0.56564}
5
+ {"imagenet-zeroshot-val-top1": 0.31118, "imagenet-zeroshot-val-top5": 0.5705}
6
+ {"imagenet-zeroshot-val-top1": 0.33194, "imagenet-zeroshot-val-top5": 0.60224}
7
+ {"imagenet-zeroshot-val-top1": 0.35418, "imagenet-zeroshot-val-top5": 0.6281}
8
+ {"imagenet-zeroshot-val-top1": 0.37028, "imagenet-zeroshot-val-top5": 0.64418}
9
+ {"imagenet-zeroshot-val-top1": 0.383, "imagenet-zeroshot-val-top5": 0.66288}
10
+ {"imagenet-zeroshot-val-top1": 0.39306, "imagenet-zeroshot-val-top5": 0.67326}
11
+ {"imagenet-zeroshot-val-top1": 0.4132, "imagenet-zeroshot-val-top5": 0.69578}
12
+ {"imagenet-zeroshot-val-top1": 0.42382, "imagenet-zeroshot-val-top5": 0.7114}
13
+ {"imagenet-zeroshot-val-top1": 0.438, "imagenet-zeroshot-val-top5": 0.72248}
14
+ {"imagenet-zeroshot-val-top1": 0.43938, "imagenet-zeroshot-val-top5": 0.72178}
15
+ {"imagenet-zeroshot-val-top1": 0.4485, "imagenet-zeroshot-val-top5": 0.72984}
16
+ {"imagenet-zeroshot-val-top1": 0.44922, "imagenet-zeroshot-val-top5": 0.73228}
17
+ {"imagenet-zeroshot-val-top1": 0.44868, "imagenet-zeroshot-val-top5": 0.72932}
logs-lr1e-3-datacomp-rebuttal/clipcls_vit_b16_s15m_bs16k_25ep/out.log ADDED
The diff for this file is too large to render. See raw diff
 
logs-lr1e-3-datacomp-rebuttal/clipcls_vit_b16_s15m_bs16k_25ep/params.txt ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ NDR_patch_size: 16
2
+ accum_freq: 1
3
+ aug_cfg: {}
4
+ batch_size: 2048
5
+ beta1: 0.9
6
+ beta2: 0.98
7
+ checkpoint_path: ./logs/clipcls_vit_b16_s15m_bs16k/checkpoints
8
+ class_loss_weight: 1.0
9
+ coca_caption_loss_weight: 2.0
10
+ coca_contrastive_loss_weight: 1.0
11
+ copy_codebase: False
12
+ csv_caption_key: title
13
+ csv_img_key: filepath
14
+ csv_separator:
15
+ dataset_resampled: False
16
+ dataset_type: webdataset
17
+ ddp_static_graph: True
18
+ debug: False
19
+ delete_prev_step_ckpt: True
20
+ delete_previous_checkpoint: False
21
+ device: cuda:0
22
+ dist_backend: nccl
23
+ dist_url: env://
24
+ distill: False
25
+ distill_model: None
26
+ distill_pretrained: None
27
+ distributed: True
28
+ epochs: 25
29
+ epochs_cooldown: None
30
+ eps: 1e-06
31
+ force_custom_text: False
32
+ force_image_size: 224
33
+ force_patch_dropout: None
34
+ force_quick_gelu: False
35
+ gather_with_grad: True
36
+ global_batch_size: 16384
37
+ grad_checkpointing: True
38
+ grad_clip_norm: None
39
+ horovod: False
40
+ image_interpolation: None
41
+ image_mean: None
42
+ image_resize_mode: None
43
+ image_std: None
44
+ imagenet_v2: None
45
+ imagenet_val: /mnt/bn/zilongdata-us/dataset/ILSVRC/Data/CLS-LOC/val
46
+ is_cls_token: True
47
+ local_loss: True
48
+ local_rank: 0
49
+ lock_image: False
50
+ lock_image_freeze_bn_stats: False
51
+ lock_image_unlocked_groups: 0
52
+ lock_text: False
53
+ lock_text_freeze_layer_norm: False
54
+ lock_text_unlocked_layers: 0
55
+ log_every_n_steps: 128
56
+ log_level: 20
57
+ log_local: False
58
+ log_path: ./logs/clipcls_vit_b16_s15m_bs16k/out.log
59
+ logs: ./logs
60
+ lr: 0.001
61
+ lr_cooldown_end: 0.0
62
+ lr_cooldown_power: 1.0
63
+ lr_scheduler: cosine
64
+ max_seq_len: 15000
65
+ model: CLIPCLS-ViT-B-16
66
+ name: clipcls_vit_b16_s15m_bs16k
67
+ native_dynamic_resolution: False
68
+ no_set_device_rank: False
69
+ only_class_loss: False
70
+ only_packing: False
71
+ post_train: False
72
+ precision: amp_bfloat16
73
+ pretrained:
74
+ pretrained_image:
75
+ pretrained_text:
76
+ rank: 0
77
+ remote_sync: None
78
+ remote_sync_frequency: 300
79
+ remote_sync_protocol: s3
80
+ report_to: wandb
81
+ resume: ./logs/clipcls_vit_b16_s15m_bs16k/checkpoints/step_6104.pt
82
+ rope_attn_num_heads: 12
83
+ rope_model_width: 768
84
+ save_every_n_steps: 6104
85
+ save_frequency: 1
86
+ save_most_recent: False
87
+ seed: 0
88
+ siglip: False
89
+ skip_scheduler: False
90
+ tensorboard: False
91
+ tensorboard_path:
92
+ torchcompile: False
93
+ torchscript: False
94
+ trace: False
95
+ train_data: /mnt/bn/zilongdata-us/dataset/recap-datacomp-1b-webdataset/{000000..140146}.tar
96
+ train_data_upsampling_factors: None
97
+ train_num_samples: 15000000
98
+ use_bn_sync: False
99
+ use_bnb_linear: None
100
+ use_idf: True
101
+ val_data: None
102
+ val_frequency: 1
103
+ val_num_samples: None
104
+ val_steps: 6104
105
+ wandb: True
106
+ wandb_notes:
107
+ wandb_project_name: cls-clip-batch-size
108
+ warmup: 500
109
+ wd: 0.2
110
+ workers: 1
111
+ world_size: 8
112
+ zeroshot_frequency: 2
113
+ zeroshot_steps: 6104