Mehdi Cherti commited on
Commit
813e7be
1 Parent(s): ce6812f
Files changed (1) hide show
  1. trained_models_info.csv +30 -0
trained_models_info.csv ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name,arch,data,samples_seen_pretty,lr,warmup,epochs,gpus,samples_per_sec,samples_per_epoch,local_bs,detailed_training_info
2
+ Model-B-32_Data-400M_Samples-13B_lr-1e-3_bs-86k.pt,ViT-B-32,400M,13B,0.001,2000,32,128,52724.00881,413000000,672,
3
+ Model-L-14_Data-400M_Samples-13B_lr-1e-3_bs-86k.pt,ViT-L-14,400M,13B,0.001,2000,32,768,60327.90558,413000000,112,
4
+ Model-L-14_Data-400M_Samples-34B_lr-1e-3_bs-86k.pt,ViT-L-14,400M,34B,0.001,10000,84,1024,79116.28421,413000000,84,
5
+ Model-L-14_Data-2B_Samples-13B_lr-1e-3_bs-86k.pt,ViT-L-14,2B,13B,0.001,10000,64,1024,67928.46915,200000000,84,
6
+ Model-B-32_Data-2B_Samples-13B_lr-5e-4_bs-32k.pt,ViT-B-32,2B,13B,0.0005,2000,65,128,93294.30008,200000000,256,
7
+ Model-B-32_Data-80M_Samples-3B_lr-5e-4_bs-32k.pt,ViT-B-32,80M,3B,0.0005,2000,32,128,108844.5704,80000415,256,
8
+ Model-B-32_Data-80M_Samples-13B_lr-5e-4_bs-32k.pt,ViT-B-32,80M,13B,0.0005,2000,160,128,108844.5704,80000415,256,
9
+ Model-B-16_Data-2B_Samples-3B_lr-1e-3_bs-88k.pt,ViT-B-16,2B,3B,0.001,10000,12,344,134239.8261,213334440,256,
10
+ Model-B-32_Data-2B_Samples-3B_lr-1e-3_bs-88k.pt,ViT-B-32,2B,3B,0.001,10000,12,344,218174.3316,213334440,256,
11
+ Model-B-32_Data-400M_Samples-3B_lr-1e-3_bs-88k.pt,ViT-B-32,400M,3B,0.001,10000,6,344,219759.0125,407332084,256,
12
+ Model-B-16_Data-400M_Samples-3B_lr-1e-3_bs-88k.pt,ViT-B-16,400M,3B,0.001,10000,6,344,136370.9084,407332084,256,
13
+ Model-B-16_Data-2B_Samples-13B_lr-1e-3_bs-88k.pt,ViT-B-16,2B,13B,0.001,10000,65,176,54580.6237,200532718,512,
14
+ Model-B-16_Data-80M_Samples-13B_lr-1e-3_bs-88k.pt,ViT-B-16,80M,13B,0.001,10000,163,176,50927.5668,80000415,512,
15
+ Model-B-16_Data-80M_Samples-3B_lr-1e-3_bs-88k.pt,ViT-B-16,80M,3B,0.001,10000,32,344,128758.0639,80000415,256,
16
+ Model-L-14_Data-400M_Samples-3B_lr-1e-3_bs-88k.pt,ViT-L-14,400M,3B,0.001,10000,6,396,40026.59493,407332084,224,
17
+ Model-L-14_Data-2B_Samples-3B_lr-1e-3_bs-88k.pt,ViT-L-14,2B,3B,0.001,10000,12,396,39913.2071,213334440,224,
18
+ Model-B-16_Data-2B_Samples-34B_lr-1e-3_bs-88k.pt,ViT-B-16,2B,34B,0.001,10000,171,344,78356.07648,200092953,256,
19
+ Model-B-16_Data-400M_Samples-34B_lr-1e-3_bs-88k.pt,ViT-B-16,400M,34B,0.001,10000,84,176,64314.37834,407332084,512,
20
+ Model-B-32_Data-400M_Samples-34B_lr-5e-4_bs-32k.pt,ViT-B-32,400M,34B,0.0005,2000,84,128,108844.5704,407332084,256,
21
+ Model-L-14_Data-80M_Samples-13B_lr-1e-3_bs-88k.pt,ViT-L-14,80M,13B,0.001,10000,163,200,35524.82252,80000415,448,
22
+ Model-L-14_Data-80M_Samples-3B_lr-1e-3_bs-88k.pt,ViT-L-14,80M,3B,0.001,10000,32,396,38878.74478,80000415,224,
23
+ Model-L-14_Data-2B_Samples-34B_lr-1e-3_bs-86k.pt,ViT-L-14,2B,34B,0.001,10000,160,384,27861.91926,200000000,224,https://huggingface.co/laion/CLIP-ViT-L-14-laion2B-s32B-b82K
24
+ Model-B-32_Data-2B_Samples-34B_lr-1e-3_bs-79k.pt,ViT-B-32,2B,34B,0.001,2000,256,824,187872.0,135646078,96,
25
+ Model-B-16_Data-400M_Samples-13B_lr-5e-4_bs-33k.pt,ViT-B-16,400M,13B,0.0005,10000,32,176,59356.0,407332084,192,
26
+ Model-H-14_Data-2B_Samples-34B_lr-5e-4_bs-79k.pt,ViT-H-14,2B,34B,0.0005,2000,256,824,34608.0,135646078,96,https://huggingface.co/laion/CLIP-ViT-H-14-laion2B-s32B-b79K
27
+ Model-g-14_Data-2B_Samples-13B_lr-5e-4_bs-64k.pt,ViT-g-14,2B,13B,0.0005,2000,90,800,24800.0,135646078,80,https://huggingface.co/laion/CLIP-ViT-g-14-laion2B-s12B-b42K
28
+ Model-B-32_Data-80M_Samples-34B_lr-1e-3_bs-88k.pt,ViT-B-32,80M,34B,0.001,10000,428,344,99289.44575,80000415,256,
29
+ Model-B-16_Data-80M_Samples-34B_lr-1e-3_bs-88k.pt,ViT-B-16,80M,34B,0.001,10000,428,344,136146.6806,80000415,256,
30
+ Model-L-14_Data-80M_Samples-34B_lr-1e-3_bs-88k.pt,ViT-L-14,80M,34B,0.001,10000,428,400,41970.05536,80000415,224,