AbstractPhil commited on
Commit
370812a
·
verified ·
1 Parent(s): c40165e

[CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d] artifacts head_best

Browse files
CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d/head_best.config.json ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "device": "cuda",
3
+ "seed": 42,
4
+ "precision": "fp32",
5
+ "hf_clip_id": "laion/CLIP-ViT-B-32-laion2B-s34B-b79K",
6
+ "freeze_encoder": true,
7
+ "normalize_output": true,
8
+ "dataset": "cifar100",
9
+ "data_root": "./data",
10
+ "image_size": 224,
11
+ "clip_mean": [
12
+ 0.48145466,
13
+ 0.4578275,
14
+ 0.40821073
15
+ ],
16
+ "clip_std": [
17
+ 0.26862954,
18
+ 0.26130258,
19
+ 0.27577711
20
+ ],
21
+ "train_aug": true,
22
+ "train_crop_scale": [
23
+ 0.9,
24
+ 1.0
25
+ ],
26
+ "hflip_p": 0.5,
27
+ "vocab_repo": "AbstractPhil/geometric-vocab-768d",
28
+ "vocab_split": "unicode",
29
+ "vocab_dim_override": 768,
30
+ "crystal_dims": 768,
31
+ "role_index": {
32
+ "anchor": 0,
33
+ "support": 1,
34
+ "contrast": 2,
35
+ "purpose": 3,
36
+ "observer": 4
37
+ },
38
+ "rose_loss_weight": 0.15,
39
+ "rose_margin": 0.25,
40
+ "rose_temperature": 1.0,
41
+ "rose_role_weights": {
42
+ "anchor": 1.0,
43
+ "need": -0.5,
44
+ "relation": 0.75,
45
+ "purpose": 0.75,
46
+ "observer": -0.5
47
+ },
48
+ "classes": 100,
49
+ "classes_per_penta": 2,
50
+ "penta_branches": 50,
51
+ "pentachora_blocks": 4,
52
+ "temperature": 0.07,
53
+ "batch_size": 512,
54
+ "epochs": 20,
55
+ "lr": 0.0001,
56
+ "weight_decay": 0.0001,
57
+ "label_smoothing": 0.0,
58
+ "use_cosine_sched": true,
59
+ "warmup_steps": 0,
60
+ "max_steps": null,
61
+ "amp": true,
62
+ "grad_clip_norm": null,
63
+ "log_every": 25,
64
+ "auto_train": false,
65
+ "num_workers": 2,
66
+ "pin_memory": true,
67
+ "persistent_workers": true,
68
+ "ckpt_dir": "./checkpoints",
69
+ "run_name": "CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d",
70
+ "save_latest": true,
71
+ "save_best": true,
72
+ "resume": false,
73
+ "resume_which": "best",
74
+ "resume_source": "auto",
75
+ "hf_enable": true,
76
+ "hf_repo_id": "AbstractPhil/rose-geoclip",
77
+ "hf_branch": "main",
78
+ "hf_private": true,
79
+ "hf_push_latest": false,
80
+ "hf_push_best": true,
81
+ "hf_create": true,
82
+ "hf_token_env": [
83
+ "HF_TOKEN",
84
+ "HUGGINGFACE_HUB_TOKEN"
85
+ ],
86
+ "features_enable": true,
87
+ "features_local_root": "./features_cache",
88
+ "features_batch_size": 1024,
89
+ "features_push_to_hub": true,
90
+ "features_offload_after_prepare": false,
91
+ "features_repo_id": "AbstractPhil/CLIP-ViT-B-32-laion2B-s34B-b79K_cifar100_extracted_features",
92
+ "features_local_dir": "./features_cache/CLIP-ViT-B-32-laion2B-s34B-b79K-cifar100",
93
+ "features_embed_dim": 512,
94
+ "features_ready": true,
95
+ "use_precomputed_features": true
96
+ }
CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d/head_best.metrics.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1,
3
+ "train_loss": 2.7008541645431516,
4
+ "val_loss": 0.9892485931396484,
5
+ "top1": 0.8,
6
+ "top3": 0.9327999994277955,
7
+ "rose_weight": 0.15,
8
+ "rose_margin": 0.25,
9
+ "rose_temperature": 1.0
10
+ }