[CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d] artifacts head_best
Browse files
CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d/head_best.config.json
ADDED
|
@@ -0,0 +1,96 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"device": "cuda",
|
| 3 |
+
"seed": 42,
|
| 4 |
+
"precision": "fp32",
|
| 5 |
+
"hf_clip_id": "laion/CLIP-ViT-B-32-laion2B-s34B-b79K",
|
| 6 |
+
"freeze_encoder": true,
|
| 7 |
+
"normalize_output": true,
|
| 8 |
+
"dataset": "cifar100",
|
| 9 |
+
"data_root": "./data",
|
| 10 |
+
"image_size": 224,
|
| 11 |
+
"clip_mean": [
|
| 12 |
+
0.48145466,
|
| 13 |
+
0.4578275,
|
| 14 |
+
0.40821073
|
| 15 |
+
],
|
| 16 |
+
"clip_std": [
|
| 17 |
+
0.26862954,
|
| 18 |
+
0.26130258,
|
| 19 |
+
0.27577711
|
| 20 |
+
],
|
| 21 |
+
"train_aug": true,
|
| 22 |
+
"train_crop_scale": [
|
| 23 |
+
0.9,
|
| 24 |
+
1.0
|
| 25 |
+
],
|
| 26 |
+
"hflip_p": 0.5,
|
| 27 |
+
"vocab_repo": "AbstractPhil/geometric-vocab-768d",
|
| 28 |
+
"vocab_split": "unicode",
|
| 29 |
+
"vocab_dim_override": 768,
|
| 30 |
+
"crystal_dims": 768,
|
| 31 |
+
"role_index": {
|
| 32 |
+
"anchor": 0,
|
| 33 |
+
"support": 1,
|
| 34 |
+
"contrast": 2,
|
| 35 |
+
"purpose": 3,
|
| 36 |
+
"observer": 4
|
| 37 |
+
},
|
| 38 |
+
"rose_loss_weight": 0.15,
|
| 39 |
+
"rose_margin": 0.25,
|
| 40 |
+
"rose_temperature": 1.0,
|
| 41 |
+
"rose_role_weights": {
|
| 42 |
+
"anchor": 1.0,
|
| 43 |
+
"need": -0.5,
|
| 44 |
+
"relation": 0.75,
|
| 45 |
+
"purpose": 0.75,
|
| 46 |
+
"observer": -0.5
|
| 47 |
+
},
|
| 48 |
+
"classes": 100,
|
| 49 |
+
"classes_per_penta": 2,
|
| 50 |
+
"penta_branches": 50,
|
| 51 |
+
"pentachora_blocks": 4,
|
| 52 |
+
"temperature": 0.07,
|
| 53 |
+
"batch_size": 512,
|
| 54 |
+
"epochs": 20,
|
| 55 |
+
"lr": 0.0001,
|
| 56 |
+
"weight_decay": 0.0001,
|
| 57 |
+
"label_smoothing": 0.0,
|
| 58 |
+
"use_cosine_sched": true,
|
| 59 |
+
"warmup_steps": 0,
|
| 60 |
+
"max_steps": null,
|
| 61 |
+
"amp": true,
|
| 62 |
+
"grad_clip_norm": null,
|
| 63 |
+
"log_every": 25,
|
| 64 |
+
"auto_train": false,
|
| 65 |
+
"num_workers": 2,
|
| 66 |
+
"pin_memory": true,
|
| 67 |
+
"persistent_workers": true,
|
| 68 |
+
"ckpt_dir": "./checkpoints",
|
| 69 |
+
"run_name": "CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d",
|
| 70 |
+
"save_latest": true,
|
| 71 |
+
"save_best": true,
|
| 72 |
+
"resume": false,
|
| 73 |
+
"resume_which": "best",
|
| 74 |
+
"resume_source": "auto",
|
| 75 |
+
"hf_enable": true,
|
| 76 |
+
"hf_repo_id": "AbstractPhil/rose-geoclip",
|
| 77 |
+
"hf_branch": "main",
|
| 78 |
+
"hf_private": true,
|
| 79 |
+
"hf_push_latest": false,
|
| 80 |
+
"hf_push_best": true,
|
| 81 |
+
"hf_create": true,
|
| 82 |
+
"hf_token_env": [
|
| 83 |
+
"HF_TOKEN",
|
| 84 |
+
"HUGGINGFACE_HUB_TOKEN"
|
| 85 |
+
],
|
| 86 |
+
"features_enable": true,
|
| 87 |
+
"features_local_root": "./features_cache",
|
| 88 |
+
"features_batch_size": 1024,
|
| 89 |
+
"features_push_to_hub": true,
|
| 90 |
+
"features_offload_after_prepare": false,
|
| 91 |
+
"features_repo_id": "AbstractPhil/CLIP-ViT-B-32-laion2B-s34B-b79K_cifar100_extracted_features",
|
| 92 |
+
"features_local_dir": "./features_cache/CLIP-ViT-B-32-laion2B-s34B-b79K-cifar100",
|
| 93 |
+
"features_embed_dim": 512,
|
| 94 |
+
"features_ready": true,
|
| 95 |
+
"use_precomputed_features": true
|
| 96 |
+
}
|
CLIP-ViT-B-32-laion2B-s34B-b79K-uni-768dx768d/head_best.metrics.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"epoch": 1,
|
| 3 |
+
"train_loss": 2.7008541645431516,
|
| 4 |
+
"val_loss": 0.9892485931396484,
|
| 5 |
+
"top1": 0.8,
|
| 6 |
+
"top3": 0.9327999994277955,
|
| 7 |
+
"rose_weight": 0.15,
|
| 8 |
+
"rose_margin": 0.25,
|
| 9 |
+
"rose_temperature": 1.0
|
| 10 |
+
}
|