adams-story
commited on
Commit
•
d797f0e
1
Parent(s):
5ba468d
Update README.md
Browse files
README.md
CHANGED
@@ -1,6 +1,89 @@
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
---
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4 |
epoch=1-step=4503.ckpt
|
5 |
* inserted at 3, all resnet weights frozen
|
6 |
* ~.62 val acc
|
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
---
|
4 |
+
insert_at_4_nonfrozen_deep_epoch=3-step=7759.ckpt
|
5 |
+
* small codebook size (64)
|
6 |
+
* trained to v acc@5 .8645 acc@1 0.6554
|
7 |
+
```
|
8 |
+
# lightning.pytorch==2.0.0
|
9 |
+
# bigger depth
|
10 |
+
seed_everything: true
|
11 |
+
trainer:
|
12 |
+
callbacks:
|
13 |
+
- class_path: lightning.pytorch.callbacks.ModelCheckpoint
|
14 |
+
init_args:
|
15 |
+
save_last: true
|
16 |
+
save_top_k: 1
|
17 |
+
monitor: v_c_loss
|
18 |
+
accelerator: auto
|
19 |
+
strategy: auto
|
20 |
+
devices: auto
|
21 |
+
num_nodes: 1
|
22 |
+
precision: 16-mixed
|
23 |
+
logger: null
|
24 |
+
callbacks: null
|
25 |
+
fast_dev_run: false
|
26 |
+
max_epochs: 5
|
27 |
+
min_epochs: null
|
28 |
+
max_steps: -1
|
29 |
+
min_steps: null
|
30 |
+
max_time: null
|
31 |
+
limit_train_batches: null
|
32 |
+
limit_val_batches: null
|
33 |
+
limit_test_batches: null
|
34 |
+
limit_predict_batches: null
|
35 |
+
overfit_batches: 0.0
|
36 |
+
val_check_interval: 0.1
|
37 |
+
check_val_every_n_epoch: 1
|
38 |
+
num_sanity_val_steps: null
|
39 |
+
log_every_n_steps: 15
|
40 |
+
enable_checkpointing: true
|
41 |
+
enable_progress_bar: null
|
42 |
+
enable_model_summary: null
|
43 |
+
accumulate_grad_batches: 1
|
44 |
+
gradient_clip_val: 1.0
|
45 |
+
gradient_clip_algorithm: null
|
46 |
+
deterministic: null
|
47 |
+
benchmark: null
|
48 |
+
inference_mode: true
|
49 |
+
use_distributed_sampler: true
|
50 |
+
profiler: null
|
51 |
+
detect_anomaly: false
|
52 |
+
barebones: false
|
53 |
+
plugins: null
|
54 |
+
sync_batchnorm: false
|
55 |
+
reload_dataloaders_every_n_epochs: 0
|
56 |
+
default_root_dir: ckpt/insert_at_4_nonfrozen_deep
|
57 |
+
model:
|
58 |
+
resnet_type: 34
|
59 |
+
is_rq: false
|
60 |
+
quantizer_args:
|
61 |
+
heads: 8
|
62 |
+
use_cosine_sim: false
|
63 |
+
accept_image_fmap: true
|
64 |
+
codebook_dim: 128
|
65 |
+
codebook_size: 64
|
66 |
+
decay: 0.85
|
67 |
+
eps: 1.0e-05
|
68 |
+
commitment_weight: 0.5
|
69 |
+
threshold_ema_dead_code: 1
|
70 |
+
sample_codebook_temp: 0.1
|
71 |
+
resnet_insertion_index: 4
|
72 |
+
unfreeze_resnet_block_indeces:
|
73 |
+
- 2
|
74 |
+
- 3
|
75 |
+
unfreeze_fc: true
|
76 |
+
lr: 0.0001
|
77 |
+
data:
|
78 |
+
data_dir: "/home/figes/Downloads/ILSVRC2012_CLS-LOC/"
|
79 |
+
image_size: 224
|
80 |
+
num_workers: 6
|
81 |
+
batch_size: 512
|
82 |
+
shuffle: true
|
83 |
+
pin_memory: true
|
84 |
+
drop_last: false
|
85 |
+
```
|
86 |
+
|
87 |
epoch=1-step=4503.ckpt
|
88 |
* inserted at 3, all resnet weights frozen
|
89 |
* ~.62 val acc
|