|
--- |
|
license: apache-2.0 |
|
--- |
|
insert_at_4_nonfrozen_50rn_8heads_k=128.ckpt |
|
* Final validation scores: acc@1=0.758 acc@5=0.92 |
|
* Trained for 4 epochs |
|
``` |
|
# lightning.pytorch==2.0.0 |
|
seed_everything: true |
|
trainer: |
|
callbacks: |
|
- class_path: lightning.pytorch.callbacks.ModelCheckpoint |
|
init_args: |
|
save_last: true |
|
save_top_k: 1 |
|
monitor: v_c_loss |
|
- class_path: lightning.pytorch.callbacks.LearningRateMonitor |
|
accelerator: auto |
|
strategy: auto |
|
devices: auto |
|
num_nodes: 1 |
|
precision: 16-mixed |
|
logger: null |
|
fast_dev_run: false |
|
max_epochs: 8 |
|
min_epochs: null |
|
max_steps: -1 |
|
min_steps: null |
|
max_time: null |
|
limit_train_batches: null |
|
limit_val_batches: null |
|
limit_test_batches: null |
|
limit_predict_batches: null |
|
overfit_batches: 0.0 |
|
val_check_interval: 0.1 |
|
check_val_every_n_epoch: 1 |
|
num_sanity_val_steps: null |
|
log_every_n_steps: 15 |
|
enable_checkpointing: true |
|
enable_progress_bar: null |
|
enable_model_summary: null |
|
accumulate_grad_batches: 1 |
|
gradient_clip_val: 1.0 |
|
gradient_clip_algorithm: null |
|
deterministic: null |
|
benchmark: null |
|
inference_mode: true |
|
use_distributed_sampler: true |
|
profiler: null |
|
detect_anomaly: false |
|
barebones: false |
|
plugins: null |
|
sync_batchnorm: false |
|
reload_dataloaders_every_n_epochs: 0 |
|
default_root_dir: ckpt/insert_at_4_nonfrozen_50rn_4heads_k=128 |
|
model: |
|
resnet_type: 50 |
|
is_rq: false |
|
quantizer_args: |
|
heads: 8 |
|
use_cosine_sim: false |
|
accept_image_fmap: true |
|
codebook_dim: 256 |
|
codebook_size: 128 |
|
decay: 0.95 |
|
eps: 1.0e-05 |
|
commitment_weight: 0.0 |
|
threshold_ema_dead_code: 2 |
|
resnet_insertion_index: 4 |
|
unfreeze_resnet_block_indeces: [3] |
|
unfreeze_fc: true |
|
lr: 0.00010 |
|
data: |
|
data_dir: "/home/figes/Downloads/ILSVRC2012_CLS-LOC/" |
|
image_size: 224 |
|
num_workers: 6 |
|
batch_size: 512 |
|
shuffle: true |
|
pin_memory: true |
|
drop_last: false |
|
``` |
|
|
|
|
|
epoch0-insert-at-4-frozen-deep-norq.ckpt |
|
* trained to vall acc@5 0.887 acc@1 .6697 |
|
* big codebook size (256) |
|
* 8 heads |
|
``` |
|
# lightning.pytorch==2.0.0 |
|
# bigger depth |
|
seed_everything: true |
|
trainer: |
|
callbacks: |
|
- class_path: lightning.pytorch.callbacks.ModelCheckpoint |
|
init_args: |
|
save_last: true |
|
save_top_k: 1 |
|
monitor: v_c_loss |
|
accelerator: auto |
|
strategy: auto |
|
devices: auto |
|
num_nodes: 1 |
|
precision: 16-mixed |
|
logger: null |
|
callbacks: null |
|
fast_dev_run: false |
|
max_epochs: 5 |
|
min_epochs: null |
|
max_steps: -1 |
|
min_steps: null |
|
max_time: null |
|
limit_train_batches: null |
|
limit_val_batches: null |
|
limit_test_batches: null |
|
limit_predict_batches: null |
|
overfit_batches: 0.0 |
|
val_check_interval: 0.1 |
|
check_val_every_n_epoch: 1 |
|
num_sanity_val_steps: null |
|
log_every_n_steps: 15 |
|
enable_checkpointing: true |
|
enable_progress_bar: null |
|
enable_model_summary: null |
|
accumulate_grad_batches: 1 |
|
gradient_clip_val: 1.0 |
|
gradient_clip_algorithm: null |
|
deterministic: null |
|
benchmark: null |
|
inference_mode: true |
|
use_distributed_sampler: true |
|
profiler: null |
|
detect_anomaly: false |
|
barebones: false |
|
plugins: null |
|
sync_batchnorm: false |
|
reload_dataloaders_every_n_epochs: 0 |
|
default_root_dir: ckpt/insert_at_4_frozen_deep |
|
model: |
|
resnet_type: 34 |
|
is_rq: false |
|
quantizer_args: |
|
heads: 8 |
|
use_cosine_sim: false |
|
accept_image_fmap: true |
|
codebook_dim: 128 |
|
codebook_size: 256 |
|
decay: 0.85 |
|
eps: 1.0e-05 |
|
commitment_weight: 5.0 |
|
threshold_ema_dead_code: 1 |
|
resnet_insertion_index: 4 |
|
unfreeze_resnet_block_indeces: [] |
|
unfreeze_fc: false |
|
lr: 0.0002 |
|
data: |
|
data_dir: "/home/figes/Downloads/ILSVRC2012_CLS-LOC/" |
|
image_size: 224 |
|
num_workers: 6 |
|
batch_size: 512 |
|
shuffle: true |
|
pin_memory: true |
|
drop_last: false |
|
``` |
|
insert_at_4_nonfrozen_deep_epoch=3-step=7759.ckpt |
|
* small codebook size (64) |
|
* trained to v acc@5 .8645 acc@1 0.6554 |
|
``` |
|
# lightning.pytorch==2.0.0 |
|
# bigger depth |
|
seed_everything: true |
|
trainer: |
|
callbacks: |
|
- class_path: lightning.pytorch.callbacks.ModelCheckpoint |
|
init_args: |
|
save_last: true |
|
save_top_k: 1 |
|
monitor: v_c_loss |
|
accelerator: auto |
|
strategy: auto |
|
devices: auto |
|
num_nodes: 1 |
|
precision: 16-mixed |
|
logger: null |
|
callbacks: null |
|
fast_dev_run: false |
|
max_epochs: 5 |
|
min_epochs: null |
|
max_steps: -1 |
|
min_steps: null |
|
max_time: null |
|
limit_train_batches: null |
|
limit_val_batches: null |
|
limit_test_batches: null |
|
limit_predict_batches: null |
|
overfit_batches: 0.0 |
|
val_check_interval: 0.1 |
|
check_val_every_n_epoch: 1 |
|
num_sanity_val_steps: null |
|
log_every_n_steps: 15 |
|
enable_checkpointing: true |
|
enable_progress_bar: null |
|
enable_model_summary: null |
|
accumulate_grad_batches: 1 |
|
gradient_clip_val: 1.0 |
|
gradient_clip_algorithm: null |
|
deterministic: null |
|
benchmark: null |
|
inference_mode: true |
|
use_distributed_sampler: true |
|
profiler: null |
|
detect_anomaly: false |
|
barebones: false |
|
plugins: null |
|
sync_batchnorm: false |
|
reload_dataloaders_every_n_epochs: 0 |
|
default_root_dir: ckpt/insert_at_4_nonfrozen_deep |
|
model: |
|
resnet_type: 34 |
|
is_rq: false |
|
quantizer_args: |
|
heads: 8 |
|
use_cosine_sim: false |
|
accept_image_fmap: true |
|
codebook_dim: 128 |
|
codebook_size: 64 |
|
decay: 0.85 |
|
eps: 1.0e-05 |
|
commitment_weight: 0.5 |
|
threshold_ema_dead_code: 1 |
|
sample_codebook_temp: 0.1 |
|
resnet_insertion_index: 4 |
|
unfreeze_resnet_block_indeces: |
|
- 2 |
|
- 3 |
|
unfreeze_fc: true |
|
lr: 0.0001 |
|
data: |
|
data_dir: "/home/figes/Downloads/ILSVRC2012_CLS-LOC/" |
|
image_size: 224 |
|
num_workers: 6 |
|
batch_size: 512 |
|
shuffle: true |
|
pin_memory: true |
|
drop_last: false |
|
``` |
|
|
|
epoch=1-step=4503.ckpt |
|
* inserted at 3, all resnet weights frozen |
|
* ~.62 val acc |
|
``` |
|
# lightning.pytorch==2.0.0 |
|
seed_everything: true |
|
trainer: |
|
callbacks: |
|
- class_path: lightning.pytorch.callbacks.ModelCheckpoint |
|
init_args: |
|
save_last: true |
|
save_top_k: 1 |
|
monitor: v_c_loss |
|
accelerator: auto |
|
strategy: auto |
|
devices: auto |
|
num_nodes: 1 |
|
precision: 16-mixed |
|
logger: null |
|
callbacks: null |
|
fast_dev_run: false |
|
max_epochs: 10 |
|
min_epochs: null |
|
max_steps: -1 |
|
min_steps: null |
|
max_time: null |
|
limit_train_batches: null |
|
limit_val_batches: null |
|
limit_test_batches: null |
|
limit_predict_batches: null |
|
overfit_batches: 0.0 |
|
val_check_interval: 0.1 |
|
check_val_every_n_epoch: 1 |
|
num_sanity_val_steps: null |
|
log_every_n_steps: 5 |
|
enable_checkpointing: true |
|
enable_progress_bar: null |
|
enable_model_summary: null |
|
accumulate_grad_batches: 1 |
|
gradient_clip_val: 0.5 |
|
gradient_clip_algorithm: null |
|
deterministic: null |
|
benchmark: null |
|
inference_mode: true |
|
use_distributed_sampler: true |
|
profiler: null |
|
detect_anomaly: false |
|
barebones: false |
|
plugins: null |
|
sync_batchnorm: false |
|
reload_dataloaders_every_n_epochs: 0 |
|
default_root_dir: ckpt/test_insert_at_3_frozen |
|
model: |
|
resnet_type: 34 |
|
is_rq: true |
|
quantizer_args: |
|
num_quantizers: 4 |
|
shared_codebook: false |
|
quantize_dropout: true |
|
accept_image_fmap: true |
|
codebook_dim: 128 |
|
codebook_size: 512 |
|
decay: 0.85 |
|
eps: 1.0e-05 |
|
commitment_weight: 25.0 |
|
threshold_ema_dead_code: 2 |
|
sample_codebook_temp: 0.05 |
|
quantize_dropout_cutoff_index: 1 |
|
quantize_dropout_multiple_of: 1 |
|
resnet_insertion_index: 3 |
|
lr: 0.0002 |
|
data: |
|
data_dir: "/home/figes/Downloads/ILSVRC2012_CLS-LOC/" |
|
image_size: 224 |
|
num_workers: 8 |
|
batch_size: 512 |
|
shuffle: true |
|
pin_memory: true |
|
drop_last: false |
|
``` |
|
|
|
|
|
epoch2-val-63.ckpt |
|
* final val acc .63 |
|
* trained for 2 epochs |
|
* More compressed embedding space, with more dropout |
|
* git commit dc54a9bdbfcfbc83c736ac5c06ab09c5acf2d5e8 |
|
``` |
|
# lightning.pytorch==2.0.0 |
|
seed_everything: true |
|
trainer: |
|
callbacks: |
|
- class_path: lightning.pytorch.callbacks.ModelCheckpoint |
|
init_args: |
|
save_last: true |
|
save_top_k: 1 |
|
monitor: v_c_loss |
|
accelerator: auto |
|
strategy: auto |
|
devices: auto |
|
num_nodes: 1 |
|
precision: 16-mixed |
|
logger: null |
|
callbacks: null |
|
fast_dev_run: false |
|
max_epochs: 10 |
|
min_epochs: null |
|
max_steps: -1 |
|
min_steps: null |
|
max_time: null |
|
limit_train_batches: null |
|
limit_val_batches: null |
|
limit_test_batches: null |
|
limit_predict_batches: null |
|
overfit_batches: 0.0 |
|
val_check_interval: 0.1 |
|
check_val_every_n_epoch: 1 |
|
num_sanity_val_steps: null |
|
log_every_n_steps: 5 |
|
enable_checkpointing: true |
|
enable_progress_bar: null |
|
enable_model_summary: null |
|
accumulate_grad_batches: 1 |
|
gradient_clip_val: 0.5 |
|
gradient_clip_algorithm: null |
|
deterministic: null |
|
benchmark: null |
|
inference_mode: true |
|
use_distributed_sampler: true |
|
profiler: null |
|
detect_anomaly: false |
|
barebones: false |
|
plugins: null |
|
sync_batchnorm: false |
|
reload_dataloaders_every_n_epochs: 0 |
|
default_root_dir: ckpt/insert_at_4 |
|
model: |
|
resnet_type: 34 |
|
is_rq: true |
|
quantizer_args: |
|
num_quantizers: 8 |
|
shared_codebook: true |
|
quantize_dropout: false |
|
accept_image_fmap: true |
|
codebook_dim: 128 |
|
codebook_size: 64 |
|
decay: 0.8 |
|
eps: 1.0e-05 |
|
commitment_weight: 5.0 |
|
threshold_ema_dead_code: 1 |
|
sample_codebook_temp: 0.1 |
|
resnet_insertion_index: 4 |
|
unfreeze_resnet_block_indeces: |
|
- 3 |
|
unfreeze_fc: true |
|
lr: 0.0002 |
|
data: |
|
data_dir: "/home/figes/Downloads/ILSVRC2012_CLS-LOC/" |
|
image_size: 224 |
|
num_workers: 6 |
|
batch_size: 512 |
|
shuffle: true |
|
pin_memory: true |
|
drop_last: false |
|
``` |
|
|
|
### epoch=5-step=14765.ckpt |
|
* trained for 5 1/2 epochs on imagenet, on top of resnet 34 |
|
* final validation accuracy: .66 |
|
* final training accuracy: 0.64 |
|
* git hash: `c4852331f9a40393b8ffd8b7b9a689d1ff6e1021` |
|
* config: |
|
``` |
|
# lightning.pytorch==2.0.0 |
|
seed_everything: true |
|
trainer: |
|
callbacks: |
|
- class_path: lightning.pytorch.callbacks.ModelCheckpoint |
|
init_args: |
|
save_last: true |
|
save_top_k: 1 |
|
monitor: v_c_loss |
|
accelerator: auto |
|
strategy: auto |
|
devices: auto |
|
num_nodes: 1 |
|
precision: 16-mixed |
|
logger: null |
|
callbacks: null |
|
fast_dev_run: false |
|
max_epochs: 10 |
|
min_epochs: null |
|
max_steps: -1 |
|
min_steps: null |
|
max_time: null |
|
limit_train_batches: null |
|
limit_val_batches: null |
|
limit_test_batches: null |
|
limit_predict_batches: null |
|
overfit_batches: 0.0 |
|
val_check_interval: 0.1 |
|
check_val_every_n_epoch: 1 |
|
num_sanity_val_steps: null |
|
log_every_n_steps: 5 |
|
enable_checkpointing: true |
|
enable_progress_bar: null |
|
enable_model_summary: null |
|
accumulate_grad_batches: 1 |
|
gradient_clip_val: 0.5 |
|
gradient_clip_algorithm: null |
|
deterministic: null |
|
benchmark: null |
|
inference_mode: true |
|
use_distributed_sampler: true |
|
profiler: null |
|
detect_anomaly: false |
|
barebones: false |
|
plugins: null |
|
sync_batchnorm: false |
|
reload_dataloaders_every_n_epochs: 0 |
|
default_root_dir: ckpt/test_insert_at_4 |
|
model: |
|
resnet_type: 34 |
|
is_rq: true |
|
quantizer_args: |
|
num_quantizers: 4 |
|
shared_codebook: true |
|
quantize_dropout: false |
|
accept_image_fmap: true |
|
codebook_dim: 128 |
|
codebook_size: 256 |
|
decay: 0.8 |
|
eps: 1.0e-05 |
|
commitment_weight: 5.0 |
|
threshold_ema_dead_code: 1 |
|
sample_codebook_temp: 0.0 |
|
resnet_insertion_index: 4 |
|
unfreeze_resnet_block_indeces: |
|
- 3 |
|
unfreeze_fc: true |
|
lr: 0.0002 |
|
data: |
|
data_dir: "/home/figes/Downloads/ILSVRC2012_CLS-LOC/" |
|
image_size: 224 |
|
num_workers: 8 |
|
batch_size: 512 |
|
shuffle: true |
|
pin_memory: true |
|
drop_last: false |
|
``` |