zgcr654321
/

classification_training

Model card Files Files and versions Community

zgcr654321 commited on Sep 17, 2023

Commit

f6451f4

•

1 Parent(s): e9b55c8

Upload 8 files

Browse files

Files changed (8) hide show

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/__pycache__/train_config.cpython-38.pyc +0 -0
imagenet/vit_tiny_patch16_lion_for_mae_pretrain/checkpoints/latest.pth +3 -0
imagenet/vit_tiny_patch16_lion_for_mae_pretrain/checkpoints/vit_tiny_patch16-acc68.614.pth +3 -0
imagenet/vit_tiny_patch16_lion_for_mae_pretrain/log/train.info.log +0 -0
imagenet/vit_tiny_patch16_lion_for_mae_pretrain/test.sh +1 -0
imagenet/vit_tiny_patch16_lion_for_mae_pretrain/test_config.py +57 -0
imagenet/vit_tiny_patch16_lion_for_mae_pretrain/train.sh +1 -0
imagenet/vit_tiny_patch16_lion_for_mae_pretrain/train_config.py +140 -0

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/__pycache__/train_config.cpython-38.pyc ADDED Viewed

Binary file (3.33 kB). View file

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/checkpoints/latest.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:943d722e66681f77a60189365a01aa8b25bb4181725bde55afad0bdbcc68a9d5
+size 45900719

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/checkpoints/vit_tiny_patch16-acc68.614.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5caf604d12a2beb6776fdf051c5a176c81b088c8f2c2e1c9fff444a0897eb5d4
+size 22915267

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/log/train.info.log ADDED Viewed

The diff for this file is too large to render. See raw diff

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/test.sh ADDED Viewed

	@@ -0,0 +1 @@


1	+ OMP_NUM_THREADS=1 CUDA_VISIBLE_DEVICES=0 python -m torch.distributed.run --nproc_per_node=1 --master_addr 127.0.1.0 --master_port 10000 ../../../tools/test_classification_model.py --work-dir ./

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/test_config.py ADDED Viewed

	@@ -0,0 +1,57 @@

+import os
+import sys
+BASE_DIR = os.path.dirname(
+    os.path.dirname(os.path.dirname(os.path.dirname(
+        os.path.abspath(__file__)))))
+sys.path.append(BASE_DIR)
+from tools.path import ILSVRC2012_path
+from simpleAICV.classification import backbones
+from simpleAICV.classification import losses
+from simpleAICV.classification.datasets.ilsvrc2012dataset import ILSVRC2012Dataset
+from simpleAICV.classification.common import Opencv2PIL, TorchResize, TorchCenterCrop, TorchMeanStdNormalize, ClassificationCollater, load_state_dict
+import torch
+import torchvision.transforms as transforms
+class config:
+    '''
+    for resnet,input_image_size = 224;for darknet,input_image_size = 256
+    '''
+    network = 'vit_tiny_patch16'
+    num_classes = 1000
+    input_image_size = 224
+    scale = 256 / 224
+    model = backbones.__dict__[network](**{
+        'image_size': 224,
+        'global_pool': True,
+        'num_classes': num_classes,
+    })
+    # load pretrained model or not
+    trained_model_path = ''
+    load_state_dict(trained_model_path, model)
+    test_criterion = losses.__dict__['CELoss']()
+    test_dataset = ILSVRC2012Dataset(
+        root_dir=ILSVRC2012_path,
+        set_name='val',
+        transform=transforms.Compose([
+            Opencv2PIL(),
+            TorchResize(resize=input_image_size * scale),
+            TorchCenterCrop(resize=input_image_size),
+            TorchMeanStdNormalize(mean=[0.485, 0.456, 0.406],
+                                  std=[0.229, 0.224, 0.225]),
+        ]))
+    test_collater = ClassificationCollater()
+    seed = 0
+    # batch_size is total size
+    batch_size = 256
+    # num_workers is total workers
+    num_workers = 10

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/train.sh ADDED Viewed

	@@ -0,0 +1 @@


1	+ OMP_NUM_THREADS=1 CUDA_VISIBLE_DEVICES=0 python -m torch.distributed.run --nproc_per_node=1 --master_addr 127.0.1.0 --master_port 10000 ../../../tools/train_classification_model.py --work-dir ./

imagenet/vit_tiny_patch16_lion_for_mae_pretrain/train_config.py ADDED Viewed

	@@ -0,0 +1,140 @@

+import os
+import sys
+BASE_DIR = os.path.dirname(
+    os.path.dirname(os.path.dirname(os.path.dirname(
+        os.path.abspath(__file__)))))
+sys.path.append(BASE_DIR)
+from tools.path import ILSVRC2012_path
+from simpleAICV.classification import backbones
+from simpleAICV.classification import losses
+from simpleAICV.classification.datasets.ilsvrc2012dataset import ILSVRC2012Dataset
+from simpleAICV.classification.common import Opencv2PIL, TorchRandomResizedCrop, TorchRandomHorizontalFlip, RandAugment, TorchResize, TorchCenterCrop, TorchMeanStdNormalize, RandomErasing, ClassificationCollater, MixupCutmixClassificationCollater, load_state_dict
+import torch
+import torchvision.transforms as transforms
+class config:
+    network = 'vit_tiny_patch16'
+    num_classes = 1000
+    input_image_size = 224
+    scale = 256 / 224
+    model = backbones.__dict__[network](**{
+        'image_size': 224,
+        'drop_path_prob': 0.1,
+        'global_pool': True,
+        'num_classes': num_classes,
+    })
+    # load pretrained model or not
+    trained_model_path = '/root/code/SimpleAICV_pytorch_training_examples_on_ImageNet_COCO_ADE20K/pretrained_models/vit_mae_pretrain_on_imagenet1k/vit_tiny_patch16_224_mae_pretrain_model-loss0.427_encoder.pth'
+    load_state_dict(trained_model_path,
+                    model,
+                    loading_new_input_size_position_encoding_weight=True)
+    train_criterion = losses.__dict__['OneHotLabelCELoss']()
+    test_criterion = losses.__dict__['CELoss']()
+    train_dataset = ILSVRC2012Dataset(
+        root_dir=ILSVRC2012_path,
+        set_name='train',
+        transform=transforms.Compose([
+            Opencv2PIL(),
+            TorchRandomResizedCrop(resize=input_image_size),
+            TorchRandomHorizontalFlip(prob=0.5),
+            RandAugment(magnitude=9,
+                        num_layers=2,
+                        resize=input_image_size,
+                        mean=[0.485, 0.456, 0.406],
+                        integer=True,
+                        weight_idx=None,
+                        magnitude_std=0.5,
+                        magnitude_max=None),
+            TorchMeanStdNormalize(mean=[0.485, 0.456, 0.406],
+                                  std=[0.229, 0.224, 0.225]),
+            RandomErasing(prob=0.25, mode='pixel', max_count=1),
+        ]))
+    test_dataset = ILSVRC2012Dataset(
+        root_dir=ILSVRC2012_path,
+        set_name='val',
+        transform=transforms.Compose([
+            Opencv2PIL(),
+            TorchResize(resize=input_image_size * scale),
+            TorchCenterCrop(resize=input_image_size),
+            TorchMeanStdNormalize(mean=[0.485, 0.456, 0.406],
+                                  std=[0.229, 0.224, 0.225]),
+        ]))
+    train_collater = MixupCutmixClassificationCollater(
+        use_mixup=True,
+        mixup_alpha=0.8,
+        cutmix_alpha=1.0,
+        cutmix_minmax=None,
+        mixup_cutmix_prob=1.0,
+        switch_to_cutmix_prob=0.5,
+        mode='batch',
+        correct_lam=True,
+        label_smoothing=0.1,
+        num_classes=1000)
+    test_collater = ClassificationCollater()
+    seed = 0
+    # batch_size is total size
+    batch_size = 512
+    # num_workers is total workers
+    num_workers = 10
+    accumulation_steps = 8
+    optimizer = (
+        'Lion',
+        {
+            'lr':
+            4e-4,
+            'global_weight_decay':
+            False,
+            # if global_weight_decay = False
+            # all bias, bn and other 1d params weight set to 0 weight decay
+            'weight_decay':
+            5e-2,
+            # lr_layer_decay only support vit style model
+            'lr_layer_decay':
+            0.65,
+            'lr_layer_decay_block':
+            model.blocks,
+            'block_name':
+            'blocks',
+            'no_weight_decay_layer_name_list': [
+                'position_encoding',
+                'cls_token',
+            ],
+        },
+    )
+    scheduler = (
+        'CosineLR',
+        {
+            'warm_up_epochs': 5,
+            'min_lr': 1e-6,
+        },
+    )
+    epochs = 100
+    print_interval = 10
+    sync_bn = False
+    use_amp = True
+    use_compile = False
+    compile_params = {
+        # 'default': optimizes for large models, low compile-time and no extra memory usage.
+        # 'reduce-overhead': optimizes to reduce the framework overhead and uses some extra memory, helps speed up small models, model update may not correct.
+        # 'max-autotune': optimizes to produce the fastest model, but takes a very long time to compile and may failed.
+        'mode': 'default',
+    }
+    use_ema_model = False
+    ema_model_decay = 0.9999