import torch from torch import nn from torch.nn import functional as F import pytorch_lightning as pl import torchmetrics from torch.optim.lr_scheduler import OneCycleLR from torchmetrics.functional import accuracy class ResBlock(nn.Module): def __init__(self, in_channel, out_channel, stride=1): super(ResBlock, self).__init__() self.conv = nn.Sequential( nn.Conv2d(in_channel, in_channel, kernel_size=3, stride=1, padding=1, bias=False), nn.BatchNorm2d(in_channel), nn.ReLU(), nn.Conv2d(in_channel, out_channel, kernel_size=3, stride=1, padding=1, bias=False), nn.BatchNorm2d(out_channel), nn.ReLU(), ) def forward(self, x): return(self.conv(x)) class ResNet18(pl.LightningModule): def __init__(self, train_loader_len, criterion, num_classes=10, lr=0.001, max_lr=1.45E-03): super().__init__() self.save_hyperparameters(ignore=['criterion']) self.criterion = criterion self.train_loader_len = train_loader_len self.accuracy = torchmetrics.Accuracy(task="multiclass", num_classes=self.hparams.num_classes) self.prep_layer = nn.Sequential( nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False), nn.BatchNorm2d(64), nn.ReLU() ) self.layer_one = nn.Sequential( nn.Conv2d(64, 128, kernel_size=3, stride=1, padding=1, bias=False), nn.MaxPool2d(2,2), nn.BatchNorm2d(128), nn.ReLU() ) self.res_block1 = ResBlock(128, 128) self.layer_two = nn.Sequential( nn.Conv2d(128, 256, kernel_size=3, stride=1, padding=1, bias=False), nn.MaxPool2d(2,2), nn.BatchNorm2d(256), nn.ReLU() ) self.layer_three = nn.Sequential( nn.Conv2d(256, 512, kernel_size=3, stride=1, padding=1, bias=False), nn.MaxPool2d(2,2), nn.BatchNorm2d(512), nn.ReLU() ) self.res_block2 = ResBlock(512, 512) self.max_pool = nn.MaxPool2d(4,4) self.fc = nn.Linear(512, num_classes, bias=False) def forward(self, x): x = self.prep_layer(x) x = self.layer_one(x) R1 = self.res_block1(x) x = x + R1 x = self.layer_two(x) x = self.layer_three(x) R2 = self.res_block2(x) x = x + R2 x = self.max_pool(x) x = x.view(x.size(0), -1) x = self.fc(x) return(x) def configure_optimizers(self): optimizer = torch.optim.Adam(self.parameters(), lr=self.hparams.lr, weight_decay=1e-4) scheduler = OneCycleLR( optimizer, max_lr=self.hparams.max_lr, epochs=self.trainer.max_epochs, steps_per_epoch=self.train_loader_len, pct_start=5/self.trainer.max_epochs, div_factor=100, three_phase=False, ) if self.hparams.max_lr==1.45E-03: return(optimizer) else: return([optimizer], [scheduler]) def training_step(self, train_batch, batch_idx): data, target = train_batch y_pred = self(data) loss = self.criterion(y_pred, target) pred = torch.argmax(y_pred.squeeze(), dim=1) acc = accuracy(pred, target, task="multiclass", num_classes=self.hparams.num_classes) self.log('train_loss', loss, prog_bar=True, on_step=False, on_epoch=True) self.log('train_acc', acc, prog_bar=True, on_step=False, on_epoch=True) return(loss) def validation_step(self, batch, batch_idx): return(self.evaluate(batch, 'val')) def test_step(self, batch, batch_idx): return(self.evaluate(batch, 'test')) def evaluate(self, batch, stage=None): data, target = batch y_pred = self(data) loss = self.criterion(y_pred, target).item() pred = torch.argmax(y_pred.squeeze(), dim=1) acc = accuracy(pred, target, task="multiclass", num_classes=self.hparams.num_classes) if stage: self.log(f"{stage}_loss", loss, prog_bar=True, on_step=False, on_epoch=True) self.log(f"{stage}_acc", acc, prog_bar=True, on_step=False, on_epoch=True) return pred, target