readme citation url change

Files changed (12) hide show

.gitignore +3 -0
README.md +70 -0
__init__.py +0 -0
analytics.png +0 -0
analytics.py +23 -0
blocknet10.py +58 -0
config.json +5 -0
dataloader.py +30 -0
figures/eq1.png +0 -0
figures/fig1.png +0 -0
main.py +102 -0
model_state_dict.pth +3 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,3 @@

+data/
+push_to_hf.py
+*.ipynb

README.md ADDED Viewed

	@@ -0,0 +1,70 @@

+# BlockNet10 - CNN for CIFAR-10 dataset
+## Overview
+BlockNet10 is a neural network architecture designed for image classification tasks using the CIFAR-10 dataset. This model implements a sequence of intermediate blocks (B1, B2, ..., BK) followed by an output block (O).
+## Architecture Details
+### Intermediate Block (Bi)
+Each intermediate block receives an input image x and outputs an image x'. The block comprises L independent convolutional layers, denoted as C1, C2, ..., CL.
+Each convolutional layer Cl in a block operates on the input image x and outputs an image Cl(x).
+<div style="display: flex; justify-content: center;">
+  <img src="figures/eq1.png" alt="Equation 1" />
+</div>
+The output image x' is computed as x' = a1C1(x) + a2C2(x) + ... + aLCL(x), where a = [a1, a2, ..., aL]T is a vector computed by the block.
+The vector a is obtained by computing the average value of each channel of x and passing it through a fully connected layer with the same number of units as convolutional layers in the block.
+<div style="display: flex; justify-content: center;">
+  <img src="figures/fig1.png" alt="Figure 1" />
+</div>
+### Output Block (O)
+The output block processes the final output image from the intermediate blocks for classification.
+## Analytics
+<div style="display: flex; justify-content: center; align-items: center;">
+  <table>
+    <tr>
+      <th>Epoch Number</th>
+      <th>Train Accuracy</th>
+      <th>Test Accuracy</th>
+      <th>Average Loss</th>
+    </tr>
+    <tr>
+      <td>50</td>
+      <td>75.43</td>
+      <td>80.56</td>
+      <td>0.685</td>
+    </tr>
+  </table>
+</div>
+## Clone on GitHub
+You can contribute to the advancement of this architecture, changes in hyperparameter, or solve issues <a href="https://github.com/siddheshtv/cifar10" target="_blank">here</a>.
+## Citation
+If you use BlockNet10 in your research or work, please cite it as follows:
+```bibtex
+@article{blocknet10,
+  title={BlockNet10: CIFAR-10 Image Classifier},
+  author={Siddhesh Kulthe},
+  year={2024},
+  publisher={Hugging Face},
+  url={https://huggingface.co/siddheshtv/BlockNet10}
+}
+```
+---
+## license: mit

__init__.py ADDED Viewed

File without changes

analytics.png ADDED Viewed

analytics.py ADDED Viewed

	@@ -0,0 +1,23 @@

+import matplotlib.pyplot as plt
+def model_analytics(train_losses, train_accuracies, test_accuracies):
+    plt.figure(figsize=(10, 5))
+    plt.subplot(1, 2, 1)
+    plt.plot(train_losses, label='Training Loss')
+    plt.xlabel('Batch')
+    plt.ylabel('Loss')
+    plt.title('Loss per Training Batch')
+    plt.legend()
+    plt.subplot(1, 2, 2)
+    plt.plot(train_accuracies, label='Training Accuracy')
+    plt.plot(test_accuracies, label='Test Accuracy')
+    plt.xlabel('Epoch')
+    plt.ylabel('Accuracy (%)')
+    plt.title('Training and Test Accuracies')
+    plt.legend()
+    plt.tight_layout()
+    plt.savefig("analytics.png")
+    return "✅ Figure saved successfully"

blocknet10.py ADDED Viewed

	@@ -0,0 +1,58 @@

+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from huggingface_hub import PyTorchModelHubMixin
+class IntermediateBlock(nn.Module):
+    def __init__(self, in_channels, num_conv_layers, conv_params):
+        super(IntermediateBlock, self).__init__()
+        self.conv_layers = nn.ModuleList([nn.Conv2d(in_channels, *conv_params) for _ in range(num_conv_layers)])
+        self.batch_norms = nn.ModuleList([nn.BatchNorm2d(conv_params[0]) for _ in range(num_conv_layers)])
+        out_channels = conv_params[0]
+        self.fc = nn.Linear(in_channels, out_channels)
+    def forward(self, x):
+        batch_size = x.size(0)
+        channel_means = x.mean(dim=[2, 3])
+        a = self.fc(channel_means)
+        x_out = torch.stack([F.leaky_relu(conv(x)) for conv in self.conv_layers], dim=-1).sum(dim=-1)
+        x_out = torch.stack([bn(x_out) for bn in self.batch_norms], dim=-1).sum(dim=-1)
+        return x_out * F.leaky_relu(a.view(batch_size, -1, 1, 1))
+class OutputBlock(nn.Module):
+    def __init__(self, in_channels, num_classes, hidden_sizes=[]):
+        super(OutputBlock, self).__init__()
+        self.fc_layers = nn.ModuleList([nn.Linear(in_channels, hidden_sizes[0])] + [nn.Linear(hidden_sizes[i], hidden_sizes[i+1]) for i in range(len(hidden_sizes)-1)] + [nn.Linear(hidden_sizes[-1], num_classes)])
+        self.batch_norms = nn.ModuleList([nn.BatchNorm1d(size) for size in hidden_sizes])
+    def forward(self, x):
+        channel_means = x.mean(dim=[2, 3])
+        out = F.leaky_relu(channel_means)
+        for fc, bn in zip(self.fc_layers, self.batch_norms):
+            out = F.leaky_relu(bn(fc(out)))
+        return out
+class CustomCIFAR10Net(nn.Module, PyTorchModelHubMixin):
+    def __init__(self, num_classes=10):
+        super(CustomCIFAR10Net, self).__init__()
+        self.intermediate_blocks = nn.ModuleList([
+            IntermediateBlock(3, 3, [64, 3, 3, 1, 1]),
+            IntermediateBlock(64, 3, [128, 3, 3, 1, 1]),
+            IntermediateBlock(128, 3, [256, 3, 3, 1, 1]),
+            IntermediateBlock(256, 3, [512, 3, 3, 1, 1]),
+            IntermediateBlock(512, 3, [1024, 3, 3, 1, 1])
+        ])
+        self.output_block = OutputBlock(1024, num_classes, [512, 256])
+        self.dropout = nn.Dropout(0.5)
+        for m in self.modules():
+            if isinstance(m, nn.Conv2d) or isinstance(m, nn.Linear):
+                nn.init.kaiming_normal_(m.weight, mode='fan_in', nonlinearity='relu')
+    def forward(self, x):
+        for block in self.intermediate_blocks:
+            x = block(x)
+            x = self.dropout(x)
+        x = self.output_block(x)
+        return x

config.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "architectures": ["BlockNet10"],
+  "hidden_size": 1024,
+  "num_classes": 10
+}

dataloader.py ADDED Viewed

	@@ -0,0 +1,30 @@

+import torch
+from torchvision import datasets
+import torchvision.transforms as transforms
+batch_size = 128
+def data_transform():
+    transform_train = transforms.Compose([
+    transforms.RandomHorizontalFlip(),
+    transforms.RandomRotation(10),
+    transforms.RandomCrop(32, padding=4),
+    transforms.ColorJitter(brightness=0.2, contrast=0.2, saturation=0.2, hue=0.1),
+    transforms.ToTensor(),
+    transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
+    ])
+    transform_test = transforms.Compose([
+        transforms.ToTensor(),
+        transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
+    ])
+    return transform_train, transform_test
+def data_loader(transform_train, transform_test):
+    train_dataset = datasets.CIFAR10(root='./data', train=True, download=True, transform=transform_train)
+    test_dataset = datasets.CIFAR10(root='./data', train=False, download=True, transform=transform_test)
+    train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True, num_workers=2)
+    test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=False, num_workers=2)
+    return train_loader, test_loader

figures/eq1.png ADDED Viewed

figures/fig1.png ADDED Viewed

main.py ADDED Viewed

	@@ -0,0 +1,102 @@

+import torch
+import torch.nn as nn
+import torch.optim as optim
+import torch.optim.lr_scheduler as lr_scheduler
+from dataloader import batch_size
+from dataloader import data_transform, data_loader
+from blocknet10 import CustomCIFAR10Net
+from analytics import model_analytics
+from push_to_hf import HF
+torch.manual_seed(42)
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+print(f"Using device: {device}")
+transform_train, transform_test = data_transform()
+train_loader, test_loader = data_loader(transform_train, transform_test)
+def arch_tester():
+    model = CustomCIFAR10Net()
+    input_data = torch.randn(batch_size, 3, 32, 32)
+    output = model(input_data)
+    return output.shape
+arch_tester_output = arch_tester()
+print(arch_tester_output)
+model = CustomCIFAR10Net().to(device)
+criterion = nn.CrossEntropyLoss()
+optimizer = optim.AdamW(model.parameters(), lr=0.01, betas=(0.8, 0.95), weight_decay=0.0005, amsgrad=True, eps=1e-8)
+scheduler = lr_scheduler.CosineAnnealingLR(optimizer, T_max=200)
+train_losses = []
+train_accuracies = []
+test_accuracies = []
+num_epochs = 50
+total_steps = len(train_loader) * num_epochs
+step_count = 0
+for epoch in range(num_epochs):
+    running_loss = 0.0
+    correct_train = 0
+    total_train = 0
+    for i, (inputs, labels) in enumerate(train_loader, 0):
+        inputs, labels = inputs.to(device), labels.to(device)
+        optimizer.zero_grad()
+        outputs = model(inputs)
+        loss = criterion(outputs, labels)
+        loss.backward()
+        optimizer.step()
+        running_loss += loss.item()
+        step_count += 1
+        if step_count % 100 == 0:
+            train_losses.append(running_loss / 100)
+            print(f'[Epoch: {epoch + 1}, Step: {step_count:5d}/{total_steps}] loss: {running_loss / 100:.3f}')
+            running_loss = 0.0
+        if i == len(train_loader) - 1:
+            model.eval()
+            with torch.no_grad():
+                for images, labels in train_loader:
+                    images, labels = images.to(device), labels.to(device)
+                    outputs = model(images)
+                    _, predicted = torch.max(outputs.data, 1)
+                    total_train += labels.size(0)
+                    correct_train += (predicted == labels).sum().item()
+            train_accuracy = 100 * correct_train / total_train
+            train_accuracies.append(train_accuracy)
+    scheduler.step()
+    model.eval()
+    correct_test = 0
+    total_test = 0
+    with torch.no_grad():
+        for images, labels in test_loader:
+            images, labels = images.to(device), labels.to(device)
+            outputs = model(images)
+            _, predicted = torch.max(outputs.data, 1)
+            total_test += labels.size(0)
+            correct_test += (predicted == labels).sum().item()
+    test_accuracy = 100 * correct_test / total_test
+    test_accuracies.append(test_accuracy)
+    print(f'Epoch {epoch + 1}: Test Accuracy = {test_accuracy:.2f}%')
+print("Last Train Losses:" + str(train_losses[-1]))
+print("Last Train Accuracy:" + str(train_accuracies[-1]))
+print("Last Test Accuracy:" + str(test_accuracies[-1]))
+analytics = model_analytics(train_losses, train_accuracies, test_accuracies)
+huggingface = HF()
+push_to_face = huggingface.push_to_face(model=model)
+print(push_to_face)

model_state_dict.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7be1849972498ca04e513cf1cf3a49d626f011f0ba337a404412791c810d0df4
+size 80831147