creating a neural network for the mens data, predicting the win column

with 10k epochs, trained on my m1 macbook with metal gpu acceleration.
Next we need to compare this model performance against a baseline model
that just blindly picks the higher chalk seed to win.

Files changed (2) hide show

models/{scoreDist30k.pth → nn10k.pth} +2 -2
src/nn.ipynb +116 -53

models/{scoreDist30k.pth → nn10k.pth} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d11fcf0f9b0ea5b93de0cbfbbaed4447f48ebc03c53be688981c3ceddbc287f7
-size 39998

 version https://git-lfs.github.com/spec/v1
+oid sha256:72062bda8133544b2241172907c3614855527a51357bebddaac0e46a7a9ea29f
+size 18898

src/nn.ipynb CHANGED Viewed

@@ -25,7 +25,7 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "/var/folders/v8/0hd98b512cn3ms2rz146k7jw0000gn/T/ipykernel_23752/685274063.py:1: DtypeWarning: Columns (481,482,483) have mixed types. Specify dtype option on import or set low_memory=False.\n",
       "  detailed_games_df = pd.read_csv(\n"
      ]
     },
@@ -66,6 +66,13 @@
     "wmns_games_df = detailed_games_df[detailed_games_df[\"League\"] == \"W\"]"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 4,
@@ -78,6 +85,11 @@
     "    \"FGMDiff mean reg\",\n",
     "    \"FGM3Diff mean reg\",\n",
     "    \"TODiff mean reg\",\n",
     "]\n",
     "\n",
     "target_cols = [\"Win\"]"
@@ -108,52 +120,70 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
    "metadata": {},
    "outputs": [],
    "source": [
     "# convert data to tensor objects and register to device\n",
-    "DEVICE = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
     "\n",
     "MX_train_T = torch.tensor(\n",
-    "    MX_train.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)\n",
     "\n",
     "MX_test_T = torch.tensor(\n",
-    "    MX_test.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)\n",
     "\n",
     "My_train_T = torch.tensor(\n",
-    "    My_train.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)\n",
     "\n",
     "My_test_T = torch.tensor(\n",
-    "    My_test.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)\n",
     "\n",
-    "# same for womens data\n",
-    "Wy_test_T = torch.tensor(\n",
-    "    Wy_test.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)\n",
     "\n",
-    "Wy_test_T = torch.tensor(\n",
-    "    Wy_test.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)\n",
     "\n",
-    "Wy_test_T = torch.tensor(\n",
-    "    My_test.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)\n",
     "\n",
     "Wy_test_T = torch.tensor(\n",
     "    Wy_test.values,\n",
-    "    dtype=float,\n",
     ").to(DEVICE)"
    ]
   },
@@ -168,7 +198,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -177,13 +207,13 @@
     "class NiglNN(nn.Module):\n",
     "    def __init__(self):\n",
     "        super().__init__()\n",
-    "        self.activation_func = nn.ReLU()\n",
     "        self.layer1 = nn.Linear(num_features, 64) \n",
     "        self.layer2 = nn.Linear(64, 32)\n",
     "        self.layer3 = nn.Linear(32, 16)\n",
     "        self.layer4 = nn.Linear(16, 8)\n",
     "        self.layer5 = nn.Linear(8, 4)\n",
-    "        self.layer5 = nn.Linear(4, 1)\n",
     "\n",
     "    def forward(self, x: torch.Tensor):\n",
     "        x = self.layer1(x)\n",
@@ -195,60 +225,93 @@
     "        x = self.layer4(x)\n",
     "        x = self.activation_func(x)\n",
     "        x = self.layer5(x)\n",
     "        return x\n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
    "metadata": {},
    "outputs": [
     {
-     "ename": "RuntimeError",
-     "evalue": "mat1 and mat2 must have the same dtype, but got Double and Float",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[12], line 11\u001b[0m\n\u001b[1;32m      5\u001b[0m optimizer \u001b[38;5;241m=\u001b[39m optim\u001b[38;5;241m.\u001b[39mAdam(\n\u001b[1;32m      6\u001b[0m     lr\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m0.001\u001b[39m,\n\u001b[1;32m      7\u001b[0m     params\u001b[38;5;241m=\u001b[39mnigl1k\u001b[38;5;241m.\u001b[39mparameters(),\n\u001b[1;32m      8\u001b[0m )\n\u001b[1;32m     10\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m i \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(epochs):\n\u001b[0;32m---> 11\u001b[0m     pred \u001b[38;5;241m=\u001b[39m \u001b[43mnigl1k\u001b[49m\u001b[43m(\u001b[49m\u001b[43mMX_train_T\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     13\u001b[0m     optimizer\u001b[38;5;241m.\u001b[39mzero_grad()\n\u001b[1;32m     15\u001b[0m     loss \u001b[38;5;241m=\u001b[39m loss_fn(pred, My_test_T) \n",
-      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/torch/nn/modules/module.py:1518\u001b[0m, in \u001b[0;36mModule._wrapped_call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m   1516\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_compiled_call_impl(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)  \u001b[38;5;66;03m# type: ignore[misc]\u001b[39;00m\n\u001b[1;32m   1517\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m-> 1518\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_call_impl\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/torch/nn/modules/module.py:1527\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m   1522\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1523\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1524\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks\n\u001b[1;32m   1525\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_backward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1526\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1527\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1529\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m   1530\u001b[0m     result \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n",
-      "Cell \u001b[0;32mIn[9], line 15\u001b[0m, in \u001b[0;36mNiglNN.forward\u001b[0;34m(self, x)\u001b[0m\n\u001b[1;32m     14\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mforward\u001b[39m(\u001b[38;5;28mself\u001b[39m, x: torch\u001b[38;5;241m.\u001b[39mTensor):\n\u001b[0;32m---> 15\u001b[0m     x \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mlayer1\u001b[49m\u001b[43m(\u001b[49m\u001b[43mx\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     16\u001b[0m     x \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mactivation_func(x)\n\u001b[1;32m     17\u001b[0m     x \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlayer2(x)\n",
-      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/torch/nn/modules/module.py:1518\u001b[0m, in \u001b[0;36mModule._wrapped_call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m   1516\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_compiled_call_impl(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)  \u001b[38;5;66;03m# type: ignore[misc]\u001b[39;00m\n\u001b[1;32m   1517\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m-> 1518\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_call_impl\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/torch/nn/modules/module.py:1527\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m   1522\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1523\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1524\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks\n\u001b[1;32m   1525\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_backward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1526\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1527\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1529\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m   1530\u001b[0m     result \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n",
-      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/torch/nn/modules/linear.py:114\u001b[0m, in \u001b[0;36mLinear.forward\u001b[0;34m(self, input)\u001b[0m\n\u001b[1;32m    113\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mforward\u001b[39m(\u001b[38;5;28mself\u001b[39m, \u001b[38;5;28minput\u001b[39m: Tensor) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m Tensor:\n\u001b[0;32m--> 114\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mF\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mlinear\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mweight\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mbias\u001b[49m\u001b[43m)\u001b[49m\n",
-      "\u001b[0;31mRuntimeError\u001b[0m: mat1 and mat2 must have the same dtype, but got Double and Float"
      ]
     }
    ],
    "source": [
     "# mens training loop\n",
-    "epochs = 1_000\n",
-    "nigl1k = NiglNN()\n",
-    "loss_fn = nn.MSELoss()\n",
     "optimizer = optim.Adam(\n",
     "    lr=0.001,\n",
-    "    params=nigl1k.parameters(),\n",
     ")\n",
     "\n",
-    "for i in range(epochs):\n",
-    "    pred = nigl1k(MX_train_T)\n",
     "    optimizer.zero_grad()\n",
-    "\n",
-    "    loss = loss_fn(pred, My_test_T) \n",
     "    loss.backward()\n",
-    "\n",
     "    optimizer.step()\n",
-    "    if i % epochs == 0:\n",
-    "        print(f\"[{i} / {epochs}] loss = {loss.item()}\")\n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": []
   }
  ],
  "metadata": {

      "name": "stderr",
      "output_type": "stream",
      "text": [
+      "/var/folders/v8/0hd98b512cn3ms2rz146k7jw0000gn/T/ipykernel_41770/685274063.py:1: DtypeWarning: Columns (481,482,483) have mixed types. Specify dtype option on import or set low_memory=False.\n",
       "  detailed_games_df = pd.read_csv(\n"
      ]
     },
     "wmns_games_df = detailed_games_df[detailed_games_df[\"League\"] == \"W\"]"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Define Features, Targets, and register data on device"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": 4,
     "    \"FGMDiff mean reg\",\n",
     "    \"FGM3Diff mean reg\",\n",
     "    \"TODiff mean reg\",\n",
+    "\n",
+    "    \"OppScore mean reg\",\n",
+    "    \"OppFGM mean reg\",\n",
+    "    \"OppFGM3 mean reg\",\n",
+    "    \"OppTO mean reg\",\n",
     "]\n",
     "\n",
     "target_cols = [\"Win\"]"
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
     "# convert data to tensor objects and register to device\n",
+    "# DEVICE = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
+    "\n",
+    "def get_device() -> str:\n",
+    "    if torch.cuda.is_available():\n",
+    "        return \"cuda\"\n",
+    "    if torch.backends.mps.is_available():\n",
+    "        return \"mps\"\n",
+    "    return \"cpu\"\n",
+    "\n",
+    "DEVICE = get_device()\n",
+    "print(DEVICE)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [],
+   "source": [
     "\n",
     "MX_train_T = torch.tensor(\n",
+    "    MX_train.astype(float).values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)\n",
     "\n",
     "MX_test_T = torch.tensor(\n",
+    "    MX_test.astype(float).values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)\n",
     "\n",
     "My_train_T = torch.tensor(\n",
+    "    My_train.astype(float).values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)\n",
     "\n",
     "My_test_T = torch.tensor(\n",
+    "    My_test.astype(float).values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)\n",
     "\n",
+    "# # same for womens data\n",
+    "WX_train_T = torch.tensor(\n",
+    "    WX_train.values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)\n",
     "\n",
+    "WX_test_T = torch.tensor(\n",
+    "    WX_test.values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)\n",
     "\n",
+    "Wy_train_T = torch.tensor(\n",
+    "    Wy_train.values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)\n",
     "\n",
     "Wy_test_T = torch.tensor(\n",
     "    Wy_test.values,\n",
+    "    dtype=torch.float32,\n",
     ").to(DEVICE)"
    ]
   },
   },
   {
    "cell_type": "code",
+   "execution_count": 8,
    "metadata": {},
    "outputs": [],
    "source": [
     "class NiglNN(nn.Module):\n",
     "    def __init__(self):\n",
     "        super().__init__()\n",
+    "        self.activation_func = nn.Sigmoid()\n",
     "        self.layer1 = nn.Linear(num_features, 64) \n",
     "        self.layer2 = nn.Linear(64, 32)\n",
     "        self.layer3 = nn.Linear(32, 16)\n",
     "        self.layer4 = nn.Linear(16, 8)\n",
     "        self.layer5 = nn.Linear(8, 4)\n",
+    "        self.layer6 = nn.Linear(4, 1)\n",
     "\n",
     "    def forward(self, x: torch.Tensor):\n",
     "        x = self.layer1(x)\n",
     "        x = self.layer4(x)\n",
     "        x = self.activation_func(x)\n",
     "        x = self.layer5(x)\n",
+    "        x = self.activation_func(x)\n",
+    "        x = self.layer6(x)\n",
+    "        x = self.activation_func(x)\n",
     "        return x\n"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[1000 / 10000] Binary Cross Entropy: 0.6770758628845215\n",
+      "[2000 / 10000] Binary Cross Entropy: 0.6671037077903748\n",
+      "[3000 / 10000] Binary Cross Entropy: 0.6648934483528137\n",
+      "[4000 / 10000] Binary Cross Entropy: 0.6640341281890869\n",
+      "[5000 / 10000] Binary Cross Entropy: 0.663619875907898\n",
+      "[6000 / 10000] Binary Cross Entropy: 0.6633755564689636\n",
+      "[7000 / 10000] Binary Cross Entropy: 0.6631807088851929\n",
+      "[8000 / 10000] Binary Cross Entropy: 0.663043200969696\n",
+      "[9000 / 10000] Binary Cross Entropy: 0.6629269123077393\n",
+      "[10000 / 10000] Binary Cross Entropy: 0.6629060506820679\n"
      ]
     }
    ],
    "source": [
     "# mens training loop\n",
+    "torch.manual_seed(2)\n",
+    "\n",
+    "epochs = 10_000\n",
+    "nigl10k = NiglNN().to(DEVICE)\n",
+    "loss_fn = nn.BCEWithLogitsLoss()\n",
     "optimizer = optim.Adam(\n",
     "    lr=0.001,\n",
+    "    params=nigl10k.parameters(),\n",
     ")\n",
     "\n",
+    "for epoch in range(1, epochs + 1):\n",
     "    optimizer.zero_grad()\n",
+    "    pred = nigl10k(MX_train_T)\n",
+    "    loss = loss_fn(pred, My_train_T) \n",
     "    loss.backward()\n",
     "    optimizer.step()\n",
+    "\n",
+    "    if epoch % 1_000 == 0:\n",
+    "        print(f\"[{epoch} / {epochs}] Binary Cross Entropy: {loss.item()}\")\n"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Binary Cross Entropy: 0.6655928492546082\n"
+     ]
+    }
+   ],
+   "source": [
+    "nigl10k.eval()\n",
+    "\n",
+    "with torch.no_grad():\n",
+    "    pred = nigl10k(MX_test_T)\n",
+    "    loss = loss_fn(pred, My_test_T)\n",
+    "    print(f\"Binary Cross Entropy: {loss.item()}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
    "metadata": {},
    "outputs": [],
+   "source": [
+    "# save model\n",
+    "MODEL_DIR = os.path.join(\"..\", \"models\")\n",
+    "\n",
+    "torch.save(\n",
+    "    nigl10k,\n",
+    "    os.path.join(MODEL_DIR, \"nn10k.pth\"),\n",
+    ")"
+   ]
   }
  ],
  "metadata": {