{ "cells": [ { "cell_type": "code", "execution_count": 362, "metadata": { "id": "Vvcj31qpfCwY" }, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "from sklearn.model_selection import train_test_split\n", "from sklearn.naive_bayes import GaussianNB, MultinomialNB, BernoulliNB\n", "from sklearn.metrics import classification_report, confusion_matrix\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "import pickle " ] }, { "cell_type": "code", "execution_count": 363, "metadata": { "id": "frLJTPPefM7G" }, "outputs": [], "source": [ "# Load the dataset\n", "data = pd.read_csv('indeed.csv')" ] }, { "cell_type": "code", "execution_count": 364, "metadata": {}, "outputs": [], "source": [ "# from sklearn.preprocessing import MinMaxScaler\n", "# import pandas as pd\n", "\n", "# # Create a MinMaxScaler object\n", "# scaler = MinMaxScaler()\n", "\n", "# # Apply the scaler to the 'New Salary' column\n", "# data['New Salary'] = scaler.fit_transform(data['New Salary'].values.reshape(-1, 1))\n", "\n", "# # Print the normalized data\n", "# print(data)" ] }, { "cell_type": "code", "execution_count": 365, "metadata": { "id": "-9bDf-NOfOLo" }, "outputs": [], "source": [ "# seperate features and label\n", "X = data[[\"New Salary\",\"Experience\"]]\n", "y = data[\"Job_Pos\"]" ] }, { "cell_type": "code", "execution_count": 366, "metadata": { "id": "83HqtwnBfP0F" }, "outputs": [], "source": [ "X_train, X_test,y_train,y_test = train_test_split(x,y, test_size=0.3, random_state=42)" ] }, { "cell_type": "code", "execution_count": 367, "metadata": {}, "outputs": [], "source": [ "# for bernoulli\n", "a_train = X_train\n", "a_test = X_test\n", "b_train = y_train.astype(int)\n", "b_test = y_test.astype(int)" ] }, { "cell_type": "code", "execution_count": 368, "metadata": {}, "outputs": [], "source": [ "class_prob = [0.25,0.25,0.25,0.25]" ] }, { "attachments": {}, "cell_type": "markdown", "metadata": { "id": "lnd1249Ig9ov" }, "source": [ "# **MultinomialNB**" ] }, { "cell_type": "code", "execution_count": 369, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
MultinomialNB(alpha=10.0, class_prior=[0.25, 0.25, 0.25, 0.25], fit_prior=False)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
MultinomialNB(alpha=10.0, class_prior=[0.25, 0.25, 0.25, 0.25], fit_prior=False)