{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "048bb88a-9e50-4f77-af52-cc0ca8d43079", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n" ] }, { "cell_type": "code", "execution_count": 2, "id": "c798af35-9b68-4648-8c39-b48b02c9e206", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
namecompanyyearPricekms_drivenfuel_type
0Hyundai Santro Xing XO eRLX Euro IIIHyundai200780,00045,000 kmsPetrol
1Mahindra Jeep CL550 MDIMahindra20064,25,00040 kmsDiesel
2Maruti Suzuki Alto 800 VxiMaruti2018Ask For Price22,000 kmsPetrol
3Hyundai Grand i10 Magna 1.2 Kappa VTVTHyundai20143,25,00028,000 kmsPetrol
4Ford EcoSport Titanium 1.5L TDCiFord20145,75,00036,000 kmsDiesel
\n", "
" ], "text/plain": [ " name company year Price \\\n", "0 Hyundai Santro Xing XO eRLX Euro III Hyundai 2007 80,000 \n", "1 Mahindra Jeep CL550 MDI Mahindra 2006 4,25,000 \n", "2 Maruti Suzuki Alto 800 Vxi Maruti 2018 Ask For Price \n", "3 Hyundai Grand i10 Magna 1.2 Kappa VTVT Hyundai 2014 3,25,000 \n", "4 Ford EcoSport Titanium 1.5L TDCi Ford 2014 5,75,000 \n", "\n", " kms_driven fuel_type \n", "0 45,000 kms Petrol \n", "1 40 kms Diesel \n", "2 22,000 kms Petrol \n", "3 28,000 kms Petrol \n", "4 36,000 kms Diesel " ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car=pd.read_csv(\"quikr_car.csv\")\n", "car.head()" ] }, { "cell_type": "code", "execution_count": 3, "id": "ef324a73-1679-4c63-9a13-13e605592bb7", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "(892, 6)" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car.shape" ] }, { "cell_type": "code", "execution_count": 4, "id": "87591cbb-33dc-45d5-99d8-c5985ed58a00", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "RangeIndex: 892 entries, 0 to 891\n", "Data columns (total 6 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 name 892 non-null object\n", " 1 company 892 non-null object\n", " 2 year 892 non-null object\n", " 3 Price 892 non-null object\n", " 4 kms_driven 840 non-null object\n", " 5 fuel_type 837 non-null object\n", "dtypes: object(6)\n", "memory usage: 41.9+ KB\n" ] } ], "source": [ "car.info()" ] }, { "cell_type": "code", "execution_count": 5, "id": "bab6df5c-0d21-4fab-93c6-6979baaa0259", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array(['2007', '2006', '2018', '2014', '2015', '2012', '2013', '2016',\n", " '2010', '2017', '2008', '2011', '2019', '2009', '2005', '2000',\n", " '...', '150k', 'TOUR', '2003', 'r 15', '2004', 'Zest', '/-Rs',\n", " 'sale', '1995', 'ara)', '2002', 'SELL', '2001', 'tion', 'odel',\n", " '2 bs', 'arry', 'Eon', 'o...', 'ture', 'emi', 'car', 'able', 'no.',\n", " 'd...', 'SALE', 'digo', 'sell', 'd Ex', 'n...', 'e...', 'D...',\n", " ', Ac', 'go .', 'k...', 'o c4', 'zire', 'cent', 'Sumo', 'cab',\n", " 't xe', 'EV2', 'r...', 'zest'], dtype=object)" ] }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car['year'].unique()" ] }, { "cell_type": "code", "execution_count": 6, "id": "51a2307c-85d9-409d-a6db-136e70eacbe4", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array(['80,000', '4,25,000', 'Ask For Price', '3,25,000', '5,75,000',\n", " '1,75,000', '1,90,000', '8,30,000', '2,50,000', '1,82,000',\n", " '3,15,000', '4,15,000', '3,20,000', '10,00,000', '5,00,000',\n", " '3,50,000', '1,60,000', '3,10,000', '75,000', '1,00,000',\n", " '2,90,000', '95,000', '1,80,000', '3,85,000', '1,05,000',\n", " '6,50,000', '6,89,999', '4,48,000', '5,49,000', '5,01,000',\n", " '4,89,999', '2,80,000', '3,49,999', '2,84,999', '3,45,000',\n", " '4,99,999', '2,35,000', '2,49,999', '14,75,000', '3,95,000',\n", " '2,20,000', '1,70,000', '85,000', '2,00,000', '5,70,000',\n", " '1,10,000', '4,48,999', '18,91,111', '1,59,500', '3,44,999',\n", " '4,49,999', '8,65,000', '6,99,000', '3,75,000', '2,24,999',\n", " '12,00,000', '1,95,000', '3,51,000', '2,40,000', '90,000',\n", " '1,55,000', '6,00,000', '1,89,500', '2,10,000', '3,90,000',\n", " '1,35,000', '16,00,000', '7,01,000', '2,65,000', '5,25,000',\n", " '3,72,000', '6,35,000', '5,50,000', '4,85,000', '3,29,500',\n", " '2,51,111', '5,69,999', '69,999', '2,99,999', '3,99,999',\n", " '4,50,000', '2,70,000', '1,58,400', '1,79,000', '1,25,000',\n", " '2,99,000', '1,50,000', '2,75,000', '2,85,000', '3,40,000',\n", " '70,000', '2,89,999', '8,49,999', '7,49,999', '2,74,999',\n", " '9,84,999', '5,99,999', '2,44,999', '4,74,999', '2,45,000',\n", " '1,69,500', '3,70,000', '1,68,000', '1,45,000', '98,500',\n", " '2,09,000', '1,85,000', '9,00,000', '6,99,999', '1,99,999',\n", " '5,44,999', '1,99,000', '5,40,000', '49,000', '7,00,000', '55,000',\n", " '8,95,000', '3,55,000', '5,65,000', '3,65,000', '40,000',\n", " '4,00,000', '3,30,000', '5,80,000', '3,79,000', '2,19,000',\n", " '5,19,000', '7,30,000', '20,00,000', '21,00,000', '14,00,000',\n", " '3,11,000', '8,55,000', '5,35,000', '1,78,000', '3,00,000',\n", " '2,55,000', '5,49,999', '3,80,000', '57,000', '4,10,000',\n", " '2,25,000', '1,20,000', '59,000', '5,99,000', '6,75,000', '72,500',\n", " '6,10,000', '2,30,000', '5,20,000', '5,24,999', '4,24,999',\n", " '6,44,999', '5,84,999', '7,99,999', '4,44,999', '6,49,999',\n", " '9,44,999', '5,74,999', '3,74,999', '1,30,000', '4,01,000',\n", " '13,50,000', '1,74,999', '2,39,999', '99,999', '3,24,999',\n", " '10,74,999', '11,30,000', '1,49,000', '7,70,000', '30,000',\n", " '3,35,000', '3,99,000', '65,000', '1,69,999', '1,65,000',\n", " '5,60,000', '9,50,000', '7,15,000', '45,000', '9,40,000',\n", " '1,55,555', '15,00,000', '4,95,000', '8,00,000', '12,99,000',\n", " '5,30,000', '14,99,000', '32,000', '4,05,000', '7,60,000',\n", " '7,50,000', '4,19,000', '1,40,000', '15,40,000', '1,23,000',\n", " '4,98,000', '4,80,000', '4,88,000', '15,25,000', '5,48,900',\n", " '7,25,000', '99,000', '52,000', '28,00,000', '4,99,000',\n", " '3,81,000', '2,78,000', '6,90,000', '2,60,000', '90,001',\n", " '1,15,000', '15,99,000', '1,59,000', '51,999', '2,15,000',\n", " '35,000', '11,50,000', '2,69,000', '60,000', '4,30,000',\n", " '85,00,003', '4,01,919', '4,90,000', '4,24,000', '2,05,000',\n", " '5,49,900', '3,71,500', '4,35,000', '1,89,700', '3,89,700',\n", " '3,60,000', '2,95,000', '1,14,990', '10,65,000', '4,70,000',\n", " '48,000', '1,88,000', '4,65,000', '1,79,999', '21,90,000',\n", " '23,90,000', '10,75,000', '4,75,000', '10,25,000', '6,15,000',\n", " '19,00,000', '14,90,000', '15,10,000', '18,50,000', '7,90,000',\n", " '17,25,000', '12,25,000', '68,000', '9,70,000', '31,00,000',\n", " '8,99,000', '88,000', '53,000', '5,68,500', '71,000', '5,90,000',\n", " '7,95,000', '42,000', '1,89,000', '1,62,000', '35,999',\n", " '29,00,000', '39,999', '50,500', '5,10,000', '8,60,000',\n", " '5,00,001'], dtype=object)" ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car['Price'].unique()" ] }, { "cell_type": "code", "execution_count": 7, "id": "11c4a15e-82e8-4fd8-a1f1-e2068a5f62e8", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array(['45,000 kms', '40 kms', '22,000 kms', '28,000 kms', '36,000 kms',\n", " '59,000 kms', '41,000 kms', '25,000 kms', '24,530 kms',\n", " '60,000 kms', '30,000 kms', '32,000 kms', '48,660 kms',\n", " '4,000 kms', '16,934 kms', '43,000 kms', '35,550 kms',\n", " '39,522 kms', '39,000 kms', '55,000 kms', '72,000 kms',\n", " '15,975 kms', '70,000 kms', '23,452 kms', '35,522 kms',\n", " '48,508 kms', '15,487 kms', '82,000 kms', '20,000 kms',\n", " '68,000 kms', '38,000 kms', '27,000 kms', '33,000 kms',\n", " '46,000 kms', '16,000 kms', '47,000 kms', '35,000 kms',\n", " '30,874 kms', '15,000 kms', '29,685 kms', '1,30,000 kms',\n", " '19,000 kms', nan, '54,000 kms', '13,000 kms', '38,200 kms',\n", " '50,000 kms', '13,500 kms', '3,600 kms', '45,863 kms',\n", " '60,500 kms', '12,500 kms', '18,000 kms', '13,349 kms',\n", " '29,000 kms', '44,000 kms', '42,000 kms', '14,000 kms',\n", " '49,000 kms', '36,200 kms', '51,000 kms', '1,04,000 kms',\n", " '33,333 kms', '33,600 kms', '5,600 kms', '7,500 kms', '26,000 kms',\n", " '24,330 kms', '65,480 kms', '28,028 kms', '2,00,000 kms',\n", " '99,000 kms', '2,800 kms', '21,000 kms', '11,000 kms',\n", " '66,000 kms', '3,000 kms', '7,000 kms', '38,500 kms', '37,200 kms',\n", " '43,200 kms', '24,800 kms', '45,872 kms', '40,000 kms',\n", " '11,400 kms', '97,200 kms', '52,000 kms', '31,000 kms',\n", " '1,75,430 kms', '37,000 kms', '65,000 kms', '3,350 kms',\n", " '75,000 kms', '62,000 kms', '73,000 kms', '2,200 kms',\n", " '54,870 kms', '34,580 kms', '97,000 kms', '60 kms', '80,200 kms',\n", " '3,200 kms', '0,000 kms', '5,000 kms', '588 kms', '71,200 kms',\n", " '1,75,400 kms', '9,300 kms', '56,758 kms', '10,000 kms',\n", " '56,450 kms', '56,000 kms', '32,700 kms', '9,000 kms', '73 kms',\n", " '1,60,000 kms', '84,000 kms', '58,559 kms', '57,000 kms',\n", " '1,70,000 kms', '80,000 kms', '6,821 kms', '23,000 kms',\n", " '34,000 kms', '1,800 kms', '4,00,000 kms', '48,000 kms',\n", " '90,000 kms', '12,000 kms', '69,900 kms', '1,66,000 kms',\n", " '122 kms', '0 kms', '24,000 kms', '36,469 kms', '7,800 kms',\n", " '24,695 kms', '15,141 kms', '59,910 kms', '1,00,000 kms',\n", " '4,500 kms', '1,29,000 kms', '300 kms', '1,31,000 kms',\n", " '1,11,111 kms', '59,466 kms', '25,500 kms', '44,005 kms',\n", " '2,110 kms', '43,222 kms', '1,00,200 kms', '65 kms',\n", " '1,40,000 kms', '1,03,553 kms', '58,000 kms', '1,20,000 kms',\n", " '49,800 kms', '100 kms', '81,876 kms', '6,020 kms', '55,700 kms',\n", " '18,500 kms', '1,80,000 kms', '53,000 kms', '35,500 kms',\n", " '22,134 kms', '1,000 kms', '8,500 kms', '87,000 kms', '6,000 kms',\n", " '15,574 kms', '8,000 kms', '55,800 kms', '56,400 kms',\n", " '72,160 kms', '11,500 kms', '1,33,000 kms', '2,000 kms',\n", " '88,000 kms', '65,422 kms', '1,17,000 kms', '1,50,000 kms',\n", " '10,750 kms', '6,800 kms', '5 kms', '9,800 kms', '57,923 kms',\n", " '30,201 kms', '6,200 kms', '37,518 kms', '24,652 kms', '383 kms',\n", " '95,000 kms', '3,528 kms', '52,500 kms', '47,900 kms',\n", " '52,800 kms', '1,95,000 kms', '48,008 kms', '48,247 kms',\n", " '9,400 kms', '64,000 kms', '2,137 kms', '10,544 kms', '49,500 kms',\n", " '1,47,000 kms', '90,001 kms', '48,006 kms', '74,000 kms',\n", " '85,000 kms', '29,500 kms', '39,700 kms', '67,000 kms',\n", " '19,336 kms', '60,105 kms', '45,933 kms', '1,02,563 kms',\n", " '28,600 kms', '41,800 kms', '1,16,000 kms', '42,590 kms',\n", " '7,400 kms', '54,500 kms', '76,000 kms', '00 kms', '11,523 kms',\n", " '38,600 kms', '95,500 kms', '37,458 kms', '85,960 kms',\n", " '12,516 kms', '30,600 kms', '2,550 kms', '62,500 kms',\n", " '69,000 kms', '28,400 kms', '68,485 kms', '3,500 kms',\n", " '85,455 kms', '63,000 kms', '1,600 kms', '77,000 kms',\n", " '26,500 kms', '2,875 kms', '13,900 kms', '1,500 kms', '2,450 kms',\n", " '1,625 kms', '33,400 kms', '60,123 kms', '38,900 kms',\n", " '1,37,495 kms', '91,200 kms', '1,46,000 kms', '1,00,800 kms',\n", " '2,100 kms', '2,500 kms', '1,32,000 kms', 'Petrol'], dtype=object)" ] }, "execution_count": 7, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car['kms_driven'].unique()" ] }, { "cell_type": "code", "execution_count": 8, "id": "0e7f715a-351b-4256-bf5d-cd7863a3ce47", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array(['Petrol', 'Diesel', nan, 'LPG'], dtype=object)" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car['fuel_type'].unique()" ] }, { "cell_type": "code", "execution_count": 9, "id": "5649ebaa-41af-48d8-a12a-c150d66b86dd", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array(['Hyundai Santro Xing XO eRLX Euro III', 'Mahindra Jeep CL550 MDI',\n", " 'Maruti Suzuki Alto 800 Vxi',\n", " 'Hyundai Grand i10 Magna 1.2 Kappa VTVT',\n", " 'Ford EcoSport Titanium 1.5L TDCi', 'Ford Figo', 'Hyundai Eon',\n", " 'Ford EcoSport Ambiente 1.5L TDCi',\n", " 'Maruti Suzuki Alto K10 VXi AMT', 'Skoda Fabia Classic 1.2 MPI',\n", " 'Maruti Suzuki Stingray VXi', 'Hyundai Elite i20 Magna 1.2',\n", " 'Mahindra Scorpio SLE BS IV', 'Audi A8', 'Audi Q7',\n", " 'Mahindra Scorpio S10', 'Maruti Suzuki Alto 800',\n", " 'Hyundai i20 Sportz 1.2', 'Maruti Suzuki Alto 800 Lx',\n", " 'Maruti Suzuki Vitara Brezza ZDi', 'Maruti Suzuki Alto LX',\n", " 'Mahindra Bolero DI', 'Maruti Suzuki Swift Dzire ZDi',\n", " 'Mahindra Scorpio S10 4WD', 'Maruti Suzuki Swift Vdi BSIII',\n", " 'Maruti Suzuki Wagon R VXi BS III',\n", " 'Maruti Suzuki Wagon R VXi Minor',\n", " 'Toyota Innova 2.0 G 8 STR BS IV', 'Renault Lodgy 85 PS RXL',\n", " 'Skoda Yeti Ambition 2.0 TDI CR 4x2',\n", " 'Maruti Suzuki Baleno Delta 1.2',\n", " 'Renault Duster 110 PS RxZ Diesel Plus',\n", " 'Renault Duster 85 PS RxE Diesel', 'Honda City 1.5 S MT',\n", " 'Maruti Suzuki Dzire', 'Honda Amaze', 'Honda Amaze 1.5 SX i DTEC',\n", " 'Honda City', 'Datsun Redi GO S', 'Maruti Suzuki SX4 ZXI MT',\n", " 'Mitsubishi Pajero Sport Limited Edition',\n", " 'Maruti Suzuki Swift VXi 1.2 ABS BS IV', 'Honda City ZX CVT',\n", " 'Maruti Suzuki Wagon R LX BS IV', 'Tata Indigo eCS LS CR4 BS IV',\n", " 'Volkswagen Polo Highline Exquisite P',\n", " 'I want to sell my car Tata Zest', 'Chevrolet Spark LS 1.0',\n", " 'Renault Duster 110PS Diesel RxZ', 'Mini Cooper S 1.6',\n", " 'Skoda Fabia 1.2L Diesel Ambiente', 'Renault Duster',\n", " 'Mahindra Scorpio S4', 'Mahindra Scorpio VLX 2WD BS IV',\n", " 'Mahindra Quanto C8', 'Ford EcoSport', 'Honda Brio',\n", " 'Volkswagen Vento Highline Plus 1.5 Diesel AT',\n", " 'Hyundai i20 Magna', 'Toyota Corolla Altis Diesel D4DG',\n", " 'Hyundai Verna Transform SX VTVT',\n", " 'Toyota Corolla Altis Petrol Ltd', 'Honda City 1.5 EXi New',\n", " 'Skoda Fabia 1.2L Diesel Elegance', 'BMW 3 Series 320i',\n", " 'Maruti Suzuki A Star Lxi', 'Toyota Etios GD',\n", " 'Ford Figo Diesel EXI Option',\n", " 'Maruti Suzuki Swift Dzire VXi 1.2 BS IV',\n", " 'Chevrolet Beat LT Diesel', 'BMW 7 Series 740Li Sedan',\n", " 'Mahindra XUV500 W8 AWD 2013', 'Hyundai i10 Magna 1.2',\n", " 'Hyundai Verna Fluidic New', 'Maruti Suzuki Swift VXi 1.2 BS IV',\n", " 'Maruti Suzuki Ertiga ZXI Plus', 'Maruti Suzuki Ertiga Vxi',\n", " 'Maruti Suzuki Ertiga VDi', 'Maruti Suzuki Alto LXi BS III',\n", " 'Hyundai Grand i10 Asta 1.1 CRDi', 'Honda Amaze 1.2 S i VTEC',\n", " 'Hyundai i20 Asta 1.4 CRDI 6 Speed', 'Ford Figo Diesel EXI',\n", " 'Maruti Suzuki Eeco 5 STR WITH AC HTR', 'Maruti Suzuki Ertiga ZXi',\n", " 'Maruti Suzuki Esteem LXi BS III', 'Maruti Suzuki Ritz VXI',\n", " 'Maruti Suzuki Ritz LDi', 'Maruti Suzuki Dzire VDI',\n", " 'Toyota Etios Liva G', 'Hyundai i20 Sportz 1.4 CRDI',\n", " 'Chevrolet Spark', 'Nissan Micra XV', 'Maruti Suzuki Swift',\n", " 'Honda Amaze 1.5 S i DTEC', 'Chevrolet Beat', 'Toyota Corolla',\n", " 'Honda City 1.5 V MT', 'Ford EcoSport Trend 1.5L TDCi',\n", " 'Hyundai i20 Asta 1.2', 'Tata Indica V2 eLS',\n", " 'Maruti Suzuki Alto 800 Lxi', 'Hindustan Motors Ambassador',\n", " 'Toyota Corolla Altis 1.8 GL', 'Toyota Corolla Altis 1.8 J',\n", " 'Toyota Innova 2.5 GX BS IV 7 STR',\n", " 'Volkswagen Jetta Highline TDI AT',\n", " 'Volkswagen Polo Comfortline 1.2L P', 'Volkswagen Polo',\n", " 'Mahindra Scorpio', 'Nissan Sunny', 'Hyundai Elite i20',\n", " 'Renault Kwid', 'Mahindra Scorpio VLX Airbag',\n", " 'Chevrolet Spark LT 1.0', 'Datsun Redi GO T O',\n", " 'Maruti Suzuki Swift RS VDI', 'Fiat Punto Emotion 1.2',\n", " 'Hyundai i10 Sportz 1.2', 'Chevrolet Beat LT Opt Diesel',\n", " 'Chevrolet Beat LS Diesel', 'Tata Indigo CS',\n", " 'Maruti Suzuki Swift VDi', 'Hyundai Eon Era Plus',\n", " 'Mahindra XUV500', 'Ford Fiesta', 'Maruti Suzuki Wagon R',\n", " 'Hyundai i20', 'Tata Indigo eCS LX TDI BS III',\n", " 'Hyundai Fluidic Verna 1.6 CRDi SX',\n", " 'Commercial , DZire LDI, 2016, for sale', 'Fiat Petra ELX 1.2 PS',\n", " 'Hyundai Santro Xing XS', 'Maruti Suzuki Ciaz VXi Plus',\n", " 'Maruti Suzuki Zen VX', 'Hyundai Creta 1.6 SX Plus Petrol',\n", " 'Tata indigo ecs LX, 201', 'Mahindra Scorpio SLX',\n", " 'Toyota Innova 2.5 G BS III 8 STR',\n", " 'Maruti Suzuki Wagon R LXI BS IV', 'Tata Nano Cx BSIV',\n", " 'Maruti Suzuki Alto Std BS IV', 'Maruti Suzuki Wagon R LXi BS III',\n", " 'Maruti Suzuki Swift VXI BSIII',\n", " 'Tata Sumo Victa EX 10 by 7 Str BSIII', 'MARUTI SUZUKI DESI',\n", " 'Volkswagen Passat Diesel Comfortline AT',\n", " 'Renault Scala RxL Diesel Travelogue',\n", " 'Hyundai Grand i10 Sportz O 1.2 Kappa VTVT',\n", " 'Hyundai i20 Active 1.2 SX', 'Mahindra Xylo E4',\n", " 'Mahindra Jeep MM 550 XDB', 'Mahindra Bolero SLE BS IV',\n", " 'Force Motors Force One LX ABS 7 STR', 'Maruti Suzuki SX4',\n", " 'Toyota Etios', 'Honda City ZX VTEC',\n", " 'Maruti Suzuki Wagon R LX BS III', 'Honda City VX O MT Diesel',\n", " 'Mahindra Thar CRDe 4x4 AC',\n", " 'Audi A4 1.8 TFSI Multitronic Premium Plus',\n", " 'Mercedes Benz GLA Class 200 CDI Sport',\n", " 'Land Rover Freelander 2 SE', 'Renault Kwid RXT',\n", " 'Tata Aria Pleasure 4X2', 'Mercedes Benz B Class B180 Sports',\n", " 'Datsun GO T O', 'Honda Jazz VX MT',\n", " 'Hyundai i20 Active 1.4L SX O', 'Mini Cooper S',\n", " 'Maruti Suzuki Ciaz ZXI Plus', 'Chevrolet Tavera Neo',\n", " 'Hyundai Eon Sportz', 'Tata Sumo Gold Select Variant',\n", " 'Maruti Suzuki Wagon R 1.0', 'Maruti Suzuki Esteem VXi BS III',\n", " 'Chevrolet Enjoy 1.4 LS 8 STR', 'Maruti Suzuki Wagon R 1.0 VXi',\n", " 'Nissan Terrano XL D Plus', 'Renault Duster 85 PS RxL Diesel',\n", " 'Maruti Suzuki Dzire ZXI', 'Renault Kwid RXT Opt',\n", " 'Maruti Suzuki Maruti 800 Std', 'Renault Kwid 1.0 RXT AMT',\n", " 'Renault Scala RxL Diesel',\n", " 'Hyundai Grand i10 Asta 1.2 Kappa VTVT O',\n", " 'Chevrolet Beat LS Petrol', 'Hyundai Accent GLX', 'Yama',\n", " 'Maruti Suzuki Swift LDi', 'Mahindra TUV300 T4 Plus',\n", " 'Tata Indica V2 Xeta e GLE', 'Tata Indigo CS LS DiCOR',\n", " 'Mahindra Scorpio VLX Special Edition BS III',\n", " 'Tata Indica eV2 LS', 'Honda Accord',\n", " 'Ford EcoSport Titanium 1.5 TDCi', 'Maruti Suzuki Ertiga',\n", " 'Mahindra Scorpio 2.6 CRDe', 'Honda Mobilio',\n", " 'Toyota Corolla Altis', 'Skoda Laura', 'Hyundai Verna Fluidic',\n", " 'Maruti Suzuki Vitara Brezza', 'Tata Manza Aura Quadrajet',\n", " 'Chevrolet Sail UVA Petrol LT ABS',\n", " 'Hyundai Verna Fluidic 1.6 VTVT SX',\n", " 'Audi A4 2.0 TDI 177bhp Premium', 'Hyundai Elantra SX',\n", " 'Mahindra Scorpio VLX 4WD Airbag', 'Mahindra KUV100 K8 D 6 STR',\n", " 'Hyundai Grand i10', 'Hyundai i10', 'Hyundai i20 Active',\n", " 'Datsun Redi GO', 'Toyota Etios Liva', 'Hyundai Accent',\n", " 'Hyundai Verna', 'Toyota Fortuner', 'Hyundai i10 Sportz',\n", " 'Mahindra Bolero Power Plus SLE', 'selling car Ta',\n", " 'Honda City 1.5 V MT Exclusive', 'Chevrolet Spark LT 1.0 Airbag',\n", " 'Tata Indigo eCS VX CR4 BS IV', 'Tata Zest 90',\n", " 'Skoda Rapid Elegance 1.6 TDI CR MT', 'Tata Vista Quadrajet VX',\n", " 'Maruti Suzuki Alto K10 VXi AT', 'Maruti Suzuki Zen LXi BS III',\n", " 'Maruti Suzuki Swift Dzire Tour LDi', 'Honda City ZX EXi',\n", " 'Chevrolet Beat Diesel', 'Maruti Suzuki Swift Dzire car',\n", " 'Hyundai Verna 1.4 VTVT', 'Toyota Innova 2.5 E MS 7 STR BS IV',\n", " 'Maruti Suzuki Maruti 800 Std – Befo',\n", " 'Hyundai Elite i20 Asta 1.4 CRDI',\n", " 'Maruti Suzuki Swift Dzire Tour (Gat',\n", " 'Maruti Suzuki Versa DX2 8 SEATER BSIII',\n", " 'Tata Indigo LX TDI BS III',\n", " 'Volkswagen Vento Konekt Diesel Highline',\n", " 'Mercedes Benz C Class 200 CDI Classic', 'URJE',\n", " 'Hyundai Santro Xing GLS', 'Maruti Suzuki Omni Limited Edition',\n", " 'Hyundai Sonata Transform 2.4 GDi MT',\n", " 'Hyundai Elite i20 Sportz 1.2', 'Honda Jazz S MT',\n", " 'Hyundai Grand i10 Sportz 1.2 Kappa VTVT',\n", " 'Maruti Suzuki Zen LXi BSII',\n", " 'Mahindra Scorpio W Turbo 2.6DX 9 Seater',\n", " 'Swift Dzire Tour 27 Dec 2016 Regis', 'Maruti Suzuki Alto K10 VXi',\n", " 'Hyundai Grand i10 Asta 1.2 Kappa VTVT', 'Mahindra XUV500 W8',\n", " 'Hyundai i20 Magna O 1.2', 'Renault Duster 85 PS RxL Explore LE',\n", " 'Honda Brio V MT', 'Mahindra TUV300 T8',\n", " 'Nissan X Trail Select Variant', 'Ford Ikon 1.3 CLXi NXt Finesse',\n", " 'Toyota Fortuner 3.0 4x4 MT', 'Tata Manza ELAN Quadrajet',\n", " 'Tata zest x', 'Mahindra xyl',\n", " 'Mercedes Benz A Class A 180 Sport Petrol', 'Tata Indigo LS',\n", " 'Hyundai i20 Magna 1.2', 'Used Commercial Maruti Omn',\n", " 'Honda Amaze 1.5 E i DTEC', 'Hyundai Verna 1.6 EX VTVT',\n", " 'BMW 5 Series 520d Sedan', 'Skoda Superb 1.8 TFSI AT',\n", " 'Audi Q3 2.0 TDI quattro Premium', 'Mahindra Bolero DI BSII',\n", " 'Maruti Suzuki Zen Estilo LXI Green CNG',\n", " 'Ford Figo Duratorq Diesel Titanium 1.4',\n", " 'Maruti Suzuki Wagon R VXI BS IV', 'Mahindra Logan Diesel 1.5 DLS',\n", " 'Tata Nano GenX XMA', 'Honda City SV', 'Ford Figo Petrol LXI',\n", " 'Hyundai i10 Magna 1.2 Kappa2', 'Toyota Corolla H2',\n", " 'Maruti Suzuki Swift Dzire Tour VXi', 'Tata Indigo CS eLS BS IV',\n", " 'Hyundai Xcent Base 1.1 CRDi', 'Hyundai Accent Executive Edition',\n", " 'Tata Zest XE 75 PS Diesel', 'Maruti Suzuki Dzire LDI',\n", " 'Tata Sumo Gold LX BS IV', 'Toyota Corolla Altis GL Petrol',\n", " 'Maruti Suzuki Eeco 7 STR', 'Toyota Fortuner 3.0 4x2 MT',\n", " 'Mahindra XUV500 W6', 'Tata Tigor Revotron XZ',\n", " 'Maruti Suzuki 800', 'Honda Mobilio S i DTEC',\n", " 'Hyundai Verna 1.6 CRDI E', 'Maruti Suzuki Omni Select Variant',\n", " 'Tata Indica', 'Hyundai Santro Xing', 'Maruti Suzuki Zen Estilo',\n", " 'Honda Brio VX AT', 'Maruti Suzuki Wagon R Select Variant',\n", " 'Tata Nano Lx BSIV', 'Jaguar XE XE Portfolio',\n", " 'Hyundai Xcent S 1.2', 'Hyundai Eon Magna Plus',\n", " 'Maruti Suzuki Ritz GENUS VXI',\n", " 'Hyundai Grand i10 Magna AT 1.2 Kappa VTVT',\n", " 'Hyundai Eon D Lite Plus', 'Honda Amaze 1.2 VX i VTEC',\n", " 'Maruti Suzuki Estilo VXi ABS BS IV',\n", " 'Maruti Suzuki Vitara Brezza LDi O', 'Toyota Innova 2.0 V',\n", " 'Hyundai Creta 1.6 SX Plus Petrol AT', 'Mahindra Scorpio Vlx BSIV',\n", " 'Mitsubishi Lancer 1.8 LXi', 'Maruti Suzuki Maruti 800 AC',\n", " 'Maruti Suzuki Alto 800 LXI CNG O', 'Ford Fiesta SXi 1.6 ABS',\n", " 'Maruti Suzuki Ritz VDi', 'Maruti Suzuki Estilo LX BS IV',\n", " 'Audi A6 2.0 TDI Premium', 'Maruti Suzuki Alto',\n", " 'Maruti Suzuki Baleno Sigma 1.2', 'Hyundai Verna 1.6 SX VTVT AT',\n", " 'Maruti Suzuki Swift GLAM', 'Hyundai Getz Prime 1.3 GVS',\n", " 'Hyundai Santro', 'Hyundai Getz Prime 1.3 GLX',\n", " 'Chevrolet Beat PS Diesel', 'Ford EcoSport Trend 1.5 Ti VCT',\n", " 'Tata Indica V2 DLG', 'BMW X1 xDrive20d xLine',\n", " 'Honda City 1.5 V AT', 'Tata Nano', 'Chevrolet Cruze LTZ AT',\n", " 'Hyun', 'Maruti Suzuki Swift Dzire VDi', 'Mahindra XUV500 W10',\n", " 'Maruti Suzuki Alto K10 LXi CNG', 'Hyundai Accent GLE',\n", " 'Force Motors One SUV', 'Datsun Go Plus T O',\n", " 'Chevrolet Spark 1.0 LT', 'Toyota Etios Liva GD',\n", " 'Renault Duster 85PS Diesel RxL Optional with Nav',\n", " 'Chevrolet Enjoy', 'BMW 5 Series 530i', 'Chevrolet Cruze LTZ',\n", " 'Jeep Wrangler Unlimited 4x4 Diesel',\n", " 'Hyundai Verna VGT CRDi SX ABS', 'Maruti Suzuki Omni',\n", " 'Maruti Suzuki Celerio VDi', 'Tata Zest Quadrajet 1.3',\n", " 'Tata Indigo CS eLX BS IV', 'Hyundai i10 Era',\n", " 'Tata Indigo eCS LX CR4 BS IV', 'Tata Indigo Marina LS',\n", " 'Commercial Chevrolet Sail Hatchback ca', 'Hyundai Xcent SX 1.2',\n", " 'Tata Nano LX Special Edition', 'Commercial Car Ta',\n", " 'Renault Duster 110 PS RxZ Diesel',\n", " 'Maruti Suzuki Wagon R AX BSIV', 'Maruti Suzuki Alto K10 New',\n", " 'tata Indica', 'Mahindra Xylo E8', 'Tata Manza Aqua Quadrajet',\n", " 'Used bt new conditions ta', 'Renault Kwid 1.0', 'Sale tata',\n", " 'Tata Venture EX 8 STR', 'Maruti Suzuki Swift Dzire Tour LXi',\n", " 'Maruti Suzuki Alto LX BSII', 'Skoda Octavia Classic 1.9 TDI MT',\n", " 'Maruti Suzuki Omni LPG BS IV', 'Tata Sumo Gold EX BS IV',\n", " 'Tata indigo 2017 top model..', 'Hyundai Verna 1.6 CRDI SX',\n", " 'Mahindra Scorpio SLX 2.6 Turbo 8 Str', 'Ford Ikon 1.6 Nxt',\n", " 'Tata indigo', 'Toyota Innova 2.5 V 7 STR', 'Nissan Sunny XL',\n", " 'Maruti Suzuki Swift VDi BS IV',\n", " 'very good condition tata bolts are av', 'Toyota Innova 2.0 G4',\n", " 'Sale Hyundai xcent commerc', 'Maruti Suzuki Swift VDi ABS',\n", " 'Hyundai Elite i20 Asta 1.2', 'Volkswagen Polo Trendline 1.5L D',\n", " 'Toyota Etios Liva Diesel', 'Maruti Suzuki Ciaz ZXi Plus RS',\n", " 'Hyundai Elantra 1.8 S', 'Ford EcoSport Trend 1.5L Ti VCT',\n", " 'Jaguar XF 2.2 Diesel Luxury',\n", " 'Audi Q5 2.0 TDI quattro Premium Plus', 'BMW 3 Series 320d Sedan',\n", " 'Maruti Suzuki Swift ZXi 1.2 BS IV', 'BMW X1 sDrive20d',\n", " 'Maruti Suzuki S Cross Sigma 1.3', 'Maruti Suzuki Ertiga LDi',\n", " 'Volkswagen Vento Comfortline Petrol', 'Mahindra KUV100',\n", " 'Maruti Suzuki Swift Dzire Tour VDi', 'Mahindra Scorpio 2.6 SLX',\n", " 'Maruti Suzuki Omni 8 STR BS III',\n", " 'Volkswagen Jetta Comfortline 1.9 TDI AT', 'Volvo S80 Summum D4',\n", " 'Toyota Corolla Altis VL AT Petrol',\n", " 'Mitsubishi Pajero Sport 2.5 AT', 'Chevrolet Beat LT Petrol',\n", " 'BMW X1', 'Mercedes Benz C Class C 220 CDI Avantgarde',\n", " 'Volkswagen Vento Comfortline Diesel', 'Tata Indigo CS GLS',\n", " 'Ford Figo Petrol Titanium', 'Honda City ZX GXi',\n", " 'Maruti Suzuki Wagon R Duo Lxi', 'Maruti Suzuki Zen LX BSII',\n", " 'Renault Duster RxL Petrol', 'Maruti Suzuki Baleno Zeta 1.2',\n", " 'Honda WR V S MT Petrol', 'Renault Duster 110 PS RxL Diesel',\n", " 'Mahindra Scorpio LX BS III',\n", " 'Maruti Suzuki SX4 Celebration Diesel',\n", " 'Audi A3 Cabriolet 40 TFSI',\n", " 'I want to sell my commercial car due t',\n", " 'Hyundai Santro AE GLS Audio',\n", " 'i want sale my car.no emi....uber atta', 'Tata ZEST 6 month old',\n", " 'Mahindra Xylo D2 BS IV', 'Hyundai Getz GLE',\n", " 'Hyundai Creta 1.6 SX', 'Hyundai Santro Xing XL AT eRLX Euro III',\n", " 'Hyundai Santro Xing XL eRLX Euro III',\n", " 'Tata Indica V2 DLS BS III', 'Honda City 1.5 E MT',\n", " 'Nissan Micra XL', 'Honda City 1.5 S Inspire',\n", " 'Tata Indica eV2 eXeta eGLX', 'Maruti Suzuki Omni E 8 STR BS IV',\n", " 'MARUTI SUZUKI ERTIGA F', 'Hyundai Verna 1.6 CRDI SX Plus AT',\n", " 'Chevrolet Tavera LS B3 10 Seats BSII', 'Tata Tiago Revotron XM',\n", " 'Tata Tiago Revotorq XZ', 'Tata Nexon', 'Tata',\n", " 'Hindustan Motors Ambassador Classic Mark 4 – Befo',\n", " 'Ford Fusion 1.4 TDCi Diesel',\n", " 'Fiat Linea Emotion 1.4 L T Jet Petrol',\n", " 'Ford Ikon 1.3 Flair Josh 100', 'Tata Indica V2 LS',\n", " 'Mahindra Xylo D2', 'Hyundai Eon Magna',\n", " 'Tata Sumo Grande MKII GX', 'Volkswagen Polo Highline1.2L P',\n", " 'Tata Tiago Revotron XZ', 'Tata Indigo eCS',\n", " '2012 Tata Sumo Gold f', 'Mahindra Xylo E8 BS IV',\n", " 'Well mentained Tata Sumo',\n", " 'all paper updated tata indica v2 and u',\n", " 'Maruti Ertiga showroom condition with',\n", " '7 SEATER MAHINDRA BOLERO IN VERY GOOD', '9 SEATER MAHINDRA BOL',\n", " 'scratch less Tata I', 'Maruti Suzuki swift dzire for sale in',\n", " 'Commercial Chevrolet beat for sale in',\n", " 'urgent sell my Mahindra qu', 'Tata Sumo Gold FX BSIII',\n", " 'sell my car Maruti Suzuki Swif',\n", " 'Maruti Suzuki Swift Dzire good car fo', 'Hyunda',\n", " 'Commercial Maruti Suzuki Alto Lxi 800', 'urgent sale Ta',\n", " 'Maruti Suzuki Alto vxi t', 'tata', 'TATA INDI', 'Hyundai Creta',\n", " 'Tata Bolt XM Petrol', 'Hyundai Venue', 'Maruti Suzuki Ritz',\n", " 'Renault Lodgy', 'Hyundai i20 Asta',\n", " 'Maruti Suzuki Swift Select Variant', 'Tata Indica V2 DLX BS III',\n", " 'Mahindra Scorpio VLX 2.2 mHawk Airbag BSIV',\n", " 'Toyota Innova 2.5 E 8 STR', 'Mahindra KUV100 K8 6 STR',\n", " 'Datsun Go Plus', 'Ford Endeavor 4x4 Thunder Plus',\n", " 'Tata Indica V2', 'Hyundai Santro Xing GL',\n", " 'Toyota Innova 2.5 Z Diesel 7 Seater',\n", " 'Any type car avaiabel hare...comercica', 'Maruti Suzuki Alto AX',\n", " 'Mahindra Logan', 'Maruti Suzuki 800 Std BS III',\n", " 'Chevrolet Sail 1.2 LS',\n", " 'Volkswagen Vento Highline Plus 1.5 Diesel', 'Tata Manza',\n", " 'Toyota Innova 2.0 G1 Petrol 8seater', 'Toyota Etios G',\n", " 'Toyota Qualis', 'Mahindra Quanto C4', 'Maruti Suzuki Swift Dzire',\n", " 'Hyundai i20 Select Variant', 'Honda City VX Petrol',\n", " 'Hyundai Getz', 'Mercedes Benz C Class 200 K MT', 'Skoda Fabia',\n", " 'Maruti Suzuki Alto 800 Select Variant',\n", " 'Maruti Suzuki Ritz VXI ABS', 'tata zest 2017 f',\n", " 'Tata Indica V2 DLE BS III', 'Ta', 'Tata Zest XM Diesel',\n", " 'Honda Amaze 1.2 E i VTEC', 'Chevrolet Sail 1.2 LT ABS'],\n", " dtype=object)" ] }, "execution_count": 9, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car['name'].unique()" ] }, { "cell_type": "markdown", "id": "470f179e-4860-4f34-992a-b8b4f9189199", "metadata": {}, "source": [ "## Quality\n", "- Year has many non-year values.\n", "- Year object to int\n", "- Price has 'ask for price' value. We need to remove this.\n", "- Price object to int\n", "- kms_driven has 'Petrol' and kms with integer.\n", "- kms_driven to int object\n", "- kms_driven has nan values.\n", "- fuel_type has nan values.\n", " " ] }, { "cell_type": "markdown", "id": "f31c659d-4396-49fe-a7dd-e656123eacc5", "metadata": {}, "source": [ "## Cleaning\n" ] }, { "cell_type": "code", "execution_count": 10, "id": "86612423-3219-4e12-9d0a-e6ed251ceb11", "metadata": {}, "outputs": [], "source": [ "backup=car.copy()" ] }, { "cell_type": "code", "execution_count": 11, "id": "07338540-2e4f-4394-884d-dfc23116325a", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0 True\n", "1 True\n", "2 True\n", "3 True\n", "4 True\n", " ... \n", "887 False\n", "888 True\n", "889 True\n", "890 True\n", "891 True\n", "Name: year, Length: 892, dtype: bool" ] }, "execution_count": 11, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car['year'].str.isnumeric()" ] }, { "cell_type": "code", "execution_count": 12, "id": "93d7be11-9c9e-4f48-8f82-949e7924dd31", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
namecompanyyearPricekms_drivenfuel_type
0Hyundai Santro Xing XO eRLX Euro IIIHyundai200780,00045,000 kmsPetrol
1Mahindra Jeep CL550 MDIMahindra20064,25,00040 kmsDiesel
2Maruti Suzuki Alto 800 VxiMaruti2018Ask For Price22,000 kmsPetrol
3Hyundai Grand i10 Magna 1.2 Kappa VTVTHyundai20143,25,00028,000 kmsPetrol
4Ford EcoSport Titanium 1.5L TDCiFord20145,75,00036,000 kmsDiesel
\n", "
" ], "text/plain": [ " name company year Price \\\n", "0 Hyundai Santro Xing XO eRLX Euro III Hyundai 2007 80,000 \n", "1 Mahindra Jeep CL550 MDI Mahindra 2006 4,25,000 \n", "2 Maruti Suzuki Alto 800 Vxi Maruti 2018 Ask For Price \n", "3 Hyundai Grand i10 Magna 1.2 Kappa VTVT Hyundai 2014 3,25,000 \n", "4 Ford EcoSport Titanium 1.5L TDCi Ford 2014 5,75,000 \n", "\n", " kms_driven fuel_type \n", "0 45,000 kms Petrol \n", "1 40 kms Diesel \n", "2 22,000 kms Petrol \n", "3 28,000 kms Petrol \n", "4 36,000 kms Diesel " ] }, "execution_count": 12, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1=car[car['year'].str.isnumeric()]\n", "car1.head()" ] }, { "cell_type": "code", "execution_count": 13, "id": "24309923-9157-47d6-a839-4a95f2f28315", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "Index: 842 entries, 0 to 891\n", "Data columns (total 6 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 name 842 non-null object\n", " 1 company 842 non-null object\n", " 2 year 842 non-null int32 \n", " 3 Price 842 non-null object\n", " 4 kms_driven 840 non-null object\n", " 5 fuel_type 837 non-null object\n", "dtypes: int32(1), object(5)\n", "memory usage: 42.8+ KB\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "C:\\Users\\RUSHABH\\AppData\\Local\\Temp\\ipykernel_20532\\2300982009.py:1: SettingWithCopyWarning: \n", "A value is trying to be set on a copy of a slice from a DataFrame.\n", "Try using .loc[row_indexer,col_indexer] = value instead\n", "\n", "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n", " car1['year']=car1['year'].astype(int)\n" ] } ], "source": [ "car1['year']=car1['year'].astype(int)\n", "car1.info()" ] }, { "cell_type": "code", "execution_count": 14, "id": "8d6a21de-4c3d-410c-8889-66a0e36d604a", "metadata": {}, "outputs": [], "source": [ "car1=car1[car1['Price']!='Ask For Price']" ] }, { "cell_type": "code", "execution_count": 15, "id": "70e840b6-c6bb-407e-bc5a-e069d6d07d3b", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0 80000\n", "1 425000\n", "3 325000\n", "4 575000\n", "6 175000\n", " ... \n", "886 300000\n", "888 260000\n", "889 390000\n", "890 180000\n", "891 160000\n", "Name: Price, Length: 819, dtype: int32" ] }, "execution_count": 15, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1['Price'].str.replace(',','').astype(int)" ] }, { "cell_type": "code", "execution_count": 16, "id": "3bd863ce-b208-4af4-8340-1bd27b337846", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "Index: 819 entries, 0 to 891\n", "Data columns (total 6 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 name 819 non-null object\n", " 1 company 819 non-null object\n", " 2 year 819 non-null int32 \n", " 3 Price 819 non-null int32 \n", " 4 kms_driven 819 non-null object\n", " 5 fuel_type 816 non-null object\n", "dtypes: int32(2), object(4)\n", "memory usage: 38.4+ KB\n" ] } ], "source": [ "car1['Price']=car1['Price'].str.replace(',','').astype(int)\n", "car1.info()" ] }, { "cell_type": "code", "execution_count": 17, "id": "573a7047-be9a-4dc5-a87e-d8f401abb111", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0 45000\n", "1 40\n", "3 28000\n", "4 36000\n", "6 41000\n", " ... \n", "886 132000\n", "888 27000\n", "889 40000\n", "890 Petrol\n", "891 Petrol\n", "Name: kms_driven, Length: 819, dtype: object" ] }, "execution_count": 17, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1['kms_driven'].str.split(\" \").str.get(0).str.replace(',','')" ] }, { "cell_type": "code", "execution_count": 18, "id": "8237c462-8263-449d-adc5-ba7204367670", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "Index: 819 entries, 0 to 891\n", "Data columns (total 6 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 name 819 non-null object\n", " 1 company 819 non-null object\n", " 2 year 819 non-null int32 \n", " 3 Price 819 non-null int32 \n", " 4 kms_driven 819 non-null object\n", " 5 fuel_type 816 non-null object\n", "dtypes: int32(2), object(4)\n", "memory usage: 38.4+ KB\n" ] } ], "source": [ "car1['kms_driven']=car1['kms_driven'].str.split(\" \").str.get(0).str.replace(',','')\n", "car1.info()" ] }, { "cell_type": "code", "execution_count": 19, "id": "0215efc1-e276-4a5a-b0bc-fa1798ee0069", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
namecompanyyearPricekms_drivenfuel_type
0Hyundai Santro Xing XO eRLX Euro IIIHyundai20078000045000Petrol
1Mahindra Jeep CL550 MDIMahindra200642500040Diesel
3Hyundai Grand i10 Magna 1.2 Kappa VTVTHyundai201432500028000Petrol
4Ford EcoSport Titanium 1.5L TDCiFord201457500036000Diesel
6Ford FigoFord201217500041000Diesel
\n", "
" ], "text/plain": [ " name company year Price kms_driven \\\n", "0 Hyundai Santro Xing XO eRLX Euro III Hyundai 2007 80000 45000 \n", "1 Mahindra Jeep CL550 MDI Mahindra 2006 425000 40 \n", "3 Hyundai Grand i10 Magna 1.2 Kappa VTVT Hyundai 2014 325000 28000 \n", "4 Ford EcoSport Titanium 1.5L TDCi Ford 2014 575000 36000 \n", "6 Ford Figo Ford 2012 175000 41000 \n", "\n", " fuel_type \n", "0 Petrol \n", "1 Diesel \n", "3 Petrol \n", "4 Diesel \n", "6 Diesel " ] }, "execution_count": 19, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1=car1[car1[\"kms_driven\"].str.isnumeric()]\n", "car1.head()" ] }, { "cell_type": "code", "execution_count": 20, "id": "29aa5e23-9d2f-4ddd-84a5-a4db9b908423", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "Index: 817 entries, 0 to 889\n", "Data columns (total 6 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 name 817 non-null object\n", " 1 company 817 non-null object\n", " 2 year 817 non-null int32 \n", " 3 Price 817 non-null int32 \n", " 4 kms_driven 817 non-null object\n", " 5 fuel_type 816 non-null object\n", "dtypes: int32(2), object(4)\n", "memory usage: 38.3+ KB\n" ] } ], "source": [ "car1.info()" ] }, { "cell_type": "code", "execution_count": 21, "id": "a7e12b08-540f-413b-a4eb-3b1df9ed1c33", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "Index: 817 entries, 0 to 889\n", "Data columns (total 6 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 name 817 non-null object\n", " 1 company 817 non-null object\n", " 2 year 817 non-null int32 \n", " 3 Price 817 non-null int32 \n", " 4 kms_driven 817 non-null int32 \n", " 5 fuel_type 816 non-null object\n", "dtypes: int32(3), object(3)\n", "memory usage: 35.1+ KB\n" ] } ], "source": [ "car1[\"kms_driven\"]=car1[\"kms_driven\"].astype(int)\n", "car1.info()" ] }, { "cell_type": "code", "execution_count": 22, "id": "4cc50942-7b1b-492c-88b2-1c5e43eb9c51", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
namecompanyyearPricekms_drivenfuel_type
0Hyundai Santro Xing XO eRLX Euro IIIHyundai20078000045000Petrol
1Mahindra Jeep CL550 MDIMahindra200642500040Diesel
3Hyundai Grand i10 Magna 1.2 Kappa VTVTHyundai201432500028000Petrol
4Ford EcoSport Titanium 1.5L TDCiFord201457500036000Diesel
6Ford FigoFord201217500041000Diesel
.....................
883Maruti Suzuki Ritz VXI ABSMaruti201127000050000Petrol
885Tata Indica V2 DLE BS IIITata200911000030000Diesel
886Toyota Corolla AltisToyota2009300000132000Petrol
888Tata Zest XM DieselTata201826000027000Diesel
889Mahindra Quanto C8Mahindra201339000040000Diesel
\n", "

816 rows × 6 columns

\n", "
" ], "text/plain": [ " name company year Price \\\n", "0 Hyundai Santro Xing XO eRLX Euro III Hyundai 2007 80000 \n", "1 Mahindra Jeep CL550 MDI Mahindra 2006 425000 \n", "3 Hyundai Grand i10 Magna 1.2 Kappa VTVT Hyundai 2014 325000 \n", "4 Ford EcoSport Titanium 1.5L TDCi Ford 2014 575000 \n", "6 Ford Figo Ford 2012 175000 \n", ".. ... ... ... ... \n", "883 Maruti Suzuki Ritz VXI ABS Maruti 2011 270000 \n", "885 Tata Indica V2 DLE BS III Tata 2009 110000 \n", "886 Toyota Corolla Altis Toyota 2009 300000 \n", "888 Tata Zest XM Diesel Tata 2018 260000 \n", "889 Mahindra Quanto C8 Mahindra 2013 390000 \n", "\n", " kms_driven fuel_type \n", "0 45000 Petrol \n", "1 40 Diesel \n", "3 28000 Petrol \n", "4 36000 Diesel \n", "6 41000 Diesel \n", ".. ... ... \n", "883 50000 Petrol \n", "885 30000 Diesel \n", "886 132000 Petrol \n", "888 27000 Diesel \n", "889 40000 Diesel \n", "\n", "[816 rows x 6 columns]" ] }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1=car1[~car1['fuel_type'].isna()]\n", "car1" ] }, { "cell_type": "code", "execution_count": 23, "id": "04e9108c-9177-4052-94a9-9e47c1ad7472", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0 Hyundai Santro Xing\n", "1 Mahindra Jeep CL550\n", "3 Hyundai Grand i10\n", "4 Ford EcoSport Titanium\n", "6 Ford Figo\n", " ... \n", "883 Maruti Suzuki Ritz\n", "885 Tata Indica V2\n", "886 Toyota Corolla Altis\n", "888 Tata Zest XM\n", "889 Mahindra Quanto C8\n", "Name: name, Length: 816, dtype: object" ] }, "execution_count": 23, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1['name']=car1['name'].str.split(\" \").str.slice(0,3).str.join(' ')\n", "car1['name']" ] }, { "cell_type": "code", "execution_count": 24, "id": "28accf05-4846-45eb-a67e-1ea487920dbd", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
namecompanyyearPricekms_drivenfuel_type
0Hyundai Santro XingHyundai20078000045000Petrol
1Mahindra Jeep CL550Mahindra200642500040Diesel
3Hyundai Grand i10Hyundai201432500028000Petrol
4Ford EcoSport TitaniumFord201457500036000Diesel
6Ford FigoFord201217500041000Diesel
.....................
883Maruti Suzuki RitzMaruti201127000050000Petrol
885Tata Indica V2Tata200911000030000Diesel
886Toyota Corolla AltisToyota2009300000132000Petrol
888Tata Zest XMTata201826000027000Diesel
889Mahindra Quanto C8Mahindra201339000040000Diesel
\n", "

816 rows × 6 columns

\n", "
" ], "text/plain": [ " name company year Price kms_driven fuel_type\n", "0 Hyundai Santro Xing Hyundai 2007 80000 45000 Petrol\n", "1 Mahindra Jeep CL550 Mahindra 2006 425000 40 Diesel\n", "3 Hyundai Grand i10 Hyundai 2014 325000 28000 Petrol\n", "4 Ford EcoSport Titanium Ford 2014 575000 36000 Diesel\n", "6 Ford Figo Ford 2012 175000 41000 Diesel\n", ".. ... ... ... ... ... ...\n", "883 Maruti Suzuki Ritz Maruti 2011 270000 50000 Petrol\n", "885 Tata Indica V2 Tata 2009 110000 30000 Diesel\n", "886 Toyota Corolla Altis Toyota 2009 300000 132000 Petrol\n", "888 Tata Zest XM Tata 2018 260000 27000 Diesel\n", "889 Mahindra Quanto C8 Mahindra 2013 390000 40000 Diesel\n", "\n", "[816 rows x 6 columns]" ] }, "execution_count": 24, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1" ] }, { "cell_type": "code", "execution_count": 25, "id": "f7dbe6fb-1714-41b3-a08f-9d1e48a05317", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
namecompanyyearPricekms_drivenfuel_type
0Hyundai Santro XingHyundai20078000045000Petrol
1Mahindra Jeep CL550Mahindra200642500040Diesel
2Hyundai Grand i10Hyundai201432500028000Petrol
3Ford EcoSport TitaniumFord201457500036000Diesel
4Ford FigoFord201217500041000Diesel
.....................
811Maruti Suzuki RitzMaruti201127000050000Petrol
812Tata Indica V2Tata200911000030000Diesel
813Toyota Corolla AltisToyota2009300000132000Petrol
814Tata Zest XMTata201826000027000Diesel
815Mahindra Quanto C8Mahindra201339000040000Diesel
\n", "

816 rows × 6 columns

\n", "
" ], "text/plain": [ " name company year Price kms_driven fuel_type\n", "0 Hyundai Santro Xing Hyundai 2007 80000 45000 Petrol\n", "1 Mahindra Jeep CL550 Mahindra 2006 425000 40 Diesel\n", "2 Hyundai Grand i10 Hyundai 2014 325000 28000 Petrol\n", "3 Ford EcoSport Titanium Ford 2014 575000 36000 Diesel\n", "4 Ford Figo Ford 2012 175000 41000 Diesel\n", ".. ... ... ... ... ... ...\n", "811 Maruti Suzuki Ritz Maruti 2011 270000 50000 Petrol\n", "812 Tata Indica V2 Tata 2009 110000 30000 Diesel\n", "813 Toyota Corolla Altis Toyota 2009 300000 132000 Petrol\n", "814 Tata Zest XM Tata 2018 260000 27000 Diesel\n", "815 Mahindra Quanto C8 Mahindra 2013 390000 40000 Diesel\n", "\n", "[816 rows x 6 columns]" ] }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1=car1.reset_index(drop=True)\n", "car1" ] }, { "cell_type": "code", "execution_count": 26, "id": "5d244c24-6905-4701-8db2-cf1026f3e434", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "RangeIndex: 816 entries, 0 to 815\n", "Data columns (total 6 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 name 816 non-null object\n", " 1 company 816 non-null object\n", " 2 year 816 non-null int32 \n", " 3 Price 816 non-null int32 \n", " 4 kms_driven 816 non-null int32 \n", " 5 fuel_type 816 non-null object\n", "dtypes: int32(3), object(3)\n", "memory usage: 28.8+ KB\n" ] } ], "source": [ "car1.info()" ] }, { "cell_type": "code", "execution_count": 27, "id": "16a17659-162a-4457-831f-df64d6d98d1f", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
yearPricekms_driven
count816.0000008.160000e+02816.000000
mean2012.4448534.117176e+0546275.531863
std4.0029924.751844e+0534297.428044
min1995.0000003.000000e+040.000000
25%2010.0000001.750000e+0527000.000000
50%2013.0000002.999990e+0541000.000000
75%2015.0000004.912500e+0556818.500000
max2019.0000008.500003e+06400000.000000
\n", "
" ], "text/plain": [ " year Price kms_driven\n", "count 816.000000 8.160000e+02 816.000000\n", "mean 2012.444853 4.117176e+05 46275.531863\n", "std 4.002992 4.751844e+05 34297.428044\n", "min 1995.000000 3.000000e+04 0.000000\n", "25% 2010.000000 1.750000e+05 27000.000000\n", "50% 2013.000000 2.999990e+05 41000.000000\n", "75% 2015.000000 4.912500e+05 56818.500000\n", "max 2019.000000 8.500003e+06 400000.000000" ] }, "execution_count": 27, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car1.describe()" ] }, { "cell_type": "code", "execution_count": 28, "id": "c556a939-a9a1-42ad-b6cf-15c2cc41fd61", "metadata": {}, "outputs": [], "source": [ "#Price<6,00,000\n", "car2=car1[car1['Price']<6e6].reset_index(drop=True)" ] }, { "cell_type": "code", "execution_count": 29, "id": "f75fa5c2-5640-42e6-8564-5e8d9ad8da4b", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
namecompanyyearPricekms_drivenfuel_type
0Hyundai Santro XingHyundai20078000045000Petrol
1Mahindra Jeep CL550Mahindra200642500040Diesel
2Hyundai Grand i10Hyundai201432500028000Petrol
3Ford EcoSport TitaniumFord201457500036000Diesel
4Ford FigoFord201217500041000Diesel
.....................
810Maruti Suzuki RitzMaruti201127000050000Petrol
811Tata Indica V2Tata200911000030000Diesel
812Toyota Corolla AltisToyota2009300000132000Petrol
813Tata Zest XMTata201826000027000Diesel
814Mahindra Quanto C8Mahindra201339000040000Diesel
\n", "

815 rows × 6 columns

\n", "
" ], "text/plain": [ " name company year Price kms_driven fuel_type\n", "0 Hyundai Santro Xing Hyundai 2007 80000 45000 Petrol\n", "1 Mahindra Jeep CL550 Mahindra 2006 425000 40 Diesel\n", "2 Hyundai Grand i10 Hyundai 2014 325000 28000 Petrol\n", "3 Ford EcoSport Titanium Ford 2014 575000 36000 Diesel\n", "4 Ford Figo Ford 2012 175000 41000 Diesel\n", ".. ... ... ... ... ... ...\n", "810 Maruti Suzuki Ritz Maruti 2011 270000 50000 Petrol\n", "811 Tata Indica V2 Tata 2009 110000 30000 Diesel\n", "812 Toyota Corolla Altis Toyota 2009 300000 132000 Petrol\n", "813 Tata Zest XM Tata 2018 260000 27000 Diesel\n", "814 Mahindra Quanto C8 Mahindra 2013 390000 40000 Diesel\n", "\n", "[815 rows x 6 columns]" ] }, "execution_count": 29, "metadata": {}, "output_type": "execute_result" } ], "source": [ "car2" ] }, { "cell_type": "code", "execution_count": 30, "id": "916ca498-707d-44b5-a79a-231f6b30827b", "metadata": {}, "outputs": [], "source": [ "car2.to_csv(\"cleaned_data.csv\")" ] }, { "cell_type": "markdown", "id": "214c6fc5-4ae7-4ef9-b516-60aaa484ad1c", "metadata": {}, "source": [ "## Model" ] }, { "cell_type": "code", "execution_count": 31, "id": "acb98641-4025-414a-9dff-515f2d99c702", "metadata": {}, "outputs": [], "source": [ "X=car2.drop(columns='Price')\n", "y=car2['Price']\n" ] }, { "cell_type": "code", "execution_count": 32, "id": "7eb49274-fc9b-48ff-a17c-0a37c79348c5", "metadata": {}, "outputs": [], "source": [ "from sklearn.model_selection import train_test_split\n", "X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=0.2)" ] }, { "cell_type": "code", "execution_count": 33, "id": "fe9dce09-7921-4680-b781-16d386cf8ce1", "metadata": {}, "outputs": [], "source": [ "from sklearn.linear_model import LinearRegression\n", "from sklearn.metrics import r2_score\n", "from sklearn.preprocessing import OneHotEncoder\n", "from sklearn.compose import make_column_transformer\n", "from sklearn.pipeline import make_pipeline" ] }, { "cell_type": "code", "execution_count": 34, "id": "0066fbf5-6709-4c6f-8565-7a273e59f6c8", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
OneHotEncoder()
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" ], "text/plain": [ "OneHotEncoder()" ] }, "execution_count": 34, "metadata": {}, "output_type": "execute_result" } ], "source": [ "ohe=OneHotEncoder()\n", "ohe.fit(X[['name','company','fuel_type']])" ] }, { "cell_type": "code", "execution_count": 35, "id": "9c04e9cd-32f7-4502-bc3f-a6f455bbf5ab", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "[array(['Audi A3 Cabriolet', 'Audi A4 1.8', 'Audi A4 2.0', 'Audi A6 2.0',\n", " 'Audi A8', 'Audi Q3 2.0', 'Audi Q5 2.0', 'Audi Q7', 'BMW 3 Series',\n", " 'BMW 5 Series', 'BMW 7 Series', 'BMW X1', 'BMW X1 sDrive20d',\n", " 'BMW X1 xDrive20d', 'Chevrolet Beat', 'Chevrolet Beat Diesel',\n", " 'Chevrolet Beat LS', 'Chevrolet Beat LT', 'Chevrolet Beat PS',\n", " 'Chevrolet Cruze LTZ', 'Chevrolet Enjoy', 'Chevrolet Enjoy 1.4',\n", " 'Chevrolet Sail 1.2', 'Chevrolet Sail UVA', 'Chevrolet Spark',\n", " 'Chevrolet Spark 1.0', 'Chevrolet Spark LS', 'Chevrolet Spark LT',\n", " 'Chevrolet Tavera LS', 'Chevrolet Tavera Neo', 'Datsun GO T',\n", " 'Datsun Go Plus', 'Datsun Redi GO', 'Fiat Linea Emotion',\n", " 'Fiat Petra ELX', 'Fiat Punto Emotion', 'Force Motors Force',\n", " 'Force Motors One', 'Ford EcoSport', 'Ford EcoSport Ambiente',\n", " 'Ford EcoSport Titanium', 'Ford EcoSport Trend',\n", " 'Ford Endeavor 4x4', 'Ford Fiesta', 'Ford Fiesta SXi', 'Ford Figo',\n", " 'Ford Figo Diesel', 'Ford Figo Duratorq', 'Ford Figo Petrol',\n", " 'Ford Fusion 1.4', 'Ford Ikon 1.3', 'Ford Ikon 1.6',\n", " 'Hindustan Motors Ambassador', 'Honda Accord', 'Honda Amaze',\n", " 'Honda Amaze 1.2', 'Honda Amaze 1.5', 'Honda Brio', 'Honda Brio V',\n", " 'Honda Brio VX', 'Honda City', 'Honda City 1.5', 'Honda City SV',\n", " 'Honda City VX', 'Honda City ZX', 'Honda Jazz S', 'Honda Jazz VX',\n", " 'Honda Mobilio', 'Honda Mobilio S', 'Honda WR V', 'Hyundai Accent',\n", " 'Hyundai Accent Executive', 'Hyundai Accent GLE',\n", " 'Hyundai Accent GLX', 'Hyundai Creta', 'Hyundai Creta 1.6',\n", " 'Hyundai Elantra 1.8', 'Hyundai Elantra SX', 'Hyundai Elite i20',\n", " 'Hyundai Eon', 'Hyundai Eon D', 'Hyundai Eon Era',\n", " 'Hyundai Eon Magna', 'Hyundai Eon Sportz', 'Hyundai Fluidic Verna',\n", " 'Hyundai Getz', 'Hyundai Getz GLE', 'Hyundai Getz Prime',\n", " 'Hyundai Grand i10', 'Hyundai Santro', 'Hyundai Santro AE',\n", " 'Hyundai Santro Xing', 'Hyundai Sonata Transform', 'Hyundai Verna',\n", " 'Hyundai Verna 1.4', 'Hyundai Verna 1.6', 'Hyundai Verna Fluidic',\n", " 'Hyundai Verna Transform', 'Hyundai Verna VGT',\n", " 'Hyundai Xcent Base', 'Hyundai Xcent SX', 'Hyundai i10',\n", " 'Hyundai i10 Era', 'Hyundai i10 Magna', 'Hyundai i10 Sportz',\n", " 'Hyundai i20', 'Hyundai i20 Active', 'Hyundai i20 Asta',\n", " 'Hyundai i20 Magna', 'Hyundai i20 Select', 'Hyundai i20 Sportz',\n", " 'Jaguar XE XE', 'Jaguar XF 2.2', 'Jeep Wrangler Unlimited',\n", " 'Land Rover Freelander', 'Mahindra Bolero DI',\n", " 'Mahindra Bolero Power', 'Mahindra Bolero SLE',\n", " 'Mahindra Jeep CL550', 'Mahindra Jeep MM', 'Mahindra KUV100',\n", " 'Mahindra KUV100 K8', 'Mahindra Logan', 'Mahindra Logan Diesel',\n", " 'Mahindra Quanto C4', 'Mahindra Quanto C8', 'Mahindra Scorpio',\n", " 'Mahindra Scorpio 2.6', 'Mahindra Scorpio LX',\n", " 'Mahindra Scorpio S10', 'Mahindra Scorpio S4',\n", " 'Mahindra Scorpio SLE', 'Mahindra Scorpio SLX',\n", " 'Mahindra Scorpio VLX', 'Mahindra Scorpio Vlx',\n", " 'Mahindra Scorpio W', 'Mahindra TUV300 T4', 'Mahindra TUV300 T8',\n", " 'Mahindra Thar CRDe', 'Mahindra XUV500', 'Mahindra XUV500 W10',\n", " 'Mahindra XUV500 W6', 'Mahindra XUV500 W8', 'Mahindra Xylo D2',\n", " 'Mahindra Xylo E4', 'Mahindra Xylo E8', 'Maruti Suzuki 800',\n", " 'Maruti Suzuki A', 'Maruti Suzuki Alto', 'Maruti Suzuki Baleno',\n", " 'Maruti Suzuki Celerio', 'Maruti Suzuki Ciaz',\n", " 'Maruti Suzuki Dzire', 'Maruti Suzuki Eeco',\n", " 'Maruti Suzuki Ertiga', 'Maruti Suzuki Esteem',\n", " 'Maruti Suzuki Estilo', 'Maruti Suzuki Maruti',\n", " 'Maruti Suzuki Omni', 'Maruti Suzuki Ritz', 'Maruti Suzuki S',\n", " 'Maruti Suzuki SX4', 'Maruti Suzuki Stingray',\n", " 'Maruti Suzuki Swift', 'Maruti Suzuki Versa',\n", " 'Maruti Suzuki Vitara', 'Maruti Suzuki Wagon', 'Maruti Suzuki Zen',\n", " 'Mercedes Benz A', 'Mercedes Benz B', 'Mercedes Benz C',\n", " 'Mercedes Benz GLA', 'Mini Cooper S', 'Mitsubishi Lancer 1.8',\n", " 'Mitsubishi Pajero Sport', 'Nissan Micra XL', 'Nissan Micra XV',\n", " 'Nissan Sunny', 'Nissan Sunny XL', 'Nissan Terrano XL',\n", " 'Nissan X Trail', 'Renault Duster', 'Renault Duster 110',\n", " 'Renault Duster 110PS', 'Renault Duster 85', 'Renault Duster 85PS',\n", " 'Renault Duster RxL', 'Renault Kwid', 'Renault Kwid 1.0',\n", " 'Renault Kwid RXT', 'Renault Lodgy 85', 'Renault Scala RxL',\n", " 'Skoda Fabia', 'Skoda Fabia 1.2L', 'Skoda Fabia Classic',\n", " 'Skoda Laura', 'Skoda Octavia Classic', 'Skoda Rapid Elegance',\n", " 'Skoda Superb 1.8', 'Skoda Yeti Ambition', 'Tata Aria Pleasure',\n", " 'Tata Bolt XM', 'Tata Indica', 'Tata Indica V2', 'Tata Indica eV2',\n", " 'Tata Indigo CS', 'Tata Indigo LS', 'Tata Indigo LX',\n", " 'Tata Indigo Marina', 'Tata Indigo eCS', 'Tata Manza',\n", " 'Tata Manza Aqua', 'Tata Manza Aura', 'Tata Manza ELAN',\n", " 'Tata Nano', 'Tata Nano Cx', 'Tata Nano GenX', 'Tata Nano LX',\n", " 'Tata Nano Lx', 'Tata Sumo Gold', 'Tata Sumo Grande',\n", " 'Tata Sumo Victa', 'Tata Tiago Revotorq', 'Tata Tiago Revotron',\n", " 'Tata Tigor Revotron', 'Tata Venture EX', 'Tata Vista Quadrajet',\n", " 'Tata Zest Quadrajet', 'Tata Zest XE', 'Tata Zest XM',\n", " 'Toyota Corolla', 'Toyota Corolla Altis', 'Toyota Corolla H2',\n", " 'Toyota Etios', 'Toyota Etios G', 'Toyota Etios GD',\n", " 'Toyota Etios Liva', 'Toyota Fortuner', 'Toyota Fortuner 3.0',\n", " 'Toyota Innova 2.0', 'Toyota Innova 2.5', 'Toyota Qualis',\n", " 'Volkswagen Jetta Comfortline', 'Volkswagen Jetta Highline',\n", " 'Volkswagen Passat Diesel', 'Volkswagen Polo',\n", " 'Volkswagen Polo Comfortline', 'Volkswagen Polo Highline',\n", " 'Volkswagen Polo Highline1.2L', 'Volkswagen Polo Trendline',\n", " 'Volkswagen Vento Comfortline', 'Volkswagen Vento Highline',\n", " 'Volkswagen Vento Konekt', 'Volvo S80 Summum'], dtype=object),\n", " array(['Audi', 'BMW', 'Chevrolet', 'Datsun', 'Fiat', 'Force', 'Ford',\n", " 'Hindustan', 'Honda', 'Hyundai', 'Jaguar', 'Jeep', 'Land',\n", " 'Mahindra', 'Maruti', 'Mercedes', 'Mini', 'Mitsubishi', 'Nissan',\n", " 'Renault', 'Skoda', 'Tata', 'Toyota', 'Volkswagen', 'Volvo'],\n", " dtype=object),\n", " array(['Diesel', 'LPG', 'Petrol'], dtype=object)]" ] }, "execution_count": 35, "metadata": {}, "output_type": "execute_result" } ], "source": [ "ohe.categories_" ] }, { "cell_type": "code", "execution_count": 36, "id": "fa7df93b-6d7f-4524-aa5a-23e4d1cec0af", "metadata": {}, "outputs": [], "source": [ "# SimpleImputer removes nan values. But, there are no nan values.\n", "column_trans=make_column_transformer((OneHotEncoder(categories=ohe.categories_),['name','company','fuel_type']),remainder='passthrough')" ] }, { "cell_type": "code", "execution_count": 37, "id": "6d555173-9ee9-4e64-b1fd-bb17709b0b7a", "metadata": {}, "outputs": [], "source": [ "lr=LinearRegression()" ] }, { "cell_type": "code", "execution_count": 38, "id": "65bff1f9-a80b-492e-82f7-5ac9e70ca5c4", "metadata": {}, "outputs": [], "source": [ "pipe=make_pipeline(column_trans,lr) #" ] }, { "cell_type": "code", "execution_count": 39, "id": "a6b6a1d1-faa2-4713-b143-f60910820785", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
Pipeline(steps=[('columntransformer',\n",
       "                 ColumnTransformer(remainder='passthrough',\n",
       "                                   transformers=[('onehotencoder',\n",
       "                                                  OneHotEncoder(categories=[array(['Audi A3 Cabriolet', 'Audi A4 1.8', 'Audi A4 2.0', 'Audi A6 2.0',\n",
       "       'Audi A8', 'Audi Q3 2.0', 'Audi Q5 2.0', 'Audi Q7', 'BMW 3 Series',\n",
       "       'BMW 5 Series', 'BMW 7 Series', 'BMW X1', 'BMW X1 sDrive20d',\n",
       "       'BMW X1 xDrive20d', 'Chevrolet Beat', 'Chevrolet Beat...\n",
       "                                                                            array(['Audi', 'BMW', 'Chevrolet', 'Datsun', 'Fiat', 'Force', 'Ford',\n",
       "       'Hindustan', 'Honda', 'Hyundai', 'Jaguar', 'Jeep', 'Land',\n",
       "       'Mahindra', 'Maruti', 'Mercedes', 'Mini', 'Mitsubishi', 'Nissan',\n",
       "       'Renault', 'Skoda', 'Tata', 'Toyota', 'Volkswagen', 'Volvo'],\n",
       "      dtype=object),\n",
       "                                                                            array(['Diesel', 'LPG', 'Petrol'], dtype=object)]),\n",
       "                                                  ['name', 'company',\n",
       "                                                   'fuel_type'])])),\n",
       "                ('linearregression', LinearRegression())])
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" ], "text/plain": [ "Pipeline(steps=[('columntransformer',\n", " ColumnTransformer(remainder='passthrough',\n", " transformers=[('onehotencoder',\n", " OneHotEncoder(categories=[array(['Audi A3 Cabriolet', 'Audi A4 1.8', 'Audi A4 2.0', 'Audi A6 2.0',\n", " 'Audi A8', 'Audi Q3 2.0', 'Audi Q5 2.0', 'Audi Q7', 'BMW 3 Series',\n", " 'BMW 5 Series', 'BMW 7 Series', 'BMW X1', 'BMW X1 sDrive20d',\n", " 'BMW X1 xDrive20d', 'Chevrolet Beat', 'Chevrolet Beat...\n", " array(['Audi', 'BMW', 'Chevrolet', 'Datsun', 'Fiat', 'Force', 'Ford',\n", " 'Hindustan', 'Honda', 'Hyundai', 'Jaguar', 'Jeep', 'Land',\n", " 'Mahindra', 'Maruti', 'Mercedes', 'Mini', 'Mitsubishi', 'Nissan',\n", " 'Renault', 'Skoda', 'Tata', 'Toyota', 'Volkswagen', 'Volvo'],\n", " dtype=object),\n", " array(['Diesel', 'LPG', 'Petrol'], dtype=object)]),\n", " ['name', 'company',\n", " 'fuel_type'])])),\n", " ('linearregression', LinearRegression())])" ] }, "execution_count": 39, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pipe.fit(X_train,y_train)" ] }, { "cell_type": "code", "execution_count": 40, "id": "33efbdff-b161-48c9-b61b-db0371e4fb96", "metadata": {}, "outputs": [], "source": [ "y_pred=pipe.predict(X_test)" ] }, { "cell_type": "code", "execution_count": 41, "id": "d73f8459-6343-4cce-bd59-2393eb9db8ce", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array([ 437483.17106583, 433422.85604516, 445431.29966525,\n", " 546803.77651766, 243783.16921484, 526613.18702689,\n", " 647953.1457932 , 230576.07304794, 317149.18590167,\n", " 490649.38797615, 479535.7193726 , 328607.98385943,\n", " 411720.64410387, 48563.37056129, 260370.3146277 ,\n", " 162046.01695599, 446516.63639759, 578373.91851465,\n", " 483409.8529231 , 380971.21042756, 435947.22098751,\n", " 302193.29084413, 322466.18897489, 665816.3124464 ,\n", " 567189.34019008, 229948.22004309, 547811.22435239,\n", " 404330.83861122, -21586.84055102, 270975.25911233,\n", " 102634.03610943, 237364.22739295, -159391.81424545,\n", " 616206.03733011, 199705.12217447, 322721.20220497,\n", " 99044.1423015 , 420783.68180992, 421784.61815254,\n", " -148552.40329967, 424803.5809817 , 577388.24913502,\n", " 253191.75121272, 623202.60164183, 276582.13617052,\n", " 184030.55628867, 227117.37279161, 265096.43514005,\n", " 217793.69513094, 307517.63523864, 480112.68225301,\n", " 261119.18083314, 278561.9603409 , 693321.06213455,\n", " 499593.55614746, 581489.53691532, 382488.62267945,\n", " 1416999.58901817, 547192.77908992, 363673.49972148,\n", " 50319.89510283, 418290.30378696, 420891.2638486 ,\n", " 299652.96458083, 393800.93044288, 351402.01381317,\n", " 38554.07573153, 454728.83006706, 420539.99150132,\n", " 576320.77660997, 266918.1221726 , 341285.81289955,\n", " 86967.84198052, 220814.1518578 , 313400.13671596,\n", " 385774.82548904, 413268.92488509, -200095.21920821,\n", " -99875.79927235, 43976.6225077 , 307813.07810994,\n", " 400021.59746041, -79975.78336611, 53832.61857565,\n", " 302193.29084413, 443438.26678829, 310018.56627681,\n", " 68544.71569878, 199235.37219493, 604881.21655153,\n", " 182523.79617567, 329704.2465662 , 159713.52317488,\n", " 124297.40627 , 570391.59567919, 398139.21996466,\n", " 624412.60168596, 79531.24391118, 454425.70317206,\n", " 626741.42777619, 588005.09419163, 455207.98223708,\n", " 383735.30598595, 195704.21129712, 451637.67120919,\n", " 721619.39247876, 229100.9711124 , 698770.91549752,\n", " 362706.0054514 , 451356.78660558, 258037.80370089,\n", " 222652.39167847, 557806.48453031, 776416.77102363,\n", " -61157.2925593 , 268755.04577304, 256837.97895057,\n", " 288569.13733117, 327300.43698683, 313033.26748906,\n", " 451356.78660558, 217167.22741045, 601310.86492204,\n", " 472146.42292207, 98655.15841171, 2073506.97540331,\n", " 547192.77908992, 194727.20007504, 521156.34510817,\n", " 546113.35016768, 194940.09240673, 480251.84046125,\n", " 148999.93080177, 512432.7220112 , 178718.59204444,\n", " 448799.68524299, 330359.96459238, 550868.49401304,\n", " 419680.17786598, 349805.32132552, 2073506.97540331,\n", " 301613.95213237, 19809.94388594, 364140.46017395,\n", " 105430.9122521 , 213663.93590553, 253901.39231834,\n", " 114479.70778652, 287688.22640482, 1115373.62574654,\n", " 218709.98818254, 520274.35749836, 2073506.97540331,\n", " 451356.78660558, 325549.96197601, 199568.57527158,\n", " 272892.28037125, 248390.82843892, 668083.89310887,\n", " 513660.23141772, 1143907.15847366, 290496.03587839,\n", " 298049.05987287])" ] }, "execution_count": 41, "metadata": {}, "output_type": "execute_result" } ], "source": [ "y_pred" ] }, { "cell_type": "code", "execution_count": 42, "id": "fa394194-da85-42ae-9981-46ea62f49bee", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0.6218079421120855" ] }, "execution_count": 42, "metadata": {}, "output_type": "execute_result" } ], "source": [ "r2_score(y_test,y_pred)" ] }, { "cell_type": "code", "execution_count": 43, "id": "3c949bfc-915d-490d-ac90-be9dd7b4c3fb", "metadata": {}, "outputs": [], "source": [ "scores=[]\n", "for i in range(1000):\n", " X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=0.2,random_state=i)\n", " lr=LinearRegression()\n", " pipe=make_pipeline(column_trans,lr)\n", " pipe.fit(X_train,y_train)\n", " y_pred=pipe.predict(X_test)\n", " scores.append(r2_score(y_test,y_pred))" ] }, { "cell_type": "code", "execution_count": 44, "id": "8375ee43-a1d9-4396-86c7-703e077caaf6", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "433" ] }, "execution_count": 44, "metadata": {}, "output_type": "execute_result" } ], "source": [ "np.argmax(scores)\n" ] }, { "cell_type": "code", "execution_count": 45, "id": "033d0eac-3439-4bb5-9865-76f755c8e536", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0.8457059012561223" ] }, "execution_count": 45, "metadata": {}, "output_type": "execute_result" } ], "source": [ "scores[np.argmax(scores)]" ] }, { "cell_type": "code", "execution_count": 46, "id": "c33941c1-a97a-4cce-93bc-57d0716fe0fc", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0.8457059012561223" ] }, "execution_count": 46, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=0.2,random_state=np.argmax(scores))\n", "lr=LinearRegression()\n", "pipe=make_pipeline(column_trans,lr)\n", "pipe.fit(X_train,y_train)\n", "y_pred=pipe.predict(X_test)\n", "r2_score(y_test,y_pred)" ] }, { "cell_type": "code", "execution_count": 47, "id": "2466d013-7217-4ca9-b6f1-9d678a33bce2", "metadata": {}, "outputs": [], "source": [ "import pickle\n" ] }, { "cell_type": "code", "execution_count": 48, "id": "ea9e302f-910f-4a1a-9a7d-487c02fed87a", "metadata": {}, "outputs": [], "source": [ "pickle.dump(pipe,open('LinearRegressionModel.pkl','wb'))" ] }, { "cell_type": "code", "execution_count": 49, "id": "c3a59047-b9ee-4f74-bf85-6980c333d2a9", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "array([458894.10960853])" ] }, "execution_count": 49, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pipe.predict(pd.DataFrame([['Maruti Suzuki Swift','Maruti',2019,100,'Petrol']],columns=['name','company','year','kms_driven','fuel_type']))" ] }, { "cell_type": "code", "execution_count": null, "id": "10c3b9b8-cf2a-46b2-94be-e9bfb49952b3", "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.11.5" } }, "nbformat": 4, "nbformat_minor": 5 }