diff --git a/Capstone_Final (1).ipynb b/Capstone_Final (1).ipynb new file mode 100644 index 0000000..b0afdd1 --- /dev/null +++ b/Capstone_Final (1).ipynb @@ -0,0 +1,6166 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Import Libraries" + ] + }, + { + "cell_type": "code", + "execution_count": 224, + "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np # linear algebra\n", + "import pandas as pd # data processing, CSV file\n", + "import matplotlib.pyplot as plt\n", + "import seaborn as sns\n", + "from sklearn.linear_model import LinearRegression\n", + "from sklearn import svm\n", + "from sklearn.ensemble import RandomForestRegressor\n", + "from sklearn import linear_model\n", + "from sklearn.preprocessing import PolynomialFeatures \n", + "from sklearn.linear_model import LinearRegression\n", + "from sklearn.metrics import mean_squared_error\n", + "from sklearn.metrics import mean_absolute_error\n", + "from math import sqrt\n", + "from sklearn.preprocessing import StandardScaler" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Read data file as dataframe" + ] + }, + { + "cell_type": "code", + "execution_count": 225, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | Unnamed: 0 | \n", + "ID | \n", + "Salary | \n", + "DOJ | \n", + "DOL | \n", + "Designation | \n", + "JobCity | \n", + "Gender | \n", + "DOB | \n", + "10percentage | \n", + "... | \n", + "ComputerScience | \n", + "MechanicalEngg | \n", + "ElectricalEngg | \n", + "TelecomEngg | \n", + "CivilEngg | \n", + "conscientiousness | \n", + "agreeableness | \n", + "extraversion | \n", + "nueroticism | \n", + "openess_to_experience | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "train | \n", + "203097 | \n", + "420000.0 | \n", + "01-06-2012 00:00 | \n", + "present | \n", + "senior quality engineer | \n", + "Bangalore | \n", + "f | \n", + "19-02-1990 00:00 | \n", + "84.3 | \n", + "... | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "0.9737 | \n", + "0.8128 | \n", + "0.5269 | \n", + "1.35490 | \n", + "-0.4455 | \n", + "
1 | \n", + "train | \n", + "579905 | \n", + "500000.0 | \n", + "01-09-2013 00:00 | \n", + "present | \n", + "assistant manager | \n", + "Indore | \n", + "m | \n", + "04-10-1989 00:00 | \n", + "85.4 | \n", + "... | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-0.7335 | \n", + "0.3789 | \n", + "1.2396 | \n", + "-0.10760 | \n", + "0.8637 | \n", + "
2 | \n", + "train | \n", + "810601 | \n", + "325000.0 | \n", + "01-06-2014 00:00 | \n", + "present | \n", + "systems engineer | \n", + "Chennai | \n", + "f | \n", + "03-08-1992 00:00 | \n", + "85.0 | \n", + "... | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "0.2718 | \n", + "1.7109 | \n", + "0.1637 | \n", + "-0.86820 | \n", + "0.6721 | \n", + "
3 | \n", + "train | \n", + "267447 | \n", + "1100000.0 | \n", + "01-07-2011 00:00 | \n", + "present | \n", + "senior software engineer | \n", + "Gurgaon | \n", + "m | \n", + "05-12-1989 00:00 | \n", + "85.6 | \n", + "... | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "0.0464 | \n", + "0.3448 | \n", + "-0.3440 | \n", + "-0.40780 | \n", + "-0.9194 | \n", + "
4 | \n", + "train | \n", + "343523 | \n", + "200000.0 | \n", + "01-03-2014 00:00 | \n", + "01-03-2015 00:00 | \n", + "get | \n", + "Manesar | \n", + "m | \n", + "27-02-1991 00:00 | \n", + "78.0 | \n", + "... | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-1 | \n", + "-0.8810 | \n", + "-0.2793 | \n", + "-1.0697 | \n", + "0.09163 | \n", + "-0.1295 | \n", + "
5 rows × 39 columns
\n", + "\n", + " | ID | \n", + "Salary | \n", + "JobCity | \n", + "Gender | \n", + "10percentage | \n", + "12graduation | \n", + "12percentage | \n", + "12board | \n", + "CollegeTier | \n", + "Degree | \n", + "... | \n", + "CollegeCityTier | \n", + "GraduationYear | \n", + "Domain | \n", + "Age | \n", + "Experience | \n", + "Cognitive Test Scores | \n", + "10 Board | \n", + "12 Board | \n", + "Personality Trait Score | \n", + "Designations | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "203097 | \n", + "420000.0 | \n", + "Bangalore | \n", + "f | \n", + "84.3 | \n", + "2007 | \n", + "95.8 | \n", + "board of intermediate education,ap | \n", + "2 | \n", + "B.Tech/B.E. | \n", + "... | \n", + "0 | \n", + "2011 | \n", + "0.635979 | \n", + "25 | \n", + "3 | \n", + "63.591794 | \n", + "State Board | \n", + "State Board | \n", + "0.644560 | \n", + "others | \n", + "
1 | \n", + "579905 | \n", + "500000.0 | \n", + "Indore | \n", + "m | \n", + "85.4 | \n", + "2007 | \n", + "85.0 | \n", + "cbse | \n", + "2 | \n", + "B.Tech/B.E. | \n", + "... | \n", + "0 | \n", + "2012 | \n", + "0.960603 | \n", + "26 | \n", + "2 | \n", + "80.941599 | \n", + "CBSE | \n", + "CBSE | \n", + "0.328220 | \n", + "manager | \n", + "
2 | \n", + "810601 | \n", + "325000.0 | \n", + "Chennai | \n", + "f | \n", + "85.0 | \n", + "2010 | \n", + "68.2 | \n", + "cbse | \n", + "2 | \n", + "B.Tech/B.E. | \n", + "... | \n", + "0 | \n", + "2014 | \n", + "0.450877 | \n", + "23 | \n", + "1 | \n", + "59.983428 | \n", + "CBSE | \n", + "CBSE | \n", + "0.390060 | \n", + "engineer | \n", + "
3 | \n", + "267447 | \n", + "1100000.0 | \n", + "Gurgaon | \n", + "m | \n", + "85.6 | \n", + "2007 | \n", + "83.6 | \n", + "cbse | \n", + "1 | \n", + "B.Tech/B.E. | \n", + "... | \n", + "1 | \n", + "2011 | \n", + "0.974396 | \n", + "26 | \n", + "4 | \n", + "71.866926 | \n", + "CBSE | \n", + "CBSE | \n", + "-0.256000 | \n", + "others | \n", + "
4 | \n", + "343523 | \n", + "200000.0 | \n", + "Manesar | \n", + "m | \n", + "78.0 | \n", + "2008 | \n", + "76.8 | \n", + "cbse | \n", + "2 | \n", + "B.Tech/B.E. | \n", + "... | \n", + "0 | \n", + "2012 | \n", + "0.124502 | \n", + "24 | \n", + "1 | \n", + "64.189578 | \n", + "CBSE | \n", + "CBSE | \n", + "-0.453574 | \n", + "others | \n", + "
5 rows × 23 columns
\n", + "