{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "name": "Salary_ML_Project.ipynb", "provenance": [], "collapsed_sections": [] }, "kernelspec": { "display_name": "Python 3", "name": "python3" }, "language_info": { "name": "python" } }, "cells": [ { "cell_type": "markdown", "metadata": { "id": "LXy6hmTOhed1" }, "source": [ "Setting up Colab" ] }, { "cell_type": "code", "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "PiiiSef_6tle", "outputId": "7fedf5f1-1b59-441c-d6ff-a32fd9987468" }, "source": [ "from google.colab import drive\n", "\n", "drive.mount('/content/drive', force_remount = True)" ], "execution_count": 132, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Mounted at /content/drive\n" ] } ] }, { "cell_type": "markdown", "metadata": { "id": "NIraf5LmHxm-" }, "source": [ "### Read Dataset" ] }, { "cell_type": "code", "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 307 }, "id": "6YndzY3swBQj", "outputId": "a342b5b8-cc12-4979-ec15-4a09000d3151" }, "source": [ "import pandas as pd\n", "df = pd.read_csv('/content/drive/MyDrive/ML Salary Project /Data/project-final.csv')\n", "df.head()" ], "execution_count": 133, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", " | SalaryUSD | \n", "Country | \n", "PrimaryDatabase | \n", "YearsWithThisDatabase | \n", "EmploymentStatus | \n", "JobTitle | \n", "ManageStaff | \n", "YearsWithThisTypeOfJob | \n", "HowManyCompanies | \n", "OtherPeopleOnYourTeam | \n", "EmploymentSector | \n", "CareerPlansThisYear | \n", "Gender | \n", "DatabaseServers | \n", "Education | \n", "Certifications | \n", "HoursWorkedPerWeek | \n", "TelecommuteDaysPerWeek | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "Low | \n", "Sweden | \n", "M | \n", "4 | \n", "E | \n", "D | \n", "Y | \n", "4 | \n", "1.0 | \n", "0 | \n", "PB | \n", "S | \n", "M | \n", "373.411662 | \n", "'Bachelors (4 years)' | \n", "N | \n", "43.16509 | \n", "zero | \n", "
1 | \n", "High | \n", "USA | \n", "M | \n", "15 | \n", "E | \n", "DBAP | \n", "N | \n", "25 | \n", "5.0 | \n", "0 | \n", "PB | \n", "S | \n", "M | \n", "373.411662 | \n", "'Bachelors (4 years)' | \n", "N | \n", "43.16509 | \n", "zero | \n", "
2 | \n", "High-Mid | \n", "USA | \n", "M | \n", "12 | \n", "E | \n", "DBAG | \n", "Y | \n", "6 | \n", "4.0 | \n", "1 | \n", "PB | \n", "S | \n", "M | \n", "373.411662 | \n", "'Bachelors (4 years)' | \n", "N | \n", "43.16509 | \n", "zero | \n", "
3 | \n", "Low | \n", "UK | \n", "M | \n", "10 | \n", "E | \n", "DBAP | \n", "N | \n", "5 | \n", "2.0 | \n", "0 | \n", "E | \n", "S | \n", "M | \n", "373.411662 | \n", "'Bachelors (4 years)' | \n", "N | \n", "43.16509 | \n", "zero | \n", "
4 | \n", "High-Mid | \n", "USA | \n", "M | \n", "5 | \n", "E | \n", "D | \n", "N | \n", "5 | \n", "1.0 | \n", "0 | \n", "PB | \n", "S | \n", "M | \n", "373.411662 | \n", "'Bachelors (4 years)' | \n", "N | \n", "43.16509 | \n", "zero | \n", "
\n", " | 0 | \n", "1 | \n", "2 | \n", "3 | \n", "
---|---|---|---|---|
0 | \n", "-4.138638 | \n", "-4.141160 | \n", "-1.060148 | \n", "-0.344151 | \n", "
1 | \n", "-12.162499 | \n", "1.815431 | \n", "-0.994463 | \n", "-0.261570 | \n", "
2 | \n", "-12.157918 | \n", "0.826832 | \n", "-1.003102 | \n", "-0.267811 | \n", "
3 | \n", "-11.176152 | \n", "1.820139 | \n", "-1.147436 | \n", "0.215920 | \n", "
4 | \n", "-12.138983 | \n", "-4.182848 | \n", "-1.095431 | \n", "-0.348160 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
10334 | \n", "-11.146052 | \n", "-2.188204 | \n", "-0.909104 | \n", "-0.143865 | \n", "
10335 | \n", "3.841024 | \n", "-2.151027 | \n", "1.931727 | \n", "-0.344638 | \n", "
10336 | \n", "17.828090 | \n", "0.889711 | \n", "2.020452 | \n", "-0.317144 | \n", "
10337 | \n", "-12.161796 | \n", "-2.293752 | \n", "4.563015 | \n", "0.136997 | \n", "
10338 | \n", "8.880702 | \n", "-8.122048 | \n", "-0.633003 | \n", "-0.221737 | \n", "
10339 rows × 4 columns
\n", "