From 35de4681aa98335afba38ad1f5d2f7f24ecfa645 Mon Sep 17 00:00:00 2001 From: AtharvInamdar <90698481+AtharvInamdar@users.noreply.github.com> Date: Thu, 24 Feb 2022 22:22:39 +0530 Subject: [PATCH 1/2] Add files via upload --- setdataset.ipynb | 2116 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 2116 insertions(+) create mode 100644 setdataset.ipynb diff --git a/setdataset.ipynb b/setdataset.ipynb new file mode 100644 index 0000000..db0a3e9 --- /dev/null +++ b/setdataset.ipynb @@ -0,0 +1,2116 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "name": "setdataset.ipynb", + "provenance": [], + "collapsed_sections": [] + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + } + }, + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "id": "cXAaaqUMtXeK" + }, + "outputs": [], + "source": [ + "# Importing the libraries\n", + "import pandas as pd\n", + "import numpy as np\n", + "from sklearn.model_selection import train_test_split\n", + "from sklearn.linear_model import LinearRegression\n", + "from sklearn.metrics import mean_squared_error" + ] + }, + { + "cell_type": "code", + "source": [ + "# Importing the dataset\n", + "df=pd.read_csv('day.csv')" + ], + "metadata": { + "id": "ShNt4BLht4Wb" + }, + "execution_count": 2, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "df\n" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 424 + }, + "id": "dFiagtGFt-5o", + "outputId": "8f76f919-b13e-45ce-9165-d3c56af1cee8" + }, + "execution_count": 3, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
instantdtedayseasonyrmnthholidayweekdayworkingdayweathersittempatemphumwindspeedcasualregisteredcnt
012011-01-0110106020.3441670.3636250.8058330.160446331654985
122011-01-0210100020.3634780.3537390.6960870.248539131670801
232011-01-0310101110.1963640.1894050.4372730.24830912012291349
342011-01-0410102110.2000000.2121220.5904350.16029610814541562
452011-01-0510103110.2269570.2292700.4369570.1869008215181600
...................................................
7267272012-12-27111204120.2541670.2266420.6529170.35013324718672114
7277282012-12-28111205120.2533330.2550460.5900000.15547164424513095
7287292012-12-29111206020.2533330.2424000.7529170.12438315911821341
7297302012-12-30111200010.2558330.2317000.4833330.35075436414321796
7307312012-12-31111201120.2158330.2234870.5775000.15484643922902729
\n", + "

731 rows × 16 columns

\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " instant dteday season yr ... windspeed casual registered cnt\n", + "0 1 2011-01-01 1 0 ... 0.160446 331 654 985\n", + "1 2 2011-01-02 1 0 ... 0.248539 131 670 801\n", + "2 3 2011-01-03 1 0 ... 0.248309 120 1229 1349\n", + "3 4 2011-01-04 1 0 ... 0.160296 108 1454 1562\n", + "4 5 2011-01-05 1 0 ... 0.186900 82 1518 1600\n", + ".. ... ... ... .. ... ... ... ... ...\n", + "726 727 2012-12-27 1 1 ... 0.350133 247 1867 2114\n", + "727 728 2012-12-28 1 1 ... 0.155471 644 2451 3095\n", + "728 729 2012-12-29 1 1 ... 0.124383 159 1182 1341\n", + "729 730 2012-12-30 1 1 ... 0.350754 364 1432 1796\n", + "730 731 2012-12-31 1 1 ... 0.154846 439 2290 2729\n", + "\n", + "[731 rows x 16 columns]" + ] + }, + "metadata": {}, + "execution_count": 3 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Shape of dataset\n", + "df.shape" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "1Qtm2RU9uFs2", + "outputId": "ee3904b0-0b3c-47c0-f147-53dfdbfbeefd" + }, + "execution_count": 4, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "(731, 16)" + ] + }, + "metadata": {}, + "execution_count": 4 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Using isna() function to check NaN values in dataframe\n", + "df.isna()" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 424 + }, + "id": "KqguTf_ZukyV", + "outputId": "8a39a3c6-cb92-4e43-d03b-3a0f0070ed3c" + }, + "execution_count": 5, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
instantdtedayseasonyrmnthholidayweekdayworkingdayweathersittempatemphumwindspeedcasualregisteredcnt
0FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
1FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
2FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
3FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
4FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
...................................................
726FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
727FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
728FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
729FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
730FalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalseFalse
\n", + "

731 rows × 16 columns

\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " instant dteday season yr ... windspeed casual registered cnt\n", + "0 False False False False ... False False False False\n", + "1 False False False False ... False False False False\n", + "2 False False False False ... False False False False\n", + "3 False False False False ... False False False False\n", + "4 False False False False ... False False False False\n", + ".. ... ... ... ... ... ... ... ... ...\n", + "726 False False False False ... False False False False\n", + "727 False False False False ... False False False False\n", + "728 False False False False ... False False False False\n", + "729 False False False False ... False False False False\n", + "730 False False False False ... False False False False\n", + "\n", + "[731 rows x 16 columns]" + ] + }, + "metadata": {}, + "execution_count": 5 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Drop columns which are not necessary\n", + "df=df.drop(['dteday', 'casual', 'registered'],axis=1)" + ], + "metadata": { + "id": "zHn1NMA4uqee" + }, + "execution_count": 7, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "df=df.drop(['instant'],axis=1)" + ], + "metadata": { + "id": "6DC65BtvwHhw" + }, + "execution_count": 8, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "df" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 424 + }, + "id": "LcDh5wIGwNlc", + "outputId": "333cd0fc-e686-4714-8c96-d3169ba01c0c" + }, + "execution_count": 9, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
seasonyrmnthholidayweekdayworkingdayweathersittempatemphumwindspeedcnt
010106020.3441670.3636250.8058330.160446985
110100020.3634780.3537390.6960870.248539801
210101110.1963640.1894050.4372730.2483091349
310102110.2000000.2121220.5904350.1602961562
410103110.2269570.2292700.4369570.1869001600
.......................................
726111204120.2541670.2266420.6529170.3501332114
727111205120.2533330.2550460.5900000.1554713095
728111206020.2533330.2424000.7529170.1243831341
729111200010.2558330.2317000.4833330.3507541796
730111201120.2158330.2234870.5775000.1548462729
\n", + "

731 rows × 12 columns

\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " season yr mnth holiday ... atemp hum windspeed cnt\n", + "0 1 0 1 0 ... 0.363625 0.805833 0.160446 985\n", + "1 1 0 1 0 ... 0.353739 0.696087 0.248539 801\n", + "2 1 0 1 0 ... 0.189405 0.437273 0.248309 1349\n", + "3 1 0 1 0 ... 0.212122 0.590435 0.160296 1562\n", + "4 1 0 1 0 ... 0.229270 0.436957 0.186900 1600\n", + ".. ... .. ... ... ... ... ... ... ...\n", + "726 1 1 12 0 ... 0.226642 0.652917 0.350133 2114\n", + "727 1 1 12 0 ... 0.255046 0.590000 0.155471 3095\n", + "728 1 1 12 0 ... 0.242400 0.752917 0.124383 1341\n", + "729 1 1 12 0 ... 0.231700 0.483333 0.350754 1796\n", + "730 1 1 12 0 ... 0.223487 0.577500 0.154846 2729\n", + "\n", + "[731 rows x 12 columns]" + ] + }, + "metadata": {}, + "execution_count": 9 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.shape" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "uAp54NZywT-I", + "outputId": "a077a4b1-a96d-4930-e319-bb03c6fdc98c" + }, + "execution_count": 10, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "(731, 12)" + ] + }, + "metadata": {}, + "execution_count": 10 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Remove rows which has null vlaues\n", + "df=df.dropna()" + ], + "metadata": { + "id": "67S5NTBEwZ9D" + }, + "execution_count": 12, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "df" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 424 + }, + "id": "yhWrvRzQwhvg", + "outputId": "009af491-d653-453d-c911-47c125aa494f" + }, + "execution_count": 13, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
seasonyrmnthholidayweekdayworkingdayweathersittempatemphumwindspeedcnt
010106020.3441670.3636250.8058330.160446985
110100020.3634780.3537390.6960870.248539801
210101110.1963640.1894050.4372730.2483091349
310102110.2000000.2121220.5904350.1602961562
410103110.2269570.2292700.4369570.1869001600
.......................................
726111204120.2541670.2266420.6529170.3501332114
727111205120.2533330.2550460.5900000.1554713095
728111206020.2533330.2424000.7529170.1243831341
729111200010.2558330.2317000.4833330.3507541796
730111201120.2158330.2234870.5775000.1548462729
\n", + "

731 rows × 12 columns

\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ], + "text/plain": [ + " season yr mnth holiday ... atemp hum windspeed cnt\n", + "0 1 0 1 0 ... 0.363625 0.805833 0.160446 985\n", + "1 1 0 1 0 ... 0.353739 0.696087 0.248539 801\n", + "2 1 0 1 0 ... 0.189405 0.437273 0.248309 1349\n", + "3 1 0 1 0 ... 0.212122 0.590435 0.160296 1562\n", + "4 1 0 1 0 ... 0.229270 0.436957 0.186900 1600\n", + ".. ... .. ... ... ... ... ... ... ...\n", + "726 1 1 12 0 ... 0.226642 0.652917 0.350133 2114\n", + "727 1 1 12 0 ... 0.255046 0.590000 0.155471 3095\n", + "728 1 1 12 0 ... 0.242400 0.752917 0.124383 1341\n", + "729 1 1 12 0 ... 0.231700 0.483333 0.350754 1796\n", + "730 1 1 12 0 ... 0.223487 0.577500 0.154846 2729\n", + "\n", + "[731 rows x 12 columns]" + ] + }, + "metadata": {}, + "execution_count": 13 + } + ] + }, + { + "cell_type": "code", + "source": [ + "df.columns" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "EnW8izPJwlbl", + "outputId": "1dbf3c84-c844-4021-868f-ffa01797308c" + }, + "execution_count": 14, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "Index(['season', 'yr', 'mnth', 'holiday', 'weekday', 'workingday',\n", + " 'weathersit', 'temp', 'atemp', 'hum', 'windspeed', 'cnt'],\n", + " dtype='object')" + ] + }, + "metadata": {}, + "execution_count": 14 + } + ] + }, + { + "cell_type": "code", + "source": [ + "for col in df:\n", + " print(df[col].value_counts(ascending=False), '\\n\\n\\n')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "AhKPKfVuwprY", + "outputId": "5a7f7986-98b8-45f1-d5c1-b33d2b5be156" + }, + "execution_count": 15, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "3 188\n", + "2 184\n", + "1 181\n", + "4 178\n", + "Name: season, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 366\n", + "0 365\n", + "Name: yr, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 62\n", + "3 62\n", + "5 62\n", + "7 62\n", + "8 62\n", + "10 62\n", + "12 62\n", + "4 60\n", + "6 60\n", + "9 60\n", + "11 60\n", + "2 57\n", + "Name: mnth, dtype: int64 \n", + "\n", + "\n", + "\n", + "0 710\n", + "1 21\n", + "Name: holiday, dtype: int64 \n", + "\n", + "\n", + "\n", + "6 105\n", + "0 105\n", + "1 105\n", + "2 104\n", + "3 104\n", + "4 104\n", + "5 104\n", + "Name: weekday, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 500\n", + "0 231\n", + "Name: workingday, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 463\n", + "2 247\n", + "3 21\n", + "Name: weathersit, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.635000 5\n", + "0.265833 5\n", + "0.680000 4\n", + "0.710833 4\n", + "0.564167 4\n", + " ..\n", + "0.669167 1\n", + "0.643333 1\n", + "0.707059 1\n", + "0.700000 1\n", + "0.215833 1\n", + "Name: temp, Length: 499, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.654688 4\n", + "0.375621 3\n", + "0.637008 3\n", + "0.571975 2\n", + "0.466525 2\n", + " ..\n", + "0.578946 1\n", + "0.609229 1\n", + "0.602130 1\n", + "0.626900 1\n", + "0.223487 1\n", + "Name: atemp, Length: 690, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.613333 4\n", + "0.605000 3\n", + "0.590000 3\n", + "0.538333 3\n", + "0.690000 3\n", + " ..\n", + "0.548333 1\n", + "0.561765 1\n", + "0.850000 1\n", + "0.761250 1\n", + "0.577500 1\n", + "Name: hum, Length: 595, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.134954 3\n", + "0.228858 3\n", + "0.136817 3\n", + "0.110700 3\n", + "0.118792 3\n", + " ..\n", + "0.206467 1\n", + "0.212696 1\n", + "0.343943 1\n", + "0.097021 1\n", + "0.154846 1\n", + "Name: windspeed, Length: 650, dtype: int64 \n", + "\n", + "\n", + "\n", + "5409 2\n", + "2424 2\n", + "5698 2\n", + "4459 2\n", + "5119 2\n", + " ..\n", + "5046 1\n", + "4713 1\n", + "4763 1\n", + "4785 1\n", + "2729 1\n", + "Name: cnt, Length: 696, dtype: int64 \n", + "\n", + "\n", + "\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Replace negative values in dataframe with 0\n", + "num = df._get_numeric_data()\n", + "num[num < 0] = 0" + ], + "metadata": { + "id": "68Ye1KI8xKtd" + }, + "execution_count": 16, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "for col in df:\n", + " print(df[col].value_counts(ascending=False), '\\n\\n\\n')" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "nHcHZB5vxSk9", + "outputId": "77a47af2-3b70-4ccd-d34c-5b2c3e835e76" + }, + "execution_count": 17, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "3 188\n", + "2 184\n", + "1 181\n", + "4 178\n", + "Name: season, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 366\n", + "0 365\n", + "Name: yr, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 62\n", + "3 62\n", + "5 62\n", + "7 62\n", + "8 62\n", + "10 62\n", + "12 62\n", + "4 60\n", + "6 60\n", + "9 60\n", + "11 60\n", + "2 57\n", + "Name: mnth, dtype: int64 \n", + "\n", + "\n", + "\n", + "0 710\n", + "1 21\n", + "Name: holiday, dtype: int64 \n", + "\n", + "\n", + "\n", + "6 105\n", + "0 105\n", + "1 105\n", + "2 104\n", + "3 104\n", + "4 104\n", + "5 104\n", + "Name: weekday, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 500\n", + "0 231\n", + "Name: workingday, dtype: int64 \n", + "\n", + "\n", + "\n", + "1 463\n", + "2 247\n", + "3 21\n", + "Name: weathersit, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.635000 5\n", + "0.265833 5\n", + "0.680000 4\n", + "0.710833 4\n", + "0.564167 4\n", + " ..\n", + "0.669167 1\n", + "0.643333 1\n", + "0.707059 1\n", + "0.700000 1\n", + "0.215833 1\n", + "Name: temp, Length: 499, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.654688 4\n", + "0.375621 3\n", + "0.637008 3\n", + "0.571975 2\n", + "0.466525 2\n", + " ..\n", + "0.578946 1\n", + "0.609229 1\n", + "0.602130 1\n", + "0.626900 1\n", + "0.223487 1\n", + "Name: atemp, Length: 690, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.613333 4\n", + "0.605000 3\n", + "0.590000 3\n", + "0.538333 3\n", + "0.690000 3\n", + " ..\n", + "0.548333 1\n", + "0.561765 1\n", + "0.850000 1\n", + "0.761250 1\n", + "0.577500 1\n", + "Name: hum, Length: 595, dtype: int64 \n", + "\n", + "\n", + "\n", + "0.134954 3\n", + "0.228858 3\n", + "0.136817 3\n", + "0.110700 3\n", + "0.118792 3\n", + " ..\n", + "0.206467 1\n", + "0.212696 1\n", + "0.343943 1\n", + "0.097021 1\n", + "0.154846 1\n", + "Name: windspeed, Length: 650, dtype: int64 \n", + "\n", + "\n", + "\n", + "5409 2\n", + "2424 2\n", + "5698 2\n", + "4459 2\n", + "5119 2\n", + " ..\n", + "5046 1\n", + "4713 1\n", + "4763 1\n", + "4785 1\n", + "2729 1\n", + "Name: cnt, Length: 696, dtype: int64 \n", + "\n", + "\n", + "\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "Independant_variables=df.drop(['temp'],axis=1)\n", + "Dependant_variable=df['temp']" + ], + "metadata": { + "id": "dOFiEnjIxaTs" + }, + "execution_count": 18, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "# train test split\n", + "X_train,X_test,y_train,y_test=train_test_split(Independant_variables,Dependant_variable,test_size=0.3)" + ], + "metadata": { + "id": "jkEFQVV4xzhw" + }, + "execution_count": 19, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "print(X_train.shape,y_train.shape)\n", + "print(X_test.shape,y_test.shape)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "mDO7x-Alxzdx", + "outputId": "98d4004b-d3ec-4a19-d14d-19a85af98f69" + }, + "execution_count": 21, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "(511, 11) (511,)\n", + "(220, 11) (220,)\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Fitting Linear Regression to the dataset\n", + "model=LinearRegression()\n", + "model.fit(X_train,y_train)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "vhO3VaYcyAm7", + "outputId": "a2fb51a1-d627-4460-c240-d68ca85ac56b" + }, + "execution_count": 22, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "LinearRegression()" + ] + }, + "metadata": {}, + "execution_count": 22 + } + ] + }, + { + "cell_type": "code", + "source": [ + "model.score(X_test,y_test)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "kTeRNOulyDvy", + "outputId": "b4c40c1b-523e-4285-c1cc-585f2e297174" + }, + "execution_count": 23, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "0.9618679848468319" + ] + }, + "metadata": {}, + "execution_count": 23 + } + ] + }, + { + "cell_type": "code", + "source": [ + "y_pred = model.predict(X_test)\n", + "print(\"Predicted values:\")\n", + "print(y_pred)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "yn4_5gFzyLaj", + "outputId": "01d497a6-adc0-4503-8b08-89c5bfc8d018" + }, + "execution_count": 24, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Predicted values:\n", + "[0.26139833 0.24843521 0.57131762 0.46340071 0.73222751 0.42925864\n", + " 0.65221116 0.30942026 0.27721202 0.33599549 0.24746918 0.5244218\n", + " 0.72728082 0.707459 0.5515109 0.79293599 0.69154659 0.59194944\n", + " 0.53415555 0.24943123 0.42990328 0.4123266 0.1686194 0.75294334\n", + " 0.27959153 0.57164315 0.69695136 0.62093264 0.65262078 0.21879391\n", + " 0.75169612 0.78289948 0.39884028 0.25300551 0.22447105 0.6078554\n", + " 0.2495403 0.58064256 0.62074778 0.41619943 0.39082596 0.60387529\n", + " 0.54512197 0.61977368 0.38064467 0.30284106 0.28435554 0.6628038\n", + " 0.69963989 0.32409023 0.43345099 0.75005181 0.63043925 0.6819958\n", + " 0.47599378 0.69343173 0.31038888 0.25798883 0.7767981 0.31584768\n", + " 0.69432705 0.55722329 0.39954645 0.25184504 0.18177377 0.36186834\n", + " 0.5507138 0.18857743 0.75539344 0.31570068 0.52105538 0.6341357\n", + " 0.67282208 0.50166654 0.29392652 0.62884028 0.32604945 0.63985031\n", + " 0.27612366 0.53013777 0.23698819 0.33029211 0.50623254 0.56397112\n", + " 0.59818857 0.71825545 0.25223548 0.6706068 0.17602199 0.39689776\n", + " 0.64003218 0.43404124 0.67042189 0.07511919 0.4623536 0.61195081\n", + " 0.38719967 0.28576807 0.5443404 0.42866563 0.50813055 0.31119618\n", + " 0.5429557 0.36574452 0.6747021 0.17484689 0.19794907 0.24638034\n", + " 0.57279308 0.69141186 0.5743126 0.77497681 0.7871679 0.23044344\n", + " 0.26007091 0.35365621 0.3260192 0.70599096 0.68252517 0.35467262\n", + " 0.36480047 0.38318989 0.47098053 0.24829875 0.75243295 0.43966285\n", + " 0.43548234 0.43655537 0.16437059 0.3196555 0.33029807 0.49144516\n", + " 0.30761803 0.53357889 0.39495703 0.72686136 0.31485003 0.44623891\n", + " 0.73364368 0.41215329 0.71067627 0.70796604 0.65106689 0.29479719\n", + " 0.78771798 0.37393705 0.16841837 0.43583229 0.4703323 0.80768506\n", + " 0.3452518 0.38323456 0.40320437 0.5779206 0.27402613 0.29245606\n", + " 0.76606316 0.55641492 0.75096604 0.39289307 0.76567483 0.45508641\n", + " 0.25216835 0.72826098 0.47814245 0.2186926 0.54514164 0.47080859\n", + " 0.47248718 0.62200077 0.53283727 0.51041735 0.45235661 0.38388501\n", + " 0.81835626 0.45301072 0.62550536 0.09873213 0.21604778 0.25129175\n", + " 0.35903034 0.69031484 0.69331629 0.33627929 0.3912977 0.69414387\n", + " 0.44862737 0.34760098 0.5940439 0.58038327 0.64867188 0.35062691\n", + " 0.57461317 0.59909018 0.40147666 0.5974061 0.71063735 0.32438582\n", + " 0.23513132 0.79521049 0.2489857 0.44528626 0.68370916 0.26047469\n", + " 0.5500718 0.51146117 0.54201142 0.46168646 0.46735153 0.69765124\n", + " 0.3259509 0.52784103 0.7553458 0.72303439 0.41283342 0.70875842\n", + " 0.69221006 0.24677735 0.61404769 0.7626857 ]\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "mean_squared_error(y_test,y_pred)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "bNEN2Pf2yLWB", + "outputId": "471cdb61-c180-48ff-8fb8-a2249db7ff10" + }, + "execution_count": 25, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "0.0012685416562742769" + ] + }, + "metadata": {}, + "execution_count": 25 + } + ] + }, + { + "cell_type": "code", + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "plt.xlabel('y_test')\n", + "plt.ylabel('y_pred')\n", + "plt.scatter(y_test,y_pred)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 297 + }, + "id": "_iOuMT79yTic", + "outputId": "bcecedd3-5152-4d34-c8eb-548130c2fbd3" + }, + "execution_count": 26, + "outputs": [ + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "" + ] + }, + "metadata": {}, + "execution_count": 26 + }, + { + "output_type": "display_data", + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + } + } + ] + } + ] +} \ No newline at end of file From 78fd733b8d77980c4ee4cec7668e11d06a27c50f Mon Sep 17 00:00:00 2001 From: AtharvInamdar <90698481+AtharvInamdar@users.noreply.github.com> Date: Thu, 24 Feb 2022 22:24:12 +0530 Subject: [PATCH 2/2] Update Student assignment updates.txt --- Student assignment updates.txt | 3 +++ 1 file changed, 3 insertions(+) diff --git a/Student assignment updates.txt b/Student assignment updates.txt index 9979d7c..9ad8571 100644 --- a/Student assignment updates.txt +++ b/Student assignment updates.txt @@ -1,2 +1,5 @@ Write your name and PRN no Hello Updated + +Name-Inamdar Atharv Nitin +PRN-2019BTECS00051