diff --git a/files_for_lab/csv_files/.ipynb_checkpoints/[lab-customer-analysis-round-5] Sara-checkpoint.ipynb b/files_for_lab/csv_files/.ipynb_checkpoints/[lab-customer-analysis-round-5] Sara-checkpoint.ipynb new file mode 100644 index 0000000..21ce233 --- /dev/null +++ b/files_for_lab/csv_files/.ipynb_checkpoints/[lab-customer-analysis-round-5] Sara-checkpoint.ipynb @@ -0,0 +1,1307 @@ +{ + "cells": [ + { + "cell_type": "raw", + "id": "ca62338e", + "metadata": {}, + "source": [ + "LAB 5\n", + "\n", + "DA PT 2023\n", + "\n", + "Sara Ferreira da Silva" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "57638365", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CustomerStateCustomer Lifetime ValueResponseCoverageEducationEffective To DateEmploymentStatusGenderIncome...Months Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesPolicy TypePolicyRenew Offer TypeSales ChannelTotal Claim AmountVehicle ClassVehicle Size
0BU79786Washington2763.519279NoBasicBachelor2/24/11EmployedF56274...501Corporate AutoCorporate L3Offer1Agent384.811147Two-Door CarMedsize
1QZ44356Arizona6979.535903NoExtendedBachelor1/31/11UnemployedF0...4208Personal AutoPersonal L3Offer3Agent1131.464935Four-Door CarMedsize
2AI49188Nevada12887.431650NoPremiumBachelor2/19/11EmployedF48767...3802Personal AutoPersonal L3Offer1Agent566.472247Two-Door CarMedsize
3WW63253California7645.861827NoBasicBachelor1/20/11UnemployedM0...6507Corporate AutoCorporate L2Offer1Call Center529.881344SUVMedsize
4HB64268Washington2813.692575NoBasicBachelor2/3/11EmployedM43836...4401Personal AutoPersonal L1Offer1Agent138.130879Four-Door CarMedsize
..................................................................
9129LA72316California23405.987980NoBasicBachelor2/10/11EmployedM71941...8902Personal AutoPersonal L1Offer2Web198.234764Four-Door CarMedsize
9130PK87824California3096.511217YesExtendedCollege2/12/11EmployedF21604...2801Corporate AutoCorporate L3Offer1Branch379.200000Four-Door CarMedsize
9131TD14365California8163.890428NoExtendedBachelor2/6/11UnemployedM0...3732Corporate AutoCorporate L2Offer1Branch790.784983Four-Door CarMedsize
9132UP19263California7524.442436NoExtendedCollege2/3/11EmployedM21941...303Personal AutoPersonal L2Offer3Branch691.200000Four-Door CarLarge
9133Y167826California2611.836866NoExtendedCollege2/14/11UnemployedM0...9001Corporate AutoCorporate L3Offer4Call Center369.600000Two-Door CarMedsize
\n", + "

9134 rows × 24 columns

\n", + "
" + ], + "text/plain": [ + " Customer State Customer Lifetime Value Response Coverage \\\n", + "0 BU79786 Washington 2763.519279 No Basic \n", + "1 QZ44356 Arizona 6979.535903 No Extended \n", + "2 AI49188 Nevada 12887.431650 No Premium \n", + "3 WW63253 California 7645.861827 No Basic \n", + "4 HB64268 Washington 2813.692575 No Basic \n", + "... ... ... ... ... ... \n", + "9129 LA72316 California 23405.987980 No Basic \n", + "9130 PK87824 California 3096.511217 Yes Extended \n", + "9131 TD14365 California 8163.890428 No Extended \n", + "9132 UP19263 California 7524.442436 No Extended \n", + "9133 Y167826 California 2611.836866 No Extended \n", + "\n", + " Education Effective To Date EmploymentStatus Gender Income ... \\\n", + "0 Bachelor 2/24/11 Employed F 56274 ... \n", + "1 Bachelor 1/31/11 Unemployed F 0 ... \n", + "2 Bachelor 2/19/11 Employed F 48767 ... \n", + "3 Bachelor 1/20/11 Unemployed M 0 ... \n", + "4 Bachelor 2/3/11 Employed M 43836 ... \n", + "... ... ... ... ... ... ... \n", + "9129 Bachelor 2/10/11 Employed M 71941 ... \n", + "9130 College 2/12/11 Employed F 21604 ... \n", + "9131 Bachelor 2/6/11 Unemployed M 0 ... \n", + "9132 College 2/3/11 Employed M 21941 ... \n", + "9133 College 2/14/11 Unemployed M 0 ... \n", + "\n", + " Months Since Policy Inception Number of Open Complaints \\\n", + "0 5 0 \n", + "1 42 0 \n", + "2 38 0 \n", + "3 65 0 \n", + "4 44 0 \n", + "... ... ... \n", + "9129 89 0 \n", + "9130 28 0 \n", + "9131 37 3 \n", + "9132 3 0 \n", + "9133 90 0 \n", + "\n", + " Number of Policies Policy Type Policy Renew Offer Type \\\n", + "0 1 Corporate Auto Corporate L3 Offer1 \n", + "1 8 Personal Auto Personal L3 Offer3 \n", + "2 2 Personal Auto Personal L3 Offer1 \n", + "3 7 Corporate Auto Corporate L2 Offer1 \n", + "4 1 Personal Auto Personal L1 Offer1 \n", + "... ... ... ... ... \n", + "9129 2 Personal Auto Personal L1 Offer2 \n", + "9130 1 Corporate Auto Corporate L3 Offer1 \n", + "9131 2 Corporate Auto Corporate L2 Offer1 \n", + "9132 3 Personal Auto Personal L2 Offer3 \n", + "9133 1 Corporate Auto Corporate L3 Offer4 \n", + "\n", + " Sales Channel Total Claim Amount Vehicle Class Vehicle Size \n", + "0 Agent 384.811147 Two-Door Car Medsize \n", + "1 Agent 1131.464935 Four-Door Car Medsize \n", + "2 Agent 566.472247 Two-Door Car Medsize \n", + "3 Call Center 529.881344 SUV Medsize \n", + "4 Agent 138.130879 Four-Door Car Medsize \n", + "... ... ... ... ... \n", + "9129 Web 198.234764 Four-Door Car Medsize \n", + "9130 Branch 379.200000 Four-Door Car Medsize \n", + "9131 Branch 790.784983 Four-Door Car Medsize \n", + "9132 Branch 691.200000 Four-Door Car Large \n", + "9133 Call Center 369.600000 Two-Door Car Medsize \n", + "\n", + "[9134 rows x 24 columns]" + ] + }, + "execution_count": 1, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Pre work: Importing libraries\n", + "\n", + "import pandas as pd\n", + "from sklearn.preprocessing import MinMaxScaler\n", + "\n", + "# Import data\n", + "\n", + "mc = pd.read_csv('marketing_customer_analysis.csv')\n", + "mc" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "ce2f994d", + "metadata": {}, + "outputs": [], + "source": [ + "# X-y split\n", + "# Normalize (numerical)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "64385983", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CustomerStateCustomer Lifetime ValueResponseCoverageEducationEffective To DateEmploymentStatusGenderIncome...Months Since Last ClaimMonths Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesPolicy TypePolicyRenew Offer TypeSales ChannelVehicle ClassVehicle Size
0BU79786Washington2763.519279NoBasicBachelor2/24/11EmployedF56274...32501Corporate AutoCorporate L3Offer1AgentTwo-Door CarMedsize
1QZ44356Arizona6979.535903NoExtendedBachelor1/31/11UnemployedF0...134208Personal AutoPersonal L3Offer3AgentFour-Door CarMedsize
2AI49188Nevada12887.431650NoPremiumBachelor2/19/11EmployedF48767...183802Personal AutoPersonal L3Offer1AgentTwo-Door CarMedsize
3WW63253California7645.861827NoBasicBachelor1/20/11UnemployedM0...186507Corporate AutoCorporate L2Offer1Call CenterSUVMedsize
4HB64268Washington2813.692575NoBasicBachelor2/3/11EmployedM43836...124401Personal AutoPersonal L1Offer1AgentFour-Door CarMedsize
..................................................................
9129LA72316California23405.987980NoBasicBachelor2/10/11EmployedM71941...188902Personal AutoPersonal L1Offer2WebFour-Door CarMedsize
9130PK87824California3096.511217YesExtendedCollege2/12/11EmployedF21604...142801Corporate AutoCorporate L3Offer1BranchFour-Door CarMedsize
9131TD14365California8163.890428NoExtendedBachelor2/6/11UnemployedM0...93732Corporate AutoCorporate L2Offer1BranchFour-Door CarMedsize
9132UP19263California7524.442436NoExtendedCollege2/3/11EmployedM21941...34303Personal AutoPersonal L2Offer3BranchFour-Door CarLarge
9133Y167826California2611.836866NoExtendedCollege2/14/11UnemployedM0...39001Corporate AutoCorporate L3Offer4Call CenterTwo-Door CarMedsize
\n", + "

9134 rows × 23 columns

\n", + "
" + ], + "text/plain": [ + " Customer State Customer Lifetime Value Response Coverage \\\n", + "0 BU79786 Washington 2763.519279 No Basic \n", + "1 QZ44356 Arizona 6979.535903 No Extended \n", + "2 AI49188 Nevada 12887.431650 No Premium \n", + "3 WW63253 California 7645.861827 No Basic \n", + "4 HB64268 Washington 2813.692575 No Basic \n", + "... ... ... ... ... ... \n", + "9129 LA72316 California 23405.987980 No Basic \n", + "9130 PK87824 California 3096.511217 Yes Extended \n", + "9131 TD14365 California 8163.890428 No Extended \n", + "9132 UP19263 California 7524.442436 No Extended \n", + "9133 Y167826 California 2611.836866 No Extended \n", + "\n", + " Education Effective To Date EmploymentStatus Gender Income ... \\\n", + "0 Bachelor 2/24/11 Employed F 56274 ... \n", + "1 Bachelor 1/31/11 Unemployed F 0 ... \n", + "2 Bachelor 2/19/11 Employed F 48767 ... \n", + "3 Bachelor 1/20/11 Unemployed M 0 ... \n", + "4 Bachelor 2/3/11 Employed M 43836 ... \n", + "... ... ... ... ... ... ... \n", + "9129 Bachelor 2/10/11 Employed M 71941 ... \n", + "9130 College 2/12/11 Employed F 21604 ... \n", + "9131 Bachelor 2/6/11 Unemployed M 0 ... \n", + "9132 College 2/3/11 Employed M 21941 ... \n", + "9133 College 2/14/11 Unemployed M 0 ... \n", + "\n", + " Months Since Last Claim Months Since Policy Inception \\\n", + "0 32 5 \n", + "1 13 42 \n", + "2 18 38 \n", + "3 18 65 \n", + "4 12 44 \n", + "... ... ... \n", + "9129 18 89 \n", + "9130 14 28 \n", + "9131 9 37 \n", + "9132 34 3 \n", + "9133 3 90 \n", + "\n", + " Number of Open Complaints Number of Policies Policy Type \\\n", + "0 0 1 Corporate Auto \n", + "1 0 8 Personal Auto \n", + "2 0 2 Personal Auto \n", + "3 0 7 Corporate Auto \n", + "4 0 1 Personal Auto \n", + "... ... ... ... \n", + "9129 0 2 Personal Auto \n", + "9130 0 1 Corporate Auto \n", + "9131 3 2 Corporate Auto \n", + "9132 0 3 Personal Auto \n", + "9133 0 1 Corporate Auto \n", + "\n", + " Policy Renew Offer Type Sales Channel Vehicle Class Vehicle Size \n", + "0 Corporate L3 Offer1 Agent Two-Door Car Medsize \n", + "1 Personal L3 Offer3 Agent Four-Door Car Medsize \n", + "2 Personal L3 Offer1 Agent Two-Door Car Medsize \n", + "3 Corporate L2 Offer1 Call Center SUV Medsize \n", + "4 Personal L1 Offer1 Agent Four-Door Car Medsize \n", + "... ... ... ... ... ... \n", + "9129 Personal L1 Offer2 Web Four-Door Car Medsize \n", + "9130 Corporate L3 Offer1 Branch Four-Door Car Medsize \n", + "9131 Corporate L2 Offer1 Branch Four-Door Car Medsize \n", + "9132 Personal L2 Offer3 Branch Four-Door Car Large \n", + "9133 Corporate L3 Offer4 Call Center Two-Door Car Medsize \n", + "\n", + "[9134 rows x 23 columns]" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "X = mc.drop('Total Claim Amount', axis=1)\n", + "y = mc['Total Claim Amount']\n", + "X" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "8eb3e61d", + "metadata": {}, + "outputs": [], + "source": [ + "scaler = MinMaxScaler()" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "8d03d5c1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Customer Lifetime ValueIncomeMonthly Premium AutoMonths Since Last ClaimMonths Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesTotal Claim Amount
02763.519279562746932501384.811147
16979.5359030941342081131.464935
212887.43165048767108183802566.472247
37645.8618270106186507529.881344
42813.6925754383673124401138.130879
...........................
912923405.9879807194173188902198.234764
91303096.5112172160479142801379.200000
91318163.89042808593732790.784983
91327524.442436219419634303691.200000
91332611.83686607739001369.600000
\n", + "

9134 rows × 8 columns

\n", + "
" + ], + "text/plain": [ + " Customer Lifetime Value Income Monthly Premium Auto \\\n", + "0 2763.519279 56274 69 \n", + "1 6979.535903 0 94 \n", + "2 12887.431650 48767 108 \n", + "3 7645.861827 0 106 \n", + "4 2813.692575 43836 73 \n", + "... ... ... ... \n", + "9129 23405.987980 71941 73 \n", + "9130 3096.511217 21604 79 \n", + "9131 8163.890428 0 85 \n", + "9132 7524.442436 21941 96 \n", + "9133 2611.836866 0 77 \n", + "\n", + " Months Since Last Claim Months Since Policy Inception \\\n", + "0 32 5 \n", + "1 13 42 \n", + "2 18 38 \n", + "3 18 65 \n", + "4 12 44 \n", + "... ... ... \n", + "9129 18 89 \n", + "9130 14 28 \n", + "9131 9 37 \n", + "9132 34 3 \n", + "9133 3 90 \n", + "\n", + " Number of Open Complaints Number of Policies Total Claim Amount \n", + "0 0 1 384.811147 \n", + "1 0 8 1131.464935 \n", + "2 0 2 566.472247 \n", + "3 0 7 529.881344 \n", + "4 0 1 138.130879 \n", + "... ... ... ... \n", + "9129 0 2 198.234764 \n", + "9130 0 1 379.200000 \n", + "9131 3 2 790.784983 \n", + "9132 0 3 691.200000 \n", + "9133 0 1 369.600000 \n", + "\n", + "[9134 rows x 8 columns]" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "mc_n = mc.select_dtypes(include = 'number')\n", + "mc_n" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "df2ff8d5", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Customer Lifetime ValueIncomeMonthly Premium AutoMonths Since Last ClaimMonths Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesTotal Claim Amount
00.0106290.5628470.0337550.9142860.0505050.00.0000.132974
10.0624060.0000000.1392410.3714290.4242420.00.8750.391051
20.1349600.4877630.1983120.5142860.3838380.00.1250.195764
30.0705890.0000000.1898730.5142860.6565660.00.7500.183117
40.0112450.4384430.0506330.3428570.4444440.00.0000.047710
...........................
91290.2641370.7195470.0506330.5142860.8989900.00.1250.068485
91300.0147190.2160810.0759490.4000000.2828280.00.0000.131034
91310.0769510.0000000.1012660.2571430.3737370.60.1250.273297
91320.0690980.2194520.1476790.9714290.0303030.00.2500.238876
91330.0087660.0000000.0675110.0857140.9090910.00.0000.127716
\n", + "

9134 rows × 8 columns

\n", + "
" + ], + "text/plain": [ + " Customer Lifetime Value Income Monthly Premium Auto \\\n", + "0 0.010629 0.562847 0.033755 \n", + "1 0.062406 0.000000 0.139241 \n", + "2 0.134960 0.487763 0.198312 \n", + "3 0.070589 0.000000 0.189873 \n", + "4 0.011245 0.438443 0.050633 \n", + "... ... ... ... \n", + "9129 0.264137 0.719547 0.050633 \n", + "9130 0.014719 0.216081 0.075949 \n", + "9131 0.076951 0.000000 0.101266 \n", + "9132 0.069098 0.219452 0.147679 \n", + "9133 0.008766 0.000000 0.067511 \n", + "\n", + " Months Since Last Claim Months Since Policy Inception \\\n", + "0 0.914286 0.050505 \n", + "1 0.371429 0.424242 \n", + "2 0.514286 0.383838 \n", + "3 0.514286 0.656566 \n", + "4 0.342857 0.444444 \n", + "... ... ... \n", + "9129 0.514286 0.898990 \n", + "9130 0.400000 0.282828 \n", + "9131 0.257143 0.373737 \n", + "9132 0.971429 0.030303 \n", + "9133 0.085714 0.909091 \n", + "\n", + " Number of Open Complaints Number of Policies Total Claim Amount \n", + "0 0.0 0.000 0.132974 \n", + "1 0.0 0.875 0.391051 \n", + "2 0.0 0.125 0.195764 \n", + "3 0.0 0.750 0.183117 \n", + "4 0.0 0.000 0.047710 \n", + "... ... ... ... \n", + "9129 0.0 0.125 0.068485 \n", + "9130 0.0 0.000 0.131034 \n", + "9131 0.6 0.125 0.273297 \n", + "9132 0.0 0.250 0.238876 \n", + "9133 0.0 0.000 0.127716 \n", + "\n", + "[9134 rows x 8 columns]" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "normalized_mc = scaler.fit_transform(mc_n)\n", + "normalized_mc = pd.DataFrame(normalized_mc, columns = mc_n.columns)\n", + "normalized_mc" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f045dbde", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.4" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/files_for_lab/csv_files/[lab-customer-analysis-round-5] Sara.ipynb b/files_for_lab/csv_files/[lab-customer-analysis-round-5] Sara.ipynb new file mode 100644 index 0000000..21ce233 --- /dev/null +++ b/files_for_lab/csv_files/[lab-customer-analysis-round-5] Sara.ipynb @@ -0,0 +1,1307 @@ +{ + "cells": [ + { + "cell_type": "raw", + "id": "ca62338e", + "metadata": {}, + "source": [ + "LAB 5\n", + "\n", + "DA PT 2023\n", + "\n", + "Sara Ferreira da Silva" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "57638365", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CustomerStateCustomer Lifetime ValueResponseCoverageEducationEffective To DateEmploymentStatusGenderIncome...Months Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesPolicy TypePolicyRenew Offer TypeSales ChannelTotal Claim AmountVehicle ClassVehicle Size
0BU79786Washington2763.519279NoBasicBachelor2/24/11EmployedF56274...501Corporate AutoCorporate L3Offer1Agent384.811147Two-Door CarMedsize
1QZ44356Arizona6979.535903NoExtendedBachelor1/31/11UnemployedF0...4208Personal AutoPersonal L3Offer3Agent1131.464935Four-Door CarMedsize
2AI49188Nevada12887.431650NoPremiumBachelor2/19/11EmployedF48767...3802Personal AutoPersonal L3Offer1Agent566.472247Two-Door CarMedsize
3WW63253California7645.861827NoBasicBachelor1/20/11UnemployedM0...6507Corporate AutoCorporate L2Offer1Call Center529.881344SUVMedsize
4HB64268Washington2813.692575NoBasicBachelor2/3/11EmployedM43836...4401Personal AutoPersonal L1Offer1Agent138.130879Four-Door CarMedsize
..................................................................
9129LA72316California23405.987980NoBasicBachelor2/10/11EmployedM71941...8902Personal AutoPersonal L1Offer2Web198.234764Four-Door CarMedsize
9130PK87824California3096.511217YesExtendedCollege2/12/11EmployedF21604...2801Corporate AutoCorporate L3Offer1Branch379.200000Four-Door CarMedsize
9131TD14365California8163.890428NoExtendedBachelor2/6/11UnemployedM0...3732Corporate AutoCorporate L2Offer1Branch790.784983Four-Door CarMedsize
9132UP19263California7524.442436NoExtendedCollege2/3/11EmployedM21941...303Personal AutoPersonal L2Offer3Branch691.200000Four-Door CarLarge
9133Y167826California2611.836866NoExtendedCollege2/14/11UnemployedM0...9001Corporate AutoCorporate L3Offer4Call Center369.600000Two-Door CarMedsize
\n", + "

9134 rows × 24 columns

\n", + "
" + ], + "text/plain": [ + " Customer State Customer Lifetime Value Response Coverage \\\n", + "0 BU79786 Washington 2763.519279 No Basic \n", + "1 QZ44356 Arizona 6979.535903 No Extended \n", + "2 AI49188 Nevada 12887.431650 No Premium \n", + "3 WW63253 California 7645.861827 No Basic \n", + "4 HB64268 Washington 2813.692575 No Basic \n", + "... ... ... ... ... ... \n", + "9129 LA72316 California 23405.987980 No Basic \n", + "9130 PK87824 California 3096.511217 Yes Extended \n", + "9131 TD14365 California 8163.890428 No Extended \n", + "9132 UP19263 California 7524.442436 No Extended \n", + "9133 Y167826 California 2611.836866 No Extended \n", + "\n", + " Education Effective To Date EmploymentStatus Gender Income ... \\\n", + "0 Bachelor 2/24/11 Employed F 56274 ... \n", + "1 Bachelor 1/31/11 Unemployed F 0 ... \n", + "2 Bachelor 2/19/11 Employed F 48767 ... \n", + "3 Bachelor 1/20/11 Unemployed M 0 ... \n", + "4 Bachelor 2/3/11 Employed M 43836 ... \n", + "... ... ... ... ... ... ... \n", + "9129 Bachelor 2/10/11 Employed M 71941 ... \n", + "9130 College 2/12/11 Employed F 21604 ... \n", + "9131 Bachelor 2/6/11 Unemployed M 0 ... \n", + "9132 College 2/3/11 Employed M 21941 ... \n", + "9133 College 2/14/11 Unemployed M 0 ... \n", + "\n", + " Months Since Policy Inception Number of Open Complaints \\\n", + "0 5 0 \n", + "1 42 0 \n", + "2 38 0 \n", + "3 65 0 \n", + "4 44 0 \n", + "... ... ... \n", + "9129 89 0 \n", + "9130 28 0 \n", + "9131 37 3 \n", + "9132 3 0 \n", + "9133 90 0 \n", + "\n", + " Number of Policies Policy Type Policy Renew Offer Type \\\n", + "0 1 Corporate Auto Corporate L3 Offer1 \n", + "1 8 Personal Auto Personal L3 Offer3 \n", + "2 2 Personal Auto Personal L3 Offer1 \n", + "3 7 Corporate Auto Corporate L2 Offer1 \n", + "4 1 Personal Auto Personal L1 Offer1 \n", + "... ... ... ... ... \n", + "9129 2 Personal Auto Personal L1 Offer2 \n", + "9130 1 Corporate Auto Corporate L3 Offer1 \n", + "9131 2 Corporate Auto Corporate L2 Offer1 \n", + "9132 3 Personal Auto Personal L2 Offer3 \n", + "9133 1 Corporate Auto Corporate L3 Offer4 \n", + "\n", + " Sales Channel Total Claim Amount Vehicle Class Vehicle Size \n", + "0 Agent 384.811147 Two-Door Car Medsize \n", + "1 Agent 1131.464935 Four-Door Car Medsize \n", + "2 Agent 566.472247 Two-Door Car Medsize \n", + "3 Call Center 529.881344 SUV Medsize \n", + "4 Agent 138.130879 Four-Door Car Medsize \n", + "... ... ... ... ... \n", + "9129 Web 198.234764 Four-Door Car Medsize \n", + "9130 Branch 379.200000 Four-Door Car Medsize \n", + "9131 Branch 790.784983 Four-Door Car Medsize \n", + "9132 Branch 691.200000 Four-Door Car Large \n", + "9133 Call Center 369.600000 Two-Door Car Medsize \n", + "\n", + "[9134 rows x 24 columns]" + ] + }, + "execution_count": 1, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Pre work: Importing libraries\n", + "\n", + "import pandas as pd\n", + "from sklearn.preprocessing import MinMaxScaler\n", + "\n", + "# Import data\n", + "\n", + "mc = pd.read_csv('marketing_customer_analysis.csv')\n", + "mc" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "ce2f994d", + "metadata": {}, + "outputs": [], + "source": [ + "# X-y split\n", + "# Normalize (numerical)" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "64385983", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
CustomerStateCustomer Lifetime ValueResponseCoverageEducationEffective To DateEmploymentStatusGenderIncome...Months Since Last ClaimMonths Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesPolicy TypePolicyRenew Offer TypeSales ChannelVehicle ClassVehicle Size
0BU79786Washington2763.519279NoBasicBachelor2/24/11EmployedF56274...32501Corporate AutoCorporate L3Offer1AgentTwo-Door CarMedsize
1QZ44356Arizona6979.535903NoExtendedBachelor1/31/11UnemployedF0...134208Personal AutoPersonal L3Offer3AgentFour-Door CarMedsize
2AI49188Nevada12887.431650NoPremiumBachelor2/19/11EmployedF48767...183802Personal AutoPersonal L3Offer1AgentTwo-Door CarMedsize
3WW63253California7645.861827NoBasicBachelor1/20/11UnemployedM0...186507Corporate AutoCorporate L2Offer1Call CenterSUVMedsize
4HB64268Washington2813.692575NoBasicBachelor2/3/11EmployedM43836...124401Personal AutoPersonal L1Offer1AgentFour-Door CarMedsize
..................................................................
9129LA72316California23405.987980NoBasicBachelor2/10/11EmployedM71941...188902Personal AutoPersonal L1Offer2WebFour-Door CarMedsize
9130PK87824California3096.511217YesExtendedCollege2/12/11EmployedF21604...142801Corporate AutoCorporate L3Offer1BranchFour-Door CarMedsize
9131TD14365California8163.890428NoExtendedBachelor2/6/11UnemployedM0...93732Corporate AutoCorporate L2Offer1BranchFour-Door CarMedsize
9132UP19263California7524.442436NoExtendedCollege2/3/11EmployedM21941...34303Personal AutoPersonal L2Offer3BranchFour-Door CarLarge
9133Y167826California2611.836866NoExtendedCollege2/14/11UnemployedM0...39001Corporate AutoCorporate L3Offer4Call CenterTwo-Door CarMedsize
\n", + "

9134 rows × 23 columns

\n", + "
" + ], + "text/plain": [ + " Customer State Customer Lifetime Value Response Coverage \\\n", + "0 BU79786 Washington 2763.519279 No Basic \n", + "1 QZ44356 Arizona 6979.535903 No Extended \n", + "2 AI49188 Nevada 12887.431650 No Premium \n", + "3 WW63253 California 7645.861827 No Basic \n", + "4 HB64268 Washington 2813.692575 No Basic \n", + "... ... ... ... ... ... \n", + "9129 LA72316 California 23405.987980 No Basic \n", + "9130 PK87824 California 3096.511217 Yes Extended \n", + "9131 TD14365 California 8163.890428 No Extended \n", + "9132 UP19263 California 7524.442436 No Extended \n", + "9133 Y167826 California 2611.836866 No Extended \n", + "\n", + " Education Effective To Date EmploymentStatus Gender Income ... \\\n", + "0 Bachelor 2/24/11 Employed F 56274 ... \n", + "1 Bachelor 1/31/11 Unemployed F 0 ... \n", + "2 Bachelor 2/19/11 Employed F 48767 ... \n", + "3 Bachelor 1/20/11 Unemployed M 0 ... \n", + "4 Bachelor 2/3/11 Employed M 43836 ... \n", + "... ... ... ... ... ... ... \n", + "9129 Bachelor 2/10/11 Employed M 71941 ... \n", + "9130 College 2/12/11 Employed F 21604 ... \n", + "9131 Bachelor 2/6/11 Unemployed M 0 ... \n", + "9132 College 2/3/11 Employed M 21941 ... \n", + "9133 College 2/14/11 Unemployed M 0 ... \n", + "\n", + " Months Since Last Claim Months Since Policy Inception \\\n", + "0 32 5 \n", + "1 13 42 \n", + "2 18 38 \n", + "3 18 65 \n", + "4 12 44 \n", + "... ... ... \n", + "9129 18 89 \n", + "9130 14 28 \n", + "9131 9 37 \n", + "9132 34 3 \n", + "9133 3 90 \n", + "\n", + " Number of Open Complaints Number of Policies Policy Type \\\n", + "0 0 1 Corporate Auto \n", + "1 0 8 Personal Auto \n", + "2 0 2 Personal Auto \n", + "3 0 7 Corporate Auto \n", + "4 0 1 Personal Auto \n", + "... ... ... ... \n", + "9129 0 2 Personal Auto \n", + "9130 0 1 Corporate Auto \n", + "9131 3 2 Corporate Auto \n", + "9132 0 3 Personal Auto \n", + "9133 0 1 Corporate Auto \n", + "\n", + " Policy Renew Offer Type Sales Channel Vehicle Class Vehicle Size \n", + "0 Corporate L3 Offer1 Agent Two-Door Car Medsize \n", + "1 Personal L3 Offer3 Agent Four-Door Car Medsize \n", + "2 Personal L3 Offer1 Agent Two-Door Car Medsize \n", + "3 Corporate L2 Offer1 Call Center SUV Medsize \n", + "4 Personal L1 Offer1 Agent Four-Door Car Medsize \n", + "... ... ... ... ... ... \n", + "9129 Personal L1 Offer2 Web Four-Door Car Medsize \n", + "9130 Corporate L3 Offer1 Branch Four-Door Car Medsize \n", + "9131 Corporate L2 Offer1 Branch Four-Door Car Medsize \n", + "9132 Personal L2 Offer3 Branch Four-Door Car Large \n", + "9133 Corporate L3 Offer4 Call Center Two-Door Car Medsize \n", + "\n", + "[9134 rows x 23 columns]" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "X = mc.drop('Total Claim Amount', axis=1)\n", + "y = mc['Total Claim Amount']\n", + "X" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "8eb3e61d", + "metadata": {}, + "outputs": [], + "source": [ + "scaler = MinMaxScaler()" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "8d03d5c1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Customer Lifetime ValueIncomeMonthly Premium AutoMonths Since Last ClaimMonths Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesTotal Claim Amount
02763.519279562746932501384.811147
16979.5359030941342081131.464935
212887.43165048767108183802566.472247
37645.8618270106186507529.881344
42813.6925754383673124401138.130879
...........................
912923405.9879807194173188902198.234764
91303096.5112172160479142801379.200000
91318163.89042808593732790.784983
91327524.442436219419634303691.200000
91332611.83686607739001369.600000
\n", + "

9134 rows × 8 columns

\n", + "
" + ], + "text/plain": [ + " Customer Lifetime Value Income Monthly Premium Auto \\\n", + "0 2763.519279 56274 69 \n", + "1 6979.535903 0 94 \n", + "2 12887.431650 48767 108 \n", + "3 7645.861827 0 106 \n", + "4 2813.692575 43836 73 \n", + "... ... ... ... \n", + "9129 23405.987980 71941 73 \n", + "9130 3096.511217 21604 79 \n", + "9131 8163.890428 0 85 \n", + "9132 7524.442436 21941 96 \n", + "9133 2611.836866 0 77 \n", + "\n", + " Months Since Last Claim Months Since Policy Inception \\\n", + "0 32 5 \n", + "1 13 42 \n", + "2 18 38 \n", + "3 18 65 \n", + "4 12 44 \n", + "... ... ... \n", + "9129 18 89 \n", + "9130 14 28 \n", + "9131 9 37 \n", + "9132 34 3 \n", + "9133 3 90 \n", + "\n", + " Number of Open Complaints Number of Policies Total Claim Amount \n", + "0 0 1 384.811147 \n", + "1 0 8 1131.464935 \n", + "2 0 2 566.472247 \n", + "3 0 7 529.881344 \n", + "4 0 1 138.130879 \n", + "... ... ... ... \n", + "9129 0 2 198.234764 \n", + "9130 0 1 379.200000 \n", + "9131 3 2 790.784983 \n", + "9132 0 3 691.200000 \n", + "9133 0 1 369.600000 \n", + "\n", + "[9134 rows x 8 columns]" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "mc_n = mc.select_dtypes(include = 'number')\n", + "mc_n" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "df2ff8d5", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Customer Lifetime ValueIncomeMonthly Premium AutoMonths Since Last ClaimMonths Since Policy InceptionNumber of Open ComplaintsNumber of PoliciesTotal Claim Amount
00.0106290.5628470.0337550.9142860.0505050.00.0000.132974
10.0624060.0000000.1392410.3714290.4242420.00.8750.391051
20.1349600.4877630.1983120.5142860.3838380.00.1250.195764
30.0705890.0000000.1898730.5142860.6565660.00.7500.183117
40.0112450.4384430.0506330.3428570.4444440.00.0000.047710
...........................
91290.2641370.7195470.0506330.5142860.8989900.00.1250.068485
91300.0147190.2160810.0759490.4000000.2828280.00.0000.131034
91310.0769510.0000000.1012660.2571430.3737370.60.1250.273297
91320.0690980.2194520.1476790.9714290.0303030.00.2500.238876
91330.0087660.0000000.0675110.0857140.9090910.00.0000.127716
\n", + "

9134 rows × 8 columns

\n", + "
" + ], + "text/plain": [ + " Customer Lifetime Value Income Monthly Premium Auto \\\n", + "0 0.010629 0.562847 0.033755 \n", + "1 0.062406 0.000000 0.139241 \n", + "2 0.134960 0.487763 0.198312 \n", + "3 0.070589 0.000000 0.189873 \n", + "4 0.011245 0.438443 0.050633 \n", + "... ... ... ... \n", + "9129 0.264137 0.719547 0.050633 \n", + "9130 0.014719 0.216081 0.075949 \n", + "9131 0.076951 0.000000 0.101266 \n", + "9132 0.069098 0.219452 0.147679 \n", + "9133 0.008766 0.000000 0.067511 \n", + "\n", + " Months Since Last Claim Months Since Policy Inception \\\n", + "0 0.914286 0.050505 \n", + "1 0.371429 0.424242 \n", + "2 0.514286 0.383838 \n", + "3 0.514286 0.656566 \n", + "4 0.342857 0.444444 \n", + "... ... ... \n", + "9129 0.514286 0.898990 \n", + "9130 0.400000 0.282828 \n", + "9131 0.257143 0.373737 \n", + "9132 0.971429 0.030303 \n", + "9133 0.085714 0.909091 \n", + "\n", + " Number of Open Complaints Number of Policies Total Claim Amount \n", + "0 0.0 0.000 0.132974 \n", + "1 0.0 0.875 0.391051 \n", + "2 0.0 0.125 0.195764 \n", + "3 0.0 0.750 0.183117 \n", + "4 0.0 0.000 0.047710 \n", + "... ... ... ... \n", + "9129 0.0 0.125 0.068485 \n", + "9130 0.0 0.000 0.131034 \n", + "9131 0.6 0.125 0.273297 \n", + "9132 0.0 0.250 0.238876 \n", + "9133 0.0 0.000 0.127716 \n", + "\n", + "[9134 rows x 8 columns]" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "normalized_mc = scaler.fit_transform(mc_n)\n", + "normalized_mc = pd.DataFrame(normalized_mc, columns = mc_n.columns)\n", + "normalized_mc" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f045dbde", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.4" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +}