diff --git a/lab-customer-analysis-round-1-checkpoint.ipynb b/lab-customer-analysis-round-1-checkpoint.ipynb
new file mode 100644
index 0000000..0fa7fff
--- /dev/null
+++ b/lab-customer-analysis-round-1-checkpoint.ipynb
@@ -0,0 +1,2543 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 101,
+ "id": "c43915d2",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Customer | \n",
+ " ST | \n",
+ " GENDER | \n",
+ " Education | \n",
+ " Customer Lifetime Value | \n",
+ " Income | \n",
+ " Monthly Premium Auto | \n",
+ " Number of Open Complaints | \n",
+ " Policy Type | \n",
+ " Vehicle Class | \n",
+ " Total Claim Amount | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " 1/0/00 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 4003 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4004 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4005 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4006 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4007 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
4008 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Customer ST GENDER Education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "4003 NaN NaN NaN NaN \n",
+ "4004 NaN NaN NaN NaN \n",
+ "4005 NaN NaN NaN NaN \n",
+ "4006 NaN NaN NaN NaN \n",
+ "4007 NaN NaN NaN NaN \n",
+ "\n",
+ " Customer Lifetime Value Income Monthly Premium Auto \\\n",
+ "0 NaN 0.0 1000.0 \n",
+ "1 697953.59% 0.0 94.0 \n",
+ "2 1288743.17% 48767.0 108.0 \n",
+ "3 764586.18% 0.0 106.0 \n",
+ "4 536307.65% 36357.0 68.0 \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " Number of Open Complaints Policy Type Vehicle Class \\\n",
+ "0 1/0/00 Personal Auto Four-Door Car \n",
+ "1 1/0/00 Personal Auto Four-Door Car \n",
+ "2 1/0/00 Personal Auto Two-Door Car \n",
+ "3 1/0/00 Corporate Auto SUV \n",
+ "4 1/0/00 Personal Auto Four-Door Car \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " Total Claim Amount \n",
+ "0 2.704934 \n",
+ "1 1131.464935 \n",
+ "2 566.472247 \n",
+ "3 529.881344 \n",
+ "4 17.269323 \n",
+ "... ... \n",
+ "4003 NaN \n",
+ "4004 NaN \n",
+ "4005 NaN \n",
+ "4006 NaN \n",
+ "4007 NaN \n",
+ "\n",
+ "[4008 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 101,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "import pandas as pd\n",
+ "\n",
+ "tab1_data = pd.read_csv(r'C:\\Users\\david\\OneDrive\\Ambiente de Trabalho\\Iron Hack\\ficheiros para LAB PANDA 1\\file1.csv')\n",
+ "\n",
+ "tab1_data\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 102,
+ "id": "297404d5",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Customer | \n",
+ " ST | \n",
+ " GENDER | \n",
+ " Education | \n",
+ " Customer Lifetime Value | \n",
+ " Income | \n",
+ " Monthly Premium Auto | \n",
+ " Number of Open Complaints | \n",
+ " Total Claim Amount | \n",
+ " Policy Type | \n",
+ " Vehicle Class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " GS98873 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 323912.47% | \n",
+ " 16061 | \n",
+ " 88 | \n",
+ " 1/0/00 | \n",
+ " 633.600000 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " CW49887 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 462680.11% | \n",
+ " 79487 | \n",
+ " 114 | \n",
+ " 1/0/00 | \n",
+ " 547.200000 | \n",
+ " Special Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " MY31220 | \n",
+ " California | \n",
+ " F | \n",
+ " College | \n",
+ " 899704.02% | \n",
+ " 54230 | \n",
+ " 112 | \n",
+ " 1/0/00 | \n",
+ " 537.600000 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " UH35128 | \n",
+ " Oregon | \n",
+ " F | \n",
+ " College | \n",
+ " 2580706.30% | \n",
+ " 71210 | \n",
+ " 214 | \n",
+ " 1/1/00 | \n",
+ " 1027.200000 | \n",
+ " Personal Auto | \n",
+ " Luxury Car | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " WH52799 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 380812.21% | \n",
+ " 94903 | \n",
+ " 94 | \n",
+ " 1/0/00 | \n",
+ " 451.200000 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 991 | \n",
+ " HV85198 | \n",
+ " Arizona | \n",
+ " M | \n",
+ " Master | \n",
+ " 847141.75% | \n",
+ " 63513 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 185.667213 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 992 | \n",
+ " BS91566 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 543121.91% | \n",
+ " 58161 | \n",
+ " 68 | \n",
+ " 1/0/00 | \n",
+ " 140.747286 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 993 | \n",
+ " IL40123 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " College | \n",
+ " 568964.41% | \n",
+ " 83640 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 471.050488 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 994 | \n",
+ " MY32149 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 368672.38% | \n",
+ " 0 | \n",
+ " 96 | \n",
+ " 1/0/00 | \n",
+ " 28.460568 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 995 | \n",
+ " SA91515 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 399258.39% | \n",
+ " 0 | \n",
+ " 111 | \n",
+ " 1/0/00 | \n",
+ " 700.349052 | \n",
+ " Personal Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
996 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Customer ST GENDER Education Customer Lifetime Value Income \\\n",
+ "0 GS98873 Arizona F Bachelor 323912.47% 16061 \n",
+ "1 CW49887 California F Master 462680.11% 79487 \n",
+ "2 MY31220 California F College 899704.02% 54230 \n",
+ "3 UH35128 Oregon F College 2580706.30% 71210 \n",
+ "4 WH52799 Arizona F College 380812.21% 94903 \n",
+ ".. ... ... ... ... ... ... \n",
+ "991 HV85198 Arizona M Master 847141.75% 63513 \n",
+ "992 BS91566 Arizona F College 543121.91% 58161 \n",
+ "993 IL40123 Nevada F College 568964.41% 83640 \n",
+ "994 MY32149 California F Master 368672.38% 0 \n",
+ "995 SA91515 California M Bachelor 399258.39% 0 \n",
+ "\n",
+ " Monthly Premium Auto Number of Open Complaints Total Claim Amount \\\n",
+ "0 88 1/0/00 633.600000 \n",
+ "1 114 1/0/00 547.200000 \n",
+ "2 112 1/0/00 537.600000 \n",
+ "3 214 1/1/00 1027.200000 \n",
+ "4 94 1/0/00 451.200000 \n",
+ ".. ... ... ... \n",
+ "991 70 1/0/00 185.667213 \n",
+ "992 68 1/0/00 140.747286 \n",
+ "993 70 1/0/00 471.050488 \n",
+ "994 96 1/0/00 28.460568 \n",
+ "995 111 1/0/00 700.349052 \n",
+ "\n",
+ " Policy Type Vehicle Class \n",
+ "0 Personal Auto Four-Door Car \n",
+ "1 Special Auto SUV \n",
+ "2 Personal Auto Two-Door Car \n",
+ "3 Personal Auto Luxury Car \n",
+ "4 Corporate Auto Two-Door Car \n",
+ ".. ... ... \n",
+ "991 Personal Auto Four-Door Car \n",
+ "992 Corporate Auto Four-Door Car \n",
+ "993 Corporate Auto Two-Door Car \n",
+ "994 Personal Auto Two-Door Car \n",
+ "995 Personal Auto SUV \n",
+ "\n",
+ "[996 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 102,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "tab2_data = pd.read_csv(r'C:\\Users\\david\\OneDrive\\Ambiente de Trabalho\\Iron Hack\\ficheiros para LAB PANDA 1\\file2.csv')\n",
+ "\n",
+ "tab2_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 103,
+ "id": "5698462b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Customer | \n",
+ " State | \n",
+ " Customer Lifetime Value | \n",
+ " Education | \n",
+ " Gender | \n",
+ " Income | \n",
+ " Monthly Premium Auto | \n",
+ " Number of Open Complaints | \n",
+ " Policy Type | \n",
+ " Total Claim Amount | \n",
+ " Vehicle Class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " SA25987 | \n",
+ " Washington | \n",
+ " 3479.137523 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 0 | \n",
+ " 104 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 499.200000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " TB86706 | \n",
+ " Arizona | \n",
+ " 2502.637401 | \n",
+ " Master | \n",
+ " M | \n",
+ " 0 | \n",
+ " 66 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 3.468912 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " ZL73902 | \n",
+ " Nevada | \n",
+ " 3265.156348 | \n",
+ " Bachelor | \n",
+ " F | \n",
+ " 25820 | \n",
+ " 82 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 393.600000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " KX23516 | \n",
+ " California | \n",
+ " 4455.843406 | \n",
+ " High School or Below | \n",
+ " F | \n",
+ " 0 | \n",
+ " 121 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 699.615192 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " FN77294 | \n",
+ " California | \n",
+ " 7704.958480 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 30366 | \n",
+ " 101 | \n",
+ " 2 | \n",
+ " Personal Auto | \n",
+ " 484.800000 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " California | \n",
+ " 23405.987980 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 71941 | \n",
+ " 73 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 198.234764 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " California | \n",
+ " 3096.511217 | \n",
+ " College | \n",
+ " F | \n",
+ " 21604 | \n",
+ " 79 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 379.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " California | \n",
+ " 8163.890428 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 0 | \n",
+ " 85 | \n",
+ " 3 | \n",
+ " Corporate Auto | \n",
+ " 790.784983 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " California | \n",
+ " 7524.442436 | \n",
+ " College | \n",
+ " M | \n",
+ " 21941 | \n",
+ " 96 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 691.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " California | \n",
+ " 2611.836866 | \n",
+ " College | \n",
+ " M | \n",
+ " 0 | \n",
+ " 77 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 369.600000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
7070 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Customer State Customer Lifetime Value Education \\\n",
+ "0 SA25987 Washington 3479.137523 High School or Below \n",
+ "1 TB86706 Arizona 2502.637401 Master \n",
+ "2 ZL73902 Nevada 3265.156348 Bachelor \n",
+ "3 KX23516 California 4455.843406 High School or Below \n",
+ "4 FN77294 California 7704.958480 High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 California 23405.987980 Bachelor \n",
+ "7066 PK87824 California 3096.511217 College \n",
+ "7067 TD14365 California 8163.890428 Bachelor \n",
+ "7068 UP19263 California 7524.442436 College \n",
+ "7069 Y167826 California 2611.836866 College \n",
+ "\n",
+ " Gender Income Monthly Premium Auto Number of Open Complaints \\\n",
+ "0 M 0 104 0 \n",
+ "1 M 0 66 0 \n",
+ "2 F 25820 82 0 \n",
+ "3 F 0 121 0 \n",
+ "4 M 30366 101 2 \n",
+ "... ... ... ... ... \n",
+ "7065 M 71941 73 0 \n",
+ "7066 F 21604 79 0 \n",
+ "7067 M 0 85 3 \n",
+ "7068 M 21941 96 0 \n",
+ "7069 M 0 77 0 \n",
+ "\n",
+ " Policy Type Total Claim Amount Vehicle Class \n",
+ "0 Personal Auto 499.200000 Two-Door Car \n",
+ "1 Personal Auto 3.468912 Two-Door Car \n",
+ "2 Personal Auto 393.600000 Four-Door Car \n",
+ "3 Personal Auto 699.615192 SUV \n",
+ "4 Personal Auto 484.800000 SUV \n",
+ "... ... ... ... \n",
+ "7065 Personal Auto 198.234764 Four-Door Car \n",
+ "7066 Corporate Auto 379.200000 Four-Door Car \n",
+ "7067 Corporate Auto 790.784983 Four-Door Car \n",
+ "7068 Personal Auto 691.200000 Four-Door Car \n",
+ "7069 Corporate Auto 369.600000 Two-Door Car \n",
+ "\n",
+ "[7070 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 103,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "tab3_data = pd.read_csv(r'C:\\Users\\david\\OneDrive\\Ambiente de Trabalho\\Iron Hack\\ficheiros para LAB PANDA 1\\file3.csv')\n",
+ "\n",
+ "tab3_data\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 104,
+ "id": "10a878b6",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(7070, 11)"
+ ]
+ },
+ "execution_count": 104,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # SHOW THE DATAFRAME'S SHAPE\n",
+ "\n",
+ "tab1_data.shape\n",
+ "tab2_data.shape\n",
+ "tab3_data.shape\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 105,
+ "id": "7eaccb15",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " 1/0/00 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 4003 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4004 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4005 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4006 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4007 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
4008 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "4003 NaN NaN NaN NaN \n",
+ "4004 NaN NaN NaN NaN \n",
+ "4005 NaN NaN NaN NaN \n",
+ "4006 NaN NaN NaN NaN \n",
+ "4007 NaN NaN NaN NaN \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto \\\n",
+ "0 NaN 0.0 1000.0 \n",
+ "1 697953.59% 0.0 94.0 \n",
+ "2 1288743.17% 48767.0 108.0 \n",
+ "3 764586.18% 0.0 106.0 \n",
+ "4 536307.65% 36357.0 68.0 \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " number_of_open_complaints policy_type vehicle_class \\\n",
+ "0 1/0/00 Personal Auto Four-Door Car \n",
+ "1 1/0/00 Personal Auto Four-Door Car \n",
+ "2 1/0/00 Personal Auto Two-Door Car \n",
+ "3 1/0/00 Corporate Auto SUV \n",
+ "4 1/0/00 Personal Auto Four-Door Car \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " total_claim_amount \n",
+ "0 2.704934 \n",
+ "1 1131.464935 \n",
+ "2 566.472247 \n",
+ "3 529.881344 \n",
+ "4 17.269323 \n",
+ "... ... \n",
+ "4003 NaN \n",
+ "4004 NaN \n",
+ "4005 NaN \n",
+ "4006 NaN \n",
+ "4007 NaN \n",
+ "\n",
+ "[4008 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 105,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # STANDARDIZE HEADER NAMES TABELA 1\n",
+ " \n",
+ "cols = []\n",
+ "for i in range(len(tab1_data.columns)): \n",
+ " cols.append(tab1_data.columns[i].lower().replace(' ', '_')) \n",
+ "tab1_data.columns = cols\n",
+ "tab1_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 106,
+ "id": "bb444eec",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " total_claim_amount | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " GS98873 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 323912.47% | \n",
+ " 16061 | \n",
+ " 88 | \n",
+ " 1/0/00 | \n",
+ " 633.600000 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " CW49887 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 462680.11% | \n",
+ " 79487 | \n",
+ " 114 | \n",
+ " 1/0/00 | \n",
+ " 547.200000 | \n",
+ " Special Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " MY31220 | \n",
+ " California | \n",
+ " F | \n",
+ " College | \n",
+ " 899704.02% | \n",
+ " 54230 | \n",
+ " 112 | \n",
+ " 1/0/00 | \n",
+ " 537.600000 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " UH35128 | \n",
+ " Oregon | \n",
+ " F | \n",
+ " College | \n",
+ " 2580706.30% | \n",
+ " 71210 | \n",
+ " 214 | \n",
+ " 1/1/00 | \n",
+ " 1027.200000 | \n",
+ " Personal Auto | \n",
+ " Luxury Car | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " WH52799 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 380812.21% | \n",
+ " 94903 | \n",
+ " 94 | \n",
+ " 1/0/00 | \n",
+ " 451.200000 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 991 | \n",
+ " HV85198 | \n",
+ " Arizona | \n",
+ " M | \n",
+ " Master | \n",
+ " 847141.75% | \n",
+ " 63513 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 185.667213 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 992 | \n",
+ " BS91566 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 543121.91% | \n",
+ " 58161 | \n",
+ " 68 | \n",
+ " 1/0/00 | \n",
+ " 140.747286 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 993 | \n",
+ " IL40123 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " College | \n",
+ " 568964.41% | \n",
+ " 83640 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 471.050488 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 994 | \n",
+ " MY32149 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 368672.38% | \n",
+ " 0 | \n",
+ " 96 | \n",
+ " 1/0/00 | \n",
+ " 28.460568 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 995 | \n",
+ " SA91515 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 399258.39% | \n",
+ " 0 | \n",
+ " 111 | \n",
+ " 1/0/00 | \n",
+ " 700.349052 | \n",
+ " Personal Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
996 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education customer_lifetime_value income \\\n",
+ "0 GS98873 Arizona F Bachelor 323912.47% 16061 \n",
+ "1 CW49887 California F Master 462680.11% 79487 \n",
+ "2 MY31220 California F College 899704.02% 54230 \n",
+ "3 UH35128 Oregon F College 2580706.30% 71210 \n",
+ "4 WH52799 Arizona F College 380812.21% 94903 \n",
+ ".. ... ... ... ... ... ... \n",
+ "991 HV85198 Arizona M Master 847141.75% 63513 \n",
+ "992 BS91566 Arizona F College 543121.91% 58161 \n",
+ "993 IL40123 Nevada F College 568964.41% 83640 \n",
+ "994 MY32149 California F Master 368672.38% 0 \n",
+ "995 SA91515 California M Bachelor 399258.39% 0 \n",
+ "\n",
+ " monthly_premium_auto number_of_open_complaints total_claim_amount \\\n",
+ "0 88 1/0/00 633.600000 \n",
+ "1 114 1/0/00 547.200000 \n",
+ "2 112 1/0/00 537.600000 \n",
+ "3 214 1/1/00 1027.200000 \n",
+ "4 94 1/0/00 451.200000 \n",
+ ".. ... ... ... \n",
+ "991 70 1/0/00 185.667213 \n",
+ "992 68 1/0/00 140.747286 \n",
+ "993 70 1/0/00 471.050488 \n",
+ "994 96 1/0/00 28.460568 \n",
+ "995 111 1/0/00 700.349052 \n",
+ "\n",
+ " policy_type vehicle_class \n",
+ "0 Personal Auto Four-Door Car \n",
+ "1 Special Auto SUV \n",
+ "2 Personal Auto Two-Door Car \n",
+ "3 Personal Auto Luxury Car \n",
+ "4 Corporate Auto Two-Door Car \n",
+ ".. ... ... \n",
+ "991 Personal Auto Four-Door Car \n",
+ "992 Corporate Auto Four-Door Car \n",
+ "993 Corporate Auto Two-Door Car \n",
+ "994 Personal Auto Two-Door Car \n",
+ "995 Personal Auto SUV \n",
+ "\n",
+ "[996 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 106,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# STANDARDIZE HEADER NAMES TABELA 2\n",
+ " \n",
+ "cols = []\n",
+ "for i in range(len(tab2_data.columns)): \n",
+ " cols.append(tab2_data.columns[i].lower().replace(' ', '_')) \n",
+ "tab2_data.columns = cols\n",
+ "tab2_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 107,
+ "id": "0fcf53af",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " state | \n",
+ " customer_lifetime_value | \n",
+ " education | \n",
+ " gender | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " total_claim_amount | \n",
+ " vehicle_class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " SA25987 | \n",
+ " Washington | \n",
+ " 3479.137523 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 0 | \n",
+ " 104 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 499.200000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " TB86706 | \n",
+ " Arizona | \n",
+ " 2502.637401 | \n",
+ " Master | \n",
+ " M | \n",
+ " 0 | \n",
+ " 66 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 3.468912 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " ZL73902 | \n",
+ " Nevada | \n",
+ " 3265.156348 | \n",
+ " Bachelor | \n",
+ " F | \n",
+ " 25820 | \n",
+ " 82 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 393.600000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " KX23516 | \n",
+ " California | \n",
+ " 4455.843406 | \n",
+ " High School or Below | \n",
+ " F | \n",
+ " 0 | \n",
+ " 121 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 699.615192 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " FN77294 | \n",
+ " California | \n",
+ " 7704.958480 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 30366 | \n",
+ " 101 | \n",
+ " 2 | \n",
+ " Personal Auto | \n",
+ " 484.800000 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " California | \n",
+ " 23405.987980 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 71941 | \n",
+ " 73 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 198.234764 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " California | \n",
+ " 3096.511217 | \n",
+ " College | \n",
+ " F | \n",
+ " 21604 | \n",
+ " 79 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 379.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " California | \n",
+ " 8163.890428 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 0 | \n",
+ " 85 | \n",
+ " 3 | \n",
+ " Corporate Auto | \n",
+ " 790.784983 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " California | \n",
+ " 7524.442436 | \n",
+ " College | \n",
+ " M | \n",
+ " 21941 | \n",
+ " 96 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 691.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " California | \n",
+ " 2611.836866 | \n",
+ " College | \n",
+ " M | \n",
+ " 0 | \n",
+ " 77 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 369.600000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
7070 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer state customer_lifetime_value education \\\n",
+ "0 SA25987 Washington 3479.137523 High School or Below \n",
+ "1 TB86706 Arizona 2502.637401 Master \n",
+ "2 ZL73902 Nevada 3265.156348 Bachelor \n",
+ "3 KX23516 California 4455.843406 High School or Below \n",
+ "4 FN77294 California 7704.958480 High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 California 23405.987980 Bachelor \n",
+ "7066 PK87824 California 3096.511217 College \n",
+ "7067 TD14365 California 8163.890428 Bachelor \n",
+ "7068 UP19263 California 7524.442436 College \n",
+ "7069 Y167826 California 2611.836866 College \n",
+ "\n",
+ " gender income monthly_premium_auto number_of_open_complaints \\\n",
+ "0 M 0 104 0 \n",
+ "1 M 0 66 0 \n",
+ "2 F 25820 82 0 \n",
+ "3 F 0 121 0 \n",
+ "4 M 30366 101 2 \n",
+ "... ... ... ... ... \n",
+ "7065 M 71941 73 0 \n",
+ "7066 F 21604 79 0 \n",
+ "7067 M 0 85 3 \n",
+ "7068 M 21941 96 0 \n",
+ "7069 M 0 77 0 \n",
+ "\n",
+ " policy_type total_claim_amount vehicle_class \n",
+ "0 Personal Auto 499.200000 Two-Door Car \n",
+ "1 Personal Auto 3.468912 Two-Door Car \n",
+ "2 Personal Auto 393.600000 Four-Door Car \n",
+ "3 Personal Auto 699.615192 SUV \n",
+ "4 Personal Auto 484.800000 SUV \n",
+ "... ... ... ... \n",
+ "7065 Personal Auto 198.234764 Four-Door Car \n",
+ "7066 Corporate Auto 379.200000 Four-Door Car \n",
+ "7067 Corporate Auto 790.784983 Four-Door Car \n",
+ "7068 Personal Auto 691.200000 Four-Door Car \n",
+ "7069 Corporate Auto 369.600000 Two-Door Car \n",
+ "\n",
+ "[7070 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 107,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# STANDARDIZE HEADER NAMES TABELA 3\n",
+ " \n",
+ "cols = []\n",
+ "for i in range(len(tab3_data.columns)): \n",
+ " cols.append(tab3_data.columns[i].lower().replace(' ', '_')) \n",
+ "tab3_data.columns = cols\n",
+ "tab3_data\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 90,
+ "id": "552a0b18",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# REARRANGE THE COLUMNS IN THE DATAFRAME AS NEEDED\n",
+ "\n",
+ "\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 108,
+ "id": "a57f4cef",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " 1/0/00 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 23405.98798 | \n",
+ " 71941.0 | \n",
+ " 73.0 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 198.234764 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " NaN | \n",
+ " F | \n",
+ " College | \n",
+ " 3096.511217 | \n",
+ " 21604.0 | \n",
+ " 79.0 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 379.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 8163.890428 | \n",
+ " 0.0 | \n",
+ " 85.0 | \n",
+ " 3 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 790.784983 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 7524.442436 | \n",
+ " 21941.0 | \n",
+ " 96.0 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 691.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 2611.836866 | \n",
+ " 0.0 | \n",
+ " 77.0 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ " 369.600000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
12074 rows × 12 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 NaN M Bachelor \n",
+ "7066 PK87824 NaN F College \n",
+ "7067 TD14365 NaN M Bachelor \n",
+ "7068 UP19263 NaN M College \n",
+ "7069 Y167826 NaN M College \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto \\\n",
+ "0 NaN 0.0 1000.0 \n",
+ "1 697953.59% 0.0 94.0 \n",
+ "2 1288743.17% 48767.0 108.0 \n",
+ "3 764586.18% 0.0 106.0 \n",
+ "4 536307.65% 36357.0 68.0 \n",
+ "... ... ... ... \n",
+ "7065 23405.98798 71941.0 73.0 \n",
+ "7066 3096.511217 21604.0 79.0 \n",
+ "7067 8163.890428 0.0 85.0 \n",
+ "7068 7524.442436 21941.0 96.0 \n",
+ "7069 2611.836866 0.0 77.0 \n",
+ "\n",
+ " number_of_open_complaints policy_type vehicle_class \\\n",
+ "0 1/0/00 Personal Auto Four-Door Car \n",
+ "1 1/0/00 Personal Auto Four-Door Car \n",
+ "2 1/0/00 Personal Auto Two-Door Car \n",
+ "3 1/0/00 Corporate Auto SUV \n",
+ "4 1/0/00 Personal Auto Four-Door Car \n",
+ "... ... ... ... \n",
+ "7065 0 Personal Auto Four-Door Car \n",
+ "7066 0 Corporate Auto Four-Door Car \n",
+ "7067 3 Corporate Auto Four-Door Car \n",
+ "7068 0 Personal Auto Four-Door Car \n",
+ "7069 0 Corporate Auto Two-Door Car \n",
+ "\n",
+ " total_claim_amount state \n",
+ "0 2.704934 NaN \n",
+ "1 1131.464935 NaN \n",
+ "2 566.472247 NaN \n",
+ "3 529.881344 NaN \n",
+ "4 17.269323 NaN \n",
+ "... ... ... \n",
+ "7065 198.234764 California \n",
+ "7066 379.200000 California \n",
+ "7067 790.784983 California \n",
+ "7068 691.200000 California \n",
+ "7069 369.600000 California \n",
+ "\n",
+ "[12074 rows x 12 columns]"
+ ]
+ },
+ "execution_count": 108,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# CONCATENATE THE THREE DATAFRAMES\n",
+ "\n",
+ "datatotal_data = pd.concat([tab1_data,tab2_data,tab3_data], axis = 0) \n",
+ "\n",
+ "datatotal_data\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 92,
+ "id": "a2367b94",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "customer object\n",
+ "st object\n",
+ "gender object\n",
+ "education object\n",
+ "customer_lifetime_value object\n",
+ "income float64\n",
+ "monthly_premium_auto float64\n",
+ "number_of_open_complaints object\n",
+ "policy_type object\n",
+ "vehicle_class object\n",
+ "total_claim_amount float64\n",
+ "state object\n",
+ "dtype: object"
+ ]
+ },
+ "execution_count": 92,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# QUESTION: WICH COLUMNS ARE NUMERICAL?\n",
+ "# ANSWER: Income, monthly_premium_auto, total_claim_amount\n",
+ "\n",
+ "# QUESTION: WICH COLUMNS ARE CATEGORICAL?\n",
+ "# ANSWER: customer, st, gender, education, customer_lifetime_value, number_of_open_complaints, policy_type, vehicle_class,state\n",
+ "\n",
+ "# UNDERSTAND THE MEANING OF ALL COLUMNS\n",
+ "# ANSWER:\n",
+ "\n",
+ "datatotal_data.dtypes\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 93,
+ "id": "32de16d5",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 23405.98798 | \n",
+ " 71941.0 | \n",
+ " 73.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 198.234764 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " NaN | \n",
+ " F | \n",
+ " College | \n",
+ " 3096.511217 | \n",
+ " 21604.0 | \n",
+ " 79.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 379.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 8163.890428 | \n",
+ " 0.0 | \n",
+ " 85.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 790.784983 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 7524.442436 | \n",
+ " 21941.0 | \n",
+ " 96.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 691.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 2611.836866 | \n",
+ " 0.0 | \n",
+ " 77.0 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ " 369.600000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
12074 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 NaN M Bachelor \n",
+ "7066 PK87824 NaN F College \n",
+ "7067 TD14365 NaN M Bachelor \n",
+ "7068 UP19263 NaN M College \n",
+ "7069 Y167826 NaN M College \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto policy_type \\\n",
+ "0 NaN 0.0 1000.0 Personal Auto \n",
+ "1 697953.59% 0.0 94.0 Personal Auto \n",
+ "2 1288743.17% 48767.0 108.0 Personal Auto \n",
+ "3 764586.18% 0.0 106.0 Corporate Auto \n",
+ "4 536307.65% 36357.0 68.0 Personal Auto \n",
+ "... ... ... ... ... \n",
+ "7065 23405.98798 71941.0 73.0 Personal Auto \n",
+ "7066 3096.511217 21604.0 79.0 Corporate Auto \n",
+ "7067 8163.890428 0.0 85.0 Corporate Auto \n",
+ "7068 7524.442436 21941.0 96.0 Personal Auto \n",
+ "7069 2611.836866 0.0 77.0 Corporate Auto \n",
+ "\n",
+ " vehicle_class total_claim_amount state \n",
+ "0 Four-Door Car 2.704934 NaN \n",
+ "1 Four-Door Car 1131.464935 NaN \n",
+ "2 Two-Door Car 566.472247 NaN \n",
+ "3 SUV 529.881344 NaN \n",
+ "4 Four-Door Car 17.269323 NaN \n",
+ "... ... ... ... \n",
+ "7065 Four-Door Car 198.234764 California \n",
+ "7066 Four-Door Car 379.200000 California \n",
+ "7067 Four-Door Car 790.784983 California \n",
+ "7068 Four-Door Car 691.200000 California \n",
+ "7069 Two-Door Car 369.600000 California \n",
+ "\n",
+ "[12074 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 93,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # DELETE THE COLUMN EDUCATION AND THE NUMBER OF OPEN COMPLAINTS FROM THE DATAFRAME\n",
+ " \n",
+ "totaldata_data = datatotal_data.drop(['education'], axis = 1)\n",
+ "totaldata_data\n",
+ "\n",
+ "totaldata_data = datatotal_data.drop(['number_of_open_complaints'], axis = 1)\n",
+ "totaldata_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 96,
+ "id": "854a8c46",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 23405.98798 | \n",
+ " 71941.0 | \n",
+ " 73.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 198.234764 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " NaN | \n",
+ " F | \n",
+ " College | \n",
+ " 3096.511217 | \n",
+ " 21604.0 | \n",
+ " 79.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 379.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 8163.890428 | \n",
+ " 0.0 | \n",
+ " 85.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 790.784983 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 7524.442436 | \n",
+ " 21941.0 | \n",
+ " 96.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 691.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 2611.836866 | \n",
+ " 0.0 | \n",
+ " 77.0 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ " 369.600000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
9135 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 NaN M Bachelor \n",
+ "7066 PK87824 NaN F College \n",
+ "7067 TD14365 NaN M Bachelor \n",
+ "7068 UP19263 NaN M College \n",
+ "7069 Y167826 NaN M College \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto policy_type \\\n",
+ "0 NaN 0.0 1000.0 Personal Auto \n",
+ "1 697953.59% 0.0 94.0 Personal Auto \n",
+ "2 1288743.17% 48767.0 108.0 Personal Auto \n",
+ "3 764586.18% 0.0 106.0 Corporate Auto \n",
+ "4 536307.65% 36357.0 68.0 Personal Auto \n",
+ "... ... ... ... ... \n",
+ "7065 23405.98798 71941.0 73.0 Personal Auto \n",
+ "7066 3096.511217 21604.0 79.0 Corporate Auto \n",
+ "7067 8163.890428 0.0 85.0 Corporate Auto \n",
+ "7068 7524.442436 21941.0 96.0 Personal Auto \n",
+ "7069 2611.836866 0.0 77.0 Corporate Auto \n",
+ "\n",
+ " vehicle_class total_claim_amount state \n",
+ "0 Four-Door Car 2.704934 NaN \n",
+ "1 Four-Door Car 1131.464935 NaN \n",
+ "2 Two-Door Car 566.472247 NaN \n",
+ "3 SUV 529.881344 NaN \n",
+ "4 Four-Door Car 17.269323 NaN \n",
+ "... ... ... ... \n",
+ "7065 Four-Door Car 198.234764 California \n",
+ "7066 Four-Door Car 379.200000 California \n",
+ "7067 Four-Door Car 790.784983 California \n",
+ "7068 Four-Door Car 691.200000 California \n",
+ "7069 Two-Door Car 369.600000 California \n",
+ "\n",
+ "[9135 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 96,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# CHECK FOR DUPLICATE ROWS IN THE DATA AND REMOVE IF ANY\n",
+ "\n",
+ "totaldata_data.duplicated() \n",
+ "\n",
+ "totaldata_data[totaldata_data.duplicated()] \n",
+ "\n",
+ "totaldata_data = totaldata_data.drop_duplicates()\n",
+ "\n",
+ "totaldata_data\n",
+ "\n",
+ "\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 111,
+ "id": "90edf4ee",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ "Empty DataFrame\n",
+ "Columns: [customer, st, gender, education, customer_lifetime_value, income, monthly_premium_auto, number_of_open_complaints, policy_type, vehicle_class, total_claim_amount, state]\n",
+ "Index: []"
+ ]
+ },
+ "execution_count": 111,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # Filter out the data for customers who have an income of 0 or less.\n",
+ " \n",
+ "datatotal_data[datatotal_data['income'] < 0]\n"
+ ]
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.11.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/lab-customer-analysis-round-1.ipynb b/lab-customer-analysis-round-1.ipynb
new file mode 100644
index 0000000..0fa7fff
--- /dev/null
+++ b/lab-customer-analysis-round-1.ipynb
@@ -0,0 +1,2543 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 101,
+ "id": "c43915d2",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Customer | \n",
+ " ST | \n",
+ " GENDER | \n",
+ " Education | \n",
+ " Customer Lifetime Value | \n",
+ " Income | \n",
+ " Monthly Premium Auto | \n",
+ " Number of Open Complaints | \n",
+ " Policy Type | \n",
+ " Vehicle Class | \n",
+ " Total Claim Amount | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " 1/0/00 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 4003 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4004 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4005 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4006 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4007 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
4008 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Customer ST GENDER Education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "4003 NaN NaN NaN NaN \n",
+ "4004 NaN NaN NaN NaN \n",
+ "4005 NaN NaN NaN NaN \n",
+ "4006 NaN NaN NaN NaN \n",
+ "4007 NaN NaN NaN NaN \n",
+ "\n",
+ " Customer Lifetime Value Income Monthly Premium Auto \\\n",
+ "0 NaN 0.0 1000.0 \n",
+ "1 697953.59% 0.0 94.0 \n",
+ "2 1288743.17% 48767.0 108.0 \n",
+ "3 764586.18% 0.0 106.0 \n",
+ "4 536307.65% 36357.0 68.0 \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " Number of Open Complaints Policy Type Vehicle Class \\\n",
+ "0 1/0/00 Personal Auto Four-Door Car \n",
+ "1 1/0/00 Personal Auto Four-Door Car \n",
+ "2 1/0/00 Personal Auto Two-Door Car \n",
+ "3 1/0/00 Corporate Auto SUV \n",
+ "4 1/0/00 Personal Auto Four-Door Car \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " Total Claim Amount \n",
+ "0 2.704934 \n",
+ "1 1131.464935 \n",
+ "2 566.472247 \n",
+ "3 529.881344 \n",
+ "4 17.269323 \n",
+ "... ... \n",
+ "4003 NaN \n",
+ "4004 NaN \n",
+ "4005 NaN \n",
+ "4006 NaN \n",
+ "4007 NaN \n",
+ "\n",
+ "[4008 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 101,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "import pandas as pd\n",
+ "\n",
+ "tab1_data = pd.read_csv(r'C:\\Users\\david\\OneDrive\\Ambiente de Trabalho\\Iron Hack\\ficheiros para LAB PANDA 1\\file1.csv')\n",
+ "\n",
+ "tab1_data\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 102,
+ "id": "297404d5",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Customer | \n",
+ " ST | \n",
+ " GENDER | \n",
+ " Education | \n",
+ " Customer Lifetime Value | \n",
+ " Income | \n",
+ " Monthly Premium Auto | \n",
+ " Number of Open Complaints | \n",
+ " Total Claim Amount | \n",
+ " Policy Type | \n",
+ " Vehicle Class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " GS98873 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 323912.47% | \n",
+ " 16061 | \n",
+ " 88 | \n",
+ " 1/0/00 | \n",
+ " 633.600000 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " CW49887 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 462680.11% | \n",
+ " 79487 | \n",
+ " 114 | \n",
+ " 1/0/00 | \n",
+ " 547.200000 | \n",
+ " Special Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " MY31220 | \n",
+ " California | \n",
+ " F | \n",
+ " College | \n",
+ " 899704.02% | \n",
+ " 54230 | \n",
+ " 112 | \n",
+ " 1/0/00 | \n",
+ " 537.600000 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " UH35128 | \n",
+ " Oregon | \n",
+ " F | \n",
+ " College | \n",
+ " 2580706.30% | \n",
+ " 71210 | \n",
+ " 214 | \n",
+ " 1/1/00 | \n",
+ " 1027.200000 | \n",
+ " Personal Auto | \n",
+ " Luxury Car | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " WH52799 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 380812.21% | \n",
+ " 94903 | \n",
+ " 94 | \n",
+ " 1/0/00 | \n",
+ " 451.200000 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 991 | \n",
+ " HV85198 | \n",
+ " Arizona | \n",
+ " M | \n",
+ " Master | \n",
+ " 847141.75% | \n",
+ " 63513 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 185.667213 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 992 | \n",
+ " BS91566 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 543121.91% | \n",
+ " 58161 | \n",
+ " 68 | \n",
+ " 1/0/00 | \n",
+ " 140.747286 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 993 | \n",
+ " IL40123 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " College | \n",
+ " 568964.41% | \n",
+ " 83640 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 471.050488 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 994 | \n",
+ " MY32149 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 368672.38% | \n",
+ " 0 | \n",
+ " 96 | \n",
+ " 1/0/00 | \n",
+ " 28.460568 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 995 | \n",
+ " SA91515 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 399258.39% | \n",
+ " 0 | \n",
+ " 111 | \n",
+ " 1/0/00 | \n",
+ " 700.349052 | \n",
+ " Personal Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
996 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Customer ST GENDER Education Customer Lifetime Value Income \\\n",
+ "0 GS98873 Arizona F Bachelor 323912.47% 16061 \n",
+ "1 CW49887 California F Master 462680.11% 79487 \n",
+ "2 MY31220 California F College 899704.02% 54230 \n",
+ "3 UH35128 Oregon F College 2580706.30% 71210 \n",
+ "4 WH52799 Arizona F College 380812.21% 94903 \n",
+ ".. ... ... ... ... ... ... \n",
+ "991 HV85198 Arizona M Master 847141.75% 63513 \n",
+ "992 BS91566 Arizona F College 543121.91% 58161 \n",
+ "993 IL40123 Nevada F College 568964.41% 83640 \n",
+ "994 MY32149 California F Master 368672.38% 0 \n",
+ "995 SA91515 California M Bachelor 399258.39% 0 \n",
+ "\n",
+ " Monthly Premium Auto Number of Open Complaints Total Claim Amount \\\n",
+ "0 88 1/0/00 633.600000 \n",
+ "1 114 1/0/00 547.200000 \n",
+ "2 112 1/0/00 537.600000 \n",
+ "3 214 1/1/00 1027.200000 \n",
+ "4 94 1/0/00 451.200000 \n",
+ ".. ... ... ... \n",
+ "991 70 1/0/00 185.667213 \n",
+ "992 68 1/0/00 140.747286 \n",
+ "993 70 1/0/00 471.050488 \n",
+ "994 96 1/0/00 28.460568 \n",
+ "995 111 1/0/00 700.349052 \n",
+ "\n",
+ " Policy Type Vehicle Class \n",
+ "0 Personal Auto Four-Door Car \n",
+ "1 Special Auto SUV \n",
+ "2 Personal Auto Two-Door Car \n",
+ "3 Personal Auto Luxury Car \n",
+ "4 Corporate Auto Two-Door Car \n",
+ ".. ... ... \n",
+ "991 Personal Auto Four-Door Car \n",
+ "992 Corporate Auto Four-Door Car \n",
+ "993 Corporate Auto Two-Door Car \n",
+ "994 Personal Auto Two-Door Car \n",
+ "995 Personal Auto SUV \n",
+ "\n",
+ "[996 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 102,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "tab2_data = pd.read_csv(r'C:\\Users\\david\\OneDrive\\Ambiente de Trabalho\\Iron Hack\\ficheiros para LAB PANDA 1\\file2.csv')\n",
+ "\n",
+ "tab2_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 103,
+ "id": "5698462b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Customer | \n",
+ " State | \n",
+ " Customer Lifetime Value | \n",
+ " Education | \n",
+ " Gender | \n",
+ " Income | \n",
+ " Monthly Premium Auto | \n",
+ " Number of Open Complaints | \n",
+ " Policy Type | \n",
+ " Total Claim Amount | \n",
+ " Vehicle Class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " SA25987 | \n",
+ " Washington | \n",
+ " 3479.137523 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 0 | \n",
+ " 104 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 499.200000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " TB86706 | \n",
+ " Arizona | \n",
+ " 2502.637401 | \n",
+ " Master | \n",
+ " M | \n",
+ " 0 | \n",
+ " 66 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 3.468912 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " ZL73902 | \n",
+ " Nevada | \n",
+ " 3265.156348 | \n",
+ " Bachelor | \n",
+ " F | \n",
+ " 25820 | \n",
+ " 82 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 393.600000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " KX23516 | \n",
+ " California | \n",
+ " 4455.843406 | \n",
+ " High School or Below | \n",
+ " F | \n",
+ " 0 | \n",
+ " 121 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 699.615192 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " FN77294 | \n",
+ " California | \n",
+ " 7704.958480 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 30366 | \n",
+ " 101 | \n",
+ " 2 | \n",
+ " Personal Auto | \n",
+ " 484.800000 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " California | \n",
+ " 23405.987980 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 71941 | \n",
+ " 73 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 198.234764 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " California | \n",
+ " 3096.511217 | \n",
+ " College | \n",
+ " F | \n",
+ " 21604 | \n",
+ " 79 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 379.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " California | \n",
+ " 8163.890428 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 0 | \n",
+ " 85 | \n",
+ " 3 | \n",
+ " Corporate Auto | \n",
+ " 790.784983 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " California | \n",
+ " 7524.442436 | \n",
+ " College | \n",
+ " M | \n",
+ " 21941 | \n",
+ " 96 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 691.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " California | \n",
+ " 2611.836866 | \n",
+ " College | \n",
+ " M | \n",
+ " 0 | \n",
+ " 77 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 369.600000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
7070 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Customer State Customer Lifetime Value Education \\\n",
+ "0 SA25987 Washington 3479.137523 High School or Below \n",
+ "1 TB86706 Arizona 2502.637401 Master \n",
+ "2 ZL73902 Nevada 3265.156348 Bachelor \n",
+ "3 KX23516 California 4455.843406 High School or Below \n",
+ "4 FN77294 California 7704.958480 High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 California 23405.987980 Bachelor \n",
+ "7066 PK87824 California 3096.511217 College \n",
+ "7067 TD14365 California 8163.890428 Bachelor \n",
+ "7068 UP19263 California 7524.442436 College \n",
+ "7069 Y167826 California 2611.836866 College \n",
+ "\n",
+ " Gender Income Monthly Premium Auto Number of Open Complaints \\\n",
+ "0 M 0 104 0 \n",
+ "1 M 0 66 0 \n",
+ "2 F 25820 82 0 \n",
+ "3 F 0 121 0 \n",
+ "4 M 30366 101 2 \n",
+ "... ... ... ... ... \n",
+ "7065 M 71941 73 0 \n",
+ "7066 F 21604 79 0 \n",
+ "7067 M 0 85 3 \n",
+ "7068 M 21941 96 0 \n",
+ "7069 M 0 77 0 \n",
+ "\n",
+ " Policy Type Total Claim Amount Vehicle Class \n",
+ "0 Personal Auto 499.200000 Two-Door Car \n",
+ "1 Personal Auto 3.468912 Two-Door Car \n",
+ "2 Personal Auto 393.600000 Four-Door Car \n",
+ "3 Personal Auto 699.615192 SUV \n",
+ "4 Personal Auto 484.800000 SUV \n",
+ "... ... ... ... \n",
+ "7065 Personal Auto 198.234764 Four-Door Car \n",
+ "7066 Corporate Auto 379.200000 Four-Door Car \n",
+ "7067 Corporate Auto 790.784983 Four-Door Car \n",
+ "7068 Personal Auto 691.200000 Four-Door Car \n",
+ "7069 Corporate Auto 369.600000 Two-Door Car \n",
+ "\n",
+ "[7070 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 103,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "tab3_data = pd.read_csv(r'C:\\Users\\david\\OneDrive\\Ambiente de Trabalho\\Iron Hack\\ficheiros para LAB PANDA 1\\file3.csv')\n",
+ "\n",
+ "tab3_data\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 104,
+ "id": "10a878b6",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(7070, 11)"
+ ]
+ },
+ "execution_count": 104,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # SHOW THE DATAFRAME'S SHAPE\n",
+ "\n",
+ "tab1_data.shape\n",
+ "tab2_data.shape\n",
+ "tab3_data.shape\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 105,
+ "id": "7eaccb15",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " 1/0/00 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 4003 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4004 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4005 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4006 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4007 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
4008 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "4003 NaN NaN NaN NaN \n",
+ "4004 NaN NaN NaN NaN \n",
+ "4005 NaN NaN NaN NaN \n",
+ "4006 NaN NaN NaN NaN \n",
+ "4007 NaN NaN NaN NaN \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto \\\n",
+ "0 NaN 0.0 1000.0 \n",
+ "1 697953.59% 0.0 94.0 \n",
+ "2 1288743.17% 48767.0 108.0 \n",
+ "3 764586.18% 0.0 106.0 \n",
+ "4 536307.65% 36357.0 68.0 \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " number_of_open_complaints policy_type vehicle_class \\\n",
+ "0 1/0/00 Personal Auto Four-Door Car \n",
+ "1 1/0/00 Personal Auto Four-Door Car \n",
+ "2 1/0/00 Personal Auto Two-Door Car \n",
+ "3 1/0/00 Corporate Auto SUV \n",
+ "4 1/0/00 Personal Auto Four-Door Car \n",
+ "... ... ... ... \n",
+ "4003 NaN NaN NaN \n",
+ "4004 NaN NaN NaN \n",
+ "4005 NaN NaN NaN \n",
+ "4006 NaN NaN NaN \n",
+ "4007 NaN NaN NaN \n",
+ "\n",
+ " total_claim_amount \n",
+ "0 2.704934 \n",
+ "1 1131.464935 \n",
+ "2 566.472247 \n",
+ "3 529.881344 \n",
+ "4 17.269323 \n",
+ "... ... \n",
+ "4003 NaN \n",
+ "4004 NaN \n",
+ "4005 NaN \n",
+ "4006 NaN \n",
+ "4007 NaN \n",
+ "\n",
+ "[4008 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 105,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # STANDARDIZE HEADER NAMES TABELA 1\n",
+ " \n",
+ "cols = []\n",
+ "for i in range(len(tab1_data.columns)): \n",
+ " cols.append(tab1_data.columns[i].lower().replace(' ', '_')) \n",
+ "tab1_data.columns = cols\n",
+ "tab1_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 106,
+ "id": "bb444eec",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " total_claim_amount | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " GS98873 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 323912.47% | \n",
+ " 16061 | \n",
+ " 88 | \n",
+ " 1/0/00 | \n",
+ " 633.600000 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " CW49887 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 462680.11% | \n",
+ " 79487 | \n",
+ " 114 | \n",
+ " 1/0/00 | \n",
+ " 547.200000 | \n",
+ " Special Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " MY31220 | \n",
+ " California | \n",
+ " F | \n",
+ " College | \n",
+ " 899704.02% | \n",
+ " 54230 | \n",
+ " 112 | \n",
+ " 1/0/00 | \n",
+ " 537.600000 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " UH35128 | \n",
+ " Oregon | \n",
+ " F | \n",
+ " College | \n",
+ " 2580706.30% | \n",
+ " 71210 | \n",
+ " 214 | \n",
+ " 1/1/00 | \n",
+ " 1027.200000 | \n",
+ " Personal Auto | \n",
+ " Luxury Car | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " WH52799 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 380812.21% | \n",
+ " 94903 | \n",
+ " 94 | \n",
+ " 1/0/00 | \n",
+ " 451.200000 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 991 | \n",
+ " HV85198 | \n",
+ " Arizona | \n",
+ " M | \n",
+ " Master | \n",
+ " 847141.75% | \n",
+ " 63513 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 185.667213 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 992 | \n",
+ " BS91566 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " College | \n",
+ " 543121.91% | \n",
+ " 58161 | \n",
+ " 68 | \n",
+ " 1/0/00 | \n",
+ " 140.747286 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 993 | \n",
+ " IL40123 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " College | \n",
+ " 568964.41% | \n",
+ " 83640 | \n",
+ " 70 | \n",
+ " 1/0/00 | \n",
+ " 471.050488 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 994 | \n",
+ " MY32149 | \n",
+ " California | \n",
+ " F | \n",
+ " Master | \n",
+ " 368672.38% | \n",
+ " 0 | \n",
+ " 96 | \n",
+ " 1/0/00 | \n",
+ " 28.460568 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 995 | \n",
+ " SA91515 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 399258.39% | \n",
+ " 0 | \n",
+ " 111 | \n",
+ " 1/0/00 | \n",
+ " 700.349052 | \n",
+ " Personal Auto | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
996 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education customer_lifetime_value income \\\n",
+ "0 GS98873 Arizona F Bachelor 323912.47% 16061 \n",
+ "1 CW49887 California F Master 462680.11% 79487 \n",
+ "2 MY31220 California F College 899704.02% 54230 \n",
+ "3 UH35128 Oregon F College 2580706.30% 71210 \n",
+ "4 WH52799 Arizona F College 380812.21% 94903 \n",
+ ".. ... ... ... ... ... ... \n",
+ "991 HV85198 Arizona M Master 847141.75% 63513 \n",
+ "992 BS91566 Arizona F College 543121.91% 58161 \n",
+ "993 IL40123 Nevada F College 568964.41% 83640 \n",
+ "994 MY32149 California F Master 368672.38% 0 \n",
+ "995 SA91515 California M Bachelor 399258.39% 0 \n",
+ "\n",
+ " monthly_premium_auto number_of_open_complaints total_claim_amount \\\n",
+ "0 88 1/0/00 633.600000 \n",
+ "1 114 1/0/00 547.200000 \n",
+ "2 112 1/0/00 537.600000 \n",
+ "3 214 1/1/00 1027.200000 \n",
+ "4 94 1/0/00 451.200000 \n",
+ ".. ... ... ... \n",
+ "991 70 1/0/00 185.667213 \n",
+ "992 68 1/0/00 140.747286 \n",
+ "993 70 1/0/00 471.050488 \n",
+ "994 96 1/0/00 28.460568 \n",
+ "995 111 1/0/00 700.349052 \n",
+ "\n",
+ " policy_type vehicle_class \n",
+ "0 Personal Auto Four-Door Car \n",
+ "1 Special Auto SUV \n",
+ "2 Personal Auto Two-Door Car \n",
+ "3 Personal Auto Luxury Car \n",
+ "4 Corporate Auto Two-Door Car \n",
+ ".. ... ... \n",
+ "991 Personal Auto Four-Door Car \n",
+ "992 Corporate Auto Four-Door Car \n",
+ "993 Corporate Auto Two-Door Car \n",
+ "994 Personal Auto Two-Door Car \n",
+ "995 Personal Auto SUV \n",
+ "\n",
+ "[996 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 106,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# STANDARDIZE HEADER NAMES TABELA 2\n",
+ " \n",
+ "cols = []\n",
+ "for i in range(len(tab2_data.columns)): \n",
+ " cols.append(tab2_data.columns[i].lower().replace(' ', '_')) \n",
+ "tab2_data.columns = cols\n",
+ "tab2_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 107,
+ "id": "0fcf53af",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " state | \n",
+ " customer_lifetime_value | \n",
+ " education | \n",
+ " gender | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " total_claim_amount | \n",
+ " vehicle_class | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " SA25987 | \n",
+ " Washington | \n",
+ " 3479.137523 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 0 | \n",
+ " 104 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 499.200000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " TB86706 | \n",
+ " Arizona | \n",
+ " 2502.637401 | \n",
+ " Master | \n",
+ " M | \n",
+ " 0 | \n",
+ " 66 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 3.468912 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " ZL73902 | \n",
+ " Nevada | \n",
+ " 3265.156348 | \n",
+ " Bachelor | \n",
+ " F | \n",
+ " 25820 | \n",
+ " 82 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 393.600000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " KX23516 | \n",
+ " California | \n",
+ " 4455.843406 | \n",
+ " High School or Below | \n",
+ " F | \n",
+ " 0 | \n",
+ " 121 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 699.615192 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " FN77294 | \n",
+ " California | \n",
+ " 7704.958480 | \n",
+ " High School or Below | \n",
+ " M | \n",
+ " 30366 | \n",
+ " 101 | \n",
+ " 2 | \n",
+ " Personal Auto | \n",
+ " 484.800000 | \n",
+ " SUV | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " California | \n",
+ " 23405.987980 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 71941 | \n",
+ " 73 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 198.234764 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " California | \n",
+ " 3096.511217 | \n",
+ " College | \n",
+ " F | \n",
+ " 21604 | \n",
+ " 79 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 379.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " California | \n",
+ " 8163.890428 | \n",
+ " Bachelor | \n",
+ " M | \n",
+ " 0 | \n",
+ " 85 | \n",
+ " 3 | \n",
+ " Corporate Auto | \n",
+ " 790.784983 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " California | \n",
+ " 7524.442436 | \n",
+ " College | \n",
+ " M | \n",
+ " 21941 | \n",
+ " 96 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " 691.200000 | \n",
+ " Four-Door Car | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " California | \n",
+ " 2611.836866 | \n",
+ " College | \n",
+ " M | \n",
+ " 0 | \n",
+ " 77 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " 369.600000 | \n",
+ " Two-Door Car | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
7070 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer state customer_lifetime_value education \\\n",
+ "0 SA25987 Washington 3479.137523 High School or Below \n",
+ "1 TB86706 Arizona 2502.637401 Master \n",
+ "2 ZL73902 Nevada 3265.156348 Bachelor \n",
+ "3 KX23516 California 4455.843406 High School or Below \n",
+ "4 FN77294 California 7704.958480 High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 California 23405.987980 Bachelor \n",
+ "7066 PK87824 California 3096.511217 College \n",
+ "7067 TD14365 California 8163.890428 Bachelor \n",
+ "7068 UP19263 California 7524.442436 College \n",
+ "7069 Y167826 California 2611.836866 College \n",
+ "\n",
+ " gender income monthly_premium_auto number_of_open_complaints \\\n",
+ "0 M 0 104 0 \n",
+ "1 M 0 66 0 \n",
+ "2 F 25820 82 0 \n",
+ "3 F 0 121 0 \n",
+ "4 M 30366 101 2 \n",
+ "... ... ... ... ... \n",
+ "7065 M 71941 73 0 \n",
+ "7066 F 21604 79 0 \n",
+ "7067 M 0 85 3 \n",
+ "7068 M 21941 96 0 \n",
+ "7069 M 0 77 0 \n",
+ "\n",
+ " policy_type total_claim_amount vehicle_class \n",
+ "0 Personal Auto 499.200000 Two-Door Car \n",
+ "1 Personal Auto 3.468912 Two-Door Car \n",
+ "2 Personal Auto 393.600000 Four-Door Car \n",
+ "3 Personal Auto 699.615192 SUV \n",
+ "4 Personal Auto 484.800000 SUV \n",
+ "... ... ... ... \n",
+ "7065 Personal Auto 198.234764 Four-Door Car \n",
+ "7066 Corporate Auto 379.200000 Four-Door Car \n",
+ "7067 Corporate Auto 790.784983 Four-Door Car \n",
+ "7068 Personal Auto 691.200000 Four-Door Car \n",
+ "7069 Corporate Auto 369.600000 Two-Door Car \n",
+ "\n",
+ "[7070 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 107,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# STANDARDIZE HEADER NAMES TABELA 3\n",
+ " \n",
+ "cols = []\n",
+ "for i in range(len(tab3_data.columns)): \n",
+ " cols.append(tab3_data.columns[i].lower().replace(' ', '_')) \n",
+ "tab3_data.columns = cols\n",
+ "tab3_data\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 90,
+ "id": "552a0b18",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# REARRANGE THE COLUMNS IN THE DATAFRAME AS NEEDED\n",
+ "\n",
+ "\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 108,
+ "id": "a57f4cef",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " 1/0/00 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " 1/0/00 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 23405.98798 | \n",
+ " 71941.0 | \n",
+ " 73.0 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 198.234764 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " NaN | \n",
+ " F | \n",
+ " College | \n",
+ " 3096.511217 | \n",
+ " 21604.0 | \n",
+ " 79.0 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 379.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 8163.890428 | \n",
+ " 0.0 | \n",
+ " 85.0 | \n",
+ " 3 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 790.784983 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 7524.442436 | \n",
+ " 21941.0 | \n",
+ " 96.0 | \n",
+ " 0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 691.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 2611.836866 | \n",
+ " 0.0 | \n",
+ " 77.0 | \n",
+ " 0 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ " 369.600000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
12074 rows × 12 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 NaN M Bachelor \n",
+ "7066 PK87824 NaN F College \n",
+ "7067 TD14365 NaN M Bachelor \n",
+ "7068 UP19263 NaN M College \n",
+ "7069 Y167826 NaN M College \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto \\\n",
+ "0 NaN 0.0 1000.0 \n",
+ "1 697953.59% 0.0 94.0 \n",
+ "2 1288743.17% 48767.0 108.0 \n",
+ "3 764586.18% 0.0 106.0 \n",
+ "4 536307.65% 36357.0 68.0 \n",
+ "... ... ... ... \n",
+ "7065 23405.98798 71941.0 73.0 \n",
+ "7066 3096.511217 21604.0 79.0 \n",
+ "7067 8163.890428 0.0 85.0 \n",
+ "7068 7524.442436 21941.0 96.0 \n",
+ "7069 2611.836866 0.0 77.0 \n",
+ "\n",
+ " number_of_open_complaints policy_type vehicle_class \\\n",
+ "0 1/0/00 Personal Auto Four-Door Car \n",
+ "1 1/0/00 Personal Auto Four-Door Car \n",
+ "2 1/0/00 Personal Auto Two-Door Car \n",
+ "3 1/0/00 Corporate Auto SUV \n",
+ "4 1/0/00 Personal Auto Four-Door Car \n",
+ "... ... ... ... \n",
+ "7065 0 Personal Auto Four-Door Car \n",
+ "7066 0 Corporate Auto Four-Door Car \n",
+ "7067 3 Corporate Auto Four-Door Car \n",
+ "7068 0 Personal Auto Four-Door Car \n",
+ "7069 0 Corporate Auto Two-Door Car \n",
+ "\n",
+ " total_claim_amount state \n",
+ "0 2.704934 NaN \n",
+ "1 1131.464935 NaN \n",
+ "2 566.472247 NaN \n",
+ "3 529.881344 NaN \n",
+ "4 17.269323 NaN \n",
+ "... ... ... \n",
+ "7065 198.234764 California \n",
+ "7066 379.200000 California \n",
+ "7067 790.784983 California \n",
+ "7068 691.200000 California \n",
+ "7069 369.600000 California \n",
+ "\n",
+ "[12074 rows x 12 columns]"
+ ]
+ },
+ "execution_count": 108,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# CONCATENATE THE THREE DATAFRAMES\n",
+ "\n",
+ "datatotal_data = pd.concat([tab1_data,tab2_data,tab3_data], axis = 0) \n",
+ "\n",
+ "datatotal_data\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 92,
+ "id": "a2367b94",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "customer object\n",
+ "st object\n",
+ "gender object\n",
+ "education object\n",
+ "customer_lifetime_value object\n",
+ "income float64\n",
+ "monthly_premium_auto float64\n",
+ "number_of_open_complaints object\n",
+ "policy_type object\n",
+ "vehicle_class object\n",
+ "total_claim_amount float64\n",
+ "state object\n",
+ "dtype: object"
+ ]
+ },
+ "execution_count": 92,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# QUESTION: WICH COLUMNS ARE NUMERICAL?\n",
+ "# ANSWER: Income, monthly_premium_auto, total_claim_amount\n",
+ "\n",
+ "# QUESTION: WICH COLUMNS ARE CATEGORICAL?\n",
+ "# ANSWER: customer, st, gender, education, customer_lifetime_value, number_of_open_complaints, policy_type, vehicle_class,state\n",
+ "\n",
+ "# UNDERSTAND THE MEANING OF ALL COLUMNS\n",
+ "# ANSWER:\n",
+ "\n",
+ "datatotal_data.dtypes\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 93,
+ "id": "32de16d5",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 23405.98798 | \n",
+ " 71941.0 | \n",
+ " 73.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 198.234764 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " NaN | \n",
+ " F | \n",
+ " College | \n",
+ " 3096.511217 | \n",
+ " 21604.0 | \n",
+ " 79.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 379.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 8163.890428 | \n",
+ " 0.0 | \n",
+ " 85.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 790.784983 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 7524.442436 | \n",
+ " 21941.0 | \n",
+ " 96.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 691.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 2611.836866 | \n",
+ " 0.0 | \n",
+ " 77.0 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ " 369.600000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
12074 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 NaN M Bachelor \n",
+ "7066 PK87824 NaN F College \n",
+ "7067 TD14365 NaN M Bachelor \n",
+ "7068 UP19263 NaN M College \n",
+ "7069 Y167826 NaN M College \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto policy_type \\\n",
+ "0 NaN 0.0 1000.0 Personal Auto \n",
+ "1 697953.59% 0.0 94.0 Personal Auto \n",
+ "2 1288743.17% 48767.0 108.0 Personal Auto \n",
+ "3 764586.18% 0.0 106.0 Corporate Auto \n",
+ "4 536307.65% 36357.0 68.0 Personal Auto \n",
+ "... ... ... ... ... \n",
+ "7065 23405.98798 71941.0 73.0 Personal Auto \n",
+ "7066 3096.511217 21604.0 79.0 Corporate Auto \n",
+ "7067 8163.890428 0.0 85.0 Corporate Auto \n",
+ "7068 7524.442436 21941.0 96.0 Personal Auto \n",
+ "7069 2611.836866 0.0 77.0 Corporate Auto \n",
+ "\n",
+ " vehicle_class total_claim_amount state \n",
+ "0 Four-Door Car 2.704934 NaN \n",
+ "1 Four-Door Car 1131.464935 NaN \n",
+ "2 Two-Door Car 566.472247 NaN \n",
+ "3 SUV 529.881344 NaN \n",
+ "4 Four-Door Car 17.269323 NaN \n",
+ "... ... ... ... \n",
+ "7065 Four-Door Car 198.234764 California \n",
+ "7066 Four-Door Car 379.200000 California \n",
+ "7067 Four-Door Car 790.784983 California \n",
+ "7068 Four-Door Car 691.200000 California \n",
+ "7069 Two-Door Car 369.600000 California \n",
+ "\n",
+ "[12074 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 93,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # DELETE THE COLUMN EDUCATION AND THE NUMBER OF OPEN COMPLAINTS FROM THE DATAFRAME\n",
+ " \n",
+ "totaldata_data = datatotal_data.drop(['education'], axis = 1)\n",
+ "totaldata_data\n",
+ "\n",
+ "totaldata_data = datatotal_data.drop(['number_of_open_complaints'], axis = 1)\n",
+ "totaldata_data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 96,
+ "id": "854a8c46",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " RB50392 | \n",
+ " Washington | \n",
+ " NaN | \n",
+ " Master | \n",
+ " NaN | \n",
+ " 0.0 | \n",
+ " 1000.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 2.704934 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " QZ44356 | \n",
+ " Arizona | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 697953.59% | \n",
+ " 0.0 | \n",
+ " 94.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 1131.464935 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " AI49188 | \n",
+ " Nevada | \n",
+ " F | \n",
+ " Bachelor | \n",
+ " 1288743.17% | \n",
+ " 48767.0 | \n",
+ " 108.0 | \n",
+ " Personal Auto | \n",
+ " Two-Door Car | \n",
+ " 566.472247 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " WW63253 | \n",
+ " California | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 764586.18% | \n",
+ " 0.0 | \n",
+ " 106.0 | \n",
+ " Corporate Auto | \n",
+ " SUV | \n",
+ " 529.881344 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " GA49547 | \n",
+ " Washington | \n",
+ " M | \n",
+ " High School or Below | \n",
+ " 536307.65% | \n",
+ " 36357.0 | \n",
+ " 68.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 17.269323 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 7065 | \n",
+ " LA72316 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 23405.98798 | \n",
+ " 71941.0 | \n",
+ " 73.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 198.234764 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7066 | \n",
+ " PK87824 | \n",
+ " NaN | \n",
+ " F | \n",
+ " College | \n",
+ " 3096.511217 | \n",
+ " 21604.0 | \n",
+ " 79.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 379.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7067 | \n",
+ " TD14365 | \n",
+ " NaN | \n",
+ " M | \n",
+ " Bachelor | \n",
+ " 8163.890428 | \n",
+ " 0.0 | \n",
+ " 85.0 | \n",
+ " Corporate Auto | \n",
+ " Four-Door Car | \n",
+ " 790.784983 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7068 | \n",
+ " UP19263 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 7524.442436 | \n",
+ " 21941.0 | \n",
+ " 96.0 | \n",
+ " Personal Auto | \n",
+ " Four-Door Car | \n",
+ " 691.200000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ " 7069 | \n",
+ " Y167826 | \n",
+ " NaN | \n",
+ " M | \n",
+ " College | \n",
+ " 2611.836866 | \n",
+ " 0.0 | \n",
+ " 77.0 | \n",
+ " Corporate Auto | \n",
+ " Two-Door Car | \n",
+ " 369.600000 | \n",
+ " California | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
9135 rows × 11 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " customer st gender education \\\n",
+ "0 RB50392 Washington NaN Master \n",
+ "1 QZ44356 Arizona F Bachelor \n",
+ "2 AI49188 Nevada F Bachelor \n",
+ "3 WW63253 California M Bachelor \n",
+ "4 GA49547 Washington M High School or Below \n",
+ "... ... ... ... ... \n",
+ "7065 LA72316 NaN M Bachelor \n",
+ "7066 PK87824 NaN F College \n",
+ "7067 TD14365 NaN M Bachelor \n",
+ "7068 UP19263 NaN M College \n",
+ "7069 Y167826 NaN M College \n",
+ "\n",
+ " customer_lifetime_value income monthly_premium_auto policy_type \\\n",
+ "0 NaN 0.0 1000.0 Personal Auto \n",
+ "1 697953.59% 0.0 94.0 Personal Auto \n",
+ "2 1288743.17% 48767.0 108.0 Personal Auto \n",
+ "3 764586.18% 0.0 106.0 Corporate Auto \n",
+ "4 536307.65% 36357.0 68.0 Personal Auto \n",
+ "... ... ... ... ... \n",
+ "7065 23405.98798 71941.0 73.0 Personal Auto \n",
+ "7066 3096.511217 21604.0 79.0 Corporate Auto \n",
+ "7067 8163.890428 0.0 85.0 Corporate Auto \n",
+ "7068 7524.442436 21941.0 96.0 Personal Auto \n",
+ "7069 2611.836866 0.0 77.0 Corporate Auto \n",
+ "\n",
+ " vehicle_class total_claim_amount state \n",
+ "0 Four-Door Car 2.704934 NaN \n",
+ "1 Four-Door Car 1131.464935 NaN \n",
+ "2 Two-Door Car 566.472247 NaN \n",
+ "3 SUV 529.881344 NaN \n",
+ "4 Four-Door Car 17.269323 NaN \n",
+ "... ... ... ... \n",
+ "7065 Four-Door Car 198.234764 California \n",
+ "7066 Four-Door Car 379.200000 California \n",
+ "7067 Four-Door Car 790.784983 California \n",
+ "7068 Four-Door Car 691.200000 California \n",
+ "7069 Two-Door Car 369.600000 California \n",
+ "\n",
+ "[9135 rows x 11 columns]"
+ ]
+ },
+ "execution_count": 96,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# CHECK FOR DUPLICATE ROWS IN THE DATA AND REMOVE IF ANY\n",
+ "\n",
+ "totaldata_data.duplicated() \n",
+ "\n",
+ "totaldata_data[totaldata_data.duplicated()] \n",
+ "\n",
+ "totaldata_data = totaldata_data.drop_duplicates()\n",
+ "\n",
+ "totaldata_data\n",
+ "\n",
+ "\n",
+ "\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 111,
+ "id": "90edf4ee",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " customer | \n",
+ " st | \n",
+ " gender | \n",
+ " education | \n",
+ " customer_lifetime_value | \n",
+ " income | \n",
+ " monthly_premium_auto | \n",
+ " number_of_open_complaints | \n",
+ " policy_type | \n",
+ " vehicle_class | \n",
+ " total_claim_amount | \n",
+ " state | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ "Empty DataFrame\n",
+ "Columns: [customer, st, gender, education, customer_lifetime_value, income, monthly_premium_auto, number_of_open_complaints, policy_type, vehicle_class, total_claim_amount, state]\n",
+ "Index: []"
+ ]
+ },
+ "execution_count": 111,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " # Filter out the data for customers who have an income of 0 or less.\n",
+ " \n",
+ "datatotal_data[datatotal_data['income'] < 0]\n"
+ ]
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.11.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}