diff --git a/notebook.ipynb b/notebook.ipynb
index a9725d0..0ebcf6a 100644
--- a/notebook.ipynb
+++ b/notebook.ipynb
@@ -60,7 +60,7 @@
},
{
"cell_type": "code",
- "execution_count": 14,
+ "execution_count": 115,
"metadata": {},
"outputs": [],
"source": [
@@ -88,241 +88,46 @@
},
{
"cell_type": "code",
- "execution_count": 15,
+ "execution_count": 116,
"metadata": {},
"outputs": [],
"source": [
"# Loading data\n",
- "data = pd.read_csv(\"dataset\\dataset.csv\", sep=\"\\t\")"
+ "data = pd.read_csv(\"dataset\\dataset.csv\", sep=\"\\t\")\n"
]
},
{
"cell_type": "code",
- "execution_count": 16,
+ "execution_count": 117,
"metadata": {},
"outputs": [
{
"data": {
- "text/html": [
- "
\n",
- "\n",
- "
\n",
- " \n",
- " \n",
- " | \n",
- " ClientID | \n",
- " BirthYear | \n",
- " AcademicLevel | \n",
- " RelationshipStatus | \n",
- " AnnualIncome | \n",
- " ChildrenAtHome | \n",
- " TeensAtHome | \n",
- " EnrollmentDate | \n",
- " LastPurchaseDays | \n",
- " WineSpending | \n",
- " ... | \n",
- " WebVisitsMonth | \n",
- " Campaign3Success | \n",
- " Campaign4Success | \n",
- " Campaign5Success | \n",
- " Campaign1Success | \n",
- " Campaign2Success | \n",
- " RecentComplaint | \n",
- " Z_CC | \n",
- " Z_R | \n",
- " LastCampaignResponse | \n",
- "
\n",
- " \n",
- " \n",
- " \n",
- " 0 | \n",
- " 5524 | \n",
- " 1957 | \n",
- " Graduation | \n",
- " Single | \n",
- " 58138.0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 04-09-2012 | \n",
- " 58 | \n",
- " 635 | \n",
- " ... | \n",
- " 7 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 3 | \n",
- " 11 | \n",
- " 1 | \n",
- "
\n",
- " \n",
- " 1 | \n",
- " 2174 | \n",
- " 1954 | \n",
- " Graduation | \n",
- " Single | \n",
- " 46344.0 | \n",
- " 1 | \n",
- " 1 | \n",
- " 08-03-2014 | \n",
- " 38 | \n",
- " 11 | \n",
- " ... | \n",
- " 5 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 3 | \n",
- " 11 | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " 2 | \n",
- " 4141 | \n",
- " 1965 | \n",
- " Graduation | \n",
- " Together | \n",
- " 71613.0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 21-08-2013 | \n",
- " 26 | \n",
- " 426 | \n",
- " ... | \n",
- " 4 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 3 | \n",
- " 11 | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " 3 | \n",
- " 6182 | \n",
- " 1984 | \n",
- " Graduation | \n",
- " Together | \n",
- " 26646.0 | \n",
- " 1 | \n",
- " 0 | \n",
- " 10-02-2014 | \n",
- " 26 | \n",
- " 11 | \n",
- " ... | \n",
- " 6 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 3 | \n",
- " 11 | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " 4 | \n",
- " 5324 | \n",
- " 1981 | \n",
- " PhD | \n",
- " Married | \n",
- " 58293.0 | \n",
- " 1 | \n",
- " 0 | \n",
- " 19-01-2014 | \n",
- " 94 | \n",
- " 173 | \n",
- " ... | \n",
- " 5 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 3 | \n",
- " 11 | \n",
- " 0 | \n",
- "
\n",
- " \n",
- "
\n",
- "
5 rows × 29 columns
\n",
- "
"
- ],
"text/plain": [
- " ClientID BirthYear AcademicLevel RelationshipStatus AnnualIncome \\\n",
- "0 5524 1957 Graduation Single 58138.0 \n",
- "1 2174 1954 Graduation Single 46344.0 \n",
- "2 4141 1965 Graduation Together 71613.0 \n",
- "3 6182 1984 Graduation Together 26646.0 \n",
- "4 5324 1981 PhD Married 58293.0 \n",
- "\n",
- " ChildrenAtHome TeensAtHome EnrollmentDate LastPurchaseDays WineSpending \\\n",
- "0 0 0 04-09-2012 58 635 \n",
- "1 1 1 08-03-2014 38 11 \n",
- "2 0 0 21-08-2013 26 426 \n",
- "3 1 0 10-02-2014 26 11 \n",
- "4 1 0 19-01-2014 94 173 \n",
- "\n",
- " ... WebVisitsMonth Campaign3Success Campaign4Success Campaign5Success \\\n",
- "0 ... 7 0 0 0 \n",
- "1 ... 5 0 0 0 \n",
- "2 ... 4 0 0 0 \n",
- "3 ... 6 0 0 0 \n",
- "4 ... 5 0 0 0 \n",
- "\n",
- " Campaign1Success Campaign2Success RecentComplaint Z_CC Z_R \\\n",
- "0 0 0 0 3 11 \n",
- "1 0 0 0 3 11 \n",
- "2 0 0 0 3 11 \n",
- "3 0 0 0 3 11 \n",
- "4 0 0 0 3 11 \n",
- "\n",
- " LastCampaignResponse \n",
- "0 1 \n",
- "1 0 \n",
- "2 0 \n",
- "3 0 \n",
- "4 0 \n",
- "\n",
- "[5 rows x 29 columns]"
+ "Index(['ClientID', 'BirthYear', 'AcademicLevel', 'RelationshipStatus',\n",
+ " 'AnnualIncome', 'ChildrenAtHome', 'TeensAtHome', 'EnrollmentDate',\n",
+ " 'LastPurchaseDays', 'WineSpending', 'FruitSpending', 'MeatSpending',\n",
+ " 'FishSpending', 'SweetSpending', 'GoldSpending', 'DiscountedPurchases',\n",
+ " 'WebPurchases', 'CatalogPurchases', 'StorePurchases', 'WebVisitsMonth',\n",
+ " 'Campaign3Success', 'Campaign4Success', 'Campaign5Success',\n",
+ " 'Campaign1Success', 'Campaign2Success', 'RecentComplaint', 'Z_CC',\n",
+ " 'Z_R', 'LastCampaignResponse'],\n",
+ " dtype='object')"
]
},
- "execution_count": 16,
+ "execution_count": 117,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# Looking at the first five rows\n",
- "data.head(5)"
+ "data.columns"
]
},
{
"cell_type": "code",
- "execution_count": 17,
+ "execution_count": 118,
"metadata": {},
"outputs": [
{
@@ -534,7 +339,7 @@
"[5 rows x 29 columns]"
]
},
- "execution_count": 17,
+ "execution_count": 118,
"metadata": {},
"output_type": "execute_result"
}
@@ -552,7 +357,7 @@
},
{
"cell_type": "code",
- "execution_count": 18,
+ "execution_count": 119,
"metadata": {},
"outputs": [
{
@@ -851,7 +656,7 @@
"[8 rows x 26 columns]"
]
},
- "execution_count": 18,
+ "execution_count": 119,
"metadata": {},
"output_type": "execute_result"
}
@@ -862,7 +667,7 @@
},
{
"cell_type": "code",
- "execution_count": 19,
+ "execution_count": 120,
"metadata": {},
"outputs": [
{
@@ -924,7 +729,7 @@
},
{
"cell_type": "code",
- "execution_count": 20,
+ "execution_count": 121,
"metadata": {},
"outputs": [],
"source": [
@@ -933,7 +738,7 @@
},
{
"cell_type": "code",
- "execution_count": 21,
+ "execution_count": 122,
"metadata": {},
"outputs": [
{
@@ -971,7 +776,7 @@
"dtype: int64"
]
},
- "execution_count": 21,
+ "execution_count": 122,
"metadata": {},
"output_type": "execute_result"
}
@@ -989,7 +794,7 @@
},
{
"cell_type": "code",
- "execution_count": 22,
+ "execution_count": 123,
"metadata": {},
"outputs": [
{
@@ -1006,7 +811,7 @@
"Name: AnnualIncome, dtype: float64"
]
},
- "execution_count": 22,
+ "execution_count": 123,
"metadata": {},
"output_type": "execute_result"
}
@@ -1017,7 +822,7 @@
},
{
"cell_type": "code",
- "execution_count": 23,
+ "execution_count": 124,
"metadata": {},
"outputs": [
{
@@ -1026,7 +831,7 @@
"7500.0"
]
},
- "execution_count": 23,
+ "execution_count": 124,
"metadata": {},
"output_type": "execute_result"
}
@@ -1038,7 +843,7 @@
},
{
"cell_type": "code",
- "execution_count": 24,
+ "execution_count": 125,
"metadata": {},
"outputs": [
{
@@ -1078,7 +883,7 @@
},
{
"cell_type": "code",
- "execution_count": 25,
+ "execution_count": 126,
"metadata": {},
"outputs": [
{
@@ -1464,7 +1269,7 @@
"[2240 rows x 29 columns]"
]
},
- "execution_count": 25,
+ "execution_count": 126,
"metadata": {},
"output_type": "execute_result"
}
@@ -1476,7 +1281,7 @@
},
{
"cell_type": "code",
- "execution_count": 26,
+ "execution_count": 127,
"metadata": {},
"outputs": [],
"source": [
@@ -1485,7 +1290,7 @@
},
{
"cell_type": "code",
- "execution_count": 27,
+ "execution_count": 128,
"metadata": {},
"outputs": [
{
@@ -1537,7 +1342,7 @@
},
{
"cell_type": "code",
- "execution_count": 28,
+ "execution_count": 129,
"metadata": {},
"outputs": [
{
@@ -1551,7 +1356,7 @@
"Name: EnrollmentDate, dtype: object"
]
},
- "execution_count": 28,
+ "execution_count": 129,
"metadata": {},
"output_type": "execute_result"
}
@@ -1569,7 +1374,7 @@
},
{
"cell_type": "code",
- "execution_count": 29,
+ "execution_count": 130,
"metadata": {},
"outputs": [
{
@@ -1594,7 +1399,7 @@
},
{
"cell_type": "code",
- "execution_count": 30,
+ "execution_count": 131,
"metadata": {},
"outputs": [
{
@@ -1608,7 +1413,7 @@
"Name: EnrollmentDate, dtype: datetime64[ns]"
]
},
- "execution_count": 30,
+ "execution_count": 131,
"metadata": {},
"output_type": "execute_result"
}
@@ -1626,7 +1431,7 @@
},
{
"cell_type": "code",
- "execution_count": 31,
+ "execution_count": 132,
"metadata": {},
"outputs": [],
"source": [
@@ -1657,7 +1462,7 @@
},
{
"cell_type": "code",
- "execution_count": 32,
+ "execution_count": 133,
"metadata": {},
"outputs": [],
"source": [
@@ -1668,7 +1473,7 @@
},
{
"cell_type": "code",
- "execution_count": 33,
+ "execution_count": 134,
"metadata": {},
"outputs": [],
"source": [
@@ -1680,7 +1485,7 @@
},
{
"cell_type": "code",
- "execution_count": 34,
+ "execution_count": 135,
"metadata": {},
"outputs": [],
"source": [
@@ -1691,7 +1496,7 @@
},
{
"cell_type": "code",
- "execution_count": 35,
+ "execution_count": 136,
"metadata": {},
"outputs": [],
"source": [
@@ -1701,7 +1506,7 @@
},
{
"cell_type": "code",
- "execution_count": 36,
+ "execution_count": 137,
"metadata": {},
"outputs": [],
"source": [
@@ -1712,7 +1517,7 @@
},
{
"cell_type": "code",
- "execution_count": 37,
+ "execution_count": 138,
"metadata": {},
"outputs": [],
"source": [
@@ -1722,7 +1527,7 @@
},
{
"cell_type": "code",
- "execution_count": 38,
+ "execution_count": 139,
"metadata": {},
"outputs": [],
"source": [
@@ -1732,7 +1537,7 @@
},
{
"cell_type": "code",
- "execution_count": 39,
+ "execution_count": 140,
"metadata": {},
"outputs": [],
"source": [
@@ -1745,7 +1550,7 @@
},
{
"cell_type": "code",
- "execution_count": 40,
+ "execution_count": 141,
"metadata": {},
"outputs": [],
"source": [
@@ -1755,7 +1560,7 @@
},
{
"cell_type": "code",
- "execution_count": 41,
+ "execution_count": 142,
"metadata": {},
"outputs": [],
"source": [
@@ -1765,7 +1570,7 @@
},
{
"cell_type": "code",
- "execution_count": 42,
+ "execution_count": 143,
"metadata": {},
"outputs": [],
"source": [
@@ -1775,7 +1580,7 @@
},
{
"cell_type": "code",
- "execution_count": 43,
+ "execution_count": 144,
"metadata": {},
"outputs": [],
"source": [
@@ -1791,7 +1596,7 @@
},
{
"cell_type": "code",
- "execution_count": 44,
+ "execution_count": 145,
"metadata": {},
"outputs": [
{
@@ -1996,7 +1801,7 @@
"[5 rows x 36 columns]"
]
},
- "execution_count": 44,
+ "execution_count": 145,
"metadata": {},
"output_type": "execute_result"
}
@@ -2014,13 +1819,509 @@
},
{
"cell_type": "code",
- "execution_count": 45,
+ "execution_count": 146,
"metadata": {},
"outputs": [],
"source": [
"# Plots For The Engineered Features"
]
},
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "Engineered features :- ['Age', 'TotalSpent', 'Children',\n",
+ " 'CustomerSince', 'TotalPurchases', 'TotalSuccessfulCampaignsSuccess',\n",
+ " 'Is_Parent' ,'AnnualIncome' ]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 147,
+ "metadata": {
+ "scrolled": false
+ },
+ "outputs": [
+ {
+ "data": {
+ "image/png": "",
+ "text/plain": [
+ "