{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "002ba07a",
"metadata": {},
"outputs": [],
"source": [
"\n",
"# Import modules\n",
"import os\n",
"import pandas as pd\n",
"import matplotlib.pyplot as plt\n",
"import seaborn as sns\n",
"import re\n",
"import numpy as np\n",
"from sklearn import tree\n",
"from sklearn.model_selection import train_test_split\n",
"\n",
"# Figures inline and set visualization style\n",
"%matplotlib inline\n",
"sns.set()\n"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "2949d944",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"(891, 12)\n"
]
},
{
"data": {
"text/html": [
"
\n",
"\n",
"
\n",
" \n",
" \n",
" \n",
" PassengerId \n",
" Survived \n",
" Pclass \n",
" Name \n",
" Sex \n",
" Age \n",
" SibSp \n",
" Parch \n",
" Ticket \n",
" Fare \n",
" Cabin \n",
" Embarked \n",
" \n",
" \n",
" \n",
" \n",
" 0 \n",
" 1 \n",
" 0 \n",
" 3 \n",
" Braund, Mr. Owen Harris \n",
" male \n",
" 22.0 \n",
" 1 \n",
" 0 \n",
" A/5 21171 \n",
" 7.2500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 1 \n",
" 2 \n",
" 1 \n",
" 1 \n",
" Cumings, Mrs. John Bradley (Florence Briggs Th... \n",
" female \n",
" 38.0 \n",
" 1 \n",
" 0 \n",
" PC 17599 \n",
" 71.2833 \n",
" C85 \n",
" C \n",
" \n",
" \n",
" 2 \n",
" 3 \n",
" 1 \n",
" 3 \n",
" Heikkinen, Miss. Laina \n",
" female \n",
" 26.0 \n",
" 0 \n",
" 0 \n",
" STON/O2. 3101282 \n",
" 7.9250 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 3 \n",
" 4 \n",
" 1 \n",
" 1 \n",
" Futrelle, Mrs. Jacques Heath (Lily May Peel) \n",
" female \n",
" 35.0 \n",
" 1 \n",
" 0 \n",
" 113803 \n",
" 53.1000 \n",
" C123 \n",
" S \n",
" \n",
" \n",
" 4 \n",
" 5 \n",
" 0 \n",
" 3 \n",
" Allen, Mr. William Henry \n",
" male \n",
" 35.0 \n",
" 0 \n",
" 0 \n",
" 373450 \n",
" 8.0500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
"
\n",
"
"
],
"text/plain": [
" PassengerId Survived Pclass \\\n",
"0 1 0 3 \n",
"1 2 1 1 \n",
"2 3 1 3 \n",
"3 4 1 1 \n",
"4 5 0 3 \n",
"\n",
" Name Sex Age SibSp \\\n",
"0 Braund, Mr. Owen Harris male 22.0 1 \n",
"1 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 1 \n",
"2 Heikkinen, Miss. Laina female 26.0 0 \n",
"3 Futrelle, Mrs. Jacques Heath (Lily May Peel) female 35.0 1 \n",
"4 Allen, Mr. William Henry male 35.0 0 \n",
"\n",
" Parch Ticket Fare Cabin Embarked \n",
"0 0 A/5 21171 7.2500 NaN S \n",
"1 0 PC 17599 71.2833 C85 C \n",
"2 0 STON/O2. 3101282 7.9250 NaN S \n",
"3 0 113803 53.1000 C123 S \n",
"4 0 373450 8.0500 NaN S "
]
},
"execution_count": 2,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"\n",
"\n",
"df_train = pd.read_csv(\"C:/Users/User/Downloads/train.csv\")\n",
"df_test = pd.read_csv(\"C:/Users/User/Downloads/test.csv\")\n",
"\n",
"\n",
"print(df_train.shape)\n",
"df_train.head()"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "34b67c3b",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"(418, 11)\n"
]
},
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" \n",
" PassengerId \n",
" Pclass \n",
" Name \n",
" Sex \n",
" Age \n",
" SibSp \n",
" Parch \n",
" Ticket \n",
" Fare \n",
" Cabin \n",
" Embarked \n",
" \n",
" \n",
" \n",
" \n",
" 0 \n",
" 892 \n",
" 3 \n",
" Kelly, Mr. James \n",
" male \n",
" 34.5 \n",
" 0 \n",
" 0 \n",
" 330911 \n",
" 7.8292 \n",
" NaN \n",
" Q \n",
" \n",
" \n",
" 1 \n",
" 893 \n",
" 3 \n",
" Wilkes, Mrs. James (Ellen Needs) \n",
" female \n",
" 47.0 \n",
" 1 \n",
" 0 \n",
" 363272 \n",
" 7.0000 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 2 \n",
" 894 \n",
" 2 \n",
" Myles, Mr. Thomas Francis \n",
" male \n",
" 62.0 \n",
" 0 \n",
" 0 \n",
" 240276 \n",
" 9.6875 \n",
" NaN \n",
" Q \n",
" \n",
" \n",
" 3 \n",
" 895 \n",
" 3 \n",
" Wirz, Mr. Albert \n",
" male \n",
" 27.0 \n",
" 0 \n",
" 0 \n",
" 315154 \n",
" 8.6625 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 4 \n",
" 896 \n",
" 3 \n",
" Hirvonen, Mrs. Alexander (Helga E Lindqvist) \n",
" female \n",
" 22.0 \n",
" 1 \n",
" 1 \n",
" 3101298 \n",
" 12.2875 \n",
" NaN \n",
" S \n",
" \n",
" \n",
"
\n",
"
"
],
"text/plain": [
" PassengerId Pclass Name Sex \\\n",
"0 892 3 Kelly, Mr. James male \n",
"1 893 3 Wilkes, Mrs. James (Ellen Needs) female \n",
"2 894 2 Myles, Mr. Thomas Francis male \n",
"3 895 3 Wirz, Mr. Albert male \n",
"4 896 3 Hirvonen, Mrs. Alexander (Helga E Lindqvist) female \n",
"\n",
" Age SibSp Parch Ticket Fare Cabin Embarked \n",
"0 34.5 0 0 330911 7.8292 NaN Q \n",
"1 47.0 1 0 363272 7.0000 NaN S \n",
"2 62.0 0 0 240276 9.6875 NaN Q \n",
"3 27.0 0 0 315154 8.6625 NaN S \n",
"4 22.0 1 1 3101298 12.2875 NaN S "
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"print(df_test.shape)\n",
"df_test.head()"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "4b1b1011",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
""
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"sns.countplot(x='Survived', data=df_train);"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "d60bf413",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
""
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"sns.countplot(x='Sex', data=df_train);"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "1c2bfb25",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
""
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"sns.catplot(x='Survived', col='Sex', kind='count', data=df_train);"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "dbede04d",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"Sex\n",
"female 233\n",
"male 109\n",
"Name: Survived, dtype: int64"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_train.groupby(['Sex']).Survived.sum()"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "eeeb3341",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"342"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_train.Survived.sum()"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "937a3084",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"0.7420382165605095\n",
"0.18890814558058924\n"
]
}
],
"source": [
"print(df_train[df_train.Sex == 'female'].Survived.sum()/df_train[df_train.Sex == 'female'].Survived.count())\n",
"print(df_train[df_train.Sex == 'male'].Survived.sum()/df_train[df_train.Sex == 'male'].Survived.count())"
]
},
{
"cell_type": "code",
"execution_count": 10,
"id": "864310ff",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
""
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"sns.catplot(x='Survived', col='Pclass', kind='count', data=df_train);"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "4b9782b2",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" \n",
" PassengerId \n",
" Pclass \n",
" Name \n",
" Sex \n",
" Age \n",
" SibSp \n",
" Parch \n",
" Ticket \n",
" Fare \n",
" Cabin \n",
" Embarked \n",
" \n",
" \n",
" \n",
" \n",
" 413 \n",
" 1305 \n",
" 3 \n",
" Spector, Mr. Woolf \n",
" male \n",
" NaN \n",
" 0 \n",
" 0 \n",
" A.5. 3236 \n",
" 8.0500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 414 \n",
" 1306 \n",
" 1 \n",
" Oliva y Ocana, Dona. Fermina \n",
" female \n",
" 39.0 \n",
" 0 \n",
" 0 \n",
" PC 17758 \n",
" 108.9000 \n",
" C105 \n",
" C \n",
" \n",
" \n",
" 415 \n",
" 1307 \n",
" 3 \n",
" Saether, Mr. Simon Sivertsen \n",
" male \n",
" 38.5 \n",
" 0 \n",
" 0 \n",
" SOTON/O.Q. 3101262 \n",
" 7.2500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 416 \n",
" 1308 \n",
" 3 \n",
" Ware, Mr. Frederick \n",
" male \n",
" NaN \n",
" 0 \n",
" 0 \n",
" 359309 \n",
" 8.0500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 417 \n",
" 1309 \n",
" 3 \n",
" Peter, Master. Michael J \n",
" male \n",
" NaN \n",
" 1 \n",
" 1 \n",
" 2668 \n",
" 22.3583 \n",
" NaN \n",
" C \n",
" \n",
" \n",
"
\n",
"
"
],
"text/plain": [
" PassengerId Pclass Name Sex Age SibSp \\\n",
"413 1305 3 Spector, Mr. Woolf male NaN 0 \n",
"414 1306 1 Oliva y Ocana, Dona. Fermina female 39.0 0 \n",
"415 1307 3 Saether, Mr. Simon Sivertsen male 38.5 0 \n",
"416 1308 3 Ware, Mr. Frederick male NaN 0 \n",
"417 1309 3 Peter, Master. Michael J male NaN 1 \n",
"\n",
" Parch Ticket Fare Cabin Embarked \n",
"413 0 A.5. 3236 8.0500 NaN S \n",
"414 0 PC 17758 108.9000 C105 C \n",
"415 0 SOTON/O.Q. 3101262 7.2500 NaN S \n",
"416 0 359309 8.0500 NaN S \n",
"417 1 2668 22.3583 NaN C "
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# Store target variable of training data in a safe place\n",
"survived_train = df_train.Survived\n",
"\n",
"# Concatenate training and test sets\n",
"data = pd.concat([df_train.drop(['Survived'], axis=1), df_test])\n",
"data.tail()"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "31431041",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" \n",
" PassengerId \n",
" Pclass \n",
" Name \n",
" Sex \n",
" Age \n",
" SibSp \n",
" Parch \n",
" Ticket \n",
" Fare \n",
" Cabin \n",
" Embarked \n",
" \n",
" \n",
" \n",
" \n",
" 0 \n",
" 892 \n",
" 3 \n",
" Kelly, Mr. James \n",
" male \n",
" 34.5 \n",
" 0 \n",
" 0 \n",
" 330911 \n",
" 7.8292 \n",
" NaN \n",
" Q \n",
" \n",
" \n",
" 1 \n",
" 893 \n",
" 3 \n",
" Wilkes, Mrs. James (Ellen Needs) \n",
" female \n",
" 47.0 \n",
" 1 \n",
" 0 \n",
" 363272 \n",
" 7.0000 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 2 \n",
" 894 \n",
" 2 \n",
" Myles, Mr. Thomas Francis \n",
" male \n",
" 62.0 \n",
" 0 \n",
" 0 \n",
" 240276 \n",
" 9.6875 \n",
" NaN \n",
" Q \n",
" \n",
" \n",
" 3 \n",
" 895 \n",
" 3 \n",
" Wirz, Mr. Albert \n",
" male \n",
" 27.0 \n",
" 0 \n",
" 0 \n",
" 315154 \n",
" 8.6625 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 4 \n",
" 896 \n",
" 3 \n",
" Hirvonen, Mrs. Alexander (Helga E Lindqvist) \n",
" female \n",
" 22.0 \n",
" 1 \n",
" 1 \n",
" 3101298 \n",
" 12.2875 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" ... \n",
" \n",
" \n",
" 413 \n",
" 1305 \n",
" 3 \n",
" Spector, Mr. Woolf \n",
" male \n",
" NaN \n",
" 0 \n",
" 0 \n",
" A.5. 3236 \n",
" 8.0500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 414 \n",
" 1306 \n",
" 1 \n",
" Oliva y Ocana, Dona. Fermina \n",
" female \n",
" 39.0 \n",
" 0 \n",
" 0 \n",
" PC 17758 \n",
" 108.9000 \n",
" C105 \n",
" C \n",
" \n",
" \n",
" 415 \n",
" 1307 \n",
" 3 \n",
" Saether, Mr. Simon Sivertsen \n",
" male \n",
" 38.5 \n",
" 0 \n",
" 0 \n",
" SOTON/O.Q. 3101262 \n",
" 7.2500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 416 \n",
" 1308 \n",
" 3 \n",
" Ware, Mr. Frederick \n",
" male \n",
" NaN \n",
" 0 \n",
" 0 \n",
" 359309 \n",
" 8.0500 \n",
" NaN \n",
" S \n",
" \n",
" \n",
" 417 \n",
" 1309 \n",
" 3 \n",
" Peter, Master. Michael J \n",
" male \n",
" NaN \n",
" 1 \n",
" 1 \n",
" 2668 \n",
" 22.3583 \n",
" NaN \n",
" C \n",
" \n",
" \n",
"
\n",
"
418 rows × 11 columns
\n",
"
"
],
"text/plain": [
" PassengerId Pclass Name \\\n",
"0 892 3 Kelly, Mr. James \n",
"1 893 3 Wilkes, Mrs. James (Ellen Needs) \n",
"2 894 2 Myles, Mr. Thomas Francis \n",
"3 895 3 Wirz, Mr. Albert \n",
"4 896 3 Hirvonen, Mrs. Alexander (Helga E Lindqvist) \n",
".. ... ... ... \n",
"413 1305 3 Spector, Mr. Woolf \n",
"414 1306 1 Oliva y Ocana, Dona. Fermina \n",
"415 1307 3 Saether, Mr. Simon Sivertsen \n",
"416 1308 3 Ware, Mr. Frederick \n",
"417 1309 3 Peter, Master. Michael J \n",
"\n",
" Sex Age SibSp Parch Ticket Fare Cabin Embarked \n",
"0 male 34.5 0 0 330911 7.8292 NaN Q \n",
"1 female 47.0 1 0 363272 7.0000 NaN S \n",
"2 male 62.0 0 0 240276 9.6875 NaN Q \n",
"3 male 27.0 0 0 315154 8.6625 NaN S \n",
"4 female 22.0 1 1 3101298 12.2875 NaN S \n",
".. ... ... ... ... ... ... ... ... \n",
"413 male NaN 0 0 A.5. 3236 8.0500 NaN S \n",
"414 female 39.0 0 0 PC 17758 108.9000 C105 C \n",
"415 male 38.5 0 0 SOTON/O.Q. 3101262 7.2500 NaN S \n",
"416 male NaN 0 0 359309 8.0500 NaN S \n",
"417 male NaN 1 1 2668 22.3583 NaN C \n",
"\n",
"[418 rows x 11 columns]"
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_test"
]
},
{
"cell_type": "code",
"execution_count": 13,
"id": "ef626cce",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0 0\n",
"1 1\n",
"2 1\n",
"3 1\n",
"4 0\n",
" ..\n",
"886 0\n",
"887 1\n",
"888 0\n",
"889 1\n",
"890 0\n",
"Name: Survived, Length: 891, dtype: int64"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"survived_train"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "d871eb29",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"\n",
"Int64Index: 1309 entries, 0 to 417\n",
"Data columns (total 11 columns):\n",
" # Column Non-Null Count Dtype \n",
"--- ------ -------------- ----- \n",
" 0 PassengerId 1309 non-null int64 \n",
" 1 Pclass 1309 non-null int64 \n",
" 2 Name 1309 non-null object \n",
" 3 Sex 1309 non-null object \n",
" 4 Age 1046 non-null float64\n",
" 5 SibSp 1309 non-null int64 \n",
" 6 Parch 1309 non-null int64 \n",
" 7 Ticket 1309 non-null object \n",
" 8 Fare 1308 non-null float64\n",
" 9 Cabin 295 non-null object \n",
" 10 Embarked 1307 non-null object \n",
"dtypes: float64(2), int64(4), object(5)\n",
"memory usage: 122.7+ KB\n"
]
}
],
"source": [
"data.info()"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "7a39497b",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"\n",
"Int64Index: 1309 entries, 0 to 417\n",
"Data columns (total 11 columns):\n",
" # Column Non-Null Count Dtype \n",
"--- ------ -------------- ----- \n",
" 0 PassengerId 1309 non-null int64 \n",
" 1 Pclass 1309 non-null int64 \n",
" 2 Name 1309 non-null object \n",
" 3 Sex 1309 non-null object \n",
" 4 Age 1309 non-null float64\n",
" 5 SibSp 1309 non-null int64 \n",
" 6 Parch 1309 non-null int64 \n",
" 7 Ticket 1309 non-null object \n",
" 8 Fare 1309 non-null float64\n",
" 9 Cabin 295 non-null object \n",
" 10 Embarked 1307 non-null object \n",
"dtypes: float64(2), int64(4), object(5)\n",
"memory usage: 122.7+ KB\n"
]
}
],
"source": [
"# Dealing with missing numerical variables\n",
"data['Age'] = data.Age.fillna(data.Age.median())\n",
"data['Fare'] = data.Fare.fillna(data.Fare.median())\n",
"\n",
"# Check out info of data\n",
"data.info()"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "d6257a63",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" \n",
" PassengerId \n",
" Pclass \n",
" Name \n",
" Age \n",
" SibSp \n",
" Parch \n",
" Ticket \n",
" Fare \n",
" Cabin \n",
" Embarked \n",
" Sex_male \n",
" \n",
" \n",
" \n",
" \n",
" 0 \n",
" 1 \n",
" 3 \n",
" Braund, Mr. Owen Harris \n",
" 22.0 \n",
" 1 \n",
" 0 \n",
" A/5 21171 \n",
" 7.2500 \n",
" NaN \n",
" S \n",
" 1 \n",
" \n",
" \n",
" 1 \n",
" 2 \n",
" 1 \n",
" Cumings, Mrs. John Bradley (Florence Briggs Th... \n",
" 38.0 \n",
" 1 \n",
" 0 \n",
" PC 17599 \n",
" 71.2833 \n",
" C85 \n",
" C \n",
" 0 \n",
" \n",
" \n",
" 2 \n",
" 3 \n",
" 3 \n",
" Heikkinen, Miss. Laina \n",
" 26.0 \n",
" 0 \n",
" 0 \n",
" STON/O2. 3101282 \n",
" 7.9250 \n",
" NaN \n",
" S \n",
" 0 \n",
" \n",
" \n",
" 3 \n",
" 4 \n",
" 1 \n",
" Futrelle, Mrs. Jacques Heath (Lily May Peel) \n",
" 35.0 \n",
" 1 \n",
" 0 \n",
" 113803 \n",
" 53.1000 \n",
" C123 \n",
" S \n",
" 0 \n",
" \n",
" \n",
" 4 \n",
" 5 \n",
" 3 \n",
" Allen, Mr. William Henry \n",
" 35.0 \n",
" 0 \n",
" 0 \n",
" 373450 \n",
" 8.0500 \n",
" NaN \n",
" S \n",
" 1 \n",
" \n",
" \n",
"
\n",
"
"
],
"text/plain": [
" PassengerId Pclass Name \\\n",
"0 1 3 Braund, Mr. Owen Harris \n",
"1 2 1 Cumings, Mrs. John Bradley (Florence Briggs Th... \n",
"2 3 3 Heikkinen, Miss. Laina \n",
"3 4 1 Futrelle, Mrs. Jacques Heath (Lily May Peel) \n",
"4 5 3 Allen, Mr. William Henry \n",
"\n",
" Age SibSp Parch Ticket Fare Cabin Embarked Sex_male \n",
"0 22.0 1 0 A/5 21171 7.2500 NaN S 1 \n",
"1 38.0 1 0 PC 17599 71.2833 C85 C 0 \n",
"2 26.0 0 0 STON/O2. 3101282 7.9250 NaN S 0 \n",
"3 35.0 1 0 113803 53.1000 C123 S 0 \n",
"4 35.0 0 0 373450 8.0500 NaN S 1 "
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data = pd.get_dummies(data, columns=['Sex'], drop_first=True)\n",
"data.head()"
]
},
{
"cell_type": "code",
"execution_count": 17,
"id": "fd501ce5",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
"\n",
"
\n",
" \n",
" \n",
" \n",
" Sex_male \n",
" Fare \n",
" Age \n",
" Pclass \n",
" SibSp \n",
" \n",
" \n",
" \n",
" \n",
" 0 \n",
" 1 \n",
" 7.2500 \n",
" 22.0 \n",
" 3 \n",
" 1 \n",
" \n",
" \n",
" 1 \n",
" 0 \n",
" 71.2833 \n",
" 38.0 \n",
" 1 \n",
" 1 \n",
" \n",
" \n",
" 2 \n",
" 0 \n",
" 7.9250 \n",
" 26.0 \n",
" 3 \n",
" 0 \n",
" \n",
" \n",
" 3 \n",
" 0 \n",
" 53.1000 \n",
" 35.0 \n",
" 1 \n",
" 1 \n",
" \n",
" \n",
" 4 \n",
" 1 \n",
" 8.0500 \n",
" 35.0 \n",
" 3 \n",
" 0 \n",
" \n",
" \n",
"
\n",
"
"
],
"text/plain": [
" Sex_male Fare Age Pclass SibSp\n",
"0 1 7.2500 22.0 3 1\n",
"1 0 71.2833 38.0 1 1\n",
"2 0 7.9250 26.0 3 0\n",
"3 0 53.1000 35.0 1 1\n",
"4 1 8.0500 35.0 3 0"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"data = data[['Sex_male', 'Fare', 'Age','Pclass', 'SibSp']]\n",
"data.head()"
]
},
{
"cell_type": "code",
"execution_count": 18,
"id": "ac70fa2a",
"metadata": {},
"outputs": [],
"source": [
"data_train = data.iloc[:891]\n",
"data_test = data.iloc[891:]"
]
},
{
"cell_type": "code",
"execution_count": 19,
"id": "f307ca52",
"metadata": {},
"outputs": [],
"source": [
"X = data_train.values\n",
"test = data_test.values\n",
"y = survived_train.values"
]
},
{
"cell_type": "code",
"execution_count": 20,
"id": "3c4de849",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"DecisionTreeClassifier() In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org. "
],
"text/plain": [
"DecisionTreeClassifier()"
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"clf = tree.DecisionTreeClassifier()\n",
"clf.fit(X, y)\n"
]
},
{
"cell_type": "code",
"execution_count": 35,
"id": "1e9b38a7",
"metadata": {},
"outputs": [
{
"data": {
"image/svg+xml": [
"\n",
"\n",
"\n",
"\n",
"\n",
"\n",
"Tree \n",
" \n",
"\n",
"\n",
"0 \n",
" \n",
"Sex_male ≤ 0.5 \n",
"gini = 0.473 \n",
"samples = 891 \n",
"value = [549, 342] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"1 \n",
" \n",
"Pclass ≤ 2.5 \n",
"gini = 0.383 \n",
"samples = 314 \n",
"value = [81, 233] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"0->1 \n",
" \n",
" \n",
"True \n",
" \n",
"\n",
"\n",
"138 \n",
" \n",
"Age ≤ 6.5 \n",
"gini = 0.306 \n",
"samples = 577 \n",
"value = [468, 109] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"0->138 \n",
" \n",
" \n",
"False \n",
" \n",
"\n",
"\n",
"2 \n",
" \n",
"Age ≤ 2.5 \n",
"gini = 0.1 \n",
"samples = 170 \n",
"value = [9, 161] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"1->2 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"45 \n",
" \n",
"Fare ≤ 23.35 \n",
"gini = 0.5 \n",
"samples = 144 \n",
"value = [72, 72] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"1->45 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"3 \n",
" \n",
"Pclass ≤ 1.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"2->3 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"6 \n",
" \n",
"Fare ≤ 28.856 \n",
"gini = 0.091 \n",
"samples = 168 \n",
"value = [8, 160] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"2->6 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"4 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"3->4 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"5 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"3->5 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"7 \n",
" \n",
"Fare ≤ 28.231 \n",
"gini = 0.182 \n",
"samples = 69 \n",
"value = [7, 62] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"6->7 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"38 \n",
" \n",
"Fare ≤ 149.035 \n",
"gini = 0.02 \n",
"samples = 99 \n",
"value = [1, 98] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"6->38 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"8 \n",
" \n",
"Age ≤ 56.0 \n",
"gini = 0.161 \n",
"samples = 68 \n",
"value = [6, 62] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"7->8 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"37 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"7->37 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"9 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.14 \n",
"samples = 66 \n",
"value = [5, 61] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"8->9 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"34 \n",
" \n",
"Pclass ≤ 1.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"8->34 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"10 \n",
" \n",
"Fare ≤ 13.25 \n",
"gini = 0.085 \n",
"samples = 45 \n",
"value = [2, 43] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"9->10 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"23 \n",
" \n",
"Age ≤ 25.0 \n",
"gini = 0.245 \n",
"samples = 21 \n",
"value = [3, 18] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"9->23 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"11 \n",
" \n",
"Fare ≤ 12.825 \n",
"gini = 0.147 \n",
"samples = 25 \n",
"value = [2, 23] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"10->11 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"22 \n",
" \n",
"gini = 0.0 \n",
"samples = 20 \n",
"value = [0, 20] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"10->22 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"12 \n",
" \n",
"gini = 0.0 \n",
"samples = 11 \n",
"value = [0, 11] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"11->12 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"13 \n",
" \n",
"Age ≤ 26.0 \n",
"gini = 0.245 \n",
"samples = 14 \n",
"value = [2, 12] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"11->13 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"14 \n",
" \n",
"Age ≤ 21.0 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"13->14 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"17 \n",
" \n",
"Age ≤ 37.0 \n",
"gini = 0.165 \n",
"samples = 11 \n",
"value = [1, 10] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"13->17 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"15 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"14->15 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"16 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"14->16 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"18 \n",
" \n",
"gini = 0.0 \n",
"samples = 8 \n",
"value = [0, 8] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"17->18 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"19 \n",
" \n",
"Age ≤ 39.0 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"17->19 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"20 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"19->20 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"21 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"19->21 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"24 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [0, 6] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"23->24 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"25 \n",
" \n",
"Age ≤ 27.5 \n",
"gini = 0.32 \n",
"samples = 15 \n",
"value = [3, 12] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"23->25 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"26 \n",
" \n",
"Fare ≤ 17.429 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"25->26 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"29 \n",
" \n",
"Age ≤ 43.0 \n",
"gini = 0.153 \n",
"samples = 12 \n",
"value = [1, 11] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"25->29 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"27 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"26->27 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"28 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"26->28 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"30 \n",
" \n",
"gini = 0.0 \n",
"samples = 9 \n",
"value = [0, 9] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"29->30 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"31 \n",
" \n",
"Age ≤ 44.5 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"29->31 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"32 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"31->32 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"33 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"31->33 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"35 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"34->35 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"36 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"34->36 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"39 \n",
" \n",
"gini = 0.0 \n",
"samples = 81 \n",
"value = [0, 81] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"38->39 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"40 \n",
" \n",
"Fare ≤ 152.506 \n",
"gini = 0.105 \n",
"samples = 18 \n",
"value = [1, 17] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"38->40 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"41 \n",
" \n",
"Age ≤ 23.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"40->41 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"44 \n",
" \n",
"gini = 0.0 \n",
"samples = 16 \n",
"value = [0, 16] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"40->44 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"42 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"41->42 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"43 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"41->43 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"46 \n",
" \n",
"Age ≤ 36.5 \n",
"gini = 0.484 \n",
"samples = 117 \n",
"value = [48, 69] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"45->46 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"125 \n",
" \n",
"Fare ≤ 32.881 \n",
"gini = 0.198 \n",
"samples = 27 \n",
"value = [24, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"45->125 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"47 \n",
" \n",
"Fare ≤ 7.888 \n",
"gini = 0.472 \n",
"samples = 110 \n",
"value = [42, 68] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"46->47 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"122 \n",
" \n",
"Age ≤ 55.0 \n",
"gini = 0.245 \n",
"samples = 7 \n",
"value = [6, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"46->122 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"48 \n",
" \n",
"Age ≤ 29.25 \n",
"gini = 0.393 \n",
"samples = 41 \n",
"value = [11, 30] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"47->48 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"77 \n",
" \n",
"Fare ≤ 10.825 \n",
"gini = 0.495 \n",
"samples = 69 \n",
"value = [31, 38] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"47->77 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"49 \n",
" \n",
"Fare ≤ 6.987 \n",
"gini = 0.355 \n",
"samples = 39 \n",
"value = [9, 30] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"48->49 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"76 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"48->76 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"50 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"49->50 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"51 \n",
" \n",
"Fare ≤ 7.523 \n",
"gini = 0.332 \n",
"samples = 38 \n",
"value = [8, 30] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"49->51 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"52 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [0, 6] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"51->52 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"53 \n",
" \n",
"Age ≤ 15.0 \n",
"gini = 0.375 \n",
"samples = 32 \n",
"value = [8, 24] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"51->53 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"54 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"53->54 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"55 \n",
" \n",
"Fare ≤ 7.64 \n",
"gini = 0.35 \n",
"samples = 31 \n",
"value = [7, 24] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"53->55 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"56 \n",
" \n",
"Age ≤ 25.5 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"55->56 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"59 \n",
" \n",
"Fare ≤ 7.781 \n",
"gini = 0.293 \n",
"samples = 28 \n",
"value = [5, 23] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"55->59 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"57 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"56->57 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"58 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"56->58 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"60 \n",
" \n",
"Fare ≤ 7.763 \n",
"gini = 0.375 \n",
"samples = 20 \n",
"value = [5, 15] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"59->60 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"75 \n",
" \n",
"gini = 0.0 \n",
"samples = 8 \n",
"value = [0, 8] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"59->75 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"61 \n",
" \n",
"Fare ≤ 7.744 \n",
"gini = 0.291 \n",
"samples = 17 \n",
"value = [3, 14] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"60->61 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"70 \n",
" \n",
"Age ≤ 20.0 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"60->70 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"62 \n",
" \n",
"gini = 0.0 \n",
"samples = 4 \n",
"value = [0, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"61->62 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"63 \n",
" \n",
"Age ≤ 21.5 \n",
"gini = 0.355 \n",
"samples = 13 \n",
"value = [3, 10] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"61->63 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"64 \n",
" \n",
"Age ≤ 18.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"63->64 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"67 \n",
" \n",
"Age ≤ 25.0 \n",
"gini = 0.298 \n",
"samples = 11 \n",
"value = [2, 9] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"63->67 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"65 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"64->65 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"66 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"64->66 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"68 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"67->68 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"69 \n",
" \n",
"gini = 0.346 \n",
"samples = 9 \n",
"value = [2, 7] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"67->69 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"71 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"70->71 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"72 \n",
" \n",
"Age ≤ 23.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"70->72 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"73 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"72->73 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"74 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"72->74 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"78 \n",
" \n",
"Age ≤ 19.0 \n",
"gini = 0.434 \n",
"samples = 22 \n",
"value = [15, 7] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"77->78 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"91 \n",
" \n",
"Fare ≤ 13.908 \n",
"gini = 0.449 \n",
"samples = 47 \n",
"value = [16, 31] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"77->91 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"79 \n",
" \n",
"Fare ≤ 10.152 \n",
"gini = 0.32 \n",
"samples = 5 \n",
"value = [1, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"78->79 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"82 \n",
" \n",
"Age ≤ 30.5 \n",
"gini = 0.291 \n",
"samples = 17 \n",
"value = [14, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"78->82 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"80 \n",
" \n",
"gini = 0.0 \n",
"samples = 4 \n",
"value = [0, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"79->80 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"81 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"79->81 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"83 \n",
" \n",
"Fare ≤ 7.988 \n",
"gini = 0.219 \n",
"samples = 16 \n",
"value = [14, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"82->83 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"90 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"82->90 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"84 \n",
" \n",
"Age ≤ 25.5 \n",
"gini = 0.48 \n",
"samples = 5 \n",
"value = [3, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"83->84 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"89 \n",
" \n",
"gini = 0.0 \n",
"samples = 11 \n",
"value = [11, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"83->89 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"85 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"84->85 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"86 \n",
" \n",
"Age ≤ 27.5 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"84->86 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"87 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"86->87 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"88 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"86->88 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"92 \n",
" \n",
"gini = 0.0 \n",
"samples = 8 \n",
"value = [0, 8] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"91->92 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"93 \n",
" \n",
"Fare ≤ 15.373 \n",
"gini = 0.484 \n",
"samples = 39 \n",
"value = [16, 23] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"91->93 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"94 \n",
" \n",
"Age ≤ 28.5 \n",
"gini = 0.32 \n",
"samples = 10 \n",
"value = [8, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"93->94 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"101 \n",
" \n",
"SibSp ≤ 2.5 \n",
"gini = 0.4 \n",
"samples = 29 \n",
"value = [8, 21] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"93->101 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"95 \n",
" \n",
"Age ≤ 16.0 \n",
"gini = 0.198 \n",
"samples = 9 \n",
"value = [8, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"94->95 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"100 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"94->100 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"96 \n",
" \n",
"Age ≤ 14.75 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"95->96 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"99 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [6, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"95->99 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"97 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"96->97 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"98 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"96->98 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"102 \n",
" \n",
"Age ≤ 28.5 \n",
"gini = 0.355 \n",
"samples = 26 \n",
"value = [6, 20] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"101->102 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"119 \n",
" \n",
"Fare ≤ 18.463 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"101->119 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"103 \n",
" \n",
"Age ≤ 27.0 \n",
"gini = 0.255 \n",
"samples = 20 \n",
"value = [3, 17] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"102->103 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"112 \n",
" \n",
"Age ≤ 33.5 \n",
"gini = 0.5 \n",
"samples = 6 \n",
"value = [3, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"102->112 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"104 \n",
" \n",
"Age ≤ 11.5 \n",
"gini = 0.375 \n",
"samples = 12 \n",
"value = [3, 9] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"103->104 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"111 \n",
" \n",
"gini = 0.0 \n",
"samples = 8 \n",
"value = [0, 8] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"103->111 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"105 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [0, 6] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"104->105 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"106 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.5 \n",
"samples = 6 \n",
"value = [3, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"104->106 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"107 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"106->107 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"108 \n",
" \n",
"Fare ≤ 15.975 \n",
"gini = 0.375 \n",
"samples = 4 \n",
"value = [3, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"106->108 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"109 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"108->109 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"110 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"108->110 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"113 \n",
" \n",
"Fare ≤ 19.262 \n",
"gini = 0.375 \n",
"samples = 4 \n",
"value = [3, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"112->113 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"118 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"112->118 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"114 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"113->114 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"115 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"113->115 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"116 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"115->116 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"117 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"115->117 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"120 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"119->120 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"121 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"119->121 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"123 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [6, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"122->123 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"124 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"122->124 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"126 \n",
" \n",
"Fare ≤ 31.331 \n",
"gini = 0.278 \n",
"samples = 18 \n",
"value = [15, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"125->126 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"137 \n",
" \n",
"gini = 0.0 \n",
"samples = 9 \n",
"value = [9, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"125->137 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"127 \n",
" \n",
"Fare ≤ 24.808 \n",
"gini = 0.117 \n",
"samples = 16 \n",
"value = [15, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"126->127 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"136 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"126->136 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"128 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.375 \n",
"samples = 4 \n",
"value = [3, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"127->128 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"135 \n",
" \n",
"gini = 0.0 \n",
"samples = 12 \n",
"value = [12, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"127->135 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"129 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"128->129 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"130 \n",
" \n",
"Age ≤ 29.0 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"128->130 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"131 \n",
" \n",
"Fare ≤ 23.8 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"130->131 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"134 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"130->134 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"132 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"131->132 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"133 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"131->133 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"139 \n",
" \n",
"SibSp ≤ 2.5 \n",
"gini = 0.444 \n",
"samples = 24 \n",
"value = [8, 16] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"138->139 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"146 \n",
" \n",
"Pclass ≤ 1.5 \n",
"gini = 0.28 \n",
"samples = 553 \n",
"value = [460, 93] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"138->146 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"140 \n",
" \n",
"gini = 0.0 \n",
"samples = 15 \n",
"value = [0, 15] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"139->140 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"141 \n",
" \n",
"Age ≤ 2.5 \n",
"gini = 0.198 \n",
"samples = 9 \n",
"value = [8, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"139->141 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"142 \n",
" \n",
"gini = 0.0 \n",
"samples = 5 \n",
"value = [5, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"141->142 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"143 \n",
" \n",
"Age ≤ 3.5 \n",
"gini = 0.375 \n",
"samples = 4 \n",
"value = [3, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"141->143 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"144 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"143->144 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"145 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"143->145 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"147 \n",
" \n",
"Fare ≤ 26.144 \n",
"gini = 0.46 \n",
"samples = 120 \n",
"value = [77, 43] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"146->147 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"226 \n",
" \n",
"Fare ≤ 51.698 \n",
"gini = 0.204 \n",
"samples = 433 \n",
"value = [383, 50] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"146->226 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"148 \n",
" \n",
"gini = 0.0 \n",
"samples = 10 \n",
"value = [10, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"147->148 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"149 \n",
" \n",
"Age ≤ 53.0 \n",
"gini = 0.476 \n",
"samples = 110 \n",
"value = [67, 43] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"147->149 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"150 \n",
" \n",
"Fare ≤ 27.135 \n",
"gini = 0.495 \n",
"samples = 89 \n",
"value = [49, 40] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"149->150 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"215 \n",
" \n",
"Age ≤ 75.5 \n",
"gini = 0.245 \n",
"samples = 21 \n",
"value = [18, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"149->215 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"151 \n",
" \n",
"Fare ≤ 26.469 \n",
"gini = 0.26 \n",
"samples = 13 \n",
"value = [2, 11] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"150->151 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"160 \n",
" \n",
"Fare ≤ 387.665 \n",
"gini = 0.472 \n",
"samples = 76 \n",
"value = [47, 29] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"150->160 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"152 \n",
" \n",
"gini = 0.0 \n",
"samples = 4 \n",
"value = [0, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"151->152 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"153 \n",
" \n",
"Age ≤ 46.5 \n",
"gini = 0.346 \n",
"samples = 9 \n",
"value = [2, 7] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"151->153 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"154 \n",
" \n",
"Age ≤ 40.0 \n",
"gini = 0.408 \n",
"samples = 7 \n",
"value = [2, 5] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"153->154 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"159 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"153->159 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"155 \n",
" \n",
"Age ≤ 31.0 \n",
"gini = 0.32 \n",
"samples = 5 \n",
"value = [1, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"154->155 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"158 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"154->158 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"156 \n",
" \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"155->156 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"157 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"155->157 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"161 \n",
" \n",
"Fare ≤ 134.642 \n",
"gini = 0.463 \n",
"samples = 74 \n",
"value = [47, 27] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"160->161 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"214 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"160->214 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"162 \n",
" \n",
"Age ≤ 27.5 \n",
"gini = 0.481 \n",
"samples = 67 \n",
"value = [40, 27] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"161->162 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"213 \n",
" \n",
"gini = 0.0 \n",
"samples = 7 \n",
"value = [7, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"161->213 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"163 \n",
" \n",
"Age ≤ 24.5 \n",
"gini = 0.426 \n",
"samples = 13 \n",
"value = [4, 9] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"162->163 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"172 \n",
" \n",
"Fare ≤ 115.442 \n",
"gini = 0.444 \n",
"samples = 54 \n",
"value = [36, 18] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"162->172 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"164 \n",
" \n",
"Fare ≤ 109.892 \n",
"gini = 0.49 \n",
"samples = 7 \n",
"value = [4, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"163->164 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"171 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [0, 6] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"163->171 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"165 \n",
" \n",
"Age ≤ 22.0 \n",
"gini = 0.32 \n",
"samples = 5 \n",
"value = [4, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"164->165 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"170 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"164->170 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"166 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"165->166 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"167 \n",
" \n",
"Fare ≤ 71.279 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"165->167 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"168 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"167->168 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"169 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"167->169 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"173 \n",
" \n",
"Fare ≤ 29.1 \n",
"gini = 0.426 \n",
"samples = 52 \n",
"value = [36, 16] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"172->173 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"212 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"172->212 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"174 \n",
" \n",
"gini = 0.0 \n",
"samples = 5 \n",
"value = [5, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"173->174 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"175 \n",
" \n",
"Fare ≤ 30.598 \n",
"gini = 0.449 \n",
"samples = 47 \n",
"value = [31, 16] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"173->175 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"176 \n",
" \n",
"Age ≤ 28.5 \n",
"gini = 0.408 \n",
"samples = 7 \n",
"value = [2, 5] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"175->176 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"181 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.399 \n",
"samples = 40 \n",
"value = [29, 11] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"175->181 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"177 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [0, 3] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"176->177 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"178 \n",
" \n",
"Fare ≤ 30.25 \n",
"gini = 0.5 \n",
"samples = 4 \n",
"value = [2, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"176->178 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"179 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"178->179 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"180 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"178->180 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"182 \n",
" \n",
"Fare ≤ 37.0 \n",
"gini = 0.266 \n",
"samples = 19 \n",
"value = [16, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"181->182 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"193 \n",
" \n",
"Age ≤ 49.5 \n",
"gini = 0.472 \n",
"samples = 21 \n",
"value = [13, 8] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"181->193 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"183 \n",
" \n",
"Fare ≤ 35.25 \n",
"gini = 0.469 \n",
"samples = 8 \n",
"value = [5, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"182->183 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"192 \n",
" \n",
"gini = 0.0 \n",
"samples = 11 \n",
"value = [11, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"182->192 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"184 \n",
" \n",
"Age ≤ 34.0 \n",
"gini = 0.32 \n",
"samples = 5 \n",
"value = [4, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"183->184 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"189 \n",
" \n",
"Age ≤ 36.5 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"183->189 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"185 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"184->185 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"186 \n",
" \n",
"Age ≤ 43.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"184->186 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"187 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"186->187 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"188 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"186->188 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"190 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"189->190 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"191 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"189->191 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"194 \n",
" \n",
"Age ≤ 47.0 \n",
"gini = 0.494 \n",
"samples = 18 \n",
"value = [10, 8] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"193->194 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"211 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"193->211 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"195 \n",
" \n",
"Fare ≤ 59.087 \n",
"gini = 0.426 \n",
"samples = 13 \n",
"value = [9, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"194->195 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"208 \n",
" \n",
"Fare ≤ 99.994 \n",
"gini = 0.32 \n",
"samples = 5 \n",
"value = [1, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"194->208 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"196 \n",
" \n",
"Fare ≤ 52.277 \n",
"gini = 0.5 \n",
"samples = 6 \n",
"value = [3, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"195->196 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"203 \n",
" \n",
"Fare ≤ 86.737 \n",
"gini = 0.245 \n",
"samples = 7 \n",
"value = [6, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"195->203 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"197 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"196->197 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"198 \n",
" \n",
"Fare ≤ 52.827 \n",
"gini = 0.375 \n",
"samples = 4 \n",
"value = [1, 3] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"196->198 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"199 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"198->199 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"200 \n",
" \n",
"Age ≤ 34.0 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"198->200 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"201 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"200->201 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"202 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"200->202 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"204 \n",
" \n",
"gini = 0.0 \n",
"samples = 5 \n",
"value = [5, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"203->204 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"205 \n",
" \n",
"Age ≤ 41.0 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"203->205 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"206 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"205->206 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"207 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"205->207 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"209 \n",
" \n",
"gini = 0.0 \n",
"samples = 4 \n",
"value = [0, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"208->209 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"210 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"208->210 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"216 \n",
" \n",
"Fare ≤ 35.077 \n",
"gini = 0.18 \n",
"samples = 20 \n",
"value = [18, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"215->216 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"225 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"215->225 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"217 \n",
" \n",
"gini = 0.0 \n",
"samples = 11 \n",
"value = [11, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"216->217 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"218 \n",
" \n",
"Fare ≤ 42.502 \n",
"gini = 0.346 \n",
"samples = 9 \n",
"value = [7, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"216->218 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"219 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"218->219 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"220 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.219 \n",
"samples = 8 \n",
"value = [7, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"218->220 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"221 \n",
" \n",
"gini = 0.0 \n",
"samples = 5 \n",
"value = [5, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"220->221 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"222 \n",
" \n",
"Age ≤ 62.0 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"220->222 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"223 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"222->223 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"224 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"222->224 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"227 \n",
" \n",
"Age ≤ 13.0 \n",
"gini = 0.193 \n",
"samples = 417 \n",
"value = [372, 45] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"226->227 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"404 \n",
" \n",
"Fare ≤ 63.023 \n",
"gini = 0.43 \n",
"samples = 16 \n",
"value = [11, 5] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"226->404 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"228 \n",
" \n",
"SibSp ≤ 2.0 \n",
"gini = 0.444 \n",
"samples = 12 \n",
"value = [8, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"227->228 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"235 \n",
" \n",
"Age ≤ 32.25 \n",
"gini = 0.182 \n",
"samples = 405 \n",
"value = [364, 41] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"227->235 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"229 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.32 \n",
"samples = 5 \n",
"value = [1, 4] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"228->229 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"234 \n",
" \n",
"gini = 0.0 \n",
"samples = 7 \n",
"value = [7, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"228->234 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"230 \n",
" \n",
"Age ≤ 10.0 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"229->230 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"233 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [0, 3] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"229->233 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"231 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"230->231 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"232 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"230->232 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"236 \n",
" \n",
"Age ≤ 30.75 \n",
"gini = 0.206 \n",
"samples = 300 \n",
"value = [265, 35] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"235->236 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"377 \n",
" \n",
"Fare ≤ 7.91 \n",
"gini = 0.108 \n",
"samples = 105 \n",
"value = [99, 6] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"235->377 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"237 \n",
" \n",
"Fare ≤ 23.35 \n",
"gini = 0.185 \n",
"samples = 282 \n",
"value = [253, 29] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"236->237 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"356 \n",
" \n",
"Fare ≤ 7.815 \n",
"gini = 0.444 \n",
"samples = 18 \n",
"value = [12, 6] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"236->356 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"238 \n",
" \n",
"Fare ≤ 22.887 \n",
"gini = 0.195 \n",
"samples = 265 \n",
"value = [236, 29] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"237->238 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"355 \n",
" \n",
"gini = 0.0 \n",
"samples = 17 \n",
"value = [17, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"237->355 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"239 \n",
" \n",
"Age ≤ 28.75 \n",
"gini = 0.19 \n",
"samples = 264 \n",
"value = [236, 28] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"238->239 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"354 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"238->354 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"240 \n",
" \n",
"Fare ≤ 15.173 \n",
"gini = 0.179 \n",
"samples = 241 \n",
"value = [217, 24] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"239->240 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"339 \n",
" \n",
"Fare ≤ 10.0 \n",
"gini = 0.287 \n",
"samples = 23 \n",
"value = [19, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"239->339 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"241 \n",
" \n",
"Fare ≤ 7.798 \n",
"gini = 0.165 \n",
"samples = 220 \n",
"value = [200, 20] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"240->241 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"328 \n",
" \n",
"Fare ≤ 15.373 \n",
"gini = 0.308 \n",
"samples = 21 \n",
"value = [17, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"240->328 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"242 \n",
" \n",
"Fare ≤ 7.763 \n",
"gini = 0.215 \n",
"samples = 90 \n",
"value = [79, 11] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"241->242 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"289 \n",
" \n",
"Age ≤ 20.5 \n",
"gini = 0.129 \n",
"samples = 130 \n",
"value = [121, 9] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"241->289 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"243 \n",
" \n",
"Fare ≤ 7.24 \n",
"gini = 0.169 \n",
"samples = 75 \n",
"value = [68, 7] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"242->243 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"274 \n",
" \n",
"Age ≤ 20.0 \n",
"gini = 0.391 \n",
"samples = 15 \n",
"value = [11, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"242->274 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"244 \n",
" \n",
"Age ≤ 27.5 \n",
"gini = 0.245 \n",
"samples = 42 \n",
"value = [36, 6] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"243->244 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"267 \n",
" \n",
"Fare ≤ 7.746 \n",
"gini = 0.059 \n",
"samples = 33 \n",
"value = [32, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"243->267 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"245 \n",
" \n",
"Age ≤ 26.0 \n",
"gini = 0.363 \n",
"samples = 21 \n",
"value = [16, 5] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"244->245 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"262 \n",
" \n",
"Fare ≤ 7.227 \n",
"gini = 0.091 \n",
"samples = 21 \n",
"value = [20, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"244->262 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"246 \n",
" \n",
"Age ≤ 19.5 \n",
"gini = 0.32 \n",
"samples = 20 \n",
"value = [16, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"245->246 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"261 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"245->261 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"247 \n",
" \n",
"gini = 0.0 \n",
"samples = 7 \n",
"value = [7, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"246->247 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"248 \n",
" \n",
"Fare ≤ 2.006 \n",
"gini = 0.426 \n",
"samples = 13 \n",
"value = [9, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"246->248 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"249 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"248->249 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"250 \n",
" \n",
"Fare ≤ 7.133 \n",
"gini = 0.375 \n",
"samples = 12 \n",
"value = [9, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"248->250 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"251 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [6, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"250->251 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"252 \n",
" \n",
"Fare ≤ 7.183 \n",
"gini = 0.5 \n",
"samples = 6 \n",
"value = [3, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"250->252 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"253 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"252->253 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"254 \n",
" \n",
"Age ≤ 22.75 \n",
"gini = 0.48 \n",
"samples = 5 \n",
"value = [3, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"252->254 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"255 \n",
" \n",
"Age ≤ 21.0 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"254->255 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"260 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"254->260 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"256 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"255->256 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"257 \n",
" \n",
"Fare ≤ 7.227 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"255->257 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"258 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"257->258 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"259 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"257->259 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"263 \n",
" \n",
"gini = 0.0 \n",
"samples = 14 \n",
"value = [14, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"262->263 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"264 \n",
" \n",
"Age ≤ 28.25 \n",
"gini = 0.245 \n",
"samples = 7 \n",
"value = [6, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"262->264 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"265 \n",
" \n",
"gini = 0.278 \n",
"samples = 6 \n",
"value = [5, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"264->265 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"266 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"264->266 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"268 \n",
" \n",
"gini = 0.0 \n",
"samples = 21 \n",
"value = [21, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"267->268 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"269 \n",
" \n",
"Age ≤ 23.0 \n",
"gini = 0.153 \n",
"samples = 12 \n",
"value = [11, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"267->269 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"270 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"269->270 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"271 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.165 \n",
"samples = 11 \n",
"value = [10, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"269->271 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"272 \n",
" \n",
"gini = 0.18 \n",
"samples = 10 \n",
"value = [9, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"271->272 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"273 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"271->273 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"275 \n",
" \n",
"gini = 0.0 \n",
"samples = 4 \n",
"value = [4, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"274->275 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"276 \n",
" \n",
"Age ≤ 26.5 \n",
"gini = 0.463 \n",
"samples = 11 \n",
"value = [7, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"274->276 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"277 \n",
" \n",
"Age ≤ 21.5 \n",
"gini = 0.408 \n",
"samples = 7 \n",
"value = [5, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"276->277 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"284 \n",
" \n",
"Age ≤ 27.5 \n",
"gini = 0.5 \n",
"samples = 4 \n",
"value = [2, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"276->284 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"278 \n",
" \n",
"Fare ≤ 7.785 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"277->278 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"281 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.32 \n",
"samples = 5 \n",
"value = [4, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"277->281 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"279 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"278->279 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"280 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"278->280 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"282 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"281->282 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"283 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"281->283 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"285 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"284->285 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"286 \n",
" \n",
"Fare ≤ 7.785 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"284->286 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"287 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"286->287 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"288 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"286->288 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"290 \n",
" \n",
"Fare ≤ 8.104 \n",
"gini = 0.251 \n",
"samples = 34 \n",
"value = [29, 5] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"289->290 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"309 \n",
" \n",
"Fare ≤ 8.081 \n",
"gini = 0.08 \n",
"samples = 96 \n",
"value = [92, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"289->309 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"291 \n",
" \n",
"Fare ≤ 7.91 \n",
"gini = 0.408 \n",
"samples = 14 \n",
"value = [10, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"290->291 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"302 \n",
" \n",
"Pclass ≤ 2.5 \n",
"gini = 0.095 \n",
"samples = 20 \n",
"value = [19, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"290->302 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"292 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [6, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"291->292 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"293 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.5 \n",
"samples = 8 \n",
"value = [4, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"291->293 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"294 \n",
" \n",
"Age ≤ 19.5 \n",
"gini = 0.49 \n",
"samples = 7 \n",
"value = [4, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"293->294 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"301 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"293->301 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"295 \n",
" \n",
"Age ≤ 17.0 \n",
"gini = 0.48 \n",
"samples = 5 \n",
"value = [2, 3] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"294->295 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"300 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"294->300 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"296 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"295->296 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"297 \n",
" \n",
"Age ≤ 18.5 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"295->297 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"298 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"297->298 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"299 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"297->299 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"303 \n",
" \n",
"Age ≤ 18.5 \n",
"gini = 0.245 \n",
"samples = 7 \n",
"value = [6, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"302->303 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"308 \n",
" \n",
"gini = 0.0 \n",
"samples = 13 \n",
"value = [13, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"302->308 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"304 \n",
" \n",
"gini = 0.0 \n",
"samples = 4 \n",
"value = [4, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"303->304 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"305 \n",
" \n",
"Fare ≤ 11.75 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"303->305 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"306 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"305->306 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"307 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"305->307 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"310 \n",
" \n",
"gini = 0.0 \n",
"samples = 54 \n",
"value = [54, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"309->310 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"311 \n",
" \n",
"Fare ≤ 8.273 \n",
"gini = 0.172 \n",
"samples = 42 \n",
"value = [38, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"309->311 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"312 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"311->312 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"313 \n",
" \n",
"Age ≤ 26.5 \n",
"gini = 0.136 \n",
"samples = 41 \n",
"value = [38, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"311->313 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"314 \n",
" \n",
"gini = 0.0 \n",
"samples = 21 \n",
"value = [21, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"313->314 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"315 \n",
" \n",
"Fare ≤ 14.158 \n",
"gini = 0.255 \n",
"samples = 20 \n",
"value = [17, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"313->315 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"316 \n",
" \n",
"Fare ≤ 13.681 \n",
"gini = 0.337 \n",
"samples = 14 \n",
"value = [11, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"315->316 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"327 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [6, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"315->327 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"317 \n",
" \n",
"Age ≤ 27.5 \n",
"gini = 0.26 \n",
"samples = 13 \n",
"value = [11, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"316->317 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"326 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"316->326 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"318 \n",
" \n",
"Fare ≤ 10.831 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"317->318 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"321 \n",
" \n",
"Fare ≤ 11.75 \n",
"gini = 0.18 \n",
"samples = 10 \n",
"value = [9, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"317->321 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"319 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"318->319 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"320 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"318->320 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"322 \n",
" \n",
"gini = 0.0 \n",
"samples = 7 \n",
"value = [7, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"321->322 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"323 \n",
" \n",
"Fare ≤ 13.25 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"321->323 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"324 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"323->324 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"325 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"323->325 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"329 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"328->329 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"330 \n",
" \n",
"Age ≤ 27.0 \n",
"gini = 0.188 \n",
"samples = 19 \n",
"value = [17, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"328->330 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"331 \n",
" \n",
"Fare ≤ 15.921 \n",
"gini = 0.346 \n",
"samples = 9 \n",
"value = [7, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"330->331 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"338 \n",
" \n",
"gini = 0.0 \n",
"samples = 10 \n",
"value = [10, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"330->338 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"332 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"331->332 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"333 \n",
" \n",
"Age ≤ 25.5 \n",
"gini = 0.219 \n",
"samples = 8 \n",
"value = [7, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"331->333 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"334 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [6, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"333->334 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"335 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"333->335 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"336 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"335->336 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"337 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"335->337 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"340 \n",
" \n",
"Fare ≤ 9.492 \n",
"gini = 0.375 \n",
"samples = 16 \n",
"value = [12, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"339->340 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"353 \n",
" \n",
"gini = 0.0 \n",
"samples = 7 \n",
"value = [7, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"339->353 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"341 \n",
" \n",
"Age ≤ 29.5 \n",
"gini = 0.245 \n",
"samples = 14 \n",
"value = [12, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"340->341 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"352 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"340->352 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"342 \n",
" \n",
"Fare ≤ 7.973 \n",
"gini = 0.408 \n",
"samples = 7 \n",
"value = [5, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"341->342 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"351 \n",
" \n",
"gini = 0.0 \n",
"samples = 7 \n",
"value = [7, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"341->351 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"343 \n",
" \n",
"Fare ≤ 7.885 \n",
"gini = 0.48 \n",
"samples = 5 \n",
"value = [3, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"342->343 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"350 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"342->350 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"344 \n",
" \n",
"Fare ≤ 7.763 \n",
"gini = 0.375 \n",
"samples = 4 \n",
"value = [3, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"343->344 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"349 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"343->349 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"345 \n",
" \n",
"SibSp ≤ 0.5 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"344->345 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"348 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"344->348 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"346 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"345->346 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"347 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"345->347 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"357 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"356->357 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"358 \n",
" \n",
"Fare ≤ 7.875 \n",
"gini = 0.48 \n",
"samples = 15 \n",
"value = [9, 6] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"356->358 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"359 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"358->359 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"360 \n",
" \n",
"Fare ≤ 26.125 \n",
"gini = 0.459 \n",
"samples = 14 \n",
"value = [9, 5] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"358->360 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"361 \n",
" \n",
"Fare ≤ 20.925 \n",
"gini = 0.486 \n",
"samples = 12 \n",
"value = [7, 5] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"360->361 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"376 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"360->376 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"362 \n",
" \n",
"Age ≤ 31.5 \n",
"gini = 0.463 \n",
"samples = 11 \n",
"value = [7, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"361->362 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"375 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"361->375 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"363 \n",
" \n",
"Fare ≤ 9.213 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"362->363 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"368 \n",
" \n",
"Fare ≤ 8.206 \n",
"gini = 0.375 \n",
"samples = 8 \n",
"value = [6, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"362->368 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"364 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"363->364 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"365 \n",
" \n",
"Fare ≤ 11.75 \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"363->365 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"366 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"365->366 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"367 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"365->367 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"369 \n",
" \n",
"Fare ≤ 7.988 \n",
"gini = 0.48 \n",
"samples = 5 \n",
"value = [3, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"368->369 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"374 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"368->374 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"370 \n",
" \n",
"Fare ≤ 7.91 \n",
"gini = 0.375 \n",
"samples = 4 \n",
"value = [3, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"369->370 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"373 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"369->373 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"371 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"370->371 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"372 \n",
" \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"370->372 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"378 \n",
" \n",
"gini = 0.0 \n",
"samples = 32 \n",
"value = [32, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"377->378 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"379 \n",
" \n",
"Fare ≤ 7.988 \n",
"gini = 0.151 \n",
"samples = 73 \n",
"value = [67, 6] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"377->379 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"380 \n",
" \n",
"SibSp ≤ 1.0 \n",
"gini = 0.5 \n",
"samples = 4 \n",
"value = [2, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"379->380 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"385 \n",
" \n",
"Age ≤ 61.0 \n",
"gini = 0.109 \n",
"samples = 69 \n",
"value = [65, 4] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"379->385 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"381 \n",
" \n",
"Age ≤ 41.5 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [1, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"380->381 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"384 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [1, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"380->384 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"382 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"381->382 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"383 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"381->383 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"386 \n",
" \n",
"Fare ≤ 13.25 \n",
"gini = 0.087 \n",
"samples = 66 \n",
"value = [63, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"385->386 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"401 \n",
" \n",
"Age ≤ 64.0 \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"385->401 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"387 \n",
" \n",
"Fare ≤ 12.938 \n",
"gini = 0.157 \n",
"samples = 35 \n",
"value = [32, 3] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"386->387 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"400 \n",
" \n",
"gini = 0.0 \n",
"samples = 31 \n",
"value = [31, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"386->400 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"388 \n",
" \n",
"Age ≤ 44.5 \n",
"gini = 0.08 \n",
"samples = 24 \n",
"value = [23, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"387->388 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"393 \n",
" \n",
"Age ≤ 45.0 \n",
"gini = 0.298 \n",
"samples = 11 \n",
"value = [9, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"387->393 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"389 \n",
" \n",
"gini = 0.0 \n",
"samples = 17 \n",
"value = [17, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"388->389 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"390 \n",
" \n",
"Age ≤ 46.0 \n",
"gini = 0.245 \n",
"samples = 7 \n",
"value = [6, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"388->390 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"391 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"390->391 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"392 \n",
" \n",
"gini = 0.0 \n",
"samples = 6 \n",
"value = [6, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"390->392 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"394 \n",
" \n",
"Age ≤ 40.5 \n",
"gini = 0.375 \n",
"samples = 8 \n",
"value = [6, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"393->394 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"399 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"393->399 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"395 \n",
" \n",
"Age ≤ 35.0 \n",
"gini = 0.278 \n",
"samples = 6 \n",
"value = [5, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"394->395 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"398 \n",
" \n",
"gini = 0.5 \n",
"samples = 2 \n",
"value = [1, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"394->398 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"396 \n",
" \n",
"gini = 0.444 \n",
"samples = 3 \n",
"value = [2, 1] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"395->396 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"397 \n",
" \n",
"gini = 0.0 \n",
"samples = 3 \n",
"value = [3, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"395->397 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"402 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"401->402 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"403 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [2, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"401->403 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"405 \n",
" \n",
"Age ≤ 30.0 \n",
"gini = 0.408 \n",
"samples = 7 \n",
"value = [2, 5] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"404->405 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"410 \n",
" \n",
"gini = 0.0 \n",
"samples = 9 \n",
"value = [9, 0] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"404->410 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"406 \n",
" \n",
"Age ≤ 27.0 \n",
"gini = 0.48 \n",
"samples = 5 \n",
"value = [2, 3] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"405->406 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"409 \n",
" \n",
"gini = 0.0 \n",
"samples = 2 \n",
"value = [0, 2] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"405->409 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"407 \n",
" \n",
"gini = 0.0 \n",
"samples = 1 \n",
"value = [0, 1] \n",
"class = Not Survived \n",
" \n",
"\n",
"\n",
"406->407 \n",
" \n",
" \n",
" \n",
"\n",
"\n",
"408 \n",
" \n",
"gini = 0.5 \n",
"samples = 4 \n",
"value = [2, 2] \n",
"class = Survived \n",
" \n",
"\n",
"\n",
"406->408 \n",
" \n",
" \n",
" \n",
" \n",
" \n"
],
"text/plain": [
""
]
},
"execution_count": 35,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"import graphviz \n",
"from PIL import Image\n",
"dot_data = tree.export_graphviz(clf, out_file=None) \n",
"graph = graphviz.Source(dot_data) \n",
"graph.render(\"Titanic\") \n",
"\n",
"dot_data = tree.export_graphviz(clf, out_file=None, \n",
" feature_names=data_train.columns.values, \n",
" class_names=['Survived','Not Survived'], \n",
" filled=True, rounded=True, \n",
" special_characters=True) \n",
"graph = graphviz.Source(dot_data) \n",
"graph "
]
},
{
"cell_type": "code",
"execution_count": 22,
"id": "8ad7b604",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0.978675645342312"
]
},
"execution_count": 22,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# Make predictions and store in 'Survived' column of df_test\n",
"Y_pred = clf.predict(test)\n",
"df_test['Survived'] = Y_pred\n",
"clf.score(X, y)"
]
},
{
"cell_type": "code",
"execution_count": 23,
"id": "0d0f2be2",
"metadata": {},
"outputs": [],
"source": [
"df_test[['PassengerId', 'Survived']].to_csv('C:/Users/User/Desktop/dt.csv', index=False)"
]
},
{
"cell_type": "code",
"execution_count": 34,
"id": "ae505ffa",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"'Source.gv.pdf'"
]
},
"execution_count": 34,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"src = graphviz.Source(dot_data)\n",
"src.view()"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "e046624a",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "ml",
"language": "python",
"name": "ml"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.15"
}
},
"nbformat": 4,
"nbformat_minor": 5
}