{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "002ba07a", "metadata": {}, "outputs": [], "source": [ "\n", "# Import modules\n", "import os\n", "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "import re\n", "import numpy as np\n", "from sklearn import tree\n", "from sklearn.model_selection import train_test_split\n", "\n", "# Figures inline and set visualization style\n", "%matplotlib inline\n", "sns.set()\n" ] }, { "cell_type": "code", "execution_count": 2, "id": "2949d944", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "(891, 12)\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
PassengerIdSurvivedPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
0103Braund, Mr. Owen Harrismale22.010A/5 211717.2500NaNS
1211Cumings, Mrs. John Bradley (Florence Briggs Th...female38.010PC 1759971.2833C85C
2313Heikkinen, Miss. Lainafemale26.000STON/O2. 31012827.9250NaNS
3411Futrelle, Mrs. Jacques Heath (Lily May Peel)female35.01011380353.1000C123S
4503Allen, Mr. William Henrymale35.0003734508.0500NaNS
\n", "
" ], "text/plain": [ " PassengerId Survived Pclass \\\n", "0 1 0 3 \n", "1 2 1 1 \n", "2 3 1 3 \n", "3 4 1 1 \n", "4 5 0 3 \n", "\n", " Name Sex Age SibSp \\\n", "0 Braund, Mr. Owen Harris male 22.0 1 \n", "1 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 1 \n", "2 Heikkinen, Miss. Laina female 26.0 0 \n", "3 Futrelle, Mrs. Jacques Heath (Lily May Peel) female 35.0 1 \n", "4 Allen, Mr. William Henry male 35.0 0 \n", "\n", " Parch Ticket Fare Cabin Embarked \n", "0 0 A/5 21171 7.2500 NaN S \n", "1 0 PC 17599 71.2833 C85 C \n", "2 0 STON/O2. 3101282 7.9250 NaN S \n", "3 0 113803 53.1000 C123 S \n", "4 0 373450 8.0500 NaN S " ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "\n", "\n", "df_train = pd.read_csv(\"C:/Users/User/Downloads/train.csv\")\n", "df_test = pd.read_csv(\"C:/Users/User/Downloads/test.csv\")\n", "\n", "\n", "print(df_train.shape)\n", "df_train.head()" ] }, { "cell_type": "code", "execution_count": 3, "id": "34b67c3b", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "(418, 11)\n" ] }, { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
PassengerIdPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
08923Kelly, Mr. Jamesmale34.5003309117.8292NaNQ
18933Wilkes, Mrs. James (Ellen Needs)female47.0103632727.0000NaNS
28942Myles, Mr. Thomas Francismale62.0002402769.6875NaNQ
38953Wirz, Mr. Albertmale27.0003151548.6625NaNS
48963Hirvonen, Mrs. Alexander (Helga E Lindqvist)female22.011310129812.2875NaNS
\n", "
" ], "text/plain": [ " PassengerId Pclass Name Sex \\\n", "0 892 3 Kelly, Mr. James male \n", "1 893 3 Wilkes, Mrs. James (Ellen Needs) female \n", "2 894 2 Myles, Mr. Thomas Francis male \n", "3 895 3 Wirz, Mr. Albert male \n", "4 896 3 Hirvonen, Mrs. Alexander (Helga E Lindqvist) female \n", "\n", " Age SibSp Parch Ticket Fare Cabin Embarked \n", "0 34.5 0 0 330911 7.8292 NaN Q \n", "1 47.0 1 0 363272 7.0000 NaN S \n", "2 62.0 0 0 240276 9.6875 NaN Q \n", "3 27.0 0 0 315154 8.6625 NaN S \n", "4 22.0 1 1 3101298 12.2875 NaN S " ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "print(df_test.shape)\n", "df_test.head()" ] }, { "cell_type": "code", "execution_count": 4, "id": "4b1b1011", "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "sns.countplot(x='Survived', data=df_train);" ] }, { "cell_type": "code", "execution_count": 5, "id": "d60bf413", "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "sns.countplot(x='Sex', data=df_train);" ] }, { "cell_type": "code", "execution_count": 6, "id": "1c2bfb25", "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "sns.catplot(x='Survived', col='Sex', kind='count', data=df_train);" ] }, { "cell_type": "code", "execution_count": 7, "id": "dbede04d", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Sex\n", "female 233\n", "male 109\n", "Name: Survived, dtype: int64" ] }, "execution_count": 7, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df_train.groupby(['Sex']).Survived.sum()" ] }, { "cell_type": "code", "execution_count": 8, "id": "eeeb3341", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "342" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df_train.Survived.sum()" ] }, { "cell_type": "code", "execution_count": 9, "id": "937a3084", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "0.7420382165605095\n", "0.18890814558058924\n" ] } ], "source": [ "print(df_train[df_train.Sex == 'female'].Survived.sum()/df_train[df_train.Sex == 'female'].Survived.count())\n", "print(df_train[df_train.Sex == 'male'].Survived.sum()/df_train[df_train.Sex == 'male'].Survived.count())" ] }, { "cell_type": "code", "execution_count": 10, "id": "864310ff", "metadata": {}, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "sns.catplot(x='Survived', col='Pclass', kind='count', data=df_train);" ] }, { "cell_type": "code", "execution_count": 11, "id": "4b9782b2", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
PassengerIdPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
41313053Spector, Mr. WoolfmaleNaN00A.5. 32368.0500NaNS
41413061Oliva y Ocana, Dona. Ferminafemale39.000PC 17758108.9000C105C
41513073Saether, Mr. Simon Sivertsenmale38.500SOTON/O.Q. 31012627.2500NaNS
41613083Ware, Mr. FrederickmaleNaN003593098.0500NaNS
41713093Peter, Master. Michael JmaleNaN11266822.3583NaNC
\n", "
" ], "text/plain": [ " PassengerId Pclass Name Sex Age SibSp \\\n", "413 1305 3 Spector, Mr. Woolf male NaN 0 \n", "414 1306 1 Oliva y Ocana, Dona. Fermina female 39.0 0 \n", "415 1307 3 Saether, Mr. Simon Sivertsen male 38.5 0 \n", "416 1308 3 Ware, Mr. Frederick male NaN 0 \n", "417 1309 3 Peter, Master. Michael J male NaN 1 \n", "\n", " Parch Ticket Fare Cabin Embarked \n", "413 0 A.5. 3236 8.0500 NaN S \n", "414 0 PC 17758 108.9000 C105 C \n", "415 0 SOTON/O.Q. 3101262 7.2500 NaN S \n", "416 0 359309 8.0500 NaN S \n", "417 1 2668 22.3583 NaN C " ] }, "execution_count": 11, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# Store target variable of training data in a safe place\n", "survived_train = df_train.Survived\n", "\n", "# Concatenate training and test sets\n", "data = pd.concat([df_train.drop(['Survived'], axis=1), df_test])\n", "data.tail()" ] }, { "cell_type": "code", "execution_count": 12, "id": "31431041", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
PassengerIdPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
08923Kelly, Mr. Jamesmale34.5003309117.8292NaNQ
18933Wilkes, Mrs. James (Ellen Needs)female47.0103632727.0000NaNS
28942Myles, Mr. Thomas Francismale62.0002402769.6875NaNQ
38953Wirz, Mr. Albertmale27.0003151548.6625NaNS
48963Hirvonen, Mrs. Alexander (Helga E Lindqvist)female22.011310129812.2875NaNS
....................................
41313053Spector, Mr. WoolfmaleNaN00A.5. 32368.0500NaNS
41413061Oliva y Ocana, Dona. Ferminafemale39.000PC 17758108.9000C105C
41513073Saether, Mr. Simon Sivertsenmale38.500SOTON/O.Q. 31012627.2500NaNS
41613083Ware, Mr. FrederickmaleNaN003593098.0500NaNS
41713093Peter, Master. Michael JmaleNaN11266822.3583NaNC
\n", "

418 rows × 11 columns

\n", "
" ], "text/plain": [ " PassengerId Pclass Name \\\n", "0 892 3 Kelly, Mr. James \n", "1 893 3 Wilkes, Mrs. James (Ellen Needs) \n", "2 894 2 Myles, Mr. Thomas Francis \n", "3 895 3 Wirz, Mr. Albert \n", "4 896 3 Hirvonen, Mrs. Alexander (Helga E Lindqvist) \n", ".. ... ... ... \n", "413 1305 3 Spector, Mr. Woolf \n", "414 1306 1 Oliva y Ocana, Dona. Fermina \n", "415 1307 3 Saether, Mr. Simon Sivertsen \n", "416 1308 3 Ware, Mr. Frederick \n", "417 1309 3 Peter, Master. Michael J \n", "\n", " Sex Age SibSp Parch Ticket Fare Cabin Embarked \n", "0 male 34.5 0 0 330911 7.8292 NaN Q \n", "1 female 47.0 1 0 363272 7.0000 NaN S \n", "2 male 62.0 0 0 240276 9.6875 NaN Q \n", "3 male 27.0 0 0 315154 8.6625 NaN S \n", "4 female 22.0 1 1 3101298 12.2875 NaN S \n", ".. ... ... ... ... ... ... ... ... \n", "413 male NaN 0 0 A.5. 3236 8.0500 NaN S \n", "414 female 39.0 0 0 PC 17758 108.9000 C105 C \n", "415 male 38.5 0 0 SOTON/O.Q. 3101262 7.2500 NaN S \n", "416 male NaN 0 0 359309 8.0500 NaN S \n", "417 male NaN 1 1 2668 22.3583 NaN C \n", "\n", "[418 rows x 11 columns]" ] }, "execution_count": 12, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df_test" ] }, { "cell_type": "code", "execution_count": 13, "id": "ef626cce", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0 0\n", "1 1\n", "2 1\n", "3 1\n", "4 0\n", " ..\n", "886 0\n", "887 1\n", "888 0\n", "889 1\n", "890 0\n", "Name: Survived, Length: 891, dtype: int64" ] }, "execution_count": 13, "metadata": {}, "output_type": "execute_result" } ], "source": [ "survived_train" ] }, { "cell_type": "code", "execution_count": 14, "id": "d871eb29", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "Int64Index: 1309 entries, 0 to 417\n", "Data columns (total 11 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 PassengerId 1309 non-null int64 \n", " 1 Pclass 1309 non-null int64 \n", " 2 Name 1309 non-null object \n", " 3 Sex 1309 non-null object \n", " 4 Age 1046 non-null float64\n", " 5 SibSp 1309 non-null int64 \n", " 6 Parch 1309 non-null int64 \n", " 7 Ticket 1309 non-null object \n", " 8 Fare 1308 non-null float64\n", " 9 Cabin 295 non-null object \n", " 10 Embarked 1307 non-null object \n", "dtypes: float64(2), int64(4), object(5)\n", "memory usage: 122.7+ KB\n" ] } ], "source": [ "data.info()" ] }, { "cell_type": "code", "execution_count": 15, "id": "7a39497b", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "Int64Index: 1309 entries, 0 to 417\n", "Data columns (total 11 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 PassengerId 1309 non-null int64 \n", " 1 Pclass 1309 non-null int64 \n", " 2 Name 1309 non-null object \n", " 3 Sex 1309 non-null object \n", " 4 Age 1309 non-null float64\n", " 5 SibSp 1309 non-null int64 \n", " 6 Parch 1309 non-null int64 \n", " 7 Ticket 1309 non-null object \n", " 8 Fare 1309 non-null float64\n", " 9 Cabin 295 non-null object \n", " 10 Embarked 1307 non-null object \n", "dtypes: float64(2), int64(4), object(5)\n", "memory usage: 122.7+ KB\n" ] } ], "source": [ "# Dealing with missing numerical variables\n", "data['Age'] = data.Age.fillna(data.Age.median())\n", "data['Fare'] = data.Fare.fillna(data.Fare.median())\n", "\n", "# Check out info of data\n", "data.info()" ] }, { "cell_type": "code", "execution_count": 16, "id": "d6257a63", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
PassengerIdPclassNameAgeSibSpParchTicketFareCabinEmbarkedSex_male
013Braund, Mr. Owen Harris22.010A/5 211717.2500NaNS1
121Cumings, Mrs. John Bradley (Florence Briggs Th...38.010PC 1759971.2833C85C0
233Heikkinen, Miss. Laina26.000STON/O2. 31012827.9250NaNS0
341Futrelle, Mrs. Jacques Heath (Lily May Peel)35.01011380353.1000C123S0
453Allen, Mr. William Henry35.0003734508.0500NaNS1
\n", "
" ], "text/plain": [ " PassengerId Pclass Name \\\n", "0 1 3 Braund, Mr. Owen Harris \n", "1 2 1 Cumings, Mrs. John Bradley (Florence Briggs Th... \n", "2 3 3 Heikkinen, Miss. Laina \n", "3 4 1 Futrelle, Mrs. Jacques Heath (Lily May Peel) \n", "4 5 3 Allen, Mr. William Henry \n", "\n", " Age SibSp Parch Ticket Fare Cabin Embarked Sex_male \n", "0 22.0 1 0 A/5 21171 7.2500 NaN S 1 \n", "1 38.0 1 0 PC 17599 71.2833 C85 C 0 \n", "2 26.0 0 0 STON/O2. 3101282 7.9250 NaN S 0 \n", "3 35.0 1 0 113803 53.1000 C123 S 0 \n", "4 35.0 0 0 373450 8.0500 NaN S 1 " ] }, "execution_count": 16, "metadata": {}, "output_type": "execute_result" } ], "source": [ "data = pd.get_dummies(data, columns=['Sex'], drop_first=True)\n", "data.head()" ] }, { "cell_type": "code", "execution_count": 17, "id": "fd501ce5", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Sex_maleFareAgePclassSibSp
017.250022.031
1071.283338.011
207.925026.030
3053.100035.011
418.050035.030
\n", "
" ], "text/plain": [ " Sex_male Fare Age Pclass SibSp\n", "0 1 7.2500 22.0 3 1\n", "1 0 71.2833 38.0 1 1\n", "2 0 7.9250 26.0 3 0\n", "3 0 53.1000 35.0 1 1\n", "4 1 8.0500 35.0 3 0" ] }, "execution_count": 17, "metadata": {}, "output_type": "execute_result" } ], "source": [ "data = data[['Sex_male', 'Fare', 'Age','Pclass', 'SibSp']]\n", "data.head()" ] }, { "cell_type": "code", "execution_count": 18, "id": "ac70fa2a", "metadata": {}, "outputs": [], "source": [ "data_train = data.iloc[:891]\n", "data_test = data.iloc[891:]" ] }, { "cell_type": "code", "execution_count": 19, "id": "f307ca52", "metadata": {}, "outputs": [], "source": [ "X = data_train.values\n", "test = data_test.values\n", "y = survived_train.values" ] }, { "cell_type": "code", "execution_count": 20, "id": "3c4de849", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
DecisionTreeClassifier()
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" ], "text/plain": [ "DecisionTreeClassifier()" ] }, "execution_count": 20, "metadata": {}, "output_type": "execute_result" } ], "source": [ "clf = tree.DecisionTreeClassifier()\n", "clf.fit(X, y)\n" ] }, { "cell_type": "code", "execution_count": 35, "id": "1e9b38a7", "metadata": {}, "outputs": [ { "data": { "image/svg+xml": [ "\n", "\n", "\n", "\n", "\n", "\n", "Tree\n", "\n", "\n", "\n", "0\n", "\n", "Sex_male ≤ 0.5\n", "gini = 0.473\n", "samples = 891\n", "value = [549, 342]\n", "class = Survived\n", "\n", "\n", "\n", "1\n", "\n", "Pclass ≤ 2.5\n", "gini = 0.383\n", "samples = 314\n", "value = [81, 233]\n", "class = Not Survived\n", "\n", "\n", "\n", "0->1\n", "\n", "\n", "True\n", "\n", "\n", "\n", "138\n", "\n", "Age ≤ 6.5\n", "gini = 0.306\n", "samples = 577\n", "value = [468, 109]\n", "class = Survived\n", "\n", "\n", "\n", "0->138\n", "\n", "\n", "False\n", "\n", "\n", "\n", "2\n", "\n", "Age ≤ 2.5\n", "gini = 0.1\n", "samples = 170\n", "value = [9, 161]\n", "class = Not Survived\n", "\n", "\n", "\n", "1->2\n", "\n", "\n", "\n", "\n", "\n", "45\n", "\n", "Fare ≤ 23.35\n", "gini = 0.5\n", "samples = 144\n", "value = [72, 72]\n", "class = Survived\n", "\n", "\n", "\n", "1->45\n", "\n", "\n", "\n", "\n", "\n", "3\n", "\n", "Pclass ≤ 1.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "2->3\n", "\n", "\n", "\n", "\n", "\n", "6\n", "\n", "Fare ≤ 28.856\n", "gini = 0.091\n", "samples = 168\n", "value = [8, 160]\n", "class = Not Survived\n", "\n", "\n", "\n", "2->6\n", "\n", "\n", "\n", "\n", "\n", "4\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "3->4\n", "\n", "\n", "\n", "\n", "\n", "5\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "3->5\n", "\n", "\n", "\n", "\n", "\n", "7\n", "\n", "Fare ≤ 28.231\n", "gini = 0.182\n", "samples = 69\n", "value = [7, 62]\n", "class = Not Survived\n", "\n", "\n", "\n", "6->7\n", "\n", "\n", "\n", "\n", "\n", "38\n", "\n", "Fare ≤ 149.035\n", "gini = 0.02\n", "samples = 99\n", "value = [1, 98]\n", "class = Not Survived\n", "\n", "\n", "\n", "6->38\n", "\n", "\n", "\n", "\n", "\n", "8\n", "\n", "Age ≤ 56.0\n", "gini = 0.161\n", "samples = 68\n", "value = [6, 62]\n", "class = Not Survived\n", "\n", "\n", "\n", "7->8\n", "\n", "\n", "\n", "\n", "\n", "37\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "7->37\n", "\n", "\n", "\n", "\n", "\n", "9\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.14\n", "samples = 66\n", "value = [5, 61]\n", "class = Not Survived\n", "\n", "\n", "\n", "8->9\n", "\n", "\n", "\n", "\n", "\n", "34\n", "\n", "Pclass ≤ 1.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "8->34\n", "\n", "\n", "\n", "\n", "\n", "10\n", "\n", "Fare ≤ 13.25\n", "gini = 0.085\n", "samples = 45\n", "value = [2, 43]\n", "class = Not Survived\n", "\n", "\n", "\n", "9->10\n", "\n", "\n", "\n", "\n", "\n", "23\n", "\n", "Age ≤ 25.0\n", "gini = 0.245\n", "samples = 21\n", "value = [3, 18]\n", "class = Not Survived\n", "\n", "\n", "\n", "9->23\n", "\n", "\n", "\n", "\n", "\n", "11\n", "\n", "Fare ≤ 12.825\n", "gini = 0.147\n", "samples = 25\n", "value = [2, 23]\n", "class = Not Survived\n", "\n", "\n", "\n", "10->11\n", "\n", "\n", "\n", "\n", "\n", "22\n", "\n", "gini = 0.0\n", "samples = 20\n", "value = [0, 20]\n", "class = Not Survived\n", "\n", "\n", "\n", "10->22\n", "\n", "\n", "\n", "\n", "\n", "12\n", "\n", "gini = 0.0\n", "samples = 11\n", "value = [0, 11]\n", "class = Not Survived\n", "\n", "\n", "\n", "11->12\n", "\n", "\n", "\n", "\n", "\n", "13\n", "\n", "Age ≤ 26.0\n", "gini = 0.245\n", "samples = 14\n", "value = [2, 12]\n", "class = Not Survived\n", "\n", "\n", "\n", "11->13\n", "\n", "\n", "\n", "\n", "\n", "14\n", "\n", "Age ≤ 21.0\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "13->14\n", "\n", "\n", "\n", "\n", "\n", "17\n", "\n", "Age ≤ 37.0\n", "gini = 0.165\n", "samples = 11\n", "value = [1, 10]\n", "class = Not Survived\n", "\n", "\n", "\n", "13->17\n", "\n", "\n", "\n", "\n", "\n", "15\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "14->15\n", "\n", "\n", "\n", "\n", "\n", "16\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "14->16\n", "\n", "\n", "\n", "\n", "\n", "18\n", "\n", "gini = 0.0\n", "samples = 8\n", "value = [0, 8]\n", "class = Not Survived\n", "\n", "\n", "\n", "17->18\n", "\n", "\n", "\n", "\n", "\n", "19\n", "\n", "Age ≤ 39.0\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "17->19\n", "\n", "\n", "\n", "\n", "\n", "20\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "19->20\n", "\n", "\n", "\n", "\n", "\n", "21\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "19->21\n", "\n", "\n", "\n", "\n", "\n", "24\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [0, 6]\n", "class = Not Survived\n", "\n", "\n", "\n", "23->24\n", "\n", "\n", "\n", "\n", "\n", "25\n", "\n", "Age ≤ 27.5\n", "gini = 0.32\n", "samples = 15\n", "value = [3, 12]\n", "class = Not Survived\n", "\n", "\n", "\n", "23->25\n", "\n", "\n", "\n", "\n", "\n", "26\n", "\n", "Fare ≤ 17.429\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "25->26\n", "\n", "\n", "\n", "\n", "\n", "29\n", "\n", "Age ≤ 43.0\n", "gini = 0.153\n", "samples = 12\n", "value = [1, 11]\n", "class = Not Survived\n", "\n", "\n", "\n", "25->29\n", "\n", "\n", "\n", "\n", "\n", "27\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "26->27\n", "\n", "\n", "\n", "\n", "\n", "28\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "26->28\n", "\n", "\n", "\n", "\n", "\n", "30\n", "\n", "gini = 0.0\n", "samples = 9\n", "value = [0, 9]\n", "class = Not Survived\n", "\n", "\n", "\n", "29->30\n", "\n", "\n", "\n", "\n", "\n", "31\n", "\n", "Age ≤ 44.5\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "29->31\n", "\n", "\n", "\n", "\n", "\n", "32\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "31->32\n", "\n", "\n", "\n", "\n", "\n", "33\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "31->33\n", "\n", "\n", "\n", "\n", "\n", "35\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "34->35\n", "\n", "\n", "\n", "\n", "\n", "36\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "34->36\n", "\n", "\n", "\n", "\n", "\n", "39\n", "\n", "gini = 0.0\n", "samples = 81\n", "value = [0, 81]\n", "class = Not Survived\n", "\n", "\n", "\n", "38->39\n", "\n", "\n", "\n", "\n", "\n", "40\n", "\n", "Fare ≤ 152.506\n", "gini = 0.105\n", "samples = 18\n", "value = [1, 17]\n", "class = Not Survived\n", "\n", "\n", "\n", "38->40\n", "\n", "\n", "\n", "\n", "\n", "41\n", "\n", "Age ≤ 23.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "40->41\n", "\n", "\n", "\n", "\n", "\n", "44\n", "\n", "gini = 0.0\n", "samples = 16\n", "value = [0, 16]\n", "class = Not Survived\n", "\n", "\n", "\n", "40->44\n", "\n", "\n", "\n", "\n", "\n", "42\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "41->42\n", "\n", "\n", "\n", "\n", "\n", "43\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "41->43\n", "\n", "\n", "\n", "\n", "\n", "46\n", "\n", "Age ≤ 36.5\n", "gini = 0.484\n", "samples = 117\n", "value = [48, 69]\n", "class = Not Survived\n", "\n", "\n", "\n", "45->46\n", "\n", "\n", "\n", "\n", "\n", "125\n", "\n", "Fare ≤ 32.881\n", "gini = 0.198\n", "samples = 27\n", "value = [24, 3]\n", "class = Survived\n", "\n", "\n", "\n", "45->125\n", "\n", "\n", "\n", "\n", "\n", "47\n", "\n", "Fare ≤ 7.888\n", "gini = 0.472\n", "samples = 110\n", "value = [42, 68]\n", "class = Not Survived\n", "\n", "\n", "\n", "46->47\n", "\n", "\n", "\n", "\n", "\n", "122\n", "\n", "Age ≤ 55.0\n", "gini = 0.245\n", "samples = 7\n", "value = [6, 1]\n", "class = Survived\n", "\n", "\n", "\n", "46->122\n", "\n", "\n", "\n", "\n", "\n", "48\n", "\n", "Age ≤ 29.25\n", "gini = 0.393\n", "samples = 41\n", "value = [11, 30]\n", "class = Not Survived\n", "\n", "\n", "\n", "47->48\n", "\n", "\n", "\n", "\n", "\n", "77\n", "\n", "Fare ≤ 10.825\n", "gini = 0.495\n", "samples = 69\n", "value = [31, 38]\n", "class = Not Survived\n", "\n", "\n", "\n", "47->77\n", "\n", "\n", "\n", "\n", "\n", "49\n", "\n", "Fare ≤ 6.987\n", "gini = 0.355\n", "samples = 39\n", "value = [9, 30]\n", "class = Not Survived\n", "\n", "\n", "\n", "48->49\n", "\n", "\n", "\n", "\n", "\n", "76\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "48->76\n", "\n", "\n", "\n", "\n", "\n", "50\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "49->50\n", "\n", "\n", "\n", "\n", "\n", "51\n", "\n", "Fare ≤ 7.523\n", "gini = 0.332\n", "samples = 38\n", "value = [8, 30]\n", "class = Not Survived\n", "\n", "\n", "\n", "49->51\n", "\n", "\n", "\n", "\n", "\n", "52\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [0, 6]\n", "class = Not Survived\n", "\n", "\n", "\n", "51->52\n", "\n", "\n", "\n", "\n", "\n", "53\n", "\n", "Age ≤ 15.0\n", "gini = 0.375\n", "samples = 32\n", "value = [8, 24]\n", "class = Not Survived\n", "\n", "\n", "\n", "51->53\n", "\n", "\n", "\n", "\n", "\n", "54\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "53->54\n", "\n", "\n", "\n", "\n", "\n", "55\n", "\n", "Fare ≤ 7.64\n", "gini = 0.35\n", "samples = 31\n", "value = [7, 24]\n", "class = Not Survived\n", "\n", "\n", "\n", "53->55\n", "\n", "\n", "\n", "\n", "\n", "56\n", "\n", "Age ≤ 25.5\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "55->56\n", "\n", "\n", "\n", "\n", "\n", "59\n", "\n", "Fare ≤ 7.781\n", "gini = 0.293\n", "samples = 28\n", "value = [5, 23]\n", "class = Not Survived\n", "\n", "\n", "\n", "55->59\n", "\n", "\n", "\n", "\n", "\n", "57\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "56->57\n", "\n", "\n", "\n", "\n", "\n", "58\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "56->58\n", "\n", "\n", "\n", "\n", "\n", "60\n", "\n", "Fare ≤ 7.763\n", "gini = 0.375\n", "samples = 20\n", "value = [5, 15]\n", "class = Not Survived\n", "\n", "\n", "\n", "59->60\n", "\n", "\n", "\n", "\n", "\n", "75\n", "\n", "gini = 0.0\n", "samples = 8\n", "value = [0, 8]\n", "class = Not Survived\n", "\n", "\n", "\n", "59->75\n", "\n", "\n", "\n", "\n", "\n", "61\n", "\n", "Fare ≤ 7.744\n", "gini = 0.291\n", "samples = 17\n", "value = [3, 14]\n", "class = Not Survived\n", "\n", "\n", "\n", "60->61\n", "\n", "\n", "\n", "\n", "\n", "70\n", "\n", "Age ≤ 20.0\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "60->70\n", "\n", "\n", "\n", "\n", "\n", "62\n", "\n", "gini = 0.0\n", "samples = 4\n", "value = [0, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "61->62\n", "\n", "\n", "\n", "\n", "\n", "63\n", "\n", "Age ≤ 21.5\n", "gini = 0.355\n", "samples = 13\n", "value = [3, 10]\n", "class = Not Survived\n", "\n", "\n", "\n", "61->63\n", "\n", "\n", "\n", "\n", "\n", "64\n", "\n", "Age ≤ 18.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "63->64\n", "\n", "\n", "\n", "\n", "\n", "67\n", "\n", "Age ≤ 25.0\n", "gini = 0.298\n", "samples = 11\n", "value = [2, 9]\n", "class = Not Survived\n", "\n", "\n", "\n", "63->67\n", "\n", "\n", "\n", "\n", "\n", "65\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "64->65\n", "\n", "\n", "\n", "\n", "\n", "66\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "64->66\n", "\n", "\n", "\n", "\n", "\n", "68\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "67->68\n", "\n", "\n", "\n", "\n", "\n", "69\n", "\n", "gini = 0.346\n", "samples = 9\n", "value = [2, 7]\n", "class = Not Survived\n", "\n", "\n", "\n", "67->69\n", "\n", "\n", "\n", "\n", "\n", "71\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "70->71\n", "\n", "\n", "\n", "\n", "\n", "72\n", "\n", "Age ≤ 23.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "70->72\n", "\n", "\n", "\n", "\n", "\n", "73\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "72->73\n", "\n", "\n", "\n", "\n", "\n", "74\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "72->74\n", "\n", "\n", "\n", "\n", "\n", "78\n", "\n", "Age ≤ 19.0\n", "gini = 0.434\n", "samples = 22\n", "value = [15, 7]\n", "class = Survived\n", "\n", "\n", "\n", "77->78\n", "\n", "\n", "\n", "\n", "\n", "91\n", "\n", "Fare ≤ 13.908\n", "gini = 0.449\n", "samples = 47\n", "value = [16, 31]\n", "class = Not Survived\n", "\n", "\n", "\n", "77->91\n", "\n", "\n", "\n", "\n", "\n", "79\n", "\n", "Fare ≤ 10.152\n", "gini = 0.32\n", "samples = 5\n", "value = [1, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "78->79\n", "\n", "\n", "\n", "\n", "\n", "82\n", "\n", "Age ≤ 30.5\n", "gini = 0.291\n", "samples = 17\n", "value = [14, 3]\n", "class = Survived\n", "\n", "\n", "\n", "78->82\n", "\n", "\n", "\n", "\n", "\n", "80\n", "\n", "gini = 0.0\n", "samples = 4\n", "value = [0, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "79->80\n", "\n", "\n", "\n", "\n", "\n", "81\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "79->81\n", "\n", "\n", "\n", "\n", "\n", "83\n", "\n", "Fare ≤ 7.988\n", "gini = 0.219\n", "samples = 16\n", "value = [14, 2]\n", "class = Survived\n", "\n", "\n", "\n", "82->83\n", "\n", "\n", "\n", "\n", "\n", "90\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "82->90\n", "\n", "\n", "\n", "\n", "\n", "84\n", "\n", "Age ≤ 25.5\n", "gini = 0.48\n", "samples = 5\n", "value = [3, 2]\n", "class = Survived\n", "\n", "\n", "\n", "83->84\n", "\n", "\n", "\n", "\n", "\n", "89\n", "\n", "gini = 0.0\n", "samples = 11\n", "value = [11, 0]\n", "class = Survived\n", "\n", "\n", "\n", "83->89\n", "\n", "\n", "\n", "\n", "\n", "85\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "84->85\n", "\n", "\n", "\n", "\n", "\n", "86\n", "\n", "Age ≤ 27.5\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "84->86\n", "\n", "\n", "\n", "\n", "\n", "87\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "86->87\n", "\n", "\n", "\n", "\n", "\n", "88\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "86->88\n", "\n", "\n", "\n", "\n", "\n", "92\n", "\n", "gini = 0.0\n", "samples = 8\n", "value = [0, 8]\n", "class = Not Survived\n", "\n", "\n", "\n", "91->92\n", "\n", "\n", "\n", "\n", "\n", "93\n", "\n", "Fare ≤ 15.373\n", "gini = 0.484\n", "samples = 39\n", "value = [16, 23]\n", "class = Not Survived\n", "\n", "\n", "\n", "91->93\n", "\n", "\n", "\n", "\n", "\n", "94\n", "\n", "Age ≤ 28.5\n", "gini = 0.32\n", "samples = 10\n", "value = [8, 2]\n", "class = Survived\n", "\n", "\n", "\n", "93->94\n", "\n", "\n", "\n", "\n", "\n", "101\n", "\n", "SibSp ≤ 2.5\n", "gini = 0.4\n", "samples = 29\n", "value = [8, 21]\n", "class = Not Survived\n", "\n", "\n", "\n", "93->101\n", "\n", "\n", "\n", "\n", "\n", "95\n", "\n", "Age ≤ 16.0\n", "gini = 0.198\n", "samples = 9\n", "value = [8, 1]\n", "class = Survived\n", "\n", "\n", "\n", "94->95\n", "\n", "\n", "\n", "\n", "\n", "100\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "94->100\n", "\n", "\n", "\n", "\n", "\n", "96\n", "\n", "Age ≤ 14.75\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "95->96\n", "\n", "\n", "\n", "\n", "\n", "99\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [6, 0]\n", "class = Survived\n", "\n", "\n", "\n", "95->99\n", "\n", "\n", "\n", "\n", "\n", "97\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "96->97\n", "\n", "\n", "\n", "\n", "\n", "98\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "96->98\n", "\n", "\n", "\n", "\n", "\n", "102\n", "\n", "Age ≤ 28.5\n", "gini = 0.355\n", "samples = 26\n", "value = [6, 20]\n", "class = Not Survived\n", "\n", "\n", "\n", "101->102\n", "\n", "\n", "\n", "\n", "\n", "119\n", "\n", "Fare ≤ 18.463\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "101->119\n", "\n", "\n", "\n", "\n", "\n", "103\n", "\n", "Age ≤ 27.0\n", "gini = 0.255\n", "samples = 20\n", "value = [3, 17]\n", "class = Not Survived\n", "\n", "\n", "\n", "102->103\n", "\n", "\n", "\n", "\n", "\n", "112\n", "\n", "Age ≤ 33.5\n", "gini = 0.5\n", "samples = 6\n", "value = [3, 3]\n", "class = Survived\n", "\n", "\n", "\n", "102->112\n", "\n", "\n", "\n", "\n", "\n", "104\n", "\n", "Age ≤ 11.5\n", "gini = 0.375\n", "samples = 12\n", "value = [3, 9]\n", "class = Not Survived\n", "\n", "\n", "\n", "103->104\n", "\n", "\n", "\n", "\n", "\n", "111\n", "\n", "gini = 0.0\n", "samples = 8\n", "value = [0, 8]\n", "class = Not Survived\n", "\n", "\n", "\n", "103->111\n", "\n", "\n", "\n", "\n", "\n", "105\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [0, 6]\n", "class = Not Survived\n", "\n", "\n", "\n", "104->105\n", "\n", "\n", "\n", "\n", "\n", "106\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.5\n", "samples = 6\n", "value = [3, 3]\n", "class = Survived\n", "\n", "\n", "\n", "104->106\n", "\n", "\n", "\n", "\n", "\n", "107\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "106->107\n", "\n", "\n", "\n", "\n", "\n", "108\n", "\n", "Fare ≤ 15.975\n", "gini = 0.375\n", "samples = 4\n", "value = [3, 1]\n", "class = Survived\n", "\n", "\n", "\n", "106->108\n", "\n", "\n", "\n", "\n", "\n", "109\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "108->109\n", "\n", "\n", "\n", "\n", "\n", "110\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "108->110\n", "\n", "\n", "\n", "\n", "\n", "113\n", "\n", "Fare ≤ 19.262\n", "gini = 0.375\n", "samples = 4\n", "value = [3, 1]\n", "class = Survived\n", "\n", "\n", "\n", "112->113\n", "\n", "\n", "\n", "\n", "\n", "118\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "112->118\n", "\n", "\n", "\n", "\n", "\n", "114\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "113->114\n", "\n", "\n", "\n", "\n", "\n", "115\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "113->115\n", "\n", "\n", "\n", "\n", "\n", "116\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "115->116\n", "\n", "\n", "\n", "\n", "\n", "117\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "115->117\n", "\n", "\n", "\n", "\n", "\n", "120\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "119->120\n", "\n", "\n", "\n", "\n", "\n", "121\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "119->121\n", "\n", "\n", "\n", "\n", "\n", "123\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [6, 0]\n", "class = Survived\n", "\n", "\n", "\n", "122->123\n", "\n", "\n", "\n", "\n", "\n", "124\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "122->124\n", "\n", "\n", "\n", "\n", "\n", "126\n", "\n", "Fare ≤ 31.331\n", "gini = 0.278\n", "samples = 18\n", "value = [15, 3]\n", "class = Survived\n", "\n", "\n", "\n", "125->126\n", "\n", "\n", "\n", "\n", "\n", "137\n", "\n", "gini = 0.0\n", "samples = 9\n", "value = [9, 0]\n", "class = Survived\n", "\n", "\n", "\n", "125->137\n", "\n", "\n", "\n", "\n", "\n", "127\n", "\n", "Fare ≤ 24.808\n", "gini = 0.117\n", "samples = 16\n", "value = [15, 1]\n", "class = Survived\n", "\n", "\n", "\n", "126->127\n", "\n", "\n", "\n", "\n", "\n", "136\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "126->136\n", "\n", "\n", "\n", "\n", "\n", "128\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.375\n", "samples = 4\n", "value = [3, 1]\n", "class = Survived\n", "\n", "\n", "\n", "127->128\n", "\n", "\n", "\n", "\n", "\n", "135\n", "\n", "gini = 0.0\n", "samples = 12\n", "value = [12, 0]\n", "class = Survived\n", "\n", "\n", "\n", "127->135\n", "\n", "\n", "\n", "\n", "\n", "129\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "128->129\n", "\n", "\n", "\n", "\n", "\n", "130\n", "\n", "Age ≤ 29.0\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "128->130\n", "\n", "\n", "\n", "\n", "\n", "131\n", "\n", "Fare ≤ 23.8\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "130->131\n", "\n", "\n", "\n", "\n", "\n", "134\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "130->134\n", "\n", "\n", "\n", "\n", "\n", "132\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "131->132\n", "\n", "\n", "\n", "\n", "\n", "133\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "131->133\n", "\n", "\n", "\n", "\n", "\n", "139\n", "\n", "SibSp ≤ 2.5\n", "gini = 0.444\n", "samples = 24\n", "value = [8, 16]\n", "class = Not Survived\n", "\n", "\n", "\n", "138->139\n", "\n", "\n", "\n", "\n", "\n", "146\n", "\n", "Pclass ≤ 1.5\n", "gini = 0.28\n", "samples = 553\n", "value = [460, 93]\n", "class = Survived\n", "\n", "\n", "\n", "138->146\n", "\n", "\n", "\n", "\n", "\n", "140\n", "\n", "gini = 0.0\n", "samples = 15\n", "value = [0, 15]\n", "class = Not Survived\n", "\n", "\n", "\n", "139->140\n", "\n", "\n", "\n", "\n", "\n", "141\n", "\n", "Age ≤ 2.5\n", "gini = 0.198\n", "samples = 9\n", "value = [8, 1]\n", "class = Survived\n", "\n", "\n", "\n", "139->141\n", "\n", "\n", "\n", "\n", "\n", "142\n", "\n", "gini = 0.0\n", "samples = 5\n", "value = [5, 0]\n", "class = Survived\n", "\n", "\n", "\n", "141->142\n", "\n", "\n", "\n", "\n", "\n", "143\n", "\n", "Age ≤ 3.5\n", "gini = 0.375\n", "samples = 4\n", "value = [3, 1]\n", "class = Survived\n", "\n", "\n", "\n", "141->143\n", "\n", "\n", "\n", "\n", "\n", "144\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "143->144\n", "\n", "\n", "\n", "\n", "\n", "145\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "143->145\n", "\n", "\n", "\n", "\n", "\n", "147\n", "\n", "Fare ≤ 26.144\n", "gini = 0.46\n", "samples = 120\n", "value = [77, 43]\n", "class = Survived\n", "\n", "\n", "\n", "146->147\n", "\n", "\n", "\n", "\n", "\n", "226\n", "\n", "Fare ≤ 51.698\n", "gini = 0.204\n", "samples = 433\n", "value = [383, 50]\n", "class = Survived\n", "\n", "\n", "\n", "146->226\n", "\n", "\n", "\n", "\n", "\n", "148\n", "\n", "gini = 0.0\n", "samples = 10\n", "value = [10, 0]\n", "class = Survived\n", "\n", "\n", "\n", "147->148\n", "\n", "\n", "\n", "\n", "\n", "149\n", "\n", "Age ≤ 53.0\n", "gini = 0.476\n", "samples = 110\n", "value = [67, 43]\n", "class = Survived\n", "\n", "\n", "\n", "147->149\n", "\n", "\n", "\n", "\n", "\n", "150\n", "\n", "Fare ≤ 27.135\n", "gini = 0.495\n", "samples = 89\n", "value = [49, 40]\n", "class = Survived\n", "\n", "\n", "\n", "149->150\n", "\n", "\n", "\n", "\n", "\n", "215\n", "\n", "Age ≤ 75.5\n", "gini = 0.245\n", "samples = 21\n", "value = [18, 3]\n", "class = Survived\n", "\n", "\n", "\n", "149->215\n", "\n", "\n", "\n", "\n", "\n", "151\n", "\n", "Fare ≤ 26.469\n", "gini = 0.26\n", "samples = 13\n", "value = [2, 11]\n", "class = Not Survived\n", "\n", "\n", "\n", "150->151\n", "\n", "\n", "\n", "\n", "\n", "160\n", "\n", "Fare ≤ 387.665\n", "gini = 0.472\n", "samples = 76\n", "value = [47, 29]\n", "class = Survived\n", "\n", "\n", "\n", "150->160\n", "\n", "\n", "\n", "\n", "\n", "152\n", "\n", "gini = 0.0\n", "samples = 4\n", "value = [0, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "151->152\n", "\n", "\n", "\n", "\n", "\n", "153\n", "\n", "Age ≤ 46.5\n", "gini = 0.346\n", "samples = 9\n", "value = [2, 7]\n", "class = Not Survived\n", "\n", "\n", "\n", "151->153\n", "\n", "\n", "\n", "\n", "\n", "154\n", "\n", "Age ≤ 40.0\n", "gini = 0.408\n", "samples = 7\n", "value = [2, 5]\n", "class = Not Survived\n", "\n", "\n", "\n", "153->154\n", "\n", "\n", "\n", "\n", "\n", "159\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "153->159\n", "\n", "\n", "\n", "\n", "\n", "155\n", "\n", "Age ≤ 31.0\n", "gini = 0.32\n", "samples = 5\n", "value = [1, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "154->155\n", "\n", "\n", "\n", "\n", "\n", "158\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "154->158\n", "\n", "\n", "\n", "\n", "\n", "156\n", "\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "155->156\n", "\n", "\n", "\n", "\n", "\n", "157\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "155->157\n", "\n", "\n", "\n", "\n", "\n", "161\n", "\n", "Fare ≤ 134.642\n", "gini = 0.463\n", "samples = 74\n", "value = [47, 27]\n", "class = Survived\n", "\n", "\n", "\n", "160->161\n", "\n", "\n", "\n", "\n", "\n", "214\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "160->214\n", "\n", "\n", "\n", "\n", "\n", "162\n", "\n", "Age ≤ 27.5\n", "gini = 0.481\n", "samples = 67\n", "value = [40, 27]\n", "class = Survived\n", "\n", "\n", "\n", "161->162\n", "\n", "\n", "\n", "\n", "\n", "213\n", "\n", "gini = 0.0\n", "samples = 7\n", "value = [7, 0]\n", "class = Survived\n", "\n", "\n", "\n", "161->213\n", "\n", "\n", "\n", "\n", "\n", "163\n", "\n", "Age ≤ 24.5\n", "gini = 0.426\n", "samples = 13\n", "value = [4, 9]\n", "class = Not Survived\n", "\n", "\n", "\n", "162->163\n", "\n", "\n", "\n", "\n", "\n", "172\n", "\n", "Fare ≤ 115.442\n", "gini = 0.444\n", "samples = 54\n", "value = [36, 18]\n", "class = Survived\n", "\n", "\n", "\n", "162->172\n", "\n", "\n", "\n", "\n", "\n", "164\n", "\n", "Fare ≤ 109.892\n", "gini = 0.49\n", "samples = 7\n", "value = [4, 3]\n", "class = Survived\n", "\n", "\n", "\n", "163->164\n", "\n", "\n", "\n", "\n", "\n", "171\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [0, 6]\n", "class = Not Survived\n", "\n", "\n", "\n", "163->171\n", "\n", "\n", "\n", "\n", "\n", "165\n", "\n", "Age ≤ 22.0\n", "gini = 0.32\n", "samples = 5\n", "value = [4, 1]\n", "class = Survived\n", "\n", "\n", "\n", "164->165\n", "\n", "\n", "\n", "\n", "\n", "170\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "164->170\n", "\n", "\n", "\n", "\n", "\n", "166\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "165->166\n", "\n", "\n", "\n", "\n", "\n", "167\n", "\n", "Fare ≤ 71.279\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "165->167\n", "\n", "\n", "\n", "\n", "\n", "168\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "167->168\n", "\n", "\n", "\n", "\n", "\n", "169\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "167->169\n", "\n", "\n", "\n", "\n", "\n", "173\n", "\n", "Fare ≤ 29.1\n", "gini = 0.426\n", "samples = 52\n", "value = [36, 16]\n", "class = Survived\n", "\n", "\n", "\n", "172->173\n", "\n", "\n", "\n", "\n", "\n", "212\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "172->212\n", "\n", "\n", "\n", "\n", "\n", "174\n", "\n", "gini = 0.0\n", "samples = 5\n", "value = [5, 0]\n", "class = Survived\n", "\n", "\n", "\n", "173->174\n", "\n", "\n", "\n", "\n", "\n", "175\n", "\n", "Fare ≤ 30.598\n", "gini = 0.449\n", "samples = 47\n", "value = [31, 16]\n", "class = Survived\n", "\n", "\n", "\n", "173->175\n", "\n", "\n", "\n", "\n", "\n", "176\n", "\n", "Age ≤ 28.5\n", "gini = 0.408\n", "samples = 7\n", "value = [2, 5]\n", "class = Not Survived\n", "\n", "\n", "\n", "175->176\n", "\n", "\n", "\n", "\n", "\n", "181\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.399\n", "samples = 40\n", "value = [29, 11]\n", "class = Survived\n", "\n", "\n", "\n", "175->181\n", "\n", "\n", "\n", "\n", "\n", "177\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [0, 3]\n", "class = Not Survived\n", "\n", "\n", "\n", "176->177\n", "\n", "\n", "\n", "\n", "\n", "178\n", "\n", "Fare ≤ 30.25\n", "gini = 0.5\n", "samples = 4\n", "value = [2, 2]\n", "class = Survived\n", "\n", "\n", "\n", "176->178\n", "\n", "\n", "\n", "\n", "\n", "179\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "178->179\n", "\n", "\n", "\n", "\n", "\n", "180\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "178->180\n", "\n", "\n", "\n", "\n", "\n", "182\n", "\n", "Fare ≤ 37.0\n", "gini = 0.266\n", "samples = 19\n", "value = [16, 3]\n", "class = Survived\n", "\n", "\n", "\n", "181->182\n", "\n", "\n", "\n", "\n", "\n", "193\n", "\n", "Age ≤ 49.5\n", "gini = 0.472\n", "samples = 21\n", "value = [13, 8]\n", "class = Survived\n", "\n", "\n", "\n", "181->193\n", "\n", "\n", "\n", "\n", "\n", "183\n", "\n", "Fare ≤ 35.25\n", "gini = 0.469\n", "samples = 8\n", "value = [5, 3]\n", "class = Survived\n", "\n", "\n", "\n", "182->183\n", "\n", "\n", "\n", "\n", "\n", "192\n", "\n", "gini = 0.0\n", "samples = 11\n", "value = [11, 0]\n", "class = Survived\n", "\n", "\n", "\n", "182->192\n", "\n", "\n", "\n", "\n", "\n", "184\n", "\n", "Age ≤ 34.0\n", "gini = 0.32\n", "samples = 5\n", "value = [4, 1]\n", "class = Survived\n", "\n", "\n", "\n", "183->184\n", "\n", "\n", "\n", "\n", "\n", "189\n", "\n", "Age ≤ 36.5\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "183->189\n", "\n", "\n", "\n", "\n", "\n", "185\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "184->185\n", "\n", "\n", "\n", "\n", "\n", "186\n", "\n", "Age ≤ 43.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "184->186\n", "\n", "\n", "\n", "\n", "\n", "187\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "186->187\n", "\n", "\n", "\n", "\n", "\n", "188\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "186->188\n", "\n", "\n", "\n", "\n", "\n", "190\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "189->190\n", "\n", "\n", "\n", "\n", "\n", "191\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "189->191\n", "\n", "\n", "\n", "\n", "\n", "194\n", "\n", "Age ≤ 47.0\n", "gini = 0.494\n", "samples = 18\n", "value = [10, 8]\n", "class = Survived\n", "\n", "\n", "\n", "193->194\n", "\n", "\n", "\n", "\n", "\n", "211\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "193->211\n", "\n", "\n", "\n", "\n", "\n", "195\n", "\n", "Fare ≤ 59.087\n", "gini = 0.426\n", "samples = 13\n", "value = [9, 4]\n", "class = Survived\n", "\n", "\n", "\n", "194->195\n", "\n", "\n", "\n", "\n", "\n", "208\n", "\n", "Fare ≤ 99.994\n", "gini = 0.32\n", "samples = 5\n", "value = [1, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "194->208\n", "\n", "\n", "\n", "\n", "\n", "196\n", "\n", "Fare ≤ 52.277\n", "gini = 0.5\n", "samples = 6\n", "value = [3, 3]\n", "class = Survived\n", "\n", "\n", "\n", "195->196\n", "\n", "\n", "\n", "\n", "\n", "203\n", "\n", "Fare ≤ 86.737\n", "gini = 0.245\n", "samples = 7\n", "value = [6, 1]\n", "class = Survived\n", "\n", "\n", "\n", "195->203\n", "\n", "\n", "\n", "\n", "\n", "197\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "196->197\n", "\n", "\n", "\n", "\n", "\n", "198\n", "\n", "Fare ≤ 52.827\n", "gini = 0.375\n", "samples = 4\n", "value = [1, 3]\n", "class = Not Survived\n", "\n", "\n", "\n", "196->198\n", "\n", "\n", "\n", "\n", "\n", "199\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "198->199\n", "\n", "\n", "\n", "\n", "\n", "200\n", "\n", "Age ≤ 34.0\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "198->200\n", "\n", "\n", "\n", "\n", "\n", "201\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "200->201\n", "\n", "\n", "\n", "\n", "\n", "202\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "200->202\n", "\n", "\n", "\n", "\n", "\n", "204\n", "\n", "gini = 0.0\n", "samples = 5\n", "value = [5, 0]\n", "class = Survived\n", "\n", "\n", "\n", "203->204\n", "\n", "\n", "\n", "\n", "\n", "205\n", "\n", "Age ≤ 41.0\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "203->205\n", "\n", "\n", "\n", "\n", "\n", "206\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "205->206\n", "\n", "\n", "\n", "\n", "\n", "207\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "205->207\n", "\n", "\n", "\n", "\n", "\n", "209\n", "\n", "gini = 0.0\n", "samples = 4\n", "value = [0, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "208->209\n", "\n", "\n", "\n", "\n", "\n", "210\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "208->210\n", "\n", "\n", "\n", "\n", "\n", "216\n", "\n", "Fare ≤ 35.077\n", "gini = 0.18\n", "samples = 20\n", "value = [18, 2]\n", "class = Survived\n", "\n", "\n", "\n", "215->216\n", "\n", "\n", "\n", "\n", "\n", "225\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "215->225\n", "\n", "\n", "\n", "\n", "\n", "217\n", "\n", "gini = 0.0\n", "samples = 11\n", "value = [11, 0]\n", "class = Survived\n", "\n", "\n", "\n", "216->217\n", "\n", "\n", "\n", "\n", "\n", "218\n", "\n", "Fare ≤ 42.502\n", "gini = 0.346\n", "samples = 9\n", "value = [7, 2]\n", "class = Survived\n", "\n", "\n", "\n", "216->218\n", "\n", "\n", "\n", "\n", "\n", "219\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "218->219\n", "\n", "\n", "\n", "\n", "\n", "220\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.219\n", "samples = 8\n", "value = [7, 1]\n", "class = Survived\n", "\n", "\n", "\n", "218->220\n", "\n", "\n", "\n", "\n", "\n", "221\n", "\n", "gini = 0.0\n", "samples = 5\n", "value = [5, 0]\n", "class = Survived\n", "\n", "\n", "\n", "220->221\n", "\n", "\n", "\n", "\n", "\n", "222\n", "\n", "Age ≤ 62.0\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "220->222\n", "\n", "\n", "\n", "\n", "\n", "223\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "222->223\n", "\n", "\n", "\n", "\n", "\n", "224\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "222->224\n", "\n", "\n", "\n", "\n", "\n", "227\n", "\n", "Age ≤ 13.0\n", "gini = 0.193\n", "samples = 417\n", "value = [372, 45]\n", "class = Survived\n", "\n", "\n", "\n", "226->227\n", "\n", "\n", "\n", "\n", "\n", "404\n", "\n", "Fare ≤ 63.023\n", "gini = 0.43\n", "samples = 16\n", "value = [11, 5]\n", "class = Survived\n", "\n", "\n", "\n", "226->404\n", "\n", "\n", "\n", "\n", "\n", "228\n", "\n", "SibSp ≤ 2.0\n", "gini = 0.444\n", "samples = 12\n", "value = [8, 4]\n", "class = Survived\n", "\n", "\n", "\n", "227->228\n", "\n", "\n", "\n", "\n", "\n", "235\n", "\n", "Age ≤ 32.25\n", "gini = 0.182\n", "samples = 405\n", "value = [364, 41]\n", "class = Survived\n", "\n", "\n", "\n", "227->235\n", "\n", "\n", "\n", "\n", "\n", "229\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.32\n", "samples = 5\n", "value = [1, 4]\n", "class = Not Survived\n", "\n", "\n", "\n", "228->229\n", "\n", "\n", "\n", "\n", "\n", "234\n", "\n", "gini = 0.0\n", "samples = 7\n", "value = [7, 0]\n", "class = Survived\n", "\n", "\n", "\n", "228->234\n", "\n", "\n", "\n", "\n", "\n", "230\n", "\n", "Age ≤ 10.0\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "229->230\n", "\n", "\n", "\n", "\n", "\n", "233\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [0, 3]\n", "class = Not Survived\n", "\n", "\n", "\n", "229->233\n", "\n", "\n", "\n", "\n", "\n", "231\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "230->231\n", "\n", "\n", "\n", "\n", "\n", "232\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "230->232\n", "\n", "\n", "\n", "\n", "\n", "236\n", "\n", "Age ≤ 30.75\n", "gini = 0.206\n", "samples = 300\n", "value = [265, 35]\n", "class = Survived\n", "\n", "\n", "\n", "235->236\n", "\n", "\n", "\n", "\n", "\n", "377\n", "\n", "Fare ≤ 7.91\n", "gini = 0.108\n", "samples = 105\n", "value = [99, 6]\n", "class = Survived\n", "\n", "\n", "\n", "235->377\n", "\n", "\n", "\n", "\n", "\n", "237\n", "\n", "Fare ≤ 23.35\n", "gini = 0.185\n", "samples = 282\n", "value = [253, 29]\n", "class = Survived\n", "\n", "\n", "\n", "236->237\n", "\n", "\n", "\n", "\n", "\n", "356\n", "\n", "Fare ≤ 7.815\n", "gini = 0.444\n", "samples = 18\n", "value = [12, 6]\n", "class = Survived\n", "\n", "\n", "\n", "236->356\n", "\n", "\n", "\n", "\n", "\n", "238\n", "\n", "Fare ≤ 22.887\n", "gini = 0.195\n", "samples = 265\n", "value = [236, 29]\n", "class = Survived\n", "\n", "\n", "\n", "237->238\n", "\n", "\n", "\n", "\n", "\n", "355\n", "\n", "gini = 0.0\n", "samples = 17\n", "value = [17, 0]\n", "class = Survived\n", "\n", "\n", "\n", "237->355\n", "\n", "\n", "\n", "\n", "\n", "239\n", "\n", "Age ≤ 28.75\n", "gini = 0.19\n", "samples = 264\n", "value = [236, 28]\n", "class = Survived\n", "\n", "\n", "\n", "238->239\n", "\n", "\n", "\n", "\n", "\n", "354\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "238->354\n", "\n", "\n", "\n", "\n", "\n", "240\n", "\n", "Fare ≤ 15.173\n", "gini = 0.179\n", "samples = 241\n", "value = [217, 24]\n", "class = Survived\n", "\n", "\n", "\n", "239->240\n", "\n", "\n", "\n", "\n", "\n", "339\n", "\n", "Fare ≤ 10.0\n", "gini = 0.287\n", "samples = 23\n", "value = [19, 4]\n", "class = Survived\n", "\n", "\n", "\n", "239->339\n", "\n", "\n", "\n", "\n", "\n", "241\n", "\n", "Fare ≤ 7.798\n", "gini = 0.165\n", "samples = 220\n", "value = [200, 20]\n", "class = Survived\n", "\n", "\n", "\n", "240->241\n", "\n", "\n", "\n", "\n", "\n", "328\n", "\n", "Fare ≤ 15.373\n", "gini = 0.308\n", "samples = 21\n", "value = [17, 4]\n", "class = Survived\n", "\n", "\n", "\n", "240->328\n", "\n", "\n", "\n", "\n", "\n", "242\n", "\n", "Fare ≤ 7.763\n", "gini = 0.215\n", "samples = 90\n", "value = [79, 11]\n", "class = Survived\n", "\n", "\n", "\n", "241->242\n", "\n", "\n", "\n", "\n", "\n", "289\n", "\n", "Age ≤ 20.5\n", "gini = 0.129\n", "samples = 130\n", "value = [121, 9]\n", "class = Survived\n", "\n", "\n", "\n", "241->289\n", "\n", "\n", "\n", "\n", "\n", "243\n", "\n", "Fare ≤ 7.24\n", "gini = 0.169\n", "samples = 75\n", "value = [68, 7]\n", "class = Survived\n", "\n", "\n", "\n", "242->243\n", "\n", "\n", "\n", "\n", "\n", "274\n", "\n", "Age ≤ 20.0\n", "gini = 0.391\n", "samples = 15\n", "value = [11, 4]\n", "class = Survived\n", "\n", "\n", "\n", "242->274\n", "\n", "\n", "\n", "\n", "\n", "244\n", "\n", "Age ≤ 27.5\n", "gini = 0.245\n", "samples = 42\n", "value = [36, 6]\n", "class = Survived\n", "\n", "\n", "\n", "243->244\n", "\n", "\n", "\n", "\n", "\n", "267\n", "\n", "Fare ≤ 7.746\n", "gini = 0.059\n", "samples = 33\n", "value = [32, 1]\n", "class = Survived\n", "\n", "\n", "\n", "243->267\n", "\n", "\n", "\n", "\n", "\n", "245\n", "\n", "Age ≤ 26.0\n", "gini = 0.363\n", "samples = 21\n", "value = [16, 5]\n", "class = Survived\n", "\n", "\n", "\n", "244->245\n", "\n", "\n", "\n", "\n", "\n", "262\n", "\n", "Fare ≤ 7.227\n", "gini = 0.091\n", "samples = 21\n", "value = [20, 1]\n", "class = Survived\n", "\n", "\n", "\n", "244->262\n", "\n", "\n", "\n", "\n", "\n", "246\n", "\n", "Age ≤ 19.5\n", "gini = 0.32\n", "samples = 20\n", "value = [16, 4]\n", "class = Survived\n", "\n", "\n", "\n", "245->246\n", "\n", "\n", "\n", "\n", "\n", "261\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "245->261\n", "\n", "\n", "\n", "\n", "\n", "247\n", "\n", "gini = 0.0\n", "samples = 7\n", "value = [7, 0]\n", "class = Survived\n", "\n", "\n", "\n", "246->247\n", "\n", "\n", "\n", "\n", "\n", "248\n", "\n", "Fare ≤ 2.006\n", "gini = 0.426\n", "samples = 13\n", "value = [9, 4]\n", "class = Survived\n", "\n", "\n", "\n", "246->248\n", "\n", "\n", "\n", "\n", "\n", "249\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "248->249\n", "\n", "\n", "\n", "\n", "\n", "250\n", "\n", "Fare ≤ 7.133\n", "gini = 0.375\n", "samples = 12\n", "value = [9, 3]\n", "class = Survived\n", "\n", "\n", "\n", "248->250\n", "\n", "\n", "\n", "\n", "\n", "251\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [6, 0]\n", "class = Survived\n", "\n", "\n", "\n", "250->251\n", "\n", "\n", "\n", "\n", "\n", "252\n", "\n", "Fare ≤ 7.183\n", "gini = 0.5\n", "samples = 6\n", "value = [3, 3]\n", "class = Survived\n", "\n", "\n", "\n", "250->252\n", "\n", "\n", "\n", "\n", "\n", "253\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "252->253\n", "\n", "\n", "\n", "\n", "\n", "254\n", "\n", "Age ≤ 22.75\n", "gini = 0.48\n", "samples = 5\n", "value = [3, 2]\n", "class = Survived\n", "\n", "\n", "\n", "252->254\n", "\n", "\n", "\n", "\n", "\n", "255\n", "\n", "Age ≤ 21.0\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "254->255\n", "\n", "\n", "\n", "\n", "\n", "260\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "254->260\n", "\n", "\n", "\n", "\n", "\n", "256\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "255->256\n", "\n", "\n", "\n", "\n", "\n", "257\n", "\n", "Fare ≤ 7.227\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "255->257\n", "\n", "\n", "\n", "\n", "\n", "258\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "257->258\n", "\n", "\n", "\n", "\n", "\n", "259\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "257->259\n", "\n", "\n", "\n", "\n", "\n", "263\n", "\n", "gini = 0.0\n", "samples = 14\n", "value = [14, 0]\n", "class = Survived\n", "\n", "\n", "\n", "262->263\n", "\n", "\n", "\n", "\n", "\n", "264\n", "\n", "Age ≤ 28.25\n", "gini = 0.245\n", "samples = 7\n", "value = [6, 1]\n", "class = Survived\n", "\n", "\n", "\n", "262->264\n", "\n", "\n", "\n", "\n", "\n", "265\n", "\n", "gini = 0.278\n", "samples = 6\n", "value = [5, 1]\n", "class = Survived\n", "\n", "\n", "\n", "264->265\n", "\n", "\n", "\n", "\n", "\n", "266\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "264->266\n", "\n", "\n", "\n", "\n", "\n", "268\n", "\n", "gini = 0.0\n", "samples = 21\n", "value = [21, 0]\n", "class = Survived\n", "\n", "\n", "\n", "267->268\n", "\n", "\n", "\n", "\n", "\n", "269\n", "\n", "Age ≤ 23.0\n", "gini = 0.153\n", "samples = 12\n", "value = [11, 1]\n", "class = Survived\n", "\n", "\n", "\n", "267->269\n", "\n", "\n", "\n", "\n", "\n", "270\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "269->270\n", "\n", "\n", "\n", "\n", "\n", "271\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.165\n", "samples = 11\n", "value = [10, 1]\n", "class = Survived\n", "\n", "\n", "\n", "269->271\n", "\n", "\n", "\n", "\n", "\n", "272\n", "\n", "gini = 0.18\n", "samples = 10\n", "value = [9, 1]\n", "class = Survived\n", "\n", "\n", "\n", "271->272\n", "\n", "\n", "\n", "\n", "\n", "273\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "271->273\n", "\n", "\n", "\n", "\n", "\n", "275\n", "\n", "gini = 0.0\n", "samples = 4\n", "value = [4, 0]\n", "class = Survived\n", "\n", "\n", "\n", "274->275\n", "\n", "\n", "\n", "\n", "\n", "276\n", "\n", "Age ≤ 26.5\n", "gini = 0.463\n", "samples = 11\n", "value = [7, 4]\n", "class = Survived\n", "\n", "\n", "\n", "274->276\n", "\n", "\n", "\n", "\n", "\n", "277\n", "\n", "Age ≤ 21.5\n", "gini = 0.408\n", "samples = 7\n", "value = [5, 2]\n", "class = Survived\n", "\n", "\n", "\n", "276->277\n", "\n", "\n", "\n", "\n", "\n", "284\n", "\n", "Age ≤ 27.5\n", "gini = 0.5\n", "samples = 4\n", "value = [2, 2]\n", "class = Survived\n", "\n", "\n", "\n", "276->284\n", "\n", "\n", "\n", "\n", "\n", "278\n", "\n", "Fare ≤ 7.785\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "277->278\n", "\n", "\n", "\n", "\n", "\n", "281\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.32\n", "samples = 5\n", "value = [4, 1]\n", "class = Survived\n", "\n", "\n", "\n", "277->281\n", "\n", "\n", "\n", "\n", "\n", "279\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "278->279\n", "\n", "\n", "\n", "\n", "\n", "280\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "278->280\n", "\n", "\n", "\n", "\n", "\n", "282\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "281->282\n", "\n", "\n", "\n", "\n", "\n", "283\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "281->283\n", "\n", "\n", "\n", "\n", "\n", "285\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "284->285\n", "\n", "\n", "\n", "\n", "\n", "286\n", "\n", "Fare ≤ 7.785\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "284->286\n", "\n", "\n", "\n", "\n", "\n", "287\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "286->287\n", "\n", "\n", "\n", "\n", "\n", "288\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "286->288\n", "\n", "\n", "\n", "\n", "\n", "290\n", "\n", "Fare ≤ 8.104\n", "gini = 0.251\n", "samples = 34\n", "value = [29, 5]\n", "class = Survived\n", "\n", "\n", "\n", "289->290\n", "\n", "\n", "\n", "\n", "\n", "309\n", "\n", "Fare ≤ 8.081\n", "gini = 0.08\n", "samples = 96\n", "value = [92, 4]\n", "class = Survived\n", "\n", "\n", "\n", "289->309\n", "\n", "\n", "\n", "\n", "\n", "291\n", "\n", "Fare ≤ 7.91\n", "gini = 0.408\n", "samples = 14\n", "value = [10, 4]\n", "class = Survived\n", "\n", "\n", "\n", "290->291\n", "\n", "\n", "\n", "\n", "\n", "302\n", "\n", "Pclass ≤ 2.5\n", "gini = 0.095\n", "samples = 20\n", "value = [19, 1]\n", "class = Survived\n", "\n", "\n", "\n", "290->302\n", "\n", "\n", "\n", "\n", "\n", "292\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [6, 0]\n", "class = Survived\n", "\n", "\n", "\n", "291->292\n", "\n", "\n", "\n", "\n", "\n", "293\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.5\n", "samples = 8\n", "value = [4, 4]\n", "class = Survived\n", "\n", "\n", "\n", "291->293\n", "\n", "\n", "\n", "\n", "\n", "294\n", "\n", "Age ≤ 19.5\n", "gini = 0.49\n", "samples = 7\n", "value = [4, 3]\n", "class = Survived\n", "\n", "\n", "\n", "293->294\n", "\n", "\n", "\n", "\n", "\n", "301\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "293->301\n", "\n", "\n", "\n", "\n", "\n", "295\n", "\n", "Age ≤ 17.0\n", "gini = 0.48\n", "samples = 5\n", "value = [2, 3]\n", "class = Not Survived\n", "\n", "\n", "\n", "294->295\n", "\n", "\n", "\n", "\n", "\n", "300\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "294->300\n", "\n", "\n", "\n", "\n", "\n", "296\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "295->296\n", "\n", "\n", "\n", "\n", "\n", "297\n", "\n", "Age ≤ 18.5\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "295->297\n", "\n", "\n", "\n", "\n", "\n", "298\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "297->298\n", "\n", "\n", "\n", "\n", "\n", "299\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "297->299\n", "\n", "\n", "\n", "\n", "\n", "303\n", "\n", "Age ≤ 18.5\n", "gini = 0.245\n", "samples = 7\n", "value = [6, 1]\n", "class = Survived\n", "\n", "\n", "\n", "302->303\n", "\n", "\n", "\n", "\n", "\n", "308\n", "\n", "gini = 0.0\n", "samples = 13\n", "value = [13, 0]\n", "class = Survived\n", "\n", "\n", "\n", "302->308\n", "\n", "\n", "\n", "\n", "\n", "304\n", "\n", "gini = 0.0\n", "samples = 4\n", "value = [4, 0]\n", "class = Survived\n", "\n", "\n", "\n", "303->304\n", "\n", "\n", "\n", "\n", "\n", "305\n", "\n", "Fare ≤ 11.75\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "303->305\n", "\n", "\n", "\n", "\n", "\n", "306\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "305->306\n", "\n", "\n", "\n", "\n", "\n", "307\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "305->307\n", "\n", "\n", "\n", "\n", "\n", "310\n", "\n", "gini = 0.0\n", "samples = 54\n", "value = [54, 0]\n", "class = Survived\n", "\n", "\n", "\n", "309->310\n", "\n", "\n", "\n", "\n", "\n", "311\n", "\n", "Fare ≤ 8.273\n", "gini = 0.172\n", "samples = 42\n", "value = [38, 4]\n", "class = Survived\n", "\n", "\n", "\n", "309->311\n", "\n", "\n", "\n", "\n", "\n", "312\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "311->312\n", "\n", "\n", "\n", "\n", "\n", "313\n", "\n", "Age ≤ 26.5\n", "gini = 0.136\n", "samples = 41\n", "value = [38, 3]\n", "class = Survived\n", "\n", "\n", "\n", "311->313\n", "\n", "\n", "\n", "\n", "\n", "314\n", "\n", "gini = 0.0\n", "samples = 21\n", "value = [21, 0]\n", "class = Survived\n", "\n", "\n", "\n", "313->314\n", "\n", "\n", "\n", "\n", "\n", "315\n", "\n", "Fare ≤ 14.158\n", "gini = 0.255\n", "samples = 20\n", "value = [17, 3]\n", "class = Survived\n", "\n", "\n", "\n", "313->315\n", "\n", "\n", "\n", "\n", "\n", "316\n", "\n", "Fare ≤ 13.681\n", "gini = 0.337\n", "samples = 14\n", "value = [11, 3]\n", "class = Survived\n", "\n", "\n", "\n", "315->316\n", "\n", "\n", "\n", "\n", "\n", "327\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [6, 0]\n", "class = Survived\n", "\n", "\n", "\n", "315->327\n", "\n", "\n", "\n", "\n", "\n", "317\n", "\n", "Age ≤ 27.5\n", "gini = 0.26\n", "samples = 13\n", "value = [11, 2]\n", "class = Survived\n", "\n", "\n", "\n", "316->317\n", "\n", "\n", "\n", "\n", "\n", "326\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "316->326\n", "\n", "\n", "\n", "\n", "\n", "318\n", "\n", "Fare ≤ 10.831\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "317->318\n", "\n", "\n", "\n", "\n", "\n", "321\n", "\n", "Fare ≤ 11.75\n", "gini = 0.18\n", "samples = 10\n", "value = [9, 1]\n", "class = Survived\n", "\n", "\n", "\n", "317->321\n", "\n", "\n", "\n", "\n", "\n", "319\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "318->319\n", "\n", "\n", "\n", "\n", "\n", "320\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "318->320\n", "\n", "\n", "\n", "\n", "\n", "322\n", "\n", "gini = 0.0\n", "samples = 7\n", "value = [7, 0]\n", "class = Survived\n", "\n", "\n", "\n", "321->322\n", "\n", "\n", "\n", "\n", "\n", "323\n", "\n", "Fare ≤ 13.25\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "321->323\n", "\n", "\n", "\n", "\n", "\n", "324\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "323->324\n", "\n", "\n", "\n", "\n", "\n", "325\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "323->325\n", "\n", "\n", "\n", "\n", "\n", "329\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "328->329\n", "\n", "\n", "\n", "\n", "\n", "330\n", "\n", "Age ≤ 27.0\n", "gini = 0.188\n", "samples = 19\n", "value = [17, 2]\n", "class = Survived\n", "\n", "\n", "\n", "328->330\n", "\n", "\n", "\n", "\n", "\n", "331\n", "\n", "Fare ≤ 15.921\n", "gini = 0.346\n", "samples = 9\n", "value = [7, 2]\n", "class = Survived\n", "\n", "\n", "\n", "330->331\n", "\n", "\n", "\n", "\n", "\n", "338\n", "\n", "gini = 0.0\n", "samples = 10\n", "value = [10, 0]\n", "class = Survived\n", "\n", "\n", "\n", "330->338\n", "\n", "\n", "\n", "\n", "\n", "332\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "331->332\n", "\n", "\n", "\n", "\n", "\n", "333\n", "\n", "Age ≤ 25.5\n", "gini = 0.219\n", "samples = 8\n", "value = [7, 1]\n", "class = Survived\n", "\n", "\n", "\n", "331->333\n", "\n", "\n", "\n", "\n", "\n", "334\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [6, 0]\n", "class = Survived\n", "\n", "\n", "\n", "333->334\n", "\n", "\n", "\n", "\n", "\n", "335\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "333->335\n", "\n", "\n", "\n", "\n", "\n", "336\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "335->336\n", "\n", "\n", "\n", "\n", "\n", "337\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "335->337\n", "\n", "\n", "\n", "\n", "\n", "340\n", "\n", "Fare ≤ 9.492\n", "gini = 0.375\n", "samples = 16\n", "value = [12, 4]\n", "class = Survived\n", "\n", "\n", "\n", "339->340\n", "\n", "\n", "\n", "\n", "\n", "353\n", "\n", "gini = 0.0\n", "samples = 7\n", "value = [7, 0]\n", "class = Survived\n", "\n", "\n", "\n", "339->353\n", "\n", "\n", "\n", "\n", "\n", "341\n", "\n", "Age ≤ 29.5\n", "gini = 0.245\n", "samples = 14\n", "value = [12, 2]\n", "class = Survived\n", "\n", "\n", "\n", "340->341\n", "\n", "\n", "\n", "\n", "\n", "352\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "340->352\n", "\n", "\n", "\n", "\n", "\n", "342\n", "\n", "Fare ≤ 7.973\n", "gini = 0.408\n", "samples = 7\n", "value = [5, 2]\n", "class = Survived\n", "\n", "\n", "\n", "341->342\n", "\n", "\n", "\n", "\n", "\n", "351\n", "\n", "gini = 0.0\n", "samples = 7\n", "value = [7, 0]\n", "class = Survived\n", "\n", "\n", "\n", "341->351\n", "\n", "\n", "\n", "\n", "\n", "343\n", "\n", "Fare ≤ 7.885\n", "gini = 0.48\n", "samples = 5\n", "value = [3, 2]\n", "class = Survived\n", "\n", "\n", "\n", "342->343\n", "\n", "\n", "\n", "\n", "\n", "350\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "342->350\n", "\n", "\n", "\n", "\n", "\n", "344\n", "\n", "Fare ≤ 7.763\n", "gini = 0.375\n", "samples = 4\n", "value = [3, 1]\n", "class = Survived\n", "\n", "\n", "\n", "343->344\n", "\n", "\n", "\n", "\n", "\n", "349\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "343->349\n", "\n", "\n", "\n", "\n", "\n", "345\n", "\n", "SibSp ≤ 0.5\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "344->345\n", "\n", "\n", "\n", "\n", "\n", "348\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "344->348\n", "\n", "\n", "\n", "\n", "\n", "346\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "345->346\n", "\n", "\n", "\n", "\n", "\n", "347\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "345->347\n", "\n", "\n", "\n", "\n", "\n", "357\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "356->357\n", "\n", "\n", "\n", "\n", "\n", "358\n", "\n", "Fare ≤ 7.875\n", "gini = 0.48\n", "samples = 15\n", "value = [9, 6]\n", "class = Survived\n", "\n", "\n", "\n", "356->358\n", "\n", "\n", "\n", "\n", "\n", "359\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "358->359\n", "\n", "\n", "\n", "\n", "\n", "360\n", "\n", "Fare ≤ 26.125\n", "gini = 0.459\n", "samples = 14\n", "value = [9, 5]\n", "class = Survived\n", "\n", "\n", "\n", "358->360\n", "\n", "\n", "\n", "\n", "\n", "361\n", "\n", "Fare ≤ 20.925\n", "gini = 0.486\n", "samples = 12\n", "value = [7, 5]\n", "class = Survived\n", "\n", "\n", "\n", "360->361\n", "\n", "\n", "\n", "\n", "\n", "376\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "360->376\n", "\n", "\n", "\n", "\n", "\n", "362\n", "\n", "Age ≤ 31.5\n", "gini = 0.463\n", "samples = 11\n", "value = [7, 4]\n", "class = Survived\n", "\n", "\n", "\n", "361->362\n", "\n", "\n", "\n", "\n", "\n", "375\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "361->375\n", "\n", "\n", "\n", "\n", "\n", "363\n", "\n", "Fare ≤ 9.213\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "362->363\n", "\n", "\n", "\n", "\n", "\n", "368\n", "\n", "Fare ≤ 8.206\n", "gini = 0.375\n", "samples = 8\n", "value = [6, 2]\n", "class = Survived\n", "\n", "\n", "\n", "362->368\n", "\n", "\n", "\n", "\n", "\n", "364\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "363->364\n", "\n", "\n", "\n", "\n", "\n", "365\n", "\n", "Fare ≤ 11.75\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "363->365\n", "\n", "\n", "\n", "\n", "\n", "366\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "365->366\n", "\n", "\n", "\n", "\n", "\n", "367\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "365->367\n", "\n", "\n", "\n", "\n", "\n", "369\n", "\n", "Fare ≤ 7.988\n", "gini = 0.48\n", "samples = 5\n", "value = [3, 2]\n", "class = Survived\n", "\n", "\n", "\n", "368->369\n", "\n", "\n", "\n", "\n", "\n", "374\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "368->374\n", "\n", "\n", "\n", "\n", "\n", "370\n", "\n", "Fare ≤ 7.91\n", "gini = 0.375\n", "samples = 4\n", "value = [3, 1]\n", "class = Survived\n", "\n", "\n", "\n", "369->370\n", "\n", "\n", "\n", "\n", "\n", "373\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "369->373\n", "\n", "\n", "\n", "\n", "\n", "371\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "370->371\n", "\n", "\n", "\n", "\n", "\n", "372\n", "\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "370->372\n", "\n", "\n", "\n", "\n", "\n", "378\n", "\n", "gini = 0.0\n", "samples = 32\n", "value = [32, 0]\n", "class = Survived\n", "\n", "\n", "\n", "377->378\n", "\n", "\n", "\n", "\n", "\n", "379\n", "\n", "Fare ≤ 7.988\n", "gini = 0.151\n", "samples = 73\n", "value = [67, 6]\n", "class = Survived\n", "\n", "\n", "\n", "377->379\n", "\n", "\n", "\n", "\n", "\n", "380\n", "\n", "SibSp ≤ 1.0\n", "gini = 0.5\n", "samples = 4\n", "value = [2, 2]\n", "class = Survived\n", "\n", "\n", "\n", "379->380\n", "\n", "\n", "\n", "\n", "\n", "385\n", "\n", "Age ≤ 61.0\n", "gini = 0.109\n", "samples = 69\n", "value = [65, 4]\n", "class = Survived\n", "\n", "\n", "\n", "379->385\n", "\n", "\n", "\n", "\n", "\n", "381\n", "\n", "Age ≤ 41.5\n", "gini = 0.444\n", "samples = 3\n", "value = [1, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "380->381\n", "\n", "\n", "\n", "\n", "\n", "384\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [1, 0]\n", "class = Survived\n", "\n", "\n", "\n", "380->384\n", "\n", "\n", "\n", "\n", "\n", "382\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "381->382\n", "\n", "\n", "\n", "\n", "\n", "383\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "381->383\n", "\n", "\n", "\n", "\n", "\n", "386\n", "\n", "Fare ≤ 13.25\n", "gini = 0.087\n", "samples = 66\n", "value = [63, 3]\n", "class = Survived\n", "\n", "\n", "\n", "385->386\n", "\n", "\n", "\n", "\n", "\n", "401\n", "\n", "Age ≤ 64.0\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "385->401\n", "\n", "\n", "\n", "\n", "\n", "387\n", "\n", "Fare ≤ 12.938\n", "gini = 0.157\n", "samples = 35\n", "value = [32, 3]\n", "class = Survived\n", "\n", "\n", "\n", "386->387\n", "\n", "\n", "\n", "\n", "\n", "400\n", "\n", "gini = 0.0\n", "samples = 31\n", "value = [31, 0]\n", "class = Survived\n", "\n", "\n", "\n", "386->400\n", "\n", "\n", "\n", "\n", "\n", "388\n", "\n", "Age ≤ 44.5\n", "gini = 0.08\n", "samples = 24\n", "value = [23, 1]\n", "class = Survived\n", "\n", "\n", "\n", "387->388\n", "\n", "\n", "\n", "\n", "\n", "393\n", "\n", "Age ≤ 45.0\n", "gini = 0.298\n", "samples = 11\n", "value = [9, 2]\n", "class = Survived\n", "\n", "\n", "\n", "387->393\n", "\n", "\n", "\n", "\n", "\n", "389\n", "\n", "gini = 0.0\n", "samples = 17\n", "value = [17, 0]\n", "class = Survived\n", "\n", "\n", "\n", "388->389\n", "\n", "\n", "\n", "\n", "\n", "390\n", "\n", "Age ≤ 46.0\n", "gini = 0.245\n", "samples = 7\n", "value = [6, 1]\n", "class = Survived\n", "\n", "\n", "\n", "388->390\n", "\n", "\n", "\n", "\n", "\n", "391\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "390->391\n", "\n", "\n", "\n", "\n", "\n", "392\n", "\n", "gini = 0.0\n", "samples = 6\n", "value = [6, 0]\n", "class = Survived\n", "\n", "\n", "\n", "390->392\n", "\n", "\n", "\n", "\n", "\n", "394\n", "\n", "Age ≤ 40.5\n", "gini = 0.375\n", "samples = 8\n", "value = [6, 2]\n", "class = Survived\n", "\n", "\n", "\n", "393->394\n", "\n", "\n", "\n", "\n", "\n", "399\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "393->399\n", "\n", "\n", "\n", "\n", "\n", "395\n", "\n", "Age ≤ 35.0\n", "gini = 0.278\n", "samples = 6\n", "value = [5, 1]\n", "class = Survived\n", "\n", "\n", "\n", "394->395\n", "\n", "\n", "\n", "\n", "\n", "398\n", "\n", "gini = 0.5\n", "samples = 2\n", "value = [1, 1]\n", "class = Survived\n", "\n", "\n", "\n", "394->398\n", "\n", "\n", "\n", "\n", "\n", "396\n", "\n", "gini = 0.444\n", "samples = 3\n", "value = [2, 1]\n", "class = Survived\n", "\n", "\n", "\n", "395->396\n", "\n", "\n", "\n", "\n", "\n", "397\n", "\n", "gini = 0.0\n", "samples = 3\n", "value = [3, 0]\n", "class = Survived\n", "\n", "\n", "\n", "395->397\n", "\n", "\n", "\n", "\n", "\n", "402\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "401->402\n", "\n", "\n", "\n", "\n", "\n", "403\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [2, 0]\n", "class = Survived\n", "\n", "\n", "\n", "401->403\n", "\n", "\n", "\n", "\n", "\n", "405\n", "\n", "Age ≤ 30.0\n", "gini = 0.408\n", "samples = 7\n", "value = [2, 5]\n", "class = Not Survived\n", "\n", "\n", "\n", "404->405\n", "\n", "\n", "\n", "\n", "\n", "410\n", "\n", "gini = 0.0\n", "samples = 9\n", "value = [9, 0]\n", "class = Survived\n", "\n", "\n", "\n", "404->410\n", "\n", "\n", "\n", "\n", "\n", "406\n", "\n", "Age ≤ 27.0\n", "gini = 0.48\n", "samples = 5\n", "value = [2, 3]\n", "class = Not Survived\n", "\n", "\n", "\n", "405->406\n", "\n", "\n", "\n", "\n", "\n", "409\n", "\n", "gini = 0.0\n", "samples = 2\n", "value = [0, 2]\n", "class = Not Survived\n", "\n", "\n", "\n", "405->409\n", "\n", "\n", "\n", "\n", "\n", "407\n", "\n", "gini = 0.0\n", "samples = 1\n", "value = [0, 1]\n", "class = Not Survived\n", "\n", "\n", "\n", "406->407\n", "\n", "\n", "\n", "\n", "\n", "408\n", "\n", "gini = 0.5\n", "samples = 4\n", "value = [2, 2]\n", "class = Survived\n", "\n", "\n", "\n", "406->408\n", "\n", "\n", "\n", "\n", "\n" ], "text/plain": [ "" ] }, "execution_count": 35, "metadata": {}, "output_type": "execute_result" } ], "source": [ "import graphviz \n", "from PIL import Image\n", "dot_data = tree.export_graphviz(clf, out_file=None) \n", "graph = graphviz.Source(dot_data) \n", "graph.render(\"Titanic\") \n", "\n", "dot_data = tree.export_graphviz(clf, out_file=None, \n", " feature_names=data_train.columns.values, \n", " class_names=['Survived','Not Survived'], \n", " filled=True, rounded=True, \n", " special_characters=True) \n", "graph = graphviz.Source(dot_data) \n", "graph " ] }, { "cell_type": "code", "execution_count": 22, "id": "8ad7b604", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0.978675645342312" ] }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# Make predictions and store in 'Survived' column of df_test\n", "Y_pred = clf.predict(test)\n", "df_test['Survived'] = Y_pred\n", "clf.score(X, y)" ] }, { "cell_type": "code", "execution_count": 23, "id": "0d0f2be2", "metadata": {}, "outputs": [], "source": [ "df_test[['PassengerId', 'Survived']].to_csv('C:/Users/User/Desktop/dt.csv', index=False)" ] }, { "cell_type": "code", "execution_count": 34, "id": "ae505ffa", "metadata": {}, "outputs": [ { "data": { "text/plain": [ "'Source.gv.pdf'" ] }, "execution_count": 34, "metadata": {}, "output_type": "execute_result" } ], "source": [ "src = graphviz.Source(dot_data)\n", "src.view()" ] }, { "cell_type": "code", "execution_count": null, "id": "e046624a", "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "ml", "language": "python", "name": "ml" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.9.15" } }, "nbformat": 4, "nbformat_minor": 5 }