Decision Tree and EDA With Functions: Import Pandas As PD
Decision Tree and EDA With Functions: Import Pandas As PD
In [56]: data.head()
Out[56]:
Boat Unnamed:
Name Age Class/Dept Ticket Joined Job
[Body] 7
AB??-AL-
MUN??, Mr 3rd Class 2699?18
0 27 Cherbourg ? 15? NaN
N??s??f Passenger 15s 9d
Q??sim
ABBOTT,
3rd Class CA2673?
2 Mrs Rhoda 39 Southampton ? A? NaN
Passenger 20 5s
Mary 'Rosa'
ABBOTT, Mr
3rd Class CA2673?
3 Rossmore 16 Southampton Jeweller ? ?[190] NaN
Passenger 20 5s
Edward
ABBOTT, Mr
3rd Class CA2673?
4 Eugene 13 Southampton Scholar ? ?? NaN
Passenger 20 5s
Joseph
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 1/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
data['Age'] = data['Age'].apply(pd.to_numeric,errors='coerce')
data.head()
Out[58]:
Boat Unnamed:
Name Age Class/Dept Ticket Joined Job
[Body] 7
AB -AL-
3rd Class 2699?18
0 MUN , Mr N 27.0 Cherbourg ? 15 NaN
Passenger 15s 9d
s f Q sim
ABBOTT,
3rd Class CA2673?
2 Mrs Rhoda 39.0 Southampton ? A NaN
Passenger 20 5s
Mary 'Rosa'
ABBOTT, Mr
3rd Class CA2673?
3 Rossmore 16.0 Southampton Jeweller ? [190] NaN
Passenger 20 5s
Edward
ABBOTT, Mr
3rd Class CA2673?
4 Eugene 13.0 Southampton Scholar ? NaN
Passenger 20 5s
Joseph
Out[59]:
Name Age Class/Dept Boat [Body]
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 2/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
data["Crew/Pass"]=data["Class/Dept"].apply(checkPass)
data.head()
Out[60]:
Name Age Class/Dept Boat [Body] Crew/Pass
2 ABBOTT, Mrs Rhoda Mary 'Rosa' 39.0 3rd Class Passenger A Passenger
data['Class'] = data['Class/Dept'].apply(class_person)
data.head()
Out[61]:
Boat
Name Age Class/Dept Crew/Pass Class
[Body]
3rd Class
0 AB -AL-MUN , Mr N s f Q sim 27.0 15 Passenger 3rd
Passenger
3rd Class
1 ABBING, Mr Anthony 42.0 Passenger 3rd
Passenger
3rd Class
4 ABBOTT, Mr Eugene Joseph 13.0 Passenger 3rd
Passenger
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 3/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
data['Adult/Child'] = data['Age'].apply(child_class)
data.head()
Out[62]:
Boat
Name Age Class/Dept Crew/Pass Class Adult/Child
[Body]
3rd Class
1 ABBING, Mr Anthony 42.0 Passenger 3rd adult
Passenger
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 4/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
data['Gender'] = data['Name'].apply(gender_determiner)
data.head()
Out[63]:
Boat
Name Age Class/Dept Crew/Pass Class Adult/Child Gender
[Body]
ABBOTT, Mrs
3rd Class
2 Rhoda Mary 39.0 A Passenger 3rd adult Female
Passenger
'Rosa'
ABBOTT, Mr
3rd Class
3 Rossmore 16.0 [190] Passenger 3rd child Male
Passenger
Edward
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 5/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
data["Survival"]=data["Boat [Body]"].apply(checkSurvival)
data.head()
Out[65]:
Boat
Name Age Class/Dept Crew/Pass Class Adult/Child Gender Survival
[Body]
AB -AL-
MUN , Mr 3rd Class
0 27.0 15 Passenger 3rd adult Male 1
NsfQ Passenger
sim
ABBING,
3rd Class
1 Mr 42.0 Passenger 3rd adult Male 1
Passenger
Anthony
ABBOTT,
Mrs
3rd Class
2 Rhoda 39.0 A Passenger 3rd adult Female 1
Passenger
Mary
'Rosa'
ABBOTT,
Mr 3rd Class
3 16.0 [190] Passenger 3rd child Male 0
Rossmore Passenger
Edward
ABBOTT,
Mr 3rd Class
4 13.0 Passenger 3rd child Male 1
Eugene Passenger
Joseph
In [67]: data.groupby(['Crew/Pass'])['Survival'].sum()*100/data.groupby(['Crew/Pass'])[
'Survival'].count()
Out[67]: Crew/Pass
Crew 90.217391
Passenger 90.310651
Name: Survival, dtype: float64
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 6/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
compare("Class",data)
Out[69]: Class
1st 89.714286
2nd 88.395904
3rd 91.396333
crew 90.217391
Name: Survival, dtype: float64
In [70]: compare("Gender",data)
Out[70]: Gender
Female 95.840555
Male 88.557743
Name: Survival, dtype: float64
In [71]: compare("Adult/Child",data)
Out[71]: Adult/Child
adult 89.699955
child 95.964126
Name: Survival, dtype: float64
In [72]: trainingData=data[["Age","Crew/Pass","Class","Adult/Child","Gender","Survival"
]]
trainingData.head()
Out[72]:
Age Crew/Pass Class Adult/Child Gender Survival
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 7/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
catData=trainingData[["Crew/Pass","Class","Adult/Child","Gender"]].apply(catTo
Num)
trainingData[["Crew/Pass","Class","Adult/Child","Gender"]]=catData
trainingData.head()
C:\Users\hariz\Anaconda3\lib\site-packages\pandas\core\frame.py:3137: Setting
WithCopyWarning:
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead
0 27.0 1 2 0 1 1
1 42.0 1 2 0 1 1
2 39.0 1 2 0 0 1
3 16.0 1 2 1 1 0
4 13.0 1 2 1 1 1
In [74]: len(trainingData)
Out[74]: 2456
Out[75]: 2426
In [77]: len(train)
Out[77]: 1940
In [78]: len(test)
Out[78]: 486
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 8/9
9/20/2018 komal_DT1_EDAWithFunctions_Titanic
In [81]: clf
In [82]: clf.feature_importances_
Out[89]: 0.8847736625514403
file:///D:/KOMAL/SIMPLILEARN/MY%20COURSES/IN%20PROGRESS/My%20Codes_ML_DS/pdf%20conversion/htmls/komal_DT1_EDAWithFunctio… 9/9