生活随笔
收集整理的這篇文章主要介紹了
泰坦尼克灾难-可视化
小編覺得挺不錯的,現(xiàn)在分享給大家,幫大家做個參考.
前言:沒有具體的解釋,只有步驟,需要熟練哦
df
['Embarked']=df
['Embarked'].fillna
('S')
age_mean
= df
['Age'].mean
()
df
['Age'] = df
['Age'].fillna
(age_mean
)
def sex2value(Sex
):if Sex
=='male':return 1else:return 0df
['Sex']=df
['Sex'].apply(sex2value
)
survice_passenger_df
=df
[df
['Survived']==1]
survice_passenger_df
.head
(10)
np
.warnings
.filterwarnings
('ignore', category
=np
.VisibleDeprecationWarning
)
df_sexl
=df
['Sex'][df
['Survived']==1]
df_sex0
=df
['Sex'][df
['Survived']==0]
plt
.hist
([df_sexl
,df_sex0
],stacked
=True,label
=['Rescued','not saved'])
plt
.xticks
([-1,0,1,2],[-1,'F','M',2])
plt
.legend
()
plt
.title
('Sex_Survived')
df_classl
=df
['Pclass'][df
['Survived']==1]
df_class0
=df
['Pclass'][df
['Survived']==0]
plt
.hist
([df_classl
,df_class0
],stacked
=True,label
=['Rescued','not saved'])
plt
.xticks
([1,2,3],['Upper','Middle','lower'])
plt
.legend
()
plt
.title
('Pclass_Survived')
df_Agel
= df
['Age'][df
['Survived']==1]
df_Age0
= df
['Age'][df
['Survived']==0]
plt
.hist
([df_Agel
,df_Age0
],stacked
=True,label
=['Rescued','not saved'])
plt
.legend
()
plt
.title
('Age_Survived')
def age_duan(age
):if age
<=18:return 1elif age
<=40:return 2else:return 3
df
['Age']=df
['Age'].apply(age_duan
)
df_sex1
=df
['Age'][df
['Survived']==1]
df_sex0
=df
['Age'][df
['Survived']==0]
plt
.hist
([df_sex1
,df_sex0
],stacked
=True,label
=['Rescued','not saved'])
plt
.xticks
([1,2,3],['child','youth','elderly'])
plt
.legend
()
plt
.title
('Age_Survived')
group_all
=df
.groupby
(['Sex','Pclass']).count
()['PassengerId']
survives_passenger_df
=df
[df
['Survived']==1]
survives_passenger_group
= survives_passenger_df
.groupby
(['Sex','Pclass']).count
()['PassengerId']
survives_passenger_radio
= survives_passenger_group
/group_all
survives_passenger_radio
bar
= survives_passenger_radio
.plot
.bar
(title
="性別和乘客等級共同對生還率的影響")
for p
in bar
.patches
:bar
.text
(p
.get_x
()*1.005,p
.get_height
()*1.005,'%.2f%%'%(p
.get_height
()*100))
def passenger_survived_ratio(data
,cols
):passenger_group
= data
.groupby
(cols
)[cols
[0]].count
()surived_info
=df
[cols
][df
['Survived']==1]surived_group
= surived_info
.groupby
(cols
)[cols
[0]].count
()return surived_group
/passenger_group
def print_bar(data
,title
=""):bar
=data
.plot
.bar
(title
=title
)for p
in bar
.patches
:bar
.text
(p
.get_x
()*1.005,p
.get_height
()*1.005,'%.2f%%'%(p
.get_height
()*100))
print_bar
(passenger_survived_ratio
(df
,['Age','Sex']))
總結(jié)
以上是生活随笔為你收集整理的泰坦尼克灾难-可视化的全部內(nèi)容,希望文章能夠幫你解決所遇到的問題。
如果覺得生活随笔網(wǎng)站內(nèi)容還不錯,歡迎將生活随笔推薦給好友。