In [1]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline
sns.set()

train = pd.read_csv('../../COALA_DS_DATA/COALA_DS_DATA/week2/data/train.csv')
train
Out[1]:
PassengerId Survived Pclass Name Sex Age SibSp Parch Ticket Fare Cabin Embarked
0 1 0 3 Braund, Mr. Owen Harris male 22.0 1 0 A/5 21171 7.2500 NaN S
1 2 1 1 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 1 0 PC 17599 71.2833 C85 C
2 3 1 3 Heikkinen, Miss. Laina female 26.0 0 0 STON/O2. 3101282 7.9250 NaN S
3 4 1 1 Futrelle, Mrs. Jacques Heath (Lily May Peel) female 35.0 1 0 113803 53.1000 C123 S
4 5 0 3 Allen, Mr. William Henry male 35.0 0 0 373450 8.0500 NaN S
... ... ... ... ... ... ... ... ... ... ... ... ...
886 887 0 2 Montvila, Rev. Juozas male 27.0 0 0 211536 13.0000 NaN S
887 888 1 1 Graham, Miss. Margaret Edith female 19.0 0 0 112053 30.0000 B42 S
888 889 0 3 Johnston, Miss. Catherine Helen "Carrie" female NaN 1 2 W./C. 6607 23.4500 NaN S
889 890 1 1 Behr, Mr. Karl Howell male 26.0 0 0 111369 30.0000 C148 C
890 891 0 3 Dooley, Mr. Patrick male 32.0 0 0 370376 7.7500 NaN Q

891 rows × 12 columns

In [19]:
surv_male = train.loc[(train["Sex"] == "male") & (train['Survived'] == 1), "PassengerId"].count()
surv_female = train.loc[(train["Sex"] == "female") & (train['Survived'] == 1), "PassengerId"].count()

_male = train.loc[(train['Sex'] == "male") & (train['Survived'] == 0), "PassengerId"].count()
_female = train.loc[(train['Sex'] == "male") & (train['Survived'] == 0), "PassengerId"].count()

pd.DataFrame({
    "male" : [surv_male, _male],
    "female" : [surv_female, _female]
}, index=['Dead', 'Survived'])
Out[19]:
male female
Dead 109 233
Survived 468 468