import
pandas as pd
import
numpy as np
import
seaborn as sns
import
matplotlib.pyplot as plt
%
matplotlib inline
titanic_dataset
=
pd.read_csv(
'tested.csv.xls'
)
titanic_dataset.head()
titanic_dataset.drop([
'Name'
,
'Ticket'
,
'Cabin'
,
'PassengerId'
],axis
=
1
, inplace
=
True
)
titanic_dataset.dtypes
titanic_dataset[
'Embarked'
].unique()
titanic_dataset[
'Sex'
].unique()
titanic_dataset.fillna(titanic_dataset.mean(), inplace
=
True
)
titanic_dataset[
"Sex"
]
=
titanic_dataset[
"Sex"
].cat.codes
titanic_dataset[
"Embarked"
]
=
titanic_dataset[
"Embarked"
].cat.codes
titanic_dataset.head()
survive_colors
=
{
0
:
'orange'
,
1
:
'blue'
}
pd.plotting.scatter_matrix(titanic_dataset,figsize
=
(
20
,
20
),grid
=
True
,
marker
=
'o'
, c
=
titanic_dataset[
'Survived'
].
map
(colors))
sns.set_theme(style
=
"ticks"
)
sns.pairplot(titanic_dataset, hue
=
'Survived'
)