19: Data Visualisation with Seaborn#
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import seaborn as sns
%matplotlib inline
iris = sns.load_dataset('iris')
iris.head()
sepal_length | sepal_width | petal_length | petal_width | species | |
---|---|---|---|---|---|
0 | 5.1 | 3.5 | 1.4 | 0.2 | setosa |
1 | 4.9 | 3.0 | 1.4 | 0.2 | setosa |
2 | 4.7 | 3.2 | 1.3 | 0.2 | setosa |
3 | 4.6 | 3.1 | 1.5 | 0.2 | setosa |
4 | 5.0 | 3.6 | 1.4 | 0.2 | setosa |
1. Pairplot() : Global pictrue#
sns.pairplot(iris, hue='species')
<seaborn.axisgrid.PairGrid at 0x7fc6e4b54670>
data:image/s3,"s3://crabby-images/f803e/f803e105e9f7ba82abcadcd8cce08655361b0044" alt="../../../_images/f58ea6c7e1490a8af4306e93ba8cc014d86cf4d612900750b26d6e7f8093833d.png"
2. Categories Viewing#
titanic = sns.load_dataset('titanic')
titanic.drop(['alone', 'alive', 'who', 'adult_male', 'embark_town', 'class'], axis=1, inplace=True)
titanic.dropna(axis=0, inplace=True)
titanic.head()
survived | pclass | sex | age | sibsp | parch | fare | embarked | deck | |
---|---|---|---|---|---|---|---|---|---|
1 | 1 | 1 | female | 38.0 | 1 | 0 | 71.2833 | C | C |
3 | 1 | 1 | female | 35.0 | 1 | 0 | 53.1000 | S | C |
6 | 0 | 1 | male | 54.0 | 0 | 0 | 51.8625 | S | E |
10 | 1 | 3 | female | 4.0 | 1 | 1 | 16.7000 | S | G |
11 | 1 | 1 | female | 58.0 | 0 | 0 | 26.5500 | S | C |
sns.catplot(x='survived', y='age', data=titanic, hue='sex')
<seaborn.axisgrid.FacetGrid at 0x7fc6dfc6eaf0>
data:image/s3,"s3://crabby-images/fa746/fa7469b0c115a93845fb1fbdb2013b86ccd31240" alt="../../../_images/baa98a9c8166169fb55c4720e3b85b2eb8ff771746cecebcf09b7445ec837fdf.png"
plt.figure(figsize=(32, 8))
sns.boxplot(x='age', y='fare', data=titanic, hue='sex')
<AxesSubplot:xlabel='age', ylabel='fare'>
data:image/s3,"s3://crabby-images/51822/5182279f65fe902a3ece8dd49592551b559851d4" alt="../../../_images/acc785afc255c60f5e13998f840d743bd1af5daca8f8a152c53475b2b42f2b18.png"
3. Visualisation de Distributions#
sns.distplot(titanic['fare'])
/home/ubuntu/Documents/Projects/msci_data/.venv/lib/python3.9/site-packages/seaborn/distributions.py:2619: FutureWarning: `distplot` is a deprecated function and will be removed in a future version. Please adapt your code to use either `displot` (a figure-level function with similar flexibility) or `histplot` (an axes-level function for histograms).
warnings.warn(msg, FutureWarning)
<AxesSubplot:xlabel='fare', ylabel='Density'>
data:image/s3,"s3://crabby-images/1b4d4/1b4d481f95f3d9977dab7ca909d613a1dc698776" alt="../../../_images/a2929bc4bad82d00707729dd52da603a5e4f13634c2c181e82ae3a5636ad1b19.png"
sns.jointplot('age', 'fare', data=titanic, kind='hex')
/home/ubuntu/Documents/Projects/msci_data/.venv/lib/python3.9/site-packages/seaborn/_decorators.py:36: FutureWarning: Pass the following variables as keyword args: x, y. From version 0.12, the only valid positional argument will be `data`, and passing other arguments without an explicit keyword will result in an error or misinterpretation.
warnings.warn(
<seaborn.axisgrid.JointGrid at 0x7fc6dfc8bc40>
data:image/s3,"s3://crabby-images/8f9ce/8f9ceff74e7ff8f81d278ae550b0dd860ac05f3e" alt="../../../_images/e7c83890b52ec70ec561129d4ed497de572ab383c95898d0fd8e4e0cb7618525.png"
sns.heatmap(titanic.corr())
<AxesSubplot:>
data:image/s3,"s3://crabby-images/da61f/da61f5c516f8f28680e03995340cd83767a52989" alt="../../../_images/694c37b366030b98b1f8b21e6c56a5f139c3f0590396ce43fbe8732b2e4710a1.png"