{ "cells": [ { "cell_type": "code", "execution_count": 1, "source": [ "import pandas as pd\n", "import numpy as np\n", "\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "%matplotlib inline\n", "\n", "import plotly.graph_objects as go\n" ], "outputs": [], "metadata": { "tags": [] } }, { "cell_type": "markdown", "source": [ "# Basic Visualizations" ], "metadata": {} }, { "cell_type": "markdown", "source": [ "In thus subchapter, we will go over some key types of plots, as well as how to create them using two of the most common plotting libraries in Python: `matplotlib` and `seaborn`. However, first we will need to load in the dataset we will be using for this analysis. \n", "\n", "For this analysis, we will be loading in a subset of [World Bank's Education Statistics (EdStats) Dataset](https://datatopics.worldbank.org/education/). The subset we will be working with has data on a bunch of education metrics/indicators for 25 regions from 1970-2014. We have cleaned this dataset to ensure we don't have any missing datapoints. There are too many indicators to even begin describing all. We highly encourage you to explore World Bank's data directly if you're interested!" ], "metadata": {} }, { "cell_type": "code", "execution_count": 2, "source": [ "wb_df = pd.read_csv('data/wb_educ.csv')\n", "wb_df" ], "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
\n", " | Country Name | \n", "Country Code | \n", "Indicator Name | \n", "Indicator Code | \n", "1970 | \n", "1971 | \n", "1972 | \n", "1973 | \n", "1974 | \n", "1975 | \n", "... | \n", "2005 | \n", "2006 | \n", "2007 | \n", "2008 | \n", "2009 | \n", "2010 | \n", "2011 | \n", "2012 | \n", "2013 | \n", "2014 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "Arab World | \n", "ARB | \n", "Adjusted net enrolment rate, primary, both sex... | \n", "SE.PRM.TENR | \n", "5.482212e+01 | \n", "5.489414e+01 | \n", "5.620944e+01 | \n", "5.726711e+01 | \n", "5.799114e+01 | \n", "5.936554e+01 | \n", "... | \n", "8.248949e+01 | \n", "8.268551e+01 | \n", "8.328034e+01 | \n", "8.401187e+01 | \n", "8.419596e+01 | \n", "8.521200e+01 | \n", "8.524514e+01 | \n", "8.610167e+01 | \n", "8.551194e+01 | \n", "8.532015e+01 | \n", "
1 | \n", "Arab World | \n", "ARB | \n", "Adjusted net enrolment rate, primary, female (%) | \n", "SE.PRM.TENR.FE | \n", "4.335110e+01 | \n", "4.331815e+01 | \n", "4.464070e+01 | \n", "4.584572e+01 | \n", "4.644950e+01 | \n", "4.836389e+01 | \n", "... | \n", "7.947577e+01 | \n", "7.960833e+01 | \n", "8.058242e+01 | \n", "8.147380e+01 | \n", "8.169569e+01 | \n", "8.287165e+01 | \n", "8.286139e+01 | \n", "8.440141e+01 | \n", "8.391403e+01 | \n", "8.382083e+01 | \n", "
2 | \n", "Arab World | \n", "ARB | \n", "Adjusted net enrolment rate, primary, gender p... | \n", "UIS.NERA.1.GPI | \n", "6.585700e-01 | \n", "6.564000e-01 | \n", "6.632900e-01 | \n", "6.720400e-01 | \n", "6.726100e-01 | \n", "6.917600e-01 | \n", "... | \n", "9.308400e-01 | \n", "9.296200e-01 | \n", "9.384600e-01 | \n", "9.425000e-01 | \n", "9.434700e-01 | \n", "9.476200e-01 | \n", "9.467000e-01 | \n", "9.620800e-01 | \n", "9.640900e-01 | \n", "9.662000e-01 | \n", "
3 | \n", "Arab World | \n", "ARB | \n", "Adjusted net enrolment rate, primary, male (%) | \n", "SE.PRM.TENR.MA | \n", "6.582623e+01 | \n", "6.599358e+01 | \n", "6.730186e+01 | \n", "6.821908e+01 | \n", "6.905901e+01 | \n", "6.991455e+01 | \n", "... | \n", "8.538029e+01 | \n", "8.563508e+01 | \n", "8.586669e+01 | \n", "8.644414e+01 | \n", "8.659069e+01 | \n", "8.745258e+01 | \n", "8.752652e+01 | \n", "8.772817e+01 | \n", "8.703988e+01 | \n", "8.675339e+01 | \n", "
4 | \n", "Arab World | \n", "ARB | \n", "Adjusted net intake rate to Grade 1 of primary... | \n", "UIS.NIRA.1 | \n", "5.244892e+01 | \n", "5.248975e+01 | \n", "5.263559e+01 | \n", "5.332700e+01 | \n", "5.418465e+01 | \n", "5.486563e+01 | \n", "... | \n", "7.613177e+01 | \n", "7.522256e+01 | \n", "7.559570e+01 | \n", "7.489394e+01 | \n", "7.481455e+01 | \n", "7.619704e+01 | \n", "7.647497e+01 | \n", "7.731937e+01 | \n", "7.656671e+01 | \n", "7.662057e+01 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3395 | \n", "World | \n", "WLD | \n", "Survival rate to the last grade of primary edu... | \n", "SE.PRM.PRSL.MA.ZS | \n", "6.707542e+01 | \n", "6.657861e+01 | \n", "6.629349e+01 | \n", "6.593887e+01 | \n", "6.625532e+01 | \n", "6.682665e+01 | \n", "... | \n", "6.825568e+01 | \n", "6.920012e+01 | \n", "6.931534e+01 | \n", "7.040000e+01 | \n", "6.939960e+01 | \n", "6.849098e+01 | \n", "6.795392e+01 | \n", "6.678090e+01 | \n", "6.694540e+01 | \n", "7.019475e+01 | \n", "
3396 | \n", "World | \n", "WLD | \n", "Teachers in primary education, both sexes (num... | \n", "SE.PRM.TCHR | \n", "1.428878e+07 | \n", "1.459513e+07 | \n", "1.529481e+07 | \n", "1.582020e+07 | \n", "1.627415e+07 | \n", "1.674470e+07 | \n", "... | \n", "2.688926e+07 | \n", "2.709888e+07 | \n", "2.752526e+07 | \n", "2.777079e+07 | \n", "2.814018e+07 | \n", "2.864318e+07 | \n", "2.910380e+07 | \n", "2.938328e+07 | \n", "3.047234e+07 | \n", "3.067875e+07 | \n", "
3397 | \n", "World | \n", "WLD | \n", "Teachers in primary education, female (number) | \n", "SE.PRM.TCHR.FE | \n", "7.874428e+06 | \n", "8.001568e+06 | \n", "8.262296e+06 | \n", "8.498361e+06 | \n", "8.663721e+06 | \n", "8.810588e+06 | \n", "... | \n", "1.665298e+07 | \n", "1.679720e+07 | \n", "1.703848e+07 | \n", "1.723032e+07 | \n", "1.753421e+07 | \n", "1.796218e+07 | \n", "1.832742e+07 | \n", "1.859735e+07 | \n", "1.931428e+07 | \n", "1.952334e+07 | \n", "
3398 | \n", "World | \n", "WLD | \n", "Teachers in secondary education, both sexes (n... | \n", "SE.SEC.TCHR | \n", "1.172561e+07 | \n", "1.213650e+07 | \n", "1.269944e+07 | \n", "1.330712e+07 | \n", "1.374928e+07 | \n", "1.413025e+07 | \n", "... | \n", "2.843753e+07 | \n", "2.910475e+07 | \n", "3.010238e+07 | \n", "3.105815e+07 | \n", "3.162800e+07 | \n", "3.221992e+07 | \n", "3.249828e+07 | \n", "3.269860e+07 | \n", "3.235300e+07 | \n", "3.286152e+07 | \n", "
3399 | \n", "World | \n", "WLD | \n", "Teachers in tertiary education programmes, bot... | \n", "SE.TER.TCHR | \n", "2.752715e+06 | \n", "2.815567e+06 | \n", "2.938241e+06 | \n", "3.047319e+06 | \n", "3.181207e+06 | \n", "3.332724e+06 | \n", "... | \n", "9.191711e+06 | \n", "9.480116e+06 | \n", "1.000710e+07 | \n", "1.054032e+07 | \n", "1.069500e+07 | \n", "1.113321e+07 | \n", "1.158810e+07 | \n", "1.190016e+07 | \n", "1.216735e+07 | \n", "1.264785e+07 | \n", "
3400 rows × 49 columns
\n", "\n", " | Continent | \n", "Country | \n", "Primary completion rate: Male: % of relevant age group: 2015 | \n", "Primary completion rate: Female: % of relevant age group: 2015 | \n", "Lower secondary completion rate: Male: % of relevant age group: 2015 | \n", "Lower secondary completion rate: Female: % of relevant age group: 2015 | \n", "Youth literacy rate: Male: % of ages 15-24: 2005-14 | \n", "Youth literacy rate: Female: % of ages 15-24: 2005-14 | \n", "Adult literacy rate: Male: % ages 15 and older: 2005-14 | \n", "Adult literacy rate: Female: % ages 15 and older: 2005-14 | \n", "... | \n", "Access to improved sanitation facilities: % of population: 1990 | \n", "Access to improved sanitation facilities: % of population: 2015 | \n", "Child immunization rate: Measles: % of children ages 12-23 months: 2015 | \n", "Child immunization rate: DTP3: % of children ages 12-23 months: 2015 | \n", "Children with acute respiratory infection taken to health provider: % of children under age 5 with ARI: 2009-2016 | \n", "Children with diarrhea who received oral rehydration and continuous feeding: % of children under age 5 with diarrhea: 2009-2016 | \n", "Children sleeping under treated bed nets: % of children under age 5: 2009-2016 | \n", "Children with fever receiving antimalarial drugs: % of children under age 5 with fever: 2009-2016 | \n", "Tuberculosis: Treatment success rate: % of new cases: 2014 | \n", "Tuberculosis: Cases detection rate: % of new estimated cases: 2015 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "Africa | \n", "Algeria | \n", "106.0 | \n", "105.0 | \n", "68.0 | \n", "85.0 | \n", "96.0 | \n", "92.0 | \n", "83.0 | \n", "68.0 | \n", "... | \n", "80.0 | \n", "88.0 | \n", "95.0 | \n", "95.0 | \n", "66.0 | \n", "42.0 | \n", "NaN | \n", "NaN | \n", "88.0 | \n", "80.0 | \n", "
1 | \n", "Africa | \n", "Angola | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "79.0 | \n", "67.0 | \n", "82.0 | \n", "60.0 | \n", "... | \n", "22.0 | \n", "52.0 | \n", "55.0 | \n", "64.0 | \n", "NaN | \n", "NaN | \n", "25.9 | \n", "28.3 | \n", "34.0 | \n", "64.0 | \n", "
2 | \n", "Africa | \n", "Benin | \n", "83.0 | \n", "73.0 | \n", "50.0 | \n", "37.0 | \n", "55.0 | \n", "31.0 | \n", "41.0 | \n", "18.0 | \n", "... | \n", "7.0 | \n", "20.0 | \n", "75.0 | \n", "79.0 | \n", "23.0 | \n", "33.0 | \n", "72.7 | \n", "25.9 | \n", "89.0 | \n", "61.0 | \n", "
3 | \n", "Africa | \n", "Botswana | \n", "98.0 | \n", "101.0 | \n", "86.0 | \n", "87.0 | \n", "96.0 | \n", "99.0 | \n", "87.0 | \n", "89.0 | \n", "... | \n", "39.0 | \n", "63.0 | \n", "97.0 | \n", "95.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "77.0 | \n", "62.0 | \n", "
4 | \n", "Africa | \n", "Burundi | \n", "58.0 | \n", "66.0 | \n", "35.0 | \n", "30.0 | \n", "90.0 | \n", "88.0 | \n", "89.0 | \n", "85.0 | \n", "... | \n", "42.0 | \n", "48.0 | \n", "93.0 | \n", "94.0 | \n", "55.0 | \n", "43.0 | \n", "53.8 | \n", "25.4 | \n", "91.0 | \n", "51.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
161 | \n", "S. America | \n", "Guyana | \n", "87.0 | \n", "81.0 | \n", "NaN | \n", "NaN | \n", "92.0 | \n", "94.0 | \n", "82.0 | \n", "87.0 | \n", "... | \n", "76.0 | \n", "84.0 | \n", "99.0 | \n", "95.0 | \n", "84.0 | \n", "29.0 | \n", "7.4 | \n", "7.4 | \n", "69.0 | \n", "80.0 | \n", "
162 | \n", "S. America | \n", "Paraguay | \n", "89.0 | \n", "90.0 | \n", "71.0 | \n", "77.0 | \n", "99.0 | \n", "98.0 | \n", "96.0 | \n", "94.0 | \n", "... | \n", "52.0 | \n", "89.0 | \n", "83.0 | \n", "93.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "71.0 | \n", "87.0 | \n", "
163 | \n", "S. America | \n", "Peru | \n", "99.0 | \n", "100.0 | \n", "84.0 | \n", "87.0 | \n", "99.0 | \n", "99.0 | \n", "97.0 | \n", "90.0 | \n", "... | \n", "53.0 | \n", "76.0 | \n", "92.0 | \n", "90.0 | \n", "60.0 | \n", "57.0 | \n", "NaN | \n", "NaN | \n", "87.0 | \n", "80.0 | \n", "
164 | \n", "S. America | \n", "Suriname | \n", "90.0 | \n", "99.0 | \n", "36.0 | \n", "65.0 | \n", "98.0 | \n", "99.0 | \n", "95.0 | \n", "94.0 | \n", "... | \n", "NaN | \n", "79.0 | \n", "94.0 | \n", "89.0 | \n", "76.0 | \n", "61.0 | \n", "43.4 | \n", "0.0 | \n", "77.0 | \n", "80.0 | \n", "
165 | \n", "S. America | \n", "Uruguay | \n", "103.0 | \n", "104.0 | \n", "54.0 | \n", "68.0 | \n", "98.0 | \n", "99.0 | \n", "98.0 | \n", "99.0 | \n", "... | \n", "92.0 | \n", "96.0 | \n", "96.0 | \n", "95.0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "75.0 | \n", "87.0 | \n", "
166 rows × 47 columns
\n", "