{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "sns.set_style(\"whitegrid\")\n", "# sns.set_context(\"paper\")\n", "sns.set(rc={'figure.figsize': (12,8)})" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Download the data\n", "\n", "First, we download the data from the [John Hopkins Github](https://raw.githubusercontent.com/CSSEGISandData/COVID-19/master/csse_covid_19_data/csse_covid_19_time_series/time_series_covid19_confirmed_global.csv) and make a inspection of the columns:" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "url = \"https://raw.githubusercontent.com/CSSEGISandData/COVID-19/master/csse_covid_19_data/csse_covid_19_time_series/time_series_covid19_confirmed_global.csv\"\n", "raw_data = pd.read_csv(url)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Now we can inspect the data:" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Province/State | \n", "Country/Region | \n", "Lat | \n", "Long | \n", "1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "... | \n", "9/13/21 | \n", "9/14/21 | \n", "9/15/21 | \n", "9/16/21 | \n", "9/17/21 | \n", "9/18/21 | \n", "9/19/21 | \n", "9/20/21 | \n", "9/21/21 | \n", "9/22/21 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "NaN | \n", "Afghanistan | \n", "33.939110 | \n", "67.709953 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "154094 | \n", "154180 | \n", "154283 | \n", "154361 | \n", "154487 | \n", "154487 | \n", "154487 | \n", "154585 | \n", "154712 | \n", "154757 | \n", "
1 | \n", "NaN | \n", "Albania | \n", "41.153300 | \n", "20.168300 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "157436 | \n", "158431 | \n", "159423 | \n", "160365 | \n", "161324 | \n", "162173 | \n", "162953 | \n", "163404 | \n", "164276 | \n", "165096 | \n", "
2 | \n", "NaN | \n", "Algeria | \n", "28.033900 | \n", "1.659600 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "200301 | \n", "200528 | \n", "200770 | \n", "200989 | \n", "201224 | \n", "201425 | \n", "201600 | \n", "201766 | \n", "201948 | \n", "202122 | \n", "
3 | \n", "NaN | \n", "Andorra | \n", "42.506300 | \n", "1.521800 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "15096 | \n", "15099 | \n", "15108 | \n", "15113 | \n", "15124 | \n", "15124 | \n", "15124 | \n", "15140 | \n", "15140 | \n", "15153 | \n", "
4 | \n", "NaN | \n", "Angola | \n", "-11.202700 | \n", "17.873900 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "50738 | \n", "51047 | \n", "51407 | \n", "51827 | \n", "52208 | \n", "52307 | \n", "52307 | \n", "52644 | \n", "52968 | \n", "53387 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
274 | \n", "NaN | \n", "Vietnam | \n", "14.058324 | \n", "108.277199 | \n", "0 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "... | \n", "624547 | \n", "635055 | \n", "645640 | \n", "656129 | \n", "667650 | \n", "677023 | \n", "687063 | \n", "695744 | \n", "707436 | \n", "718963 | \n", "
275 | \n", "NaN | \n", "West Bank and Gaza | \n", "31.952200 | \n", "35.233200 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "372108 | \n", "374768 | \n", "377134 | \n", "379635 | \n", "381854 | \n", "382584 | \n", "384390 | \n", "386493 | \n", "388470 | \n", "390369 | \n", "
276 | \n", "NaN | \n", "Yemen | \n", "15.552727 | \n", "48.516388 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "8452 | \n", "8502 | \n", "8527 | \n", "8557 | \n", "8593 | \n", "8630 | \n", "8667 | \n", "8718 | \n", "8752 | \n", "8789 | \n", "
277 | \n", "NaN | \n", "Zambia | \n", "-13.133897 | \n", "27.849332 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "207960 | \n", "208049 | \n", "208161 | \n", "208267 | \n", "208353 | \n", "208422 | \n", "208469 | \n", "208502 | \n", "208599 | \n", "208676 | \n", "
278 | \n", "NaN | \n", "Zimbabwe | \n", "-19.015438 | \n", "29.154857 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "126399 | \n", "126817 | \n", "127083 | \n", "127368 | \n", "127632 | \n", "127739 | \n", "127938 | \n", "128186 | \n", "128186 | \n", "128804 | \n", "
279 rows × 614 columns
\n", "\n", " | Province/State | \n", "Country/Region | \n", "1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "1/28/20 | \n", "1/29/20 | \n", "... | \n", "9/13/21 | \n", "9/14/21 | \n", "9/15/21 | \n", "9/16/21 | \n", "9/17/21 | \n", "9/18/21 | \n", "9/19/21 | \n", "9/20/21 | \n", "9/21/21 | \n", "9/22/21 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "NaN | \n", "Afghanistan | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "154094 | \n", "154180 | \n", "154283 | \n", "154361 | \n", "154487 | \n", "154487 | \n", "154487 | \n", "154585 | \n", "154712 | \n", "154757 | \n", "
1 | \n", "NaN | \n", "Albania | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "157436 | \n", "158431 | \n", "159423 | \n", "160365 | \n", "161324 | \n", "162173 | \n", "162953 | \n", "163404 | \n", "164276 | \n", "165096 | \n", "
2 | \n", "NaN | \n", "Algeria | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "200301 | \n", "200528 | \n", "200770 | \n", "200989 | \n", "201224 | \n", "201425 | \n", "201600 | \n", "201766 | \n", "201948 | \n", "202122 | \n", "
3 | \n", "NaN | \n", "Andorra | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "15096 | \n", "15099 | \n", "15108 | \n", "15113 | \n", "15124 | \n", "15124 | \n", "15124 | \n", "15140 | \n", "15140 | \n", "15153 | \n", "
4 | \n", "NaN | \n", "Angola | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "50738 | \n", "51047 | \n", "51407 | \n", "51827 | \n", "52208 | \n", "52307 | \n", "52307 | \n", "52644 | \n", "52968 | \n", "53387 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
274 | \n", "NaN | \n", "Vietnam | \n", "0 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "... | \n", "624547 | \n", "635055 | \n", "645640 | \n", "656129 | \n", "667650 | \n", "677023 | \n", "687063 | \n", "695744 | \n", "707436 | \n", "718963 | \n", "
275 | \n", "NaN | \n", "West Bank and Gaza | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "372108 | \n", "374768 | \n", "377134 | \n", "379635 | \n", "381854 | \n", "382584 | \n", "384390 | \n", "386493 | \n", "388470 | \n", "390369 | \n", "
276 | \n", "NaN | \n", "Yemen | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "8452 | \n", "8502 | \n", "8527 | \n", "8557 | \n", "8593 | \n", "8630 | \n", "8667 | \n", "8718 | \n", "8752 | \n", "8789 | \n", "
277 | \n", "NaN | \n", "Zambia | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "207960 | \n", "208049 | \n", "208161 | \n", "208267 | \n", "208353 | \n", "208422 | \n", "208469 | \n", "208502 | \n", "208599 | \n", "208676 | \n", "
278 | \n", "NaN | \n", "Zimbabwe | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "126399 | \n", "126817 | \n", "127083 | \n", "127368 | \n", "127632 | \n", "127739 | \n", "127938 | \n", "128186 | \n", "128186 | \n", "128804 | \n", "
279 rows × 612 columns
\n", "\n", " | Province/State | \n", "Country/Region | \n", "1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "1/28/20 | \n", "1/29/20 | \n", "... | \n", "9/13/21 | \n", "9/14/21 | \n", "9/15/21 | \n", "9/16/21 | \n", "9/17/21 | \n", "9/18/21 | \n", "9/19/21 | \n", "9/20/21 | \n", "9/21/21 | \n", "9/22/21 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "NaN | \n", "Afghanistan | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "154094 | \n", "154180 | \n", "154283 | \n", "154361 | \n", "154487 | \n", "154487 | \n", "154487 | \n", "154585 | \n", "154712 | \n", "154757 | \n", "
1 | \n", "NaN | \n", "Albania | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "157436 | \n", "158431 | \n", "159423 | \n", "160365 | \n", "161324 | \n", "162173 | \n", "162953 | \n", "163404 | \n", "164276 | \n", "165096 | \n", "
2 | \n", "NaN | \n", "Algeria | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "200301 | \n", "200528 | \n", "200770 | \n", "200989 | \n", "201224 | \n", "201425 | \n", "201600 | \n", "201766 | \n", "201948 | \n", "202122 | \n", "
3 | \n", "NaN | \n", "Andorra | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "15096 | \n", "15099 | \n", "15108 | \n", "15113 | \n", "15124 | \n", "15124 | \n", "15124 | \n", "15140 | \n", "15140 | \n", "15153 | \n", "
4 | \n", "NaN | \n", "Angola | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "50738 | \n", "51047 | \n", "51407 | \n", "51827 | \n", "52208 | \n", "52307 | \n", "52307 | \n", "52644 | \n", "52968 | \n", "53387 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
274 | \n", "NaN | \n", "Vietnam | \n", "0 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "2 | \n", "... | \n", "624547 | \n", "635055 | \n", "645640 | \n", "656129 | \n", "667650 | \n", "677023 | \n", "687063 | \n", "695744 | \n", "707436 | \n", "718963 | \n", "
275 | \n", "NaN | \n", "West Bank and Gaza | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "372108 | \n", "374768 | \n", "377134 | \n", "379635 | \n", "381854 | \n", "382584 | \n", "384390 | \n", "386493 | \n", "388470 | \n", "390369 | \n", "
276 | \n", "NaN | \n", "Yemen | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "8452 | \n", "8502 | \n", "8527 | \n", "8557 | \n", "8593 | \n", "8630 | \n", "8667 | \n", "8718 | \n", "8752 | \n", "8789 | \n", "
277 | \n", "NaN | \n", "Zambia | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "207960 | \n", "208049 | \n", "208161 | \n", "208267 | \n", "208353 | \n", "208422 | \n", "208469 | \n", "208502 | \n", "208599 | \n", "208676 | \n", "
278 | \n", "NaN | \n", "Zimbabwe | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "126399 | \n", "126817 | \n", "127083 | \n", "127368 | \n", "127632 | \n", "127739 | \n", "127938 | \n", "128186 | \n", "128186 | \n", "128804 | \n", "
279 rows × 612 columns
\n", "\n", " | 1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "1/28/20 | \n", "1/29/20 | \n", "1/30/20 | \n", "1/31/20 | \n", "... | \n", "9/13/21 | \n", "9/14/21 | \n", "9/15/21 | \n", "9/16/21 | \n", "9/17/21 | \n", "9/18/21 | \n", "9/19/21 | \n", "9/20/21 | \n", "9/21/21 | \n", "9/22/21 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
Country/Region | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
Afghanistan | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "154094 | \n", "154180 | \n", "154283 | \n", "154361 | \n", "154487 | \n", "154487 | \n", "154487 | \n", "154585 | \n", "154712 | \n", "154757 | \n", "
Albania | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "157436 | \n", "158431 | \n", "159423 | \n", "160365 | \n", "161324 | \n", "162173 | \n", "162953 | \n", "163404 | \n", "164276 | \n", "165096 | \n", "
Algeria | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "200301 | \n", "200528 | \n", "200770 | \n", "200989 | \n", "201224 | \n", "201425 | \n", "201600 | \n", "201766 | \n", "201948 | \n", "202122 | \n", "
Andorra | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "15096 | \n", "15099 | \n", "15108 | \n", "15113 | \n", "15124 | \n", "15124 | \n", "15124 | \n", "15140 | \n", "15140 | \n", "15153 | \n", "
Angola | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "50738 | \n", "51047 | \n", "51407 | \n", "51827 | \n", "52208 | \n", "52307 | \n", "52307 | \n", "52644 | \n", "52968 | \n", "53387 | \n", "
5 rows × 610 columns
\n", "