{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "%matplotlib inline\n", "import matplotlib.pyplot as plt\n", "import pandas as pd\n", "import isoweek\n", "import os.path\n", "import requests" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Data analysis of Covis-19 cumulated cases by countries\n", "\n", "Les données de l'incidence du Covid-19 sont disponibles du site Web du [ Johns Hopkins University Center for Systems Science and Engineering (JHU CSSE)](https://systems.jhu.edu/). Nous les récupérons sous forme d'un fichier en format CSV dont chaque ligne correspond à une région ou pays. Nous téléchargeons le jeu de données complet si il n'est pas en local sur le dépot git. Le jeu de données commence le 22 Janvier avec les données quotidiennes des cas cumulés par région. " ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [], "source": [ "data_url = \"https://raw.githubusercontent.com/CSSEGISandData/COVID-19/master/csse_covid_19_data/csse_covid_19_time_series/time_series_covid19_confirmed_global.csv\"\n", "local_file_name = './local_data_covid.csv'\n", "if not os.path.isfile(local_file_name):\n", " print('file does not exist, downloading...')\n", " resource = requests.get(data_url, allow_redirects=True)\n", " print(resource)\n", " output = open(local_file_name,\"wb\")\n", " output.write(resource.content)\n", " output.close()\n", " print('local file saved with name : ', local_file_name)" ] }, { "cell_type": "code", "execution_count": 31, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Province/State | \n", "Country/Region | \n", "Lat | \n", "Long | \n", "1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "... | \n", "8/1/21 | \n", "8/2/21 | \n", "8/3/21 | \n", "8/4/21 | \n", "8/5/21 | \n", "8/6/21 | \n", "8/7/21 | \n", "8/8/21 | \n", "8/9/21 | \n", "8/10/21 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "NaN | \n", "Afghanistan | \n", "33.93911 | \n", "67.709953 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "146523 | \n", "147985 | \n", "148572 | \n", "148933 | \n", "149361 | \n", "149810 | \n", "149810 | \n", "149810 | \n", "150778 | \n", "151013 | \n", "
1 | \n", "NaN | \n", "Albania | \n", "41.15330 | \n", "20.168300 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "133121 | \n", "133146 | \n", "133211 | \n", "133310 | \n", "133442 | \n", "133591 | \n", "133730 | \n", "133912 | \n", "133981 | \n", "134201 | \n", "
2 | \n", "NaN | \n", "Algeria | \n", "28.03390 | \n", "1.659600 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "172564 | \n", "173922 | \n", "175229 | \n", "176724 | \n", "178013 | \n", "179216 | \n", "180356 | \n", "181376 | \n", "182368 | \n", "183347 | \n", "
3 | \n", "NaN | \n", "Andorra | \n", "42.50630 | \n", "1.521800 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "14678 | \n", "14747 | \n", "14766 | \n", "14797 | \n", "14809 | \n", "14836 | \n", "14836 | \n", "14836 | \n", "14836 | \n", "14873 | \n", "
4 | \n", "NaN | \n", "Angola | \n", "-11.20270 | \n", "17.873900 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "42815 | \n", "42970 | \n", "43070 | \n", "43158 | \n", "43269 | \n", "43487 | \n", "43592 | \n", "43662 | \n", "43747 | \n", "43890 | \n", "
5 rows × 571 columns
\n", "\n", " | Province/State | \n", "Country/Region | \n", "Lat | \n", "Long | \n", "1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "... | \n", "8/1/21 | \n", "8/2/21 | \n", "8/3/21 | \n", "8/4/21 | \n", "8/5/21 | \n", "8/6/21 | \n", "8/7/21 | \n", "8/8/21 | \n", "8/9/21 | \n", "8/10/21 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "NaN | \n", "Afghanistan | \n", "33.93911 | \n", "67.709953 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "146523 | \n", "147985 | \n", "148572 | \n", "148933 | \n", "149361 | \n", "149810 | \n", "149810 | \n", "149810 | \n", "150778 | \n", "151013 | \n", "
1 | \n", "NaN | \n", "Albania | \n", "41.15330 | \n", "20.168300 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "133121 | \n", "133146 | \n", "133211 | \n", "133310 | \n", "133442 | \n", "133591 | \n", "133730 | \n", "133912 | \n", "133981 | \n", "134201 | \n", "
2 | \n", "NaN | \n", "Algeria | \n", "28.03390 | \n", "1.659600 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "172564 | \n", "173922 | \n", "175229 | \n", "176724 | \n", "178013 | \n", "179216 | \n", "180356 | \n", "181376 | \n", "182368 | \n", "183347 | \n", "
3 | \n", "NaN | \n", "Andorra | \n", "42.50630 | \n", "1.521800 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "14678 | \n", "14747 | \n", "14766 | \n", "14797 | \n", "14809 | \n", "14836 | \n", "14836 | \n", "14836 | \n", "14836 | \n", "14873 | \n", "
4 | \n", "NaN | \n", "Angola | \n", "-11.20270 | \n", "17.873900 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "42815 | \n", "42970 | \n", "43070 | \n", "43158 | \n", "43269 | \n", "43487 | \n", "43592 | \n", "43662 | \n", "43747 | \n", "43890 | \n", "
5 rows × 571 columns
\n", "\n", " | Province/State | \n", "Country/Region | \n", "Lat | \n", "Long | \n", "1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "... | \n", "8/1/21 | \n", "8/2/21 | \n", "8/3/21 | \n", "8/4/21 | \n", "8/5/21 | \n", "8/6/21 | \n", "8/7/21 | \n", "8/8/21 | \n", "8/9/21 | \n", "8/10/21 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
70 | \n", "Hong Kong | \n", "China | \n", "22.3 | \n", "114.2 | \n", "0 | \n", "2 | \n", "2 | \n", "5 | \n", "8 | \n", "8 | \n", "... | \n", "11987 | \n", "11990 | \n", "11994 | \n", "11996 | \n", "12002 | \n", "12004 | \n", "12011 | \n", "12013 | \n", "12015 | \n", "12019 | \n", "
1 rows × 571 columns
\n", "\n", " | Province/State | \n", "Country/Region | \n", "Lat | \n", "Long | \n", "1/22/20 | \n", "1/23/20 | \n", "1/24/20 | \n", "1/25/20 | \n", "1/26/20 | \n", "1/27/20 | \n", "... | \n", "8/2/21 | \n", "8/3/21 | \n", "8/4/21 | \n", "8/5/21 | \n", "8/6/21 | \n", "8/7/21 | \n", "8/8/21 | \n", "8/9/21 | \n", "8/10/21 | \n", "70 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
70 | \n", "Hong Kong | \n", "Hong Kong | \n", "22.3 | \n", "114.2 | \n", "0.0 | \n", "2.0 | \n", "2.0 | \n", "5.0 | \n", "8.0 | \n", "8.0 | \n", "... | \n", "11990.0 | \n", "11994.0 | \n", "11996.0 | \n", "12002.0 | \n", "12004.0 | \n", "12011.0 | \n", "12013.0 | \n", "12015.0 | \n", "12019.0 | \n", "NaN | \n", "
1 rows × 572 columns
\n", "