diff --git a/module3/exo3/exercice_sarscov.ipynb b/module3/exo3/exercice_sarscov.ipynb
index c5869ee0c910801361af5661821ada8f8a4f48ec..cd46ffa735ff707039c556586b02795ae0fd83f9 100644
--- a/module3/exo3/exercice_sarscov.ipynb
+++ b/module3/exo3/exercice_sarscov.ipynb
@@ -15,7 +15,7 @@
"cell_type": "markdown",
"metadata": {},
"source": [
- "## Téléchargement des données\n",
+ "## Téléchargement et traitement des données\n",
"\n",
"Les données relevées sont stockées dans un fichier. Celles-ci sont à la date du 22 juin 2021."
]
@@ -49,405 +49,13 @@
},
{
"cell_type": "code",
- "execution_count": 6,
+ "execution_count": 2,
"metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "
\n",
- "\n",
- "
\n",
- " \n",
- " \n",
- " | \n",
- " Province/State | \n",
- " Country/Region | \n",
- " Lat | \n",
- " Long | \n",
- " 1/22/20 | \n",
- " 1/23/20 | \n",
- " 1/24/20 | \n",
- " 1/25/20 | \n",
- " 1/26/20 | \n",
- " 1/27/20 | \n",
- " ... | \n",
- " 6/12/21 | \n",
- " 6/13/21 | \n",
- " 6/14/21 | \n",
- " 6/15/21 | \n",
- " 6/16/21 | \n",
- " 6/17/21 | \n",
- " 6/18/21 | \n",
- " 6/19/21 | \n",
- " 6/20/21 | \n",
- " 6/21/21 | \n",
- "
\n",
- " \n",
- " \n",
- " \n",
- " | 119 | \n",
- " French Guiana | \n",
- " France | \n",
- " 3.933900 | \n",
- " -53.125800 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 25506 | \n",
- " 25506 | \n",
- " 25506 | \n",
- " 25788 | \n",
- " 25950 | \n",
- " 26143 | \n",
- " 26143 | \n",
- " 26143 | \n",
- " 26143 | \n",
- " 26450 | \n",
- "
\n",
- " \n",
- " | 120 | \n",
- " French Polynesia | \n",
- " France | \n",
- " -17.679700 | \n",
- " 149.406800 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 18930 | \n",
- " 18930 | \n",
- " 18939 | \n",
- " 18947 | \n",
- " 18952 | \n",
- " 18957 | \n",
- " 18963 | \n",
- " 18963 | \n",
- " 18963 | \n",
- " 18972 | \n",
- "
\n",
- " \n",
- " | 121 | \n",
- " Guadeloupe | \n",
- " France | \n",
- " 16.265000 | \n",
- " -61.551000 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 17108 | \n",
- " 17288 | \n",
- " 17288 | \n",
- " 17288 | \n",
- " 17288 | \n",
- " 17288 | \n",
- " 17288 | \n",
- " 17288 | \n",
- " 17288 | \n",
- " 17427 | \n",
- "
\n",
- " \n",
- " | 122 | \n",
- " Martinique | \n",
- " France | \n",
- " 14.641500 | \n",
- " -61.024200 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 12060 | \n",
- " 12130 | \n",
- " 12130 | \n",
- " 12130 | \n",
- " 12130 | \n",
- " 12130 | \n",
- " 12130 | \n",
- " 12130 | \n",
- " 12130 | \n",
- " 12199 | \n",
- "
\n",
- " \n",
- " | 123 | \n",
- " Mayotte | \n",
- " France | \n",
- " -12.827500 | \n",
- " 45.166244 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 19373 | \n",
- " 19373 | \n",
- " 19378 | \n",
- " 19378 | \n",
- " 19378 | \n",
- " 19378 | \n",
- " 19389 | \n",
- " 19389 | \n",
- " 19389 | \n",
- " 19389 | \n",
- "
\n",
- " \n",
- " | 124 | \n",
- " New Caledonia | \n",
- " France | \n",
- " -20.904305 | \n",
- " 165.618042 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 128 | \n",
- " 128 | \n",
- " 128 | \n",
- " 128 | \n",
- " 128 | \n",
- " 128 | \n",
- " 128 | \n",
- " 128 | \n",
- " 129 | \n",
- " 129 | \n",
- "
\n",
- " \n",
- " | 125 | \n",
- " Reunion | \n",
- " France | \n",
- " -21.115100 | \n",
- " 55.536400 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 27235 | \n",
- " 27235 | \n",
- " 27235 | \n",
- " 27235 | \n",
- " 28441 | \n",
- " 28441 | \n",
- " 28441 | \n",
- " 28441 | \n",
- " 28441 | \n",
- " 28441 | \n",
- "
\n",
- " \n",
- " | 126 | \n",
- " Saint Barthelemy | \n",
- " France | \n",
- " 17.900000 | \n",
- " -62.833300 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- " 1005 | \n",
- "
\n",
- " \n",
- " | 127 | \n",
- " Saint Pierre and Miquelon | \n",
- " France | \n",
- " 46.885200 | \n",
- " -56.315900 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 25 | \n",
- " 25 | \n",
- " 25 | \n",
- " 25 | \n",
- " 26 | \n",
- " 26 | \n",
- " 26 | \n",
- " 26 | \n",
- " 26 | \n",
- " 26 | \n",
- "
\n",
- " \n",
- " | 128 | \n",
- " St Martin | \n",
- " France | \n",
- " 18.070800 | \n",
- " -63.050100 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 2040 | \n",
- " 2040 | \n",
- " 2040 | \n",
- " 2040 | \n",
- " 2040 | \n",
- " 2133 | \n",
- " 2133 | \n",
- " 2133 | \n",
- " 2133 | \n",
- " 2133 | \n",
- "
\n",
- " \n",
- " | 129 | \n",
- " Wallis and Futuna | \n",
- " France | \n",
- " -14.293800 | \n",
- " -178.116500 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- " 445 | \n",
- "
\n",
- " \n",
- " | 130 | \n",
- " NaN | \n",
- " France | \n",
- " 46.227600 | \n",
- " 2.213700 | \n",
- " 0 | \n",
- " 0 | \n",
- " 2 | \n",
- " 3 | \n",
- " 3 | \n",
- " 3 | \n",
- " ... | \n",
- " 5675604 | \n",
- " 5678209 | \n",
- " 5678893 | \n",
- " 5681846 | \n",
- " 5683536 | \n",
- " 5685387 | \n",
- " 5688557 | \n",
- " 5691181 | \n",
- " 5692996 | \n",
- " 5692968 | \n",
- "
\n",
- " \n",
- "
\n",
- "
12 rows × 521 columns
\n",
- "
"
- ],
- "text/plain": [
- " Province/State Country/Region Lat Long 1/22/20 \\\n",
- "119 French Guiana France 3.933900 -53.125800 0 \n",
- "120 French Polynesia France -17.679700 149.406800 0 \n",
- "121 Guadeloupe France 16.265000 -61.551000 0 \n",
- "122 Martinique France 14.641500 -61.024200 0 \n",
- "123 Mayotte France -12.827500 45.166244 0 \n",
- "124 New Caledonia France -20.904305 165.618042 0 \n",
- "125 Reunion France -21.115100 55.536400 0 \n",
- "126 Saint Barthelemy France 17.900000 -62.833300 0 \n",
- "127 Saint Pierre and Miquelon France 46.885200 -56.315900 0 \n",
- "128 St Martin France 18.070800 -63.050100 0 \n",
- "129 Wallis and Futuna France -14.293800 -178.116500 0 \n",
- "130 NaN France 46.227600 2.213700 0 \n",
- "\n",
- " 1/23/20 1/24/20 1/25/20 1/26/20 1/27/20 ... 6/12/21 6/13/21 \\\n",
- "119 0 0 0 0 0 ... 25506 25506 \n",
- "120 0 0 0 0 0 ... 18930 18930 \n",
- "121 0 0 0 0 0 ... 17108 17288 \n",
- "122 0 0 0 0 0 ... 12060 12130 \n",
- "123 0 0 0 0 0 ... 19373 19373 \n",
- "124 0 0 0 0 0 ... 128 128 \n",
- "125 0 0 0 0 0 ... 27235 27235 \n",
- "126 0 0 0 0 0 ... 1005 1005 \n",
- "127 0 0 0 0 0 ... 25 25 \n",
- "128 0 0 0 0 0 ... 2040 2040 \n",
- "129 0 0 0 0 0 ... 445 445 \n",
- "130 0 2 3 3 3 ... 5675604 5678209 \n",
- "\n",
- " 6/14/21 6/15/21 6/16/21 6/17/21 6/18/21 6/19/21 6/20/21 6/21/21 \n",
- "119 25506 25788 25950 26143 26143 26143 26143 26450 \n",
- "120 18939 18947 18952 18957 18963 18963 18963 18972 \n",
- "121 17288 17288 17288 17288 17288 17288 17288 17427 \n",
- "122 12130 12130 12130 12130 12130 12130 12130 12199 \n",
- "123 19378 19378 19378 19378 19389 19389 19389 19389 \n",
- "124 128 128 128 128 128 128 129 129 \n",
- "125 27235 27235 28441 28441 28441 28441 28441 28441 \n",
- "126 1005 1005 1005 1005 1005 1005 1005 1005 \n",
- "127 25 25 26 26 26 26 26 26 \n",
- "128 2040 2040 2040 2133 2133 2133 2133 2133 \n",
- "129 445 445 445 445 445 445 445 445 \n",
- "130 5678893 5681846 5683536 5685387 5688557 5691181 5692996 5692968 \n",
- "\n",
- "[12 rows x 521 columns]"
- ]
- },
- "execution_count": 6,
- "metadata": {},
- "output_type": "execute_result"
- }
- ],
+ "outputs": [],
"source": [
- "%matplotlib inline\n",
- "import matplotlib.pyplot as plt\n",
"import pandas as pd\n",
"\n",
- "raw_data = pd.read_csv(data_file, sep=',')\n",
- "raw_data[raw_data['Country/Region'] == 'France']"
+ "raw_data = pd.read_csv(data_file, sep=',')"
]
},
{
@@ -475,7 +83,7 @@
" 'Japan', 'Korea,South', 'Netherlands', 'Portugal', 'Spain',\n",
" 'United Kingdom', 'US']\n",
"\n",
- "data = raw_data[raw_data['Country/Region'].isin(selectedCountries)]"
+ "selectedData = raw_data[raw_data['Country/Region'].isin(selectedCountries)]"
]
},
{
@@ -489,6 +97,31 @@
"cell_type": "code",
"execution_count": 4,
"metadata": {},
+ "outputs": [],
+ "source": [
+ "dataChina = selectedData[selectedData['Country/Region'] == 'China']"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "dataOther = selectedData[selectedData['Province/State'] != selectedData['Province/State']]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "On peut finalement concaténer ces deux jeux de données."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "metadata": {},
"outputs": [
{
"data": {
@@ -536,11 +169,35 @@
" \n",
" \n",
" \n",
+ " | 23 | \n",
+ " NaN | \n",
+ " Belgium | \n",
+ " 50.833300 | \n",
+ " 4.469936 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " ... | \n",
+ " 1075765 | \n",
+ " 1076338 | \n",
+ " 1076579 | \n",
+ " 1077087 | \n",
+ " 1077758 | \n",
+ " 1078251 | \n",
+ " 1078251 | \n",
+ " 1079084 | \n",
+ " 1079415 | \n",
+ " 1079640 | \n",
+ "
\n",
+ " \n",
" | 58 | \n",
" Anhui | \n",
" China | \n",
- " 31.8257 | \n",
- " 117.2264 | \n",
+ " 31.825700 | \n",
+ " 117.226400 | \n",
" 1 | \n",
" 9 | \n",
" 15 | \n",
@@ -563,8 +220,8 @@
" 59 | \n",
" Beijing | \n",
" China | \n",
- " 40.1824 | \n",
- " 116.4142 | \n",
+ " 40.182400 | \n",
+ " 116.414200 | \n",
" 14 | \n",
" 22 | \n",
" 36 | \n",
@@ -587,8 +244,8 @@
" 60 | \n",
" Chongqing | \n",
" China | \n",
- " 30.0572 | \n",
- " 107.8740 | \n",
+ " 30.057200 | \n",
+ " 107.874000 | \n",
" 6 | \n",
" 9 | \n",
" 27 | \n",
@@ -611,8 +268,8 @@
" 61 | \n",
" Fujian | \n",
" China | \n",
- " 26.0789 | \n",
- " 117.9874 | \n",
+ " 26.078900 | \n",
+ " 117.987400 | \n",
" 1 | \n",
" 5 | \n",
" 10 | \n",
@@ -635,8 +292,8 @@
" 62 | \n",
" Gansu | \n",
" China | \n",
- " 35.7518 | \n",
- " 104.2861 | \n",
+ " 35.751800 | \n",
+ " 104.286100 | \n",
" 0 | \n",
" 2 | \n",
" 2 | \n",
@@ -659,8 +316,8 @@
" 63 | \n",
" Guangdong | \n",
" China | \n",
- " 23.3417 | \n",
- " 113.4244 | \n",
+ " 23.341700 | \n",
+ " 113.424400 | \n",
" 26 | \n",
" 32 | \n",
" 53 | \n",
@@ -683,8 +340,8 @@
" 64 | \n",
" Guangxi | \n",
" China | \n",
- " 23.8298 | \n",
- " 108.7881 | \n",
+ " 23.829800 | \n",
+ " 108.788100 | \n",
" 2 | \n",
" 5 | \n",
" 23 | \n",
@@ -707,8 +364,8 @@
" 65 | \n",
" Guizhou | \n",
" China | \n",
- " 26.8154 | \n",
- " 106.8748 | \n",
+ " 26.815400 | \n",
+ " 106.874800 | \n",
" 1 | \n",
" 3 | \n",
" 3 | \n",
@@ -731,8 +388,8 @@
" 66 | \n",
" Hainan | \n",
" China | \n",
- " 19.1959 | \n",
- " 109.7453 | \n",
+ " 19.195900 | \n",
+ " 109.745300 | \n",
" 4 | \n",
" 5 | \n",
" 8 | \n",
@@ -755,8 +412,8 @@
" 67 | \n",
" Hebei | \n",
" China | \n",
- " 39.5490 | \n",
- " 116.1306 | \n",
+ " 39.549000 | \n",
+ " 116.130600 | \n",
" 1 | \n",
" 1 | \n",
" 2 | \n",
@@ -779,8 +436,8 @@
" 68 | \n",
" Heilongjiang | \n",
" China | \n",
- " 47.8620 | \n",
- " 127.7615 | \n",
+ " 47.862000 | \n",
+ " 127.761500 | \n",
" 0 | \n",
" 2 | \n",
" 4 | \n",
@@ -803,8 +460,8 @@
" 69 | \n",
" Henan | \n",
" China | \n",
- " 37.8957 | \n",
- " 114.9042 | \n",
+ " 37.895700 | \n",
+ " 114.904200 | \n",
" 5 | \n",
" 5 | \n",
" 9 | \n",
@@ -827,8 +484,8 @@
" 70 | \n",
" Hong Kong | \n",
" China | \n",
- " 22.3000 | \n",
- " 114.2000 | \n",
+ " 22.300000 | \n",
+ " 114.200000 | \n",
" 0 | \n",
" 2 | \n",
" 2 | \n",
@@ -851,8 +508,8 @@
" 71 | \n",
" Hubei | \n",
" China | \n",
- " 30.9756 | \n",
- " 112.2707 | \n",
+ " 30.975600 | \n",
+ " 112.270700 | \n",
" 444 | \n",
" 444 | \n",
" 549 | \n",
@@ -875,8 +532,8 @@
" 72 | \n",
" Hunan | \n",
" China | \n",
- " 27.6104 | \n",
- " 111.7088 | \n",
+ " 27.610400 | \n",
+ " 111.708800 | \n",
" 4 | \n",
" 9 | \n",
" 24 | \n",
@@ -899,8 +556,8 @@
" 73 | \n",
" Inner Mongolia | \n",
" China | \n",
- " 44.0935 | \n",
- " 113.9448 | \n",
+ " 44.093500 | \n",
+ " 113.944800 | \n",
" 0 | \n",
" 0 | \n",
" 1 | \n",
@@ -923,8 +580,8 @@
" 74 | \n",
" Jiangsu | \n",
" China | \n",
- " 32.9711 | \n",
- " 119.4550 | \n",
+ " 32.971100 | \n",
+ " 119.455000 | \n",
" 1 | \n",
" 5 | \n",
" 9 | \n",
@@ -947,8 +604,8 @@
" 75 | \n",
" Jiangxi | \n",
" China | \n",
- " 27.6140 | \n",
- " 115.7221 | \n",
+ " 27.614000 | \n",
+ " 115.722100 | \n",
" 2 | \n",
" 7 | \n",
" 18 | \n",
@@ -971,8 +628,8 @@
" 76 | \n",
" Jilin | \n",
" China | \n",
- " 43.6661 | \n",
- " 126.1923 | \n",
+ " 43.666100 | \n",
+ " 126.192300 | \n",
" 0 | \n",
" 1 | \n",
" 3 | \n",
@@ -995,8 +652,8 @@
" 77 | \n",
" Liaoning | \n",
" China | \n",
- " 41.2956 | \n",
- " 122.6085 | \n",
+ " 41.295600 | \n",
+ " 122.608500 | \n",
" 2 | \n",
" 3 | \n",
" 4 | \n",
@@ -1019,8 +676,8 @@
" 78 | \n",
" Macau | \n",
" China | \n",
- " 22.1667 | \n",
- " 113.5500 | \n",
+ " 22.166700 | \n",
+ " 113.550000 | \n",
" 1 | \n",
" 2 | \n",
" 2 | \n",
@@ -1043,8 +700,8 @@
" 79 | \n",
" Ningxia | \n",
" China | \n",
- " 37.2692 | \n",
- " 106.1655 | \n",
+ " 37.269200 | \n",
+ " 106.165500 | \n",
" 1 | \n",
" 1 | \n",
" 2 | \n",
@@ -1067,8 +724,8 @@
" 80 | \n",
" Qinghai | \n",
" China | \n",
- " 35.7452 | \n",
- " 95.9956 | \n",
+ " 35.745200 | \n",
+ " 95.995600 | \n",
" 0 | \n",
" 0 | \n",
" 0 | \n",
@@ -1091,8 +748,8 @@
" 81 | \n",
" Shaanxi | \n",
" China | \n",
- " 35.1917 | \n",
- " 108.8701 | \n",
+ " 35.191700 | \n",
+ " 108.870100 | \n",
" 0 | \n",
" 3 | \n",
" 5 | \n",
@@ -1115,8 +772,8 @@
" 82 | \n",
" Shandong | \n",
" China | \n",
- " 36.3427 | \n",
- " 118.1498 | \n",
+ " 36.342700 | \n",
+ " 118.149800 | \n",
" 2 | \n",
" 6 | \n",
" 15 | \n",
@@ -1139,8 +796,8 @@
" 83 | \n",
" Shanghai | \n",
" China | \n",
- " 31.2020 | \n",
- " 121.4491 | \n",
+ " 31.202000 | \n",
+ " 121.449100 | \n",
" 9 | \n",
" 16 | \n",
" 20 | \n",
@@ -1163,8 +820,8 @@
" 84 | \n",
" Shanxi | \n",
" China | \n",
- " 37.5777 | \n",
- " 112.2922 | \n",
+ " 37.577700 | \n",
+ " 112.292200 | \n",
" 1 | \n",
" 1 | \n",
" 1 | \n",
@@ -1187,8 +844,8 @@
" 85 | \n",
" Sichuan | \n",
" China | \n",
- " 30.6171 | \n",
- " 102.7103 | \n",
+ " 30.617100 | \n",
+ " 102.710300 | \n",
" 5 | \n",
" 8 | \n",
" 15 | \n",
@@ -1211,8 +868,8 @@
" 86 | \n",
" Tianjin | \n",
" China | \n",
- " 39.3054 | \n",
- " 117.3230 | \n",
+ " 39.305400 | \n",
+ " 117.323000 | \n",
" 4 | \n",
" 4 | \n",
" 8 | \n",
@@ -1235,8 +892,8 @@
" 87 | \n",
" Tibet | \n",
" China | \n",
- " 31.6927 | \n",
- " 88.0924 | \n",
+ " 31.692700 | \n",
+ " 88.092400 | \n",
" 0 | \n",
" 0 | \n",
" 0 | \n",
@@ -1283,8 +940,8 @@
" 89 | \n",
" Xinjiang | \n",
" China | \n",
- " 41.1129 | \n",
- " 85.2401 | \n",
+ " 41.112900 | \n",
+ " 85.240100 | \n",
" 0 | \n",
" 2 | \n",
" 2 | \n",
@@ -1307,8 +964,8 @@
" 90 | \n",
" Yunnan | \n",
" China | \n",
- " 24.9740 | \n",
- " 101.4870 | \n",
+ " 24.974000 | \n",
+ " 101.487000 | \n",
" 1 | \n",
" 2 | \n",
" 5 | \n",
@@ -1331,8 +988,8 @@
" 91 | \n",
" Zhejiang | \n",
" China | \n",
- " 29.1832 | \n",
- " 120.0934 | \n",
+ " 29.183200 | \n",
+ " 120.093400 | \n",
" 10 | \n",
" 27 | \n",
" 43 | \n",
@@ -1351,207 +1008,6 @@
" 1379 | \n",
" 1383 | \n",
"
\n",
- " \n",
- "\n",
- "34 rows × 521 columns
\n",
- ""
- ],
- "text/plain": [
- " Province/State Country/Region Lat Long 1/22/20 1/23/20 \\\n",
- "58 Anhui China 31.8257 117.2264 1 9 \n",
- "59 Beijing China 40.1824 116.4142 14 22 \n",
- "60 Chongqing China 30.0572 107.8740 6 9 \n",
- "61 Fujian China 26.0789 117.9874 1 5 \n",
- "62 Gansu China 35.7518 104.2861 0 2 \n",
- "63 Guangdong China 23.3417 113.4244 26 32 \n",
- "64 Guangxi China 23.8298 108.7881 2 5 \n",
- "65 Guizhou China 26.8154 106.8748 1 3 \n",
- "66 Hainan China 19.1959 109.7453 4 5 \n",
- "67 Hebei China 39.5490 116.1306 1 1 \n",
- "68 Heilongjiang China 47.8620 127.7615 0 2 \n",
- "69 Henan China 37.8957 114.9042 5 5 \n",
- "70 Hong Kong China 22.3000 114.2000 0 2 \n",
- "71 Hubei China 30.9756 112.2707 444 444 \n",
- "72 Hunan China 27.6104 111.7088 4 9 \n",
- "73 Inner Mongolia China 44.0935 113.9448 0 0 \n",
- "74 Jiangsu China 32.9711 119.4550 1 5 \n",
- "75 Jiangxi China 27.6140 115.7221 2 7 \n",
- "76 Jilin China 43.6661 126.1923 0 1 \n",
- "77 Liaoning China 41.2956 122.6085 2 3 \n",
- "78 Macau China 22.1667 113.5500 1 2 \n",
- "79 Ningxia China 37.2692 106.1655 1 1 \n",
- "80 Qinghai China 35.7452 95.9956 0 0 \n",
- "81 Shaanxi China 35.1917 108.8701 0 3 \n",
- "82 Shandong China 36.3427 118.1498 2 6 \n",
- "83 Shanghai China 31.2020 121.4491 9 16 \n",
- "84 Shanxi China 37.5777 112.2922 1 1 \n",
- "85 Sichuan China 30.6171 102.7103 5 8 \n",
- "86 Tianjin China 39.3054 117.3230 4 4 \n",
- "87 Tibet China 31.6927 88.0924 0 0 \n",
- "88 Unknown China NaN NaN 0 0 \n",
- "89 Xinjiang China 41.1129 85.2401 0 2 \n",
- "90 Yunnan China 24.9740 101.4870 1 2 \n",
- "91 Zhejiang China 29.1832 120.0934 10 27 \n",
- "\n",
- " 1/24/20 1/25/20 1/26/20 1/27/20 ... 6/12/21 6/13/21 6/14/21 \\\n",
- "58 15 39 60 70 ... 1004 1004 1004 \n",
- "59 36 41 68 80 ... 1069 1070 1071 \n",
- "60 27 57 75 110 ... 598 598 598 \n",
- "61 10 18 35 59 ... 637 637 638 \n",
- "62 2 4 7 14 ... 194 194 194 \n",
- "63 53 78 111 151 ... 2618 2625 2635 \n",
- "64 23 23 36 46 ... 275 275 275 \n",
- "65 3 4 5 7 ... 147 147 147 \n",
- "66 8 19 22 33 ... 188 188 188 \n",
- "67 2 8 13 18 ... 1317 1317 1317 \n",
- "68 4 9 15 21 ... 1612 1612 1612 \n",
- "69 9 32 83 128 ... 1316 1316 1316 \n",
- "70 2 5 8 8 ... 11877 11877 11878 \n",
- "71 549 761 1058 1423 ... 68159 68159 68159 \n",
- "72 24 43 69 100 ... 1051 1051 1051 \n",
- "73 1 7 7 11 ... 390 393 393 \n",
- "74 9 18 33 47 ... 735 736 736 \n",
- "75 18 18 36 72 ... 937 937 937 \n",
- "76 3 4 4 6 ... 573 573 573 \n",
- "77 4 17 21 27 ... 426 426 426 \n",
- "78 2 2 5 6 ... 52 52 52 \n",
- "79 2 3 4 7 ... 76 76 76 \n",
- "80 0 1 1 6 ... 18 18 18 \n",
- "81 5 15 22 35 ... 622 622 622 \n",
- "82 15 27 46 75 ... 883 883 883 \n",
- "83 20 33 40 53 ... 2155 2160 2165 \n",
- "84 1 6 9 13 ... 253 253 253 \n",
- "85 15 28 44 69 ... 1050 1054 1055 \n",
- "86 8 10 14 23 ... 398 398 398 \n",
- "87 0 0 0 0 ... 1 1 1 \n",
- "88 0 0 0 0 ... 0 0 0 \n",
- "89 2 3 4 5 ... 980 980 980 \n",
- "90 5 11 16 26 ... 374 376 377 \n",
- "91 43 62 104 128 ... 1372 1372 1373 \n",
- "\n",
- " 6/15/21 6/16/21 6/17/21 6/18/21 6/19/21 6/20/21 6/21/21 \n",
- "58 1004 1004 1004 1004 1004 1004 1004 \n",
- "59 1071 1072 1072 1073 1073 1075 1075 \n",
- "60 598 598 598 598 598 598 598 \n",
- "61 638 641 646 650 651 652 659 \n",
- "62 194 194 194 194 194 194 194 \n",
- "63 2650 2657 2666 2680 2692 2699 2706 \n",
- "64 275 275 275 275 275 275 275 \n",
- "65 147 147 147 147 147 147 147 \n",
- "66 188 188 188 188 188 188 188 \n",
- "67 1317 1317 1317 1317 1317 1317 1317 \n",
- "68 1612 1612 1612 1612 1612 1612 1612 \n",
- "69 1316 1316 1316 1316 1316 1317 1317 \n",
- "70 11880 11881 11881 11884 11885 11886 11889 \n",
- "71 68159 68160 68160 68160 68160 68160 68160 \n",
- "72 1051 1051 1051 1051 1051 1051 1051 \n",
- "73 393 393 393 393 393 393 394 \n",
- "74 738 739 739 739 739 740 740 \n",
- "75 937 937 937 937 937 937 937 \n",
- "76 573 573 573 573 573 573 573 \n",
- "77 426 426 426 426 426 426 426 \n",
- "78 52 52 52 53 53 53 53 \n",
- "79 76 76 76 76 76 76 76 \n",
- "80 18 18 18 18 18 18 18 \n",
- "81 622 622 622 624 624 624 624 \n",
- "82 883 883 883 883 883 883 883 \n",
- "83 2168 2170 2173 2179 2182 2183 2184 \n",
- "84 253 253 253 253 253 253 253 \n",
- "85 1056 1057 1057 1057 1058 1059 1064 \n",
- "86 398 398 399 399 399 399 399 \n",
- "87 1 1 1 1 1 1 1 \n",
- "88 0 0 0 0 0 0 0 \n",
- "89 980 980 980 980 980 980 980 \n",
- "90 377 380 382 384 388 391 391 \n",
- "91 1373 1373 1376 1377 1379 1379 1383 \n",
- "\n",
- "[34 rows x 521 columns]"
- ]
- },
- "execution_count": 4,
- "metadata": {},
- "output_type": "execute_result"
- }
- ],
- "source": [
- "dataChina = data[data['Country/Region'] == 'China']\n",
- "dataChina"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 7,
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "\n",
- "
\n",
- " \n",
- " \n",
- " | \n",
- " Province/State | \n",
- " Country/Region | \n",
- " Lat | \n",
- " Long | \n",
- " 1/22/20 | \n",
- " 1/23/20 | \n",
- " 1/24/20 | \n",
- " 1/25/20 | \n",
- " 1/26/20 | \n",
- " 1/27/20 | \n",
- " ... | \n",
- " 6/12/21 | \n",
- " 6/13/21 | \n",
- " 6/14/21 | \n",
- " 6/15/21 | \n",
- " 6/16/21 | \n",
- " 6/17/21 | \n",
- " 6/18/21 | \n",
- " 6/19/21 | \n",
- " 6/20/21 | \n",
- " 6/21/21 | \n",
- "
\n",
- " \n",
- " \n",
- " \n",
- " | 23 | \n",
- " NaN | \n",
- " Belgium | \n",
- " 50.833300 | \n",
- " 4.469936 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " 0 | \n",
- " ... | \n",
- " 1075765 | \n",
- " 1076338 | \n",
- " 1076579 | \n",
- " 1077087 | \n",
- " 1077758 | \n",
- " 1078251 | \n",
- " 1078251 | \n",
- " 1079084 | \n",
- " 1079415 | \n",
- " 1079640 | \n",
- "
\n",
" \n",
" | 130 | \n",
" NaN | \n",
@@ -1794,25 +1250,93 @@
"
\n",
" \n",
"
\n",
- "
11 rows × 521 columns
\n",
+ "
45 rows × 521 columns
\n",
"
"
],
"text/plain": [
- " Province/State Country/Region Lat Long 1/22/20 1/23/20 \\\n",
- "23 NaN Belgium 50.833300 4.469936 0 0 \n",
- "130 NaN France 46.227600 2.213700 0 0 \n",
- "134 NaN Germany 51.165691 10.451526 0 0 \n",
- "149 NaN Iran 32.427908 53.688046 0 0 \n",
- "153 NaN Italy 41.871940 12.567380 0 0 \n",
- "155 NaN Japan 36.204824 138.252924 2 2 \n",
- "197 NaN Netherlands 52.132600 5.291300 0 0 \n",
- "214 NaN Portugal 39.399900 -8.224500 0 0 \n",
- "237 NaN Spain 40.463667 -3.749220 0 0 \n",
- "253 NaN US 40.000000 -100.000000 1 1 \n",
- "268 NaN United Kingdom 55.378100 -3.436000 0 0 \n",
+ " Province/State Country/Region Lat Long 1/22/20 1/23/20 \\\n",
+ "23 NaN Belgium 50.833300 4.469936 0 0 \n",
+ "58 Anhui China 31.825700 117.226400 1 9 \n",
+ "59 Beijing China 40.182400 116.414200 14 22 \n",
+ "60 Chongqing China 30.057200 107.874000 6 9 \n",
+ "61 Fujian China 26.078900 117.987400 1 5 \n",
+ "62 Gansu China 35.751800 104.286100 0 2 \n",
+ "63 Guangdong China 23.341700 113.424400 26 32 \n",
+ "64 Guangxi China 23.829800 108.788100 2 5 \n",
+ "65 Guizhou China 26.815400 106.874800 1 3 \n",
+ "66 Hainan China 19.195900 109.745300 4 5 \n",
+ "67 Hebei China 39.549000 116.130600 1 1 \n",
+ "68 Heilongjiang China 47.862000 127.761500 0 2 \n",
+ "69 Henan China 37.895700 114.904200 5 5 \n",
+ "70 Hong Kong China 22.300000 114.200000 0 2 \n",
+ "71 Hubei China 30.975600 112.270700 444 444 \n",
+ "72 Hunan China 27.610400 111.708800 4 9 \n",
+ "73 Inner Mongolia China 44.093500 113.944800 0 0 \n",
+ "74 Jiangsu China 32.971100 119.455000 1 5 \n",
+ "75 Jiangxi China 27.614000 115.722100 2 7 \n",
+ "76 Jilin China 43.666100 126.192300 0 1 \n",
+ "77 Liaoning China 41.295600 122.608500 2 3 \n",
+ "78 Macau China 22.166700 113.550000 1 2 \n",
+ "79 Ningxia China 37.269200 106.165500 1 1 \n",
+ "80 Qinghai China 35.745200 95.995600 0 0 \n",
+ "81 Shaanxi China 35.191700 108.870100 0 3 \n",
+ "82 Shandong China 36.342700 118.149800 2 6 \n",
+ "83 Shanghai China 31.202000 121.449100 9 16 \n",
+ "84 Shanxi China 37.577700 112.292200 1 1 \n",
+ "85 Sichuan China 30.617100 102.710300 5 8 \n",
+ "86 Tianjin China 39.305400 117.323000 4 4 \n",
+ "87 Tibet China 31.692700 88.092400 0 0 \n",
+ "88 Unknown China NaN NaN 0 0 \n",
+ "89 Xinjiang China 41.112900 85.240100 0 2 \n",
+ "90 Yunnan China 24.974000 101.487000 1 2 \n",
+ "91 Zhejiang China 29.183200 120.093400 10 27 \n",
+ "130 NaN France 46.227600 2.213700 0 0 \n",
+ "134 NaN Germany 51.165691 10.451526 0 0 \n",
+ "149 NaN Iran 32.427908 53.688046 0 0 \n",
+ "153 NaN Italy 41.871940 12.567380 0 0 \n",
+ "155 NaN Japan 36.204824 138.252924 2 2 \n",
+ "197 NaN Netherlands 52.132600 5.291300 0 0 \n",
+ "214 NaN Portugal 39.399900 -8.224500 0 0 \n",
+ "237 NaN Spain 40.463667 -3.749220 0 0 \n",
+ "253 NaN US 40.000000 -100.000000 1 1 \n",
+ "268 NaN United Kingdom 55.378100 -3.436000 0 0 \n",
"\n",
" 1/24/20 1/25/20 1/26/20 1/27/20 ... 6/12/21 6/13/21 \\\n",
"23 0 0 0 0 ... 1075765 1076338 \n",
+ "58 15 39 60 70 ... 1004 1004 \n",
+ "59 36 41 68 80 ... 1069 1070 \n",
+ "60 27 57 75 110 ... 598 598 \n",
+ "61 10 18 35 59 ... 637 637 \n",
+ "62 2 4 7 14 ... 194 194 \n",
+ "63 53 78 111 151 ... 2618 2625 \n",
+ "64 23 23 36 46 ... 275 275 \n",
+ "65 3 4 5 7 ... 147 147 \n",
+ "66 8 19 22 33 ... 188 188 \n",
+ "67 2 8 13 18 ... 1317 1317 \n",
+ "68 4 9 15 21 ... 1612 1612 \n",
+ "69 9 32 83 128 ... 1316 1316 \n",
+ "70 2 5 8 8 ... 11877 11877 \n",
+ "71 549 761 1058 1423 ... 68159 68159 \n",
+ "72 24 43 69 100 ... 1051 1051 \n",
+ "73 1 7 7 11 ... 390 393 \n",
+ "74 9 18 33 47 ... 735 736 \n",
+ "75 18 18 36 72 ... 937 937 \n",
+ "76 3 4 4 6 ... 573 573 \n",
+ "77 4 17 21 27 ... 426 426 \n",
+ "78 2 2 5 6 ... 52 52 \n",
+ "79 2 3 4 7 ... 76 76 \n",
+ "80 0 1 1 6 ... 18 18 \n",
+ "81 5 15 22 35 ... 622 622 \n",
+ "82 15 27 46 75 ... 883 883 \n",
+ "83 20 33 40 53 ... 2155 2160 \n",
+ "84 1 6 9 13 ... 253 253 \n",
+ "85 15 28 44 69 ... 1050 1054 \n",
+ "86 8 10 14 23 ... 398 398 \n",
+ "87 0 0 0 0 ... 1 1 \n",
+ "88 0 0 0 0 ... 0 0 \n",
+ "89 2 3 4 5 ... 980 980 \n",
+ "90 5 11 16 26 ... 374 376 \n",
+ "91 43 62 104 128 ... 1372 1372 \n",
"130 2 3 3 3 ... 5675604 5678209 \n",
"134 0 0 0 1 ... 3722295 3723295 \n",
"149 0 0 0 0 ... 3020522 3028717 \n",
@@ -1826,6 +1350,40 @@
"\n",
" 6/14/21 6/15/21 6/16/21 6/17/21 6/18/21 6/19/21 6/20/21 \\\n",
"23 1076579 1077087 1077758 1078251 1078251 1079084 1079415 \n",
+ "58 1004 1004 1004 1004 1004 1004 1004 \n",
+ "59 1071 1071 1072 1072 1073 1073 1075 \n",
+ "60 598 598 598 598 598 598 598 \n",
+ "61 638 638 641 646 650 651 652 \n",
+ "62 194 194 194 194 194 194 194 \n",
+ "63 2635 2650 2657 2666 2680 2692 2699 \n",
+ "64 275 275 275 275 275 275 275 \n",
+ "65 147 147 147 147 147 147 147 \n",
+ "66 188 188 188 188 188 188 188 \n",
+ "67 1317 1317 1317 1317 1317 1317 1317 \n",
+ "68 1612 1612 1612 1612 1612 1612 1612 \n",
+ "69 1316 1316 1316 1316 1316 1316 1317 \n",
+ "70 11878 11880 11881 11881 11884 11885 11886 \n",
+ "71 68159 68159 68160 68160 68160 68160 68160 \n",
+ "72 1051 1051 1051 1051 1051 1051 1051 \n",
+ "73 393 393 393 393 393 393 393 \n",
+ "74 736 738 739 739 739 739 740 \n",
+ "75 937 937 937 937 937 937 937 \n",
+ "76 573 573 573 573 573 573 573 \n",
+ "77 426 426 426 426 426 426 426 \n",
+ "78 52 52 52 52 53 53 53 \n",
+ "79 76 76 76 76 76 76 76 \n",
+ "80 18 18 18 18 18 18 18 \n",
+ "81 622 622 622 622 624 624 624 \n",
+ "82 883 883 883 883 883 883 883 \n",
+ "83 2165 2168 2170 2173 2179 2182 2183 \n",
+ "84 253 253 253 253 253 253 253 \n",
+ "85 1055 1056 1057 1057 1057 1058 1059 \n",
+ "86 398 398 398 399 399 399 399 \n",
+ "87 1 1 1 1 1 1 1 \n",
+ "88 0 0 0 0 0 0 0 \n",
+ "89 980 980 980 980 980 980 980 \n",
+ "90 377 377 380 382 384 388 391 \n",
+ "91 1373 1373 1373 1376 1377 1379 1379 \n",
"130 5678893 5681846 5683536 5685387 5688557 5691181 5692996 \n",
"134 3724168 3725328 3726767 3727668 3728601 3729597 3730126 \n",
"149 3039432 3049648 3060135 3070426 3080526 3086974 3095135 \n",
@@ -1839,6 +1397,40 @@
"\n",
" 6/21/21 \n",
"23 1079640 \n",
+ "58 1004 \n",
+ "59 1075 \n",
+ "60 598 \n",
+ "61 659 \n",
+ "62 194 \n",
+ "63 2706 \n",
+ "64 275 \n",
+ "65 147 \n",
+ "66 188 \n",
+ "67 1317 \n",
+ "68 1612 \n",
+ "69 1317 \n",
+ "70 11889 \n",
+ "71 68160 \n",
+ "72 1051 \n",
+ "73 394 \n",
+ "74 740 \n",
+ "75 937 \n",
+ "76 573 \n",
+ "77 426 \n",
+ "78 53 \n",
+ "79 76 \n",
+ "80 18 \n",
+ "81 624 \n",
+ "82 883 \n",
+ "83 2184 \n",
+ "84 253 \n",
+ "85 1064 \n",
+ "86 399 \n",
+ "87 1 \n",
+ "88 0 \n",
+ "89 980 \n",
+ "90 391 \n",
+ "91 1383 \n",
"130 5692968 \n",
"134 3730619 \n",
"149 3105620 \n",
@@ -1850,17 +1442,113 @@
"253 33554275 \n",
"268 4640507 \n",
"\n",
- "[11 rows x 521 columns]"
+ "[45 rows x 521 columns]"
]
},
- "execution_count": 7,
+ "execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
- "dataOther = data[data['Province/State'] != data['Province/State']]\n",
- "dataOther"
+ "data = pd.concat([dataOther, dataChina]).sort_index()\n",
+ "data"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "On remarque d'ailleurs, pour la Chine (`index 88`), une ligne vide sans intérêt pour la suit de nos travaux car pleine de *zéros* ; on la supprime."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "data = data.drop([88])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "## Visualisation des données\n",
+ "\n",
+ "On cherche à visualiser le nombre cumulé de cas à chaque date disponible.\n",
+ "Présentons dans un premier temps les données telles qu'elles."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "%matplotlib inline\n",
+ "import matplotlib.pyplot as plt\n",
+ "\n",
+ "# Extraction des dates, lieux et nombre de cas cumulés\n",
+ "dates = data.keys()[4:] # Dates\n",
+ "place = data.get_values()[:,:2] # [Province , Country]\n",
+ "cases = data.get_values()[:,4:] # Cas"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "Reformattons les noms des différents pays/régions pour plus de lisibilité. Passons ainsi du format\n",
+ " `[Province, Country]`\n",
+ "au format\n",
+ " `[Country (-Province?)]`\n",
+ "où l'on ne précise la province que si c'est nécessaire."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def convert_location_names(place) :\n",
+ " places = []\n",
+ " for i in range(len(place)) :\n",
+ " newDate = place[i,1]\n",
+ " # Cas où la province est spécifiée (non- 'NaN')\n",
+ " if not place[i,0] != place[i,0] :\n",
+ " newDate = newDate + \" - \" + place[i,0]\n",
+ " places.append(newDate)\n",
+ " return places\n",
+ "place = convert_location_names(place) # Attention à ne pas réexécuter plusieurs fois cette cellule"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 16,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "for i,p in enumerate(place) :\n",
+ " plt.plot(dates, cases[i,:], label=p)\n",
+ "# On ne montre pas toutes les dates pour plus de lisibilité\n",
+ "\n",
+ "plt.show()"
]
},
{