"Looks good so lets draw the \"graph showing the evolution of the cumulative number of cases over time for: Belgium, China (all provinces except Hong Kong), China, Hong-Kong, France except Dom/Tom, Germany, Iran, Italy, Japan, Korea South, Netherlands without the colonies, Portugal, Spain, United Kingdom without the colonies, US.\"\n",
"\n",
"Unfortunately we cannot take the data as is as there are some special cases:"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Province/State</th>\n",
" <th>Country/Region</th>\n",
" <th>Lat</th>\n",
" <th>Long</th>\n",
" <th>1/22/20</th>\n",
" <th>1/23/20</th>\n",
" <th>1/24/20</th>\n",
" <th>1/25/20</th>\n",
" <th>1/26/20</th>\n",
" <th>1/27/20</th>\n",
" <th>...</th>\n",
" <th>5/10/20</th>\n",
" <th>5/11/20</th>\n",
" <th>5/12/20</th>\n",
" <th>5/13/20</th>\n",
" <th>5/14/20</th>\n",
" <th>5/15/20</th>\n",
" <th>5/16/20</th>\n",
" <th>5/17/20</th>\n",
" <th>5/18/20</th>\n",
" <th>5/19/20</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>107</th>\n",
" <td>French Guiana</td>\n",
" <td>France</td>\n",
" <td>3.9339</td>\n",
" <td>-53.1258</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>144</td>\n",
" <td>144</td>\n",
" <td>144</td>\n",
" <td>153</td>\n",
" <td>164</td>\n",
" <td>189</td>\n",
" <td>197</td>\n",
" <td>197</td>\n",
" <td>210</td>\n",
" <td>218</td>\n",
" </tr>\n",
" <tr>\n",
" <th>108</th>\n",
" <td>French Polynesia</td>\n",
" <td>France</td>\n",
" <td>-17.6797</td>\n",
" <td>149.4068</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" <td>60</td>\n",
" </tr>\n",
" <tr>\n",
" <th>109</th>\n",
" <td>Guadeloupe</td>\n",
" <td>France</td>\n",
" <td>16.2500</td>\n",
" <td>-61.5833</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>154</td>\n",
" <td>154</td>\n",
" <td>155</td>\n",
" <td>155</td>\n",
" <td>155</td>\n",
" <td>155</td>\n",
" <td>155</td>\n",
" <td>155</td>\n",
" <td>155</td>\n",
" <td>155</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>Mayotte</td>\n",
" <td>France</td>\n",
" <td>-12.8275</td>\n",
" <td>45.1662</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>1023</td>\n",
" <td>1023</td>\n",
" <td>1095</td>\n",
" <td>1143</td>\n",
" <td>1210</td>\n",
" <td>1210</td>\n",
" <td>1312</td>\n",
" <td>1342</td>\n",
" <td>1370</td>\n",
" <td>1370</td>\n",
" </tr>\n",
" <tr>\n",
" <th>111</th>\n",
" <td>New Caledonia</td>\n",
" <td>France</td>\n",
" <td>-20.9043</td>\n",
" <td>165.6180</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" <td>18</td>\n",
" </tr>\n",
" <tr>\n",
" <th>112</th>\n",
" <td>Reunion</td>\n",
" <td>France</td>\n",
" <td>-21.1351</td>\n",
" <td>55.2471</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>436</td>\n",
" <td>436</td>\n",
" <td>437</td>\n",
" <td>439</td>\n",
" <td>440</td>\n",
" <td>441</td>\n",
" <td>443</td>\n",
" <td>443</td>\n",
" <td>446</td>\n",
" <td>446</td>\n",
" </tr>\n",
" <tr>\n",
" <th>113</th>\n",
" <td>Saint Barthelemy</td>\n",
" <td>France</td>\n",
" <td>17.9000</td>\n",
" <td>-62.8333</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" <td>6</td>\n",
" </tr>\n",
" <tr>\n",
" <th>114</th>\n",
" <td>St Martin</td>\n",
" <td>France</td>\n",
" <td>18.0708</td>\n",
" <td>-63.0501</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" <td>39</td>\n",
" </tr>\n",
" <tr>\n",
" <th>115</th>\n",
" <td>Martinique</td>\n",
" <td>France</td>\n",
" <td>14.6415</td>\n",
" <td>-61.0242</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>186</td>\n",
" <td>187</td>\n",
" <td>187</td>\n",
" <td>189</td>\n",
" <td>189</td>\n",
" <td>192</td>\n",
" <td>192</td>\n",
" <td>192</td>\n",
" <td>192</td>\n",
" <td>192</td>\n",
" </tr>\n",
" <tr>\n",
" <th>116</th>\n",
" <td>NaN</td>\n",
" <td>France</td>\n",
" <td>46.2276</td>\n",
" <td>2.2137</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>3</td>\n",
" <td>3</td>\n",
" <td>3</td>\n",
" <td>...</td>\n",
" <td>175027</td>\n",
" <td>175479</td>\n",
" <td>176207</td>\n",
" <td>175981</td>\n",
" <td>176712</td>\n",
" <td>177319</td>\n",
" <td>177207</td>\n",
" <td>177240</td>\n",
" <td>177554</td>\n",
" <td>178428</td>\n",
" </tr>\n",
" <tr>\n",
" <th>258</th>\n",
" <td>Saint Pierre and Miquelon</td>\n",
" <td>France</td>\n",
" <td>46.8852</td>\n",
" <td>-56.3159</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>...</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>11 rows × 123 columns</p>\n",
"</div>"
],
"text/plain": [
" Province/State Country/Region Lat Long 1/22/20 \\\n",
"107 French Guiana France 3.9339 -53.1258 0 \n",
"108 French Polynesia France -17.6797 149.4068 0 \n",
"109 Guadeloupe France 16.2500 -61.5833 0 \n",
"110 Mayotte France -12.8275 45.1662 0 \n",
"111 New Caledonia France -20.9043 165.6180 0 \n",
"112 Reunion France -21.1351 55.2471 0 \n",
"113 Saint Barthelemy France 17.9000 -62.8333 0 \n",
"114 St Martin France 18.0708 -63.0501 0 \n",
"115 Martinique France 14.6415 -61.0242 0 \n",
"116 NaN France 46.2276 2.2137 0 \n",
"258 Saint Pierre and Miquelon France 46.8852 -56.3159 0 \n",
"Filtering like this leaves the question unanswered if line 116 contains the cases only for France except Dom/Tom or not.\n",
"As for other countries there is no extra line for the country itself we assume for now The France line is France except Dom/Tom but we will check it later again."
]
},
{
"cell_type": "code",
"execution_count": 46,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/opt/conda/lib/python3.6/site-packages/ipykernel_launcher.py:12: UserWarning: Boolean Series key will be reindexed to match DataFrame index.\n",
" if sys.path[0] == '':\n"
]
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"{'Belgium': 23\n",
"1/22/20 0\n",
"1/23/20 0\n",
"1/24/20 0\n",
"1/25/20 0\n",
"1/26/20 0\n",
"1/27/20 0\n",
"1/28/20 0\n",
"1/29/20 0\n",
"1/30/20 0\n",
"1/31/20 0\n",
"2/1/20 0\n",
"2/2/20 0\n",
"2/3/20 0\n",
"2/4/20 1\n",
"2/5/20 1\n",
"2/6/20 1\n",
"2/7/20 1\n",
"2/8/20 1\n",
"2/9/20 1\n",
"2/10/20 1\n",
"2/11/20 1\n",
"2/12/20 1\n",
"2/13/20 1\n",
"2/14/20 1\n",
"2/15/20 1\n",
"2/16/20 1\n",
"2/17/20 1\n",
"2/18/20 1\n",
"2/19/20 1\n",
"2/20/20 1\n",
"... ...\n",
"4/20/20 39983\n",
"4/21/20 40956\n",
"4/22/20 41889\n",
"4/23/20 42797\n",
"4/24/20 44293\n",
"4/25/20 45325\n",
"4/26/20 46134\n",
"4/27/20 46687\n",
"4/28/20 47334\n",
"4/29/20 47859\n",
"4/30/20 48519\n",
"5/1/20 49032\n",
"5/2/20 49517\n",
"5/3/20 49906\n",
"5/4/20 50267\n",
"5/5/20 50509\n",
"5/6/20 50781\n",
"5/7/20 51420\n",
"5/8/20 52011\n",
"5/9/20 52596\n",
"5/10/20 53081\n",
"5/11/20 53449\n",
"5/12/20 53779\n",
"5/13/20 53981\n",
"5/14/20 54288\n",
"5/15/20 54644\n",
"5/16/20 54989\n",
"5/17/20 55280\n",
"5/18/20 55559\n",
"5/19/20 55791\n",
"\n",
"[119 rows x 1 columns], 'France except Dom/Tom': 116\n",
"1/22/20 0\n",
"1/23/20 0\n",
"1/24/20 2\n",
"1/25/20 3\n",
"1/26/20 3\n",
"1/27/20 3\n",
"1/28/20 4\n",
"1/29/20 5\n",
"1/30/20 5\n",
"1/31/20 5\n",
"2/1/20 6\n",
"2/2/20 6\n",
"2/3/20 6\n",
"2/4/20 6\n",
"2/5/20 6\n",
"2/6/20 6\n",
"2/7/20 6\n",
"2/8/20 11\n",
"2/9/20 11\n",
"2/10/20 11\n",
"2/11/20 11\n",
"2/12/20 11\n",
"2/13/20 11\n",
"2/14/20 11\n",
"2/15/20 12\n",
"2/16/20 12\n",
"2/17/20 12\n",
"2/18/20 12\n",
"2/19/20 12\n",
"2/20/20 12\n",
"... ...\n",
"4/20/20 154188\n",
"4/21/20 156921\n",
"4/22/20 154715\n",
"4/23/20 157026\n",
"4/24/20 158636\n",
"4/25/20 160292\n",
"4/26/20 160847\n",
"4/27/20 164589\n",
"4/28/20 167605\n",
"4/29/20 165093\n",
"4/30/20 165764\n",
"5/1/20 165764\n",
"5/2/20 166976\n",
"5/3/20 167272\n",
"5/4/20 167886\n",
"5/5/20 168935\n",
"5/6/20 172465\n",
"5/7/20 173040\n",
"5/8/20 174318\n",
"5/9/20 174758\n",
"5/10/20 175027\n",
"5/11/20 175479\n",
"5/12/20 176207\n",
"5/13/20 175981\n",
"5/14/20 176712\n",
"5/15/20 177319\n",
"5/16/20 177207\n",
"5/17/20 177240\n",
"5/18/20 177554\n",
"5/19/20 178428\n",
"\n",
"[119 rows x 1 columns], 'Germany': 120\n",
"1/22/20 0\n",
"1/23/20 0\n",
"1/24/20 0\n",
"1/25/20 0\n",
"1/26/20 0\n",
"1/27/20 1\n",
"1/28/20 4\n",
"1/29/20 4\n",
"1/30/20 4\n",
"1/31/20 5\n",
"2/1/20 8\n",
"2/2/20 10\n",
"2/3/20 12\n",
"2/4/20 12\n",
"2/5/20 12\n",
"2/6/20 12\n",
"2/7/20 13\n",
"2/8/20 13\n",
"2/9/20 14\n",
"2/10/20 14\n",
"2/11/20 16\n",
"2/12/20 16\n",
"2/13/20 16\n",
"2/14/20 16\n",
"2/15/20 16\n",
"2/16/20 16\n",
"2/17/20 16\n",
"2/18/20 16\n",
"2/19/20 16\n",
"2/20/20 16\n",
"... ...\n",
"4/20/20 147065\n",
"4/21/20 148291\n",
"4/22/20 150648\n",
"4/23/20 153129\n",
"4/24/20 154999\n",
"4/25/20 156513\n",
"4/26/20 157770\n",
"4/27/20 158758\n",
"4/28/20 159912\n",
"4/29/20 161539\n",
"4/30/20 163009\n",
"5/1/20 164077\n",
"5/2/20 164967\n",
"5/3/20 165664\n",
"5/4/20 166152\n",
"5/5/20 167007\n",
"5/6/20 168162\n",
"5/7/20 169430\n",
"5/8/20 170588\n",
"5/9/20 171324\n",
"5/10/20 171879\n",
"5/11/20 172576\n",
"5/12/20 173171\n",
"5/13/20 174098\n",
"5/14/20 174478\n",
"5/15/20 175233\n",
"5/16/20 175752\n",
"5/17/20 176369\n",
"5/18/20 176551\n",
"5/19/20 177778\n",
"\n",
"[119 rows x 1 columns], 'Iran': 133\n",
"1/22/20 0\n",
"1/23/20 0\n",
"1/24/20 0\n",
"1/25/20 0\n",
"1/26/20 0\n",
"1/27/20 0\n",
"1/28/20 0\n",
"1/29/20 0\n",
"1/30/20 0\n",
"1/31/20 0\n",
"2/1/20 0\n",
"2/2/20 0\n",
"2/3/20 0\n",
"2/4/20 0\n",
"2/5/20 0\n",
"2/6/20 0\n",
"2/7/20 0\n",
"2/8/20 0\n",
"2/9/20 0\n",
"2/10/20 0\n",
"2/11/20 0\n",
"2/12/20 0\n",
"2/13/20 0\n",
"2/14/20 0\n",
"2/15/20 0\n",
"2/16/20 0\n",
"2/17/20 0\n",
"2/18/20 0\n",
"2/19/20 2\n",
"2/20/20 5\n",
"... ...\n",
"4/20/20 83505\n",
"4/21/20 84802\n",
"4/22/20 85996\n",
"4/23/20 87026\n",
"4/24/20 88194\n",
"4/25/20 89328\n",
"4/26/20 90481\n",
"4/27/20 91472\n",
"4/28/20 92584\n",
"4/29/20 93657\n",
"4/30/20 94640\n",
"5/1/20 95646\n",
"5/2/20 96448\n",
"5/3/20 97424\n",
"5/4/20 98647\n",
"5/5/20 99970\n",
"5/6/20 101650\n",
"5/7/20 103135\n",
"5/8/20 104691\n",
"5/9/20 106220\n",
"5/10/20 107603\n",
"5/11/20 109286\n",
"5/12/20 110767\n",
"5/13/20 112725\n",
"5/14/20 114533\n",
"5/15/20 116635\n",
"5/16/20 118392\n",
"5/17/20 120198\n",
"5/18/20 122492\n",
"5/19/20 124603\n",
"\n",
"[119 rows x 1 columns], 'Italy': 137\n",
"1/22/20 0\n",
"1/23/20 0\n",
"1/24/20 0\n",
"1/25/20 0\n",
"1/26/20 0\n",
"1/27/20 0\n",
"1/28/20 0\n",
"1/29/20 0\n",
"1/30/20 0\n",
"1/31/20 2\n",
"2/1/20 2\n",
"2/2/20 2\n",
"2/3/20 2\n",
"2/4/20 2\n",
"2/5/20 2\n",
"2/6/20 2\n",
"2/7/20 3\n",
"2/8/20 3\n",
"2/9/20 3\n",
"2/10/20 3\n",
"2/11/20 3\n",
"2/12/20 3\n",
"2/13/20 3\n",
"2/14/20 3\n",
"2/15/20 3\n",
"2/16/20 3\n",
"2/17/20 3\n",
"2/18/20 3\n",
"2/19/20 3\n",
"2/20/20 3\n",
"... ...\n",
"4/20/20 181228\n",
"4/21/20 183957\n",
"4/22/20 187327\n",
"4/23/20 189973\n",
"4/24/20 192994\n",
"4/25/20 195351\n",
"4/26/20 197675\n",
"4/27/20 199414\n",
"4/28/20 201505\n",
"4/29/20 203591\n",
"4/30/20 205463\n",
"5/1/20 207428\n",
"5/2/20 209328\n",
"5/3/20 210717\n",
"5/4/20 211938\n",
"5/5/20 213013\n",
"5/6/20 214457\n",
"5/7/20 215858\n",
"5/8/20 217185\n",
"5/9/20 218268\n",
"5/10/20 219070\n",
"5/11/20 219814\n",
"5/12/20 221216\n",
"5/13/20 222104\n",
"5/14/20 223096\n",
"5/15/20 223885\n",
"5/16/20 224760\n",
"5/17/20 225435\n",
"5/18/20 225886\n",
"5/19/20 226699\n",
"\n",
"[119 rows x 1 columns], 'Japan': 139\n",
"1/22/20 2\n",
"1/23/20 2\n",
"1/24/20 2\n",
"1/25/20 2\n",
"1/26/20 4\n",
"1/27/20 4\n",
"1/28/20 7\n",
"1/29/20 7\n",
"1/30/20 11\n",
"1/31/20 15\n",
"2/1/20 20\n",
"2/2/20 20\n",
"2/3/20 20\n",
"2/4/20 22\n",
"2/5/20 22\n",
"2/6/20 22\n",
"2/7/20 25\n",
"2/8/20 25\n",
"2/9/20 26\n",
"2/10/20 26\n",
"2/11/20 26\n",
"2/12/20 28\n",
"2/13/20 28\n",
"2/14/20 29\n",
"2/15/20 43\n",
"2/16/20 59\n",
"2/17/20 66\n",
"2/18/20 74\n",
"2/19/20 84\n",
"2/20/20 94\n",
"... ...\n",
"4/20/20 10797\n",
"4/21/20 11135\n",
"4/22/20 11512\n",
"4/23/20 12368\n",
"4/24/20 12829\n",
"4/25/20 13231\n",
"4/26/20 13441\n",
"4/27/20 14153\n",
"4/28/20 13736\n",
"4/29/20 13895\n",
"4/30/20 14088\n",
"5/1/20 14305\n",
"5/2/20 14571\n",
"5/3/20 14877\n",
"5/4/20 15078\n",
"5/5/20 15253\n",
"5/6/20 15253\n",
"5/7/20 15477\n",
"5/8/20 15575\n",
"5/9/20 15663\n",
"5/10/20 15777\n",
"5/11/20 15847\n",
"5/12/20 15968\n",
"5/13/20 16049\n",
"5/14/20 16120\n",
"5/15/20 16203\n",
"5/16/20 16237\n",
"5/17/20 16285\n",
"5/18/20 16305\n",
"5/19/20 16367\n",
"\n",
"[119 rows x 1 columns], 'Netherlands without the colonies': 169\n",
"\u001b[0;32m<ipython-input-41-5b37c91e0548>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mto_plot\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"France\"\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",