{ "cells": [ { "cell_type": "code", "execution_count": 18, "metadata": {}, "outputs": [], "source": [ "%matplotlib inline\n", "import matplotlib.pyplot as plt\n", "import pandas as pd\n", "import isoweek" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "data_url = \"http://www.sentiweb.fr/datasets/incidence-PAY-7.csv\"" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
weekindicatorincinc_lowinc_upinc100inc100_lowinc100_upgeo_inseegeo_name
02021257920559751243514919FRFrance
1202124711949883215066181323FRFrance
220212379116642011812141018FRFrance
320212274817275268827410FRFrance
420212176092345887269513FRFrance
52021207748546011036911715FRFrance
6202119766544370893810713FRFrance
72021187391221105714639FRFrance
820211774686287864947410FRFrance
920211674780289166697410FRFrance
10202115711215762714803171222FRFrance
11202114711197799414400171222FRFrance
1220211379714628913139151020FRFrance
13202112711520841514625171222FRFrance
1420211179386667812094141018FRFrance
1520211079056645211660141018FRFrance
16202109710988793814038171222FRFrance
17202108711281836114201171321FRFrance
182021077135611031516807211626FRFrance
19202106713401981016992201525FRFrance
20202105712210898815432181323FRFrance
21202104712026882615226181323FRFrance
222021037891363751145113917FRFrance
232021027779554301016012816FRFrance
24202101710525775013300161220FRFrance
25202053711978840615550181323FRFrance
26202052712012828515739181224FRFrance
27202051710564757413554161121FRFrance
28202050770634744938211715FRFrance
2920204975026314569078511FRFrance
.................................
15651991267176081130423912312042FRFrance
15661991257161691070021638281838FRFrance
15671991247161711007122271281739FRFrance
1568199123711947767116223211329FRFrance
1569199122715452995320951271737FRFrance
1570199121714903897520831261636FRFrance
15711991207190531274225364342345FRFrance
15721991197167391124622232291939FRFrance
15731991187213851388228888382551FRFrance
1574199117713462887718047241632FRFrance
15751991167148571006819646261834FRFrance
1576199115713975978118169251832FRFrance
1577199114712265768416846221430FRFrance
157819911379567604113093171123FRFrance
1579199112710864733114397191325FRFrance
15801991117155741118419964271935FRFrance
15811991107166431137221914292038FRFrance
1582199109713741878018702241533FRFrance
1583199108713289881317765231531FRFrance
1584199107712337807716597221529FRFrance
1585199106710877701314741191226FRFrance
1586199105710442654414340181125FRFrance
15871991047791345631126314820FRFrance
15881991037153871048420290271836FRFrance
15891991027162771104621508292038FRFrance
15901991017155651027120859271836FRFrance
15911990527193751329525455342345FRFrance
15921990517190801380724353342543FRFrance
1593199050711079666015498201228FRFrance
15941990497114302610205FRFrance
\n", "

1595 rows × 10 columns

\n", "
" ], "text/plain": [ " week indicator inc inc_low inc_up inc100 inc100_low \\\n", "0 202125 7 9205 5975 12435 14 9 \n", "1 202124 7 11949 8832 15066 18 13 \n", "2 202123 7 9116 6420 11812 14 10 \n", "3 202122 7 4817 2752 6882 7 4 \n", "4 202121 7 6092 3458 8726 9 5 \n", "5 202120 7 7485 4601 10369 11 7 \n", "6 202119 7 6654 4370 8938 10 7 \n", "7 202118 7 3912 2110 5714 6 3 \n", "8 202117 7 4686 2878 6494 7 4 \n", "9 202116 7 4780 2891 6669 7 4 \n", "10 202115 7 11215 7627 14803 17 12 \n", "11 202114 7 11197 7994 14400 17 12 \n", "12 202113 7 9714 6289 13139 15 10 \n", "13 202112 7 11520 8415 14625 17 12 \n", "14 202111 7 9386 6678 12094 14 10 \n", "15 202110 7 9056 6452 11660 14 10 \n", "16 202109 7 10988 7938 14038 17 12 \n", "17 202108 7 11281 8361 14201 17 13 \n", "18 202107 7 13561 10315 16807 21 16 \n", "19 202106 7 13401 9810 16992 20 15 \n", "20 202105 7 12210 8988 15432 18 13 \n", "21 202104 7 12026 8826 15226 18 13 \n", "22 202103 7 8913 6375 11451 13 9 \n", "23 202102 7 7795 5430 10160 12 8 \n", "24 202101 7 10525 7750 13300 16 12 \n", "25 202053 7 11978 8406 15550 18 13 \n", "26 202052 7 12012 8285 15739 18 12 \n", "27 202051 7 10564 7574 13554 16 11 \n", "28 202050 7 7063 4744 9382 11 7 \n", "29 202049 7 5026 3145 6907 8 5 \n", "... ... ... ... ... ... ... ... \n", "1565 199126 7 17608 11304 23912 31 20 \n", "1566 199125 7 16169 10700 21638 28 18 \n", "1567 199124 7 16171 10071 22271 28 17 \n", "1568 199123 7 11947 7671 16223 21 13 \n", "1569 199122 7 15452 9953 20951 27 17 \n", "1570 199121 7 14903 8975 20831 26 16 \n", "1571 199120 7 19053 12742 25364 34 23 \n", "1572 199119 7 16739 11246 22232 29 19 \n", "1573 199118 7 21385 13882 28888 38 25 \n", "1574 199117 7 13462 8877 18047 24 16 \n", "1575 199116 7 14857 10068 19646 26 18 \n", "1576 199115 7 13975 9781 18169 25 18 \n", "1577 199114 7 12265 7684 16846 22 14 \n", "1578 199113 7 9567 6041 13093 17 11 \n", "1579 199112 7 10864 7331 14397 19 13 \n", "1580 199111 7 15574 11184 19964 27 19 \n", "1581 199110 7 16643 11372 21914 29 20 \n", "1582 199109 7 13741 8780 18702 24 15 \n", "1583 199108 7 13289 8813 17765 23 15 \n", "1584 199107 7 12337 8077 16597 22 15 \n", "1585 199106 7 10877 7013 14741 19 12 \n", "1586 199105 7 10442 6544 14340 18 11 \n", "1587 199104 7 7913 4563 11263 14 8 \n", "1588 199103 7 15387 10484 20290 27 18 \n", "1589 199102 7 16277 11046 21508 29 20 \n", "1590 199101 7 15565 10271 20859 27 18 \n", "1591 199052 7 19375 13295 25455 34 23 \n", "1592 199051 7 19080 13807 24353 34 25 \n", "1593 199050 7 11079 6660 15498 20 12 \n", "1594 199049 7 1143 0 2610 2 0 \n", "\n", " inc100_up geo_insee geo_name \n", "0 19 FR France \n", "1 23 FR France \n", "2 18 FR France \n", "3 10 FR France \n", "4 13 FR France \n", "5 15 FR France \n", "6 13 FR France \n", "7 9 FR France \n", "8 10 FR France \n", "9 10 FR France \n", "10 22 FR France \n", "11 22 FR France \n", "12 20 FR France \n", "13 22 FR France \n", "14 18 FR France \n", "15 18 FR France \n", "16 22 FR France \n", "17 21 FR France \n", "18 26 FR France \n", "19 25 FR France \n", "20 23 FR France \n", "21 23 FR France \n", "22 17 FR France \n", "23 16 FR France \n", "24 20 FR France \n", "25 23 FR France \n", "26 24 FR France \n", "27 21 FR France \n", "28 15 FR France \n", "29 11 FR France \n", "... ... ... ... \n", "1565 42 FR France \n", "1566 38 FR France \n", "1567 39 FR France \n", "1568 29 FR France \n", "1569 37 FR France \n", "1570 36 FR France \n", "1571 45 FR France \n", "1572 39 FR France \n", "1573 51 FR France \n", "1574 32 FR France \n", "1575 34 FR France \n", "1576 32 FR France \n", "1577 30 FR France \n", "1578 23 FR France \n", "1579 25 FR France \n", "1580 35 FR France \n", "1581 38 FR France \n", "1582 33 FR France \n", "1583 31 FR France \n", "1584 29 FR France \n", "1585 26 FR France \n", "1586 25 FR France \n", "1587 20 FR France \n", "1588 36 FR France \n", "1589 38 FR France \n", "1590 36 FR France \n", "1591 45 FR France \n", "1592 43 FR France \n", "1593 28 FR France \n", "1594 5 FR France \n", "\n", "[1595 rows x 10 columns]" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "raw_data = pd.read_csv(data_url, skiprows=1)\n", "raw_data" ] }, { "cell_type": "code", "execution_count": 19, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
weekindicatorincinc_lowinc_upinc100inc100_lowinc100_upgeo_inseegeo_name
\n", "
" ], "text/plain": [ "Empty DataFrame\n", "Columns: [week, indicator, inc, inc_low, inc_up, inc100, inc100_low, inc100_up, geo_insee, geo_name]\n", "Index: []" ] }, "execution_count": 19, "metadata": {}, "output_type": "execute_result" } ], "source": [ "raw_data[raw_data.isnull().any(axis=1)]" ] }, { "cell_type": "code", "execution_count": 20, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
weekindicatorincinc_lowinc_upinc100inc100_lowinc100_upgeo_inseegeo_name
02021257920559751243514919FRFrance
1202124711949883215066181323FRFrance
220212379116642011812141018FRFrance
320212274817275268827410FRFrance
420212176092345887269513FRFrance
52021207748546011036911715FRFrance
6202119766544370893810713FRFrance
72021187391221105714639FRFrance
820211774686287864947410FRFrance
920211674780289166697410FRFrance
10202115711215762714803171222FRFrance
11202114711197799414400171222FRFrance
1220211379714628913139151020FRFrance
13202112711520841514625171222FRFrance
1420211179386667812094141018FRFrance
1520211079056645211660141018FRFrance
16202109710988793814038171222FRFrance
17202108711281836114201171321FRFrance
182021077135611031516807211626FRFrance
19202106713401981016992201525FRFrance
20202105712210898815432181323FRFrance
21202104712026882615226181323FRFrance
222021037891363751145113917FRFrance
232021027779554301016012816FRFrance
24202101710525775013300161220FRFrance
25202053711978840615550181323FRFrance
26202052712012828515739181224FRFrance
27202051710564757413554161121FRFrance
28202050770634744938211715FRFrance
2920204975026314569078511FRFrance
.................................
15651991267176081130423912312042FRFrance
15661991257161691070021638281838FRFrance
15671991247161711007122271281739FRFrance
1568199123711947767116223211329FRFrance
1569199122715452995320951271737FRFrance
1570199121714903897520831261636FRFrance
15711991207190531274225364342345FRFrance
15721991197167391124622232291939FRFrance
15731991187213851388228888382551FRFrance
1574199117713462887718047241632FRFrance
15751991167148571006819646261834FRFrance
1576199115713975978118169251832FRFrance
1577199114712265768416846221430FRFrance
157819911379567604113093171123FRFrance
1579199112710864733114397191325FRFrance
15801991117155741118419964271935FRFrance
15811991107166431137221914292038FRFrance
1582199109713741878018702241533FRFrance
1583199108713289881317765231531FRFrance
1584199107712337807716597221529FRFrance
1585199106710877701314741191226FRFrance
1586199105710442654414340181125FRFrance
15871991047791345631126314820FRFrance
15881991037153871048420290271836FRFrance
15891991027162771104621508292038FRFrance
15901991017155651027120859271836FRFrance
15911990527193751329525455342345FRFrance
15921990517190801380724353342543FRFrance
1593199050711079666015498201228FRFrance
15941990497114302610205FRFrance
\n", "

1595 rows × 10 columns

\n", "
" ], "text/plain": [ " week indicator inc inc_low inc_up inc100 inc100_low \\\n", "0 202125 7 9205 5975 12435 14 9 \n", "1 202124 7 11949 8832 15066 18 13 \n", "2 202123 7 9116 6420 11812 14 10 \n", "3 202122 7 4817 2752 6882 7 4 \n", "4 202121 7 6092 3458 8726 9 5 \n", "5 202120 7 7485 4601 10369 11 7 \n", "6 202119 7 6654 4370 8938 10 7 \n", "7 202118 7 3912 2110 5714 6 3 \n", "8 202117 7 4686 2878 6494 7 4 \n", "9 202116 7 4780 2891 6669 7 4 \n", "10 202115 7 11215 7627 14803 17 12 \n", "11 202114 7 11197 7994 14400 17 12 \n", "12 202113 7 9714 6289 13139 15 10 \n", "13 202112 7 11520 8415 14625 17 12 \n", "14 202111 7 9386 6678 12094 14 10 \n", "15 202110 7 9056 6452 11660 14 10 \n", "16 202109 7 10988 7938 14038 17 12 \n", "17 202108 7 11281 8361 14201 17 13 \n", "18 202107 7 13561 10315 16807 21 16 \n", "19 202106 7 13401 9810 16992 20 15 \n", "20 202105 7 12210 8988 15432 18 13 \n", "21 202104 7 12026 8826 15226 18 13 \n", "22 202103 7 8913 6375 11451 13 9 \n", "23 202102 7 7795 5430 10160 12 8 \n", "24 202101 7 10525 7750 13300 16 12 \n", "25 202053 7 11978 8406 15550 18 13 \n", "26 202052 7 12012 8285 15739 18 12 \n", "27 202051 7 10564 7574 13554 16 11 \n", "28 202050 7 7063 4744 9382 11 7 \n", "29 202049 7 5026 3145 6907 8 5 \n", "... ... ... ... ... ... ... ... \n", "1565 199126 7 17608 11304 23912 31 20 \n", "1566 199125 7 16169 10700 21638 28 18 \n", "1567 199124 7 16171 10071 22271 28 17 \n", "1568 199123 7 11947 7671 16223 21 13 \n", "1569 199122 7 15452 9953 20951 27 17 \n", "1570 199121 7 14903 8975 20831 26 16 \n", "1571 199120 7 19053 12742 25364 34 23 \n", "1572 199119 7 16739 11246 22232 29 19 \n", "1573 199118 7 21385 13882 28888 38 25 \n", "1574 199117 7 13462 8877 18047 24 16 \n", "1575 199116 7 14857 10068 19646 26 18 \n", "1576 199115 7 13975 9781 18169 25 18 \n", "1577 199114 7 12265 7684 16846 22 14 \n", "1578 199113 7 9567 6041 13093 17 11 \n", "1579 199112 7 10864 7331 14397 19 13 \n", "1580 199111 7 15574 11184 19964 27 19 \n", "1581 199110 7 16643 11372 21914 29 20 \n", "1582 199109 7 13741 8780 18702 24 15 \n", "1583 199108 7 13289 8813 17765 23 15 \n", "1584 199107 7 12337 8077 16597 22 15 \n", "1585 199106 7 10877 7013 14741 19 12 \n", "1586 199105 7 10442 6544 14340 18 11 \n", "1587 199104 7 7913 4563 11263 14 8 \n", "1588 199103 7 15387 10484 20290 27 18 \n", "1589 199102 7 16277 11046 21508 29 20 \n", "1590 199101 7 15565 10271 20859 27 18 \n", "1591 199052 7 19375 13295 25455 34 23 \n", "1592 199051 7 19080 13807 24353 34 25 \n", "1593 199050 7 11079 6660 15498 20 12 \n", "1594 199049 7 1143 0 2610 2 0 \n", "\n", " inc100_up geo_insee geo_name \n", "0 19 FR France \n", "1 23 FR France \n", "2 18 FR France \n", "3 10 FR France \n", "4 13 FR France \n", "5 15 FR France \n", "6 13 FR France \n", "7 9 FR France \n", "8 10 FR France \n", "9 10 FR France \n", "10 22 FR France \n", "11 22 FR France \n", "12 20 FR France \n", "13 22 FR France \n", "14 18 FR France \n", "15 18 FR France \n", "16 22 FR France \n", "17 21 FR France \n", "18 26 FR France \n", "19 25 FR France \n", "20 23 FR France \n", "21 23 FR France \n", "22 17 FR France \n", "23 16 FR France \n", "24 20 FR France \n", "25 23 FR France \n", "26 24 FR France \n", "27 21 FR France \n", "28 15 FR France \n", "29 11 FR France \n", "... ... ... ... \n", "1565 42 FR France \n", "1566 38 FR France \n", "1567 39 FR France \n", "1568 29 FR France \n", "1569 37 FR France \n", "1570 36 FR France \n", "1571 45 FR France \n", "1572 39 FR France \n", "1573 51 FR France \n", "1574 32 FR France \n", "1575 34 FR France \n", "1576 32 FR France \n", "1577 30 FR France \n", "1578 23 FR France \n", "1579 25 FR France \n", "1580 35 FR France \n", "1581 38 FR France \n", "1582 33 FR France \n", "1583 31 FR France \n", "1584 29 FR France \n", "1585 26 FR France \n", "1586 25 FR France \n", "1587 20 FR France \n", "1588 36 FR France \n", "1589 38 FR France \n", "1590 36 FR France \n", "1591 45 FR France \n", "1592 43 FR France \n", "1593 28 FR France \n", "1594 5 FR France \n", "\n", "[1595 rows x 10 columns]" ] }, "execution_count": 20, "metadata": {}, "output_type": "execute_result" } ], "source": [ "data = raw_data.dropna().copy()\n", "data" ] }, { "cell_type": "code", "execution_count": 21, "metadata": {}, "outputs": [], "source": [ "def convert_week(year_and_week_int):\n", " year_and_week_str = str(year_and_week_int)\n", " year = int(year_and_week_str[:4])\n", " week = int(year_and_week_str[4:])\n", " w = isoweek.Week(year, week)\n", " return pd.Period(w.day(0), 'W')\n", "\n", "data['period'] = [convert_week(yw) for yw in data['week']]" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [], "source": [ "sorted_data = data.set_index('period').sort_index()" ] }, { "cell_type": "code", "execution_count": 24, "metadata": {}, "outputs": [], "source": [ "periods = sorted_data.index\n", "for p1, p2 in zip(periods[:-1], periods[1:]):\n", " delta = p2.to_timestamp() - p1.end_time\n", " if delta > pd.Timedelta('1s'):\n", " print(p1, p2)" ] }, { "cell_type": "code", "execution_count": 25, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "sorted_data['inc'].plot()" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 12, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "sorted_data['inc'][-200:].plot()" ] }, { "cell_type": "code", "execution_count": 26, "metadata": {}, "outputs": [], "source": [ "first_august_week = [pd.Period(pd.Timestamp(y, 8, 1), 'W')\n", " for y in range(1990,\n", " sorted_data.index[-1].year)]" ] }, { "cell_type": "code", "execution_count": 33, "metadata": {}, "outputs": [], "source": [ "year = []\n", "yearly_incidence = []\n", "for week1, week2 in zip(first_august_week[:-1],\n", " first_august_week[1:]):\n", " one_year = sorted_data['inc'][week1:week2-1]\n", " yearly_incidence.append(one_year.sum())\n", " year.append(week2.year)\n", "yearly_incidence = pd.Series(data=yearly_incidence, index=year)" ] }, { "cell_type": "code", "execution_count": 34, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 34, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "yearly_incidence.plot(style='*')" ] }, { "cell_type": "code", "execution_count": 35, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "2020 229363\n", "2002 502271\n", "1991 507329\n", "2018 543281\n", "1996 553859\n", "2017 557449\n", "2019 584926\n", "2000 605096\n", "2015 613286\n", "2012 620315\n", "2011 645042\n", "1995 648598\n", "2001 650660\n", "1993 653058\n", "2005 654308\n", "2006 657482\n", "1998 660316\n", "2014 673458\n", "1997 679308\n", "1994 682920\n", "2007 701566\n", "2013 708874\n", "2004 736266\n", "2008 745701\n", "2003 770211\n", "2016 780645\n", "1999 784963\n", "1992 821558\n", "2009 822819\n", "2010 848236\n", "dtype: int64" ] }, "execution_count": 35, "metadata": {}, "output_type": "execute_result" } ], "source": [ "yearly_incidence.sort_values()" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.4" } }, "nbformat": 4, "nbformat_minor": 2 }