{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "%matplotlib inline\n", "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "import isoweek\n", "\n", "raw_data = pd.read_csv(\"https://www.sentiweb.fr/datasets/incidence-PAY-7.csv\", skiprows=1)" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
weekindicatorincinc_lowinc_upinc100inc100_lowinc100_upgeo_inseegeo_name
0202015719316823180315FRFrance
12020147387922275531639FRFrance
2202013773265236941611814FRFrance
32020127812357901045612816FRFrance
4202011710198756812828151119FRFrance
520201079011669111331141018FRFrance
62020097136311054416718211626FRFrance
7202008710424770813140161220FRFrance
820200778959657411344141018FRFrance
920200679264692511603141018FRFrance
1020200578505631410696131016FRFrance
112020047799158311015112915FRFrance
1220200375968410078369612FRFrance
13202002765344530853810713FRFrance
1420200179835701912651151119FRFrance
152019527794152461063612816FRFrance
1620195175823367579719612FRFrance
17201950764244276857210713FRFrance
18201949766214540870210713FRFrance
1920194875542338377018511FRFrance
202019477753650581001411715FRFrance
212019467263813163960426FRFrance
2220194574492261563697410FRFrance
2320194475728362778299612FRFrance
2420194374834275169177410FRFrance
25201942762793989856910713FRFrance
262019417413020306230639FRFrance
272019407421122186204639FRFrance
282019397313713104964528FRFrance
292019387307814164740528FRFrance
.................................
15021991267176081130423912312042FRFrance
15031991257161691070021638281838FRFrance
15041991247161711007122271281739FRFrance
1505199123711947767116223211329FRFrance
1506199122715452995320951271737FRFrance
1507199121714903897520831261636FRFrance
15081991207190531274225364342345FRFrance
15091991197167391124622232291939FRFrance
15101991187213851388228888382551FRFrance
1511199117713462887718047241632FRFrance
15121991167148571006819646261834FRFrance
1513199115713975978118169251832FRFrance
1514199114712265768416846221430FRFrance
151519911379567604113093171123FRFrance
1516199112710864733114397191325FRFrance
15171991117155741118419964271935FRFrance
15181991107166431137221914292038FRFrance
1519199109713741878018702241533FRFrance
1520199108713289881317765231531FRFrance
1521199107712337807716597221529FRFrance
1522199106710877701314741191226FRFrance
1523199105710442654414340181125FRFrance
15241991047791345631126314820FRFrance
15251991037153871048420290271836FRFrance
15261991027162771104621508292038FRFrance
15271991017155651027120859271836FRFrance
15281990527193751329525455342345FRFrance
15291990517190801380724353342543FRFrance
1530199050711079666015498201228FRFrance
15311990497114302610205FRFrance
\n", "

1532 rows × 10 columns

\n", "
" ], "text/plain": [ " week indicator inc inc_low inc_up inc100 inc100_low \\\n", "0 202015 7 1931 682 3180 3 1 \n", "1 202014 7 3879 2227 5531 6 3 \n", "2 202013 7 7326 5236 9416 11 8 \n", "3 202012 7 8123 5790 10456 12 8 \n", "4 202011 7 10198 7568 12828 15 11 \n", "5 202010 7 9011 6691 11331 14 10 \n", "6 202009 7 13631 10544 16718 21 16 \n", "7 202008 7 10424 7708 13140 16 12 \n", "8 202007 7 8959 6574 11344 14 10 \n", "9 202006 7 9264 6925 11603 14 10 \n", "10 202005 7 8505 6314 10696 13 10 \n", "11 202004 7 7991 5831 10151 12 9 \n", "12 202003 7 5968 4100 7836 9 6 \n", "13 202002 7 6534 4530 8538 10 7 \n", "14 202001 7 9835 7019 12651 15 11 \n", "15 201952 7 7941 5246 10636 12 8 \n", "16 201951 7 5823 3675 7971 9 6 \n", "17 201950 7 6424 4276 8572 10 7 \n", "18 201949 7 6621 4540 8702 10 7 \n", "19 201948 7 5542 3383 7701 8 5 \n", "20 201947 7 7536 5058 10014 11 7 \n", "21 201946 7 2638 1316 3960 4 2 \n", "22 201945 7 4492 2615 6369 7 4 \n", "23 201944 7 5728 3627 7829 9 6 \n", "24 201943 7 4834 2751 6917 7 4 \n", "25 201942 7 6279 3989 8569 10 7 \n", "26 201941 7 4130 2030 6230 6 3 \n", "27 201940 7 4211 2218 6204 6 3 \n", "28 201939 7 3137 1310 4964 5 2 \n", "29 201938 7 3078 1416 4740 5 2 \n", "... ... ... ... ... ... ... ... \n", "1502 199126 7 17608 11304 23912 31 20 \n", "1503 199125 7 16169 10700 21638 28 18 \n", "1504 199124 7 16171 10071 22271 28 17 \n", "1505 199123 7 11947 7671 16223 21 13 \n", "1506 199122 7 15452 9953 20951 27 17 \n", "1507 199121 7 14903 8975 20831 26 16 \n", "1508 199120 7 19053 12742 25364 34 23 \n", "1509 199119 7 16739 11246 22232 29 19 \n", "1510 199118 7 21385 13882 28888 38 25 \n", "1511 199117 7 13462 8877 18047 24 16 \n", "1512 199116 7 14857 10068 19646 26 18 \n", "1513 199115 7 13975 9781 18169 25 18 \n", "1514 199114 7 12265 7684 16846 22 14 \n", "1515 199113 7 9567 6041 13093 17 11 \n", "1516 199112 7 10864 7331 14397 19 13 \n", "1517 199111 7 15574 11184 19964 27 19 \n", "1518 199110 7 16643 11372 21914 29 20 \n", "1519 199109 7 13741 8780 18702 24 15 \n", "1520 199108 7 13289 8813 17765 23 15 \n", "1521 199107 7 12337 8077 16597 22 15 \n", "1522 199106 7 10877 7013 14741 19 12 \n", "1523 199105 7 10442 6544 14340 18 11 \n", "1524 199104 7 7913 4563 11263 14 8 \n", "1525 199103 7 15387 10484 20290 27 18 \n", "1526 199102 7 16277 11046 21508 29 20 \n", "1527 199101 7 15565 10271 20859 27 18 \n", "1528 199052 7 19375 13295 25455 34 23 \n", "1529 199051 7 19080 13807 24353 34 25 \n", "1530 199050 7 11079 6660 15498 20 12 \n", "1531 199049 7 1143 0 2610 2 0 \n", "\n", " inc100_up geo_insee geo_name \n", "0 5 FR France \n", "1 9 FR France \n", "2 14 FR France \n", "3 16 FR France \n", "4 19 FR France \n", "5 18 FR France \n", "6 26 FR France \n", "7 20 FR France \n", "8 18 FR France \n", "9 18 FR France \n", "10 16 FR France \n", "11 15 FR France \n", "12 12 FR France \n", "13 13 FR France \n", "14 19 FR France \n", "15 16 FR France \n", "16 12 FR France \n", "17 13 FR France \n", "18 13 FR France \n", "19 11 FR France \n", "20 15 FR France \n", "21 6 FR France \n", "22 10 FR France \n", "23 12 FR France \n", "24 10 FR France \n", "25 13 FR France \n", "26 9 FR France \n", "27 9 FR France \n", "28 8 FR France \n", "29 8 FR France \n", "... ... ... ... \n", "1502 42 FR France \n", "1503 38 FR France \n", "1504 39 FR France \n", "1505 29 FR France \n", "1506 37 FR France \n", "1507 36 FR France \n", "1508 45 FR France \n", "1509 39 FR France \n", "1510 51 FR France \n", "1511 32 FR France \n", "1512 34 FR France \n", "1513 32 FR France \n", "1514 30 FR France \n", "1515 23 FR France \n", "1516 25 FR France \n", "1517 35 FR France \n", "1518 38 FR France \n", "1519 33 FR France \n", "1520 31 FR France \n", "1521 29 FR France \n", "1522 26 FR France \n", "1523 25 FR France \n", "1524 20 FR France \n", "1525 36 FR France \n", "1526 38 FR France \n", "1527 36 FR France \n", "1528 45 FR France \n", "1529 43 FR France \n", "1530 28 FR France \n", "1531 5 FR France \n", "\n", "[1532 rows x 10 columns]" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "raw_data" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
weekindicatorincinc_lowinc_upinc100inc100_lowinc100_upgeo_inseegeo_name
\n", "
" ], "text/plain": [ "Empty DataFrame\n", "Columns: [week, indicator, inc, inc_low, inc_up, inc100, inc100_low, inc100_up, geo_insee, geo_name]\n", "Index: []" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "raw_data[raw_data.isnull().any(axis=1)]" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [], "source": [ "def convert_week(date):\n", " date_str=str(date)\n", " year=int(date_str[:4])\n", " week=int(date_str[4:])\n", " w=isoweek.Week(year,week)\n", " return pd.Period(w.day(0),'W')\n", " " ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [], "source": [ "raw_data['period'] = [convert_week(yw) for yw in raw_data['week']]" ] }, { "cell_type": "code", "execution_count": 6, "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
weekindicatorincinc_lowinc_upinc100inc100_lowinc100_upgeo_inseegeo_name
period
1990-12-03/1990-12-091990497114302610205FRFrance
1990-12-10/1990-12-16199050711079666015498201228FRFrance
1990-12-17/1990-12-231990517190801380724353342543FRFrance
1990-12-24/1990-12-301990527193751329525455342345FRFrance
1990-12-31/1991-01-061991017155651027120859271836FRFrance
1991-01-07/1991-01-131991027162771104621508292038FRFrance
1991-01-14/1991-01-201991037153871048420290271836FRFrance
1991-01-21/1991-01-271991047791345631126314820FRFrance
1991-01-28/1991-02-03199105710442654414340181125FRFrance
1991-02-04/1991-02-10199106710877701314741191226FRFrance
1991-02-11/1991-02-17199107712337807716597221529FRFrance
1991-02-18/1991-02-24199108713289881317765231531FRFrance
1991-02-25/1991-03-03199109713741878018702241533FRFrance
1991-03-04/1991-03-101991107166431137221914292038FRFrance
1991-03-11/1991-03-171991117155741118419964271935FRFrance
1991-03-18/1991-03-24199112710864733114397191325FRFrance
1991-03-25/1991-03-3119911379567604113093171123FRFrance
1991-04-01/1991-04-07199114712265768416846221430FRFrance
1991-04-08/1991-04-14199115713975978118169251832FRFrance
1991-04-15/1991-04-211991167148571006819646261834FRFrance
1991-04-22/1991-04-28199117713462887718047241632FRFrance
1991-04-29/1991-05-051991187213851388228888382551FRFrance
1991-05-06/1991-05-121991197167391124622232291939FRFrance
1991-05-13/1991-05-191991207190531274225364342345FRFrance
1991-05-20/1991-05-26199121714903897520831261636FRFrance
1991-05-27/1991-06-02199122715452995320951271737FRFrance
1991-06-03/1991-06-09199123711947767116223211329FRFrance
1991-06-10/1991-06-161991247161711007122271281739FRFrance
1991-06-17/1991-06-231991257161691070021638281838FRFrance
1991-06-24/1991-06-301991267176081130423912312042FRFrance
.................................
2019-09-16/2019-09-222019387307814164740528FRFrance
2019-09-23/2019-09-292019397313713104964528FRFrance
2019-09-30/2019-10-062019407421122186204639FRFrance
2019-10-07/2019-10-132019417413020306230639FRFrance
2019-10-14/2019-10-20201942762793989856910713FRFrance
2019-10-21/2019-10-2720194374834275169177410FRFrance
2019-10-28/2019-11-0320194475728362778299612FRFrance
2019-11-04/2019-11-1020194574492261563697410FRFrance
2019-11-11/2019-11-172019467263813163960426FRFrance
2019-11-18/2019-11-242019477753650581001411715FRFrance
2019-11-25/2019-12-0120194875542338377018511FRFrance
2019-12-02/2019-12-08201949766214540870210713FRFrance
2019-12-09/2019-12-15201950764244276857210713FRFrance
2019-12-16/2019-12-2220195175823367579719612FRFrance
2019-12-23/2019-12-292019527794152461063612816FRFrance
2019-12-30/2020-01-0520200179835701912651151119FRFrance
2020-01-06/2020-01-12202002765344530853810713FRFrance
2020-01-13/2020-01-1920200375968410078369612FRFrance
2020-01-20/2020-01-262020047799158311015112915FRFrance
2020-01-27/2020-02-0220200578505631410696131016FRFrance
2020-02-03/2020-02-0920200679264692511603141018FRFrance
2020-02-10/2020-02-1620200778959657411344141018FRFrance
2020-02-17/2020-02-23202008710424770813140161220FRFrance
2020-02-24/2020-03-012020097136311054416718211626FRFrance
2020-03-02/2020-03-0820201079011669111331141018FRFrance
2020-03-09/2020-03-15202011710198756812828151119FRFrance
2020-03-16/2020-03-222020127812357901045612816FRFrance
2020-03-23/2020-03-29202013773265236941611814FRFrance
2020-03-30/2020-04-052020147387922275531639FRFrance
2020-04-06/2020-04-12202015719316823180315FRFrance
\n", "

1532 rows × 10 columns

\n", "
" ], "text/plain": [ " week indicator inc inc_low inc_up inc100 \\\n", "period \n", "1990-12-03/1990-12-09 199049 7 1143 0 2610 2 \n", "1990-12-10/1990-12-16 199050 7 11079 6660 15498 20 \n", "1990-12-17/1990-12-23 199051 7 19080 13807 24353 34 \n", "1990-12-24/1990-12-30 199052 7 19375 13295 25455 34 \n", "1990-12-31/1991-01-06 199101 7 15565 10271 20859 27 \n", "1991-01-07/1991-01-13 199102 7 16277 11046 21508 29 \n", "1991-01-14/1991-01-20 199103 7 15387 10484 20290 27 \n", "1991-01-21/1991-01-27 199104 7 7913 4563 11263 14 \n", "1991-01-28/1991-02-03 199105 7 10442 6544 14340 18 \n", "1991-02-04/1991-02-10 199106 7 10877 7013 14741 19 \n", "1991-02-11/1991-02-17 199107 7 12337 8077 16597 22 \n", "1991-02-18/1991-02-24 199108 7 13289 8813 17765 23 \n", "1991-02-25/1991-03-03 199109 7 13741 8780 18702 24 \n", "1991-03-04/1991-03-10 199110 7 16643 11372 21914 29 \n", "1991-03-11/1991-03-17 199111 7 15574 11184 19964 27 \n", "1991-03-18/1991-03-24 199112 7 10864 7331 14397 19 \n", "1991-03-25/1991-03-31 199113 7 9567 6041 13093 17 \n", "1991-04-01/1991-04-07 199114 7 12265 7684 16846 22 \n", "1991-04-08/1991-04-14 199115 7 13975 9781 18169 25 \n", "1991-04-15/1991-04-21 199116 7 14857 10068 19646 26 \n", "1991-04-22/1991-04-28 199117 7 13462 8877 18047 24 \n", "1991-04-29/1991-05-05 199118 7 21385 13882 28888 38 \n", "1991-05-06/1991-05-12 199119 7 16739 11246 22232 29 \n", "1991-05-13/1991-05-19 199120 7 19053 12742 25364 34 \n", "1991-05-20/1991-05-26 199121 7 14903 8975 20831 26 \n", "1991-05-27/1991-06-02 199122 7 15452 9953 20951 27 \n", "1991-06-03/1991-06-09 199123 7 11947 7671 16223 21 \n", "1991-06-10/1991-06-16 199124 7 16171 10071 22271 28 \n", "1991-06-17/1991-06-23 199125 7 16169 10700 21638 28 \n", "1991-06-24/1991-06-30 199126 7 17608 11304 23912 31 \n", "... ... ... ... ... ... ... \n", "2019-09-16/2019-09-22 201938 7 3078 1416 4740 5 \n", "2019-09-23/2019-09-29 201939 7 3137 1310 4964 5 \n", "2019-09-30/2019-10-06 201940 7 4211 2218 6204 6 \n", "2019-10-07/2019-10-13 201941 7 4130 2030 6230 6 \n", "2019-10-14/2019-10-20 201942 7 6279 3989 8569 10 \n", "2019-10-21/2019-10-27 201943 7 4834 2751 6917 7 \n", "2019-10-28/2019-11-03 201944 7 5728 3627 7829 9 \n", "2019-11-04/2019-11-10 201945 7 4492 2615 6369 7 \n", "2019-11-11/2019-11-17 201946 7 2638 1316 3960 4 \n", "2019-11-18/2019-11-24 201947 7 7536 5058 10014 11 \n", "2019-11-25/2019-12-01 201948 7 5542 3383 7701 8 \n", "2019-12-02/2019-12-08 201949 7 6621 4540 8702 10 \n", "2019-12-09/2019-12-15 201950 7 6424 4276 8572 10 \n", "2019-12-16/2019-12-22 201951 7 5823 3675 7971 9 \n", "2019-12-23/2019-12-29 201952 7 7941 5246 10636 12 \n", "2019-12-30/2020-01-05 202001 7 9835 7019 12651 15 \n", "2020-01-06/2020-01-12 202002 7 6534 4530 8538 10 \n", "2020-01-13/2020-01-19 202003 7 5968 4100 7836 9 \n", "2020-01-20/2020-01-26 202004 7 7991 5831 10151 12 \n", "2020-01-27/2020-02-02 202005 7 8505 6314 10696 13 \n", "2020-02-03/2020-02-09 202006 7 9264 6925 11603 14 \n", "2020-02-10/2020-02-16 202007 7 8959 6574 11344 14 \n", "2020-02-17/2020-02-23 202008 7 10424 7708 13140 16 \n", "2020-02-24/2020-03-01 202009 7 13631 10544 16718 21 \n", "2020-03-02/2020-03-08 202010 7 9011 6691 11331 14 \n", "2020-03-09/2020-03-15 202011 7 10198 7568 12828 15 \n", "2020-03-16/2020-03-22 202012 7 8123 5790 10456 12 \n", "2020-03-23/2020-03-29 202013 7 7326 5236 9416 11 \n", "2020-03-30/2020-04-05 202014 7 3879 2227 5531 6 \n", "2020-04-06/2020-04-12 202015 7 1931 682 3180 3 \n", "\n", " inc100_low inc100_up geo_insee geo_name \n", "period \n", "1990-12-03/1990-12-09 0 5 FR France \n", "1990-12-10/1990-12-16 12 28 FR France \n", "1990-12-17/1990-12-23 25 43 FR France \n", "1990-12-24/1990-12-30 23 45 FR France \n", "1990-12-31/1991-01-06 18 36 FR France \n", "1991-01-07/1991-01-13 20 38 FR France \n", "1991-01-14/1991-01-20 18 36 FR France \n", "1991-01-21/1991-01-27 8 20 FR France \n", "1991-01-28/1991-02-03 11 25 FR France \n", "1991-02-04/1991-02-10 12 26 FR France \n", "1991-02-11/1991-02-17 15 29 FR France \n", "1991-02-18/1991-02-24 15 31 FR France \n", "1991-02-25/1991-03-03 15 33 FR France \n", "1991-03-04/1991-03-10 20 38 FR France \n", "1991-03-11/1991-03-17 19 35 FR France \n", "1991-03-18/1991-03-24 13 25 FR France \n", "1991-03-25/1991-03-31 11 23 FR France \n", "1991-04-01/1991-04-07 14 30 FR France \n", "1991-04-08/1991-04-14 18 32 FR France \n", "1991-04-15/1991-04-21 18 34 FR France \n", "1991-04-22/1991-04-28 16 32 FR France \n", "1991-04-29/1991-05-05 25 51 FR France \n", "1991-05-06/1991-05-12 19 39 FR France \n", "1991-05-13/1991-05-19 23 45 FR France \n", "1991-05-20/1991-05-26 16 36 FR France \n", "1991-05-27/1991-06-02 17 37 FR France \n", "1991-06-03/1991-06-09 13 29 FR France \n", "1991-06-10/1991-06-16 17 39 FR France \n", "1991-06-17/1991-06-23 18 38 FR France \n", "1991-06-24/1991-06-30 20 42 FR France \n", "... ... ... ... ... \n", "2019-09-16/2019-09-22 2 8 FR France \n", "2019-09-23/2019-09-29 2 8 FR France \n", "2019-09-30/2019-10-06 3 9 FR France \n", "2019-10-07/2019-10-13 3 9 FR France \n", "2019-10-14/2019-10-20 7 13 FR France \n", "2019-10-21/2019-10-27 4 10 FR France \n", "2019-10-28/2019-11-03 6 12 FR France \n", "2019-11-04/2019-11-10 4 10 FR France \n", "2019-11-11/2019-11-17 2 6 FR France \n", "2019-11-18/2019-11-24 7 15 FR France \n", "2019-11-25/2019-12-01 5 11 FR France \n", "2019-12-02/2019-12-08 7 13 FR France \n", "2019-12-09/2019-12-15 7 13 FR France \n", "2019-12-16/2019-12-22 6 12 FR France \n", "2019-12-23/2019-12-29 8 16 FR France \n", "2019-12-30/2020-01-05 11 19 FR France \n", "2020-01-06/2020-01-12 7 13 FR France \n", "2020-01-13/2020-01-19 6 12 FR France \n", "2020-01-20/2020-01-26 9 15 FR France \n", "2020-01-27/2020-02-02 10 16 FR France \n", "2020-02-03/2020-02-09 10 18 FR France \n", "2020-02-10/2020-02-16 10 18 FR France \n", "2020-02-17/2020-02-23 12 20 FR France \n", "2020-02-24/2020-03-01 16 26 FR France \n", "2020-03-02/2020-03-08 10 18 FR France \n", "2020-03-09/2020-03-15 11 19 FR France \n", "2020-03-16/2020-03-22 8 16 FR France \n", "2020-03-23/2020-03-29 8 14 FR France \n", "2020-03-30/2020-04-05 3 9 FR France \n", "2020-04-06/2020-04-12 1 5 FR France \n", "\n", "[1532 rows x 10 columns]" ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "sorted_data = raw_data.set_index('period').sort_index()\n", "sorted_data" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "On cherche si nos données se suivent ou s'il y a des trous dans les dates:" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [], "source": [ "periods = sorted_data.index\n", "for p1,p2 in zip(periods[:-1], periods[1:]):\n", " delta = p2.to_timestamp()-p1.end_time\n", " if delta > pd.Timedelta('1s'):\n", " print(p1,p2)" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "sorted_data['inc'].plot()" ] }, { "cell_type": "code", "execution_count": 9, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 9, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "sorted_data['inc'][-200:].plot()" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [], "source": [ "first_september_weeks=[pd.Period(pd.Timestamp(y,9,1),'W') for y in range(sorted_data.index[0].year, sorted_data.index[-1].year)]" ] }, { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "[Period('1990-08-27/1990-09-02', 'W-SUN'),\n", " Period('1991-08-26/1991-09-01', 'W-SUN'),\n", " Period('1992-08-31/1992-09-06', 'W-SUN'),\n", " Period('1993-08-30/1993-09-05', 'W-SUN'),\n", " Period('1994-08-29/1994-09-04', 'W-SUN'),\n", " Period('1995-08-28/1995-09-03', 'W-SUN'),\n", " Period('1996-08-26/1996-09-01', 'W-SUN'),\n", " Period('1997-09-01/1997-09-07', 'W-SUN'),\n", " Period('1998-08-31/1998-09-06', 'W-SUN'),\n", " Period('1999-08-30/1999-09-05', 'W-SUN'),\n", " Period('2000-08-28/2000-09-03', 'W-SUN'),\n", " Period('2001-08-27/2001-09-02', 'W-SUN'),\n", " Period('2002-08-26/2002-09-01', 'W-SUN'),\n", " Period('2003-09-01/2003-09-07', 'W-SUN'),\n", " Period('2004-08-30/2004-09-05', 'W-SUN'),\n", " Period('2005-08-29/2005-09-04', 'W-SUN'),\n", " Period('2006-08-28/2006-09-03', 'W-SUN'),\n", " Period('2007-08-27/2007-09-02', 'W-SUN'),\n", " Period('2008-09-01/2008-09-07', 'W-SUN'),\n", " Period('2009-08-31/2009-09-06', 'W-SUN'),\n", " Period('2010-08-30/2010-09-05', 'W-SUN'),\n", " Period('2011-08-29/2011-09-04', 'W-SUN'),\n", " Period('2012-08-27/2012-09-02', 'W-SUN'),\n", " Period('2013-08-26/2013-09-01', 'W-SUN'),\n", " Period('2014-09-01/2014-09-07', 'W-SUN'),\n", " Period('2015-08-31/2015-09-06', 'W-SUN'),\n", " Period('2016-08-29/2016-09-04', 'W-SUN'),\n", " Period('2017-08-28/2017-09-03', 'W-SUN'),\n", " Period('2018-08-27/2018-09-02', 'W-SUN'),\n", " Period('2019-08-26/2019-09-01', 'W-SUN')]" ] }, "execution_count": 11, "metadata": {}, "output_type": "execute_result" } ], "source": [ "first_september_weeks # semaines contenant le 1er septembre. " ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "year=[]\n", "yearly_incidence = []\n", "for week1, week2 in zip(first_september_weeks[:-1], first_september_weeks[1:]):\n", " one_year = sorted_data['inc'][week1:week2-1]\n", " assert abs(len(one_year))-52 < 2 # s'il n'y a pas le bon nombre de semaines dans l'année -> erreur\n", " yearly_incidence.append(one_year.sum())\n", " year.append(week2.year)" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [], "source": [ "yearly_incidence = pd.Series(index=year, data=yearly_incidence)" ] }, { "cell_type": "code", "execution_count": 14, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 14, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "yearly_incidence.plot(style='*')" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "2002 516689\n", "2018 542312\n", "2017 551041\n", "1991 553090\n", "1996 564901\n", "2019 584066\n", "2015 604382\n", "2000 617597\n", "2001 619041\n", "2012 624573\n", "2005 628464\n", "2006 632833\n", "2011 642368\n", "1993 643387\n", "1995 652478\n", "1994 661409\n", "1998 677775\n", "1997 683434\n", "2014 685769\n", "2013 698332\n", "2007 717352\n", "2008 749478\n", "1999 756456\n", "2003 758363\n", "2004 777388\n", "2016 782114\n", "2010 829911\n", "1992 832939\n", "2009 842373\n", "dtype: int64" ] }, "execution_count": 15, "metadata": {}, "output_type": "execute_result" } ], "source": [ "yearly_incidence.sort_values()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Année avec la plus forte incidence: 2009; la plus faible : 2002" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.4" } }, "nbformat": 4, "nbformat_minor": 2 }