chargement et vérification des données

parent 230df3bd
{
"cells": [],
"cells": [
{
"cell_type": "markdown",
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"source": [
"# Analyse de la varicelle"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"outputs": [],
"source": [
"%matplotlib inline\n",
"import matplotlib.pyplot as plt\n",
"import pandas as pd\n",
"import isoweek"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"outputs": [],
"source": [
"data_url = 'http://www.sentiweb.fr/datasets/incidence-PAY-7.csv'"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>week</th>\n",
" <th>indicator</th>\n",
" <th>inc</th>\n",
" <th>inc_low</th>\n",
" <th>inc_up</th>\n",
" <th>inc100</th>\n",
" <th>inc100_low</th>\n",
" <th>inc100_up</th>\n",
" <th>geo_insee</th>\n",
" <th>geo_name</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>202018</td>\n",
" <td>7</td>\n",
" <td>912</td>\n",
" <td>47</td>\n",
" <td>1777</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>202017</td>\n",
" <td>7</td>\n",
" <td>272</td>\n",
" <td>0</td>\n",
" <td>658</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>202016</td>\n",
" <td>7</td>\n",
" <td>758</td>\n",
" <td>78</td>\n",
" <td>1438</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" <td>2</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>202015</td>\n",
" <td>7</td>\n",
" <td>1918</td>\n",
" <td>675</td>\n",
" <td>3161</td>\n",
" <td>3</td>\n",
" <td>1</td>\n",
" <td>5</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>202014</td>\n",
" <td>7</td>\n",
" <td>3879</td>\n",
" <td>2227</td>\n",
" <td>5531</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>9</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>202013</td>\n",
" <td>7</td>\n",
" <td>7326</td>\n",
" <td>5236</td>\n",
" <td>9416</td>\n",
" <td>11</td>\n",
" <td>8</td>\n",
" <td>14</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>202012</td>\n",
" <td>7</td>\n",
" <td>8123</td>\n",
" <td>5790</td>\n",
" <td>10456</td>\n",
" <td>12</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7</th>\n",
" <td>202011</td>\n",
" <td>7</td>\n",
" <td>10198</td>\n",
" <td>7568</td>\n",
" <td>12828</td>\n",
" <td>15</td>\n",
" <td>11</td>\n",
" <td>19</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8</th>\n",
" <td>202010</td>\n",
" <td>7</td>\n",
" <td>9011</td>\n",
" <td>6691</td>\n",
" <td>11331</td>\n",
" <td>14</td>\n",
" <td>10</td>\n",
" <td>18</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9</th>\n",
" <td>202009</td>\n",
" <td>7</td>\n",
" <td>13631</td>\n",
" <td>10544</td>\n",
" <td>16718</td>\n",
" <td>21</td>\n",
" <td>16</td>\n",
" <td>26</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10</th>\n",
" <td>202008</td>\n",
" <td>7</td>\n",
" <td>10424</td>\n",
" <td>7708</td>\n",
" <td>13140</td>\n",
" <td>16</td>\n",
" <td>12</td>\n",
" <td>20</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>11</th>\n",
" <td>202007</td>\n",
" <td>7</td>\n",
" <td>8959</td>\n",
" <td>6574</td>\n",
" <td>11344</td>\n",
" <td>14</td>\n",
" <td>10</td>\n",
" <td>18</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>12</th>\n",
" <td>202006</td>\n",
" <td>7</td>\n",
" <td>9264</td>\n",
" <td>6925</td>\n",
" <td>11603</td>\n",
" <td>14</td>\n",
" <td>10</td>\n",
" <td>18</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>13</th>\n",
" <td>202005</td>\n",
" <td>7</td>\n",
" <td>8505</td>\n",
" <td>6314</td>\n",
" <td>10696</td>\n",
" <td>13</td>\n",
" <td>10</td>\n",
" <td>16</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14</th>\n",
" <td>202004</td>\n",
" <td>7</td>\n",
" <td>7991</td>\n",
" <td>5831</td>\n",
" <td>10151</td>\n",
" <td>12</td>\n",
" <td>9</td>\n",
" <td>15</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15</th>\n",
" <td>202003</td>\n",
" <td>7</td>\n",
" <td>5968</td>\n",
" <td>4100</td>\n",
" <td>7836</td>\n",
" <td>9</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>16</th>\n",
" <td>202002</td>\n",
" <td>7</td>\n",
" <td>6534</td>\n",
" <td>4530</td>\n",
" <td>8538</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>13</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>17</th>\n",
" <td>202001</td>\n",
" <td>7</td>\n",
" <td>9835</td>\n",
" <td>7019</td>\n",
" <td>12651</td>\n",
" <td>15</td>\n",
" <td>11</td>\n",
" <td>19</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>18</th>\n",
" <td>201952</td>\n",
" <td>7</td>\n",
" <td>7941</td>\n",
" <td>5246</td>\n",
" <td>10636</td>\n",
" <td>12</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>19</th>\n",
" <td>201951</td>\n",
" <td>7</td>\n",
" <td>5823</td>\n",
" <td>3675</td>\n",
" <td>7971</td>\n",
" <td>9</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>20</th>\n",
" <td>201950</td>\n",
" <td>7</td>\n",
" <td>6424</td>\n",
" <td>4276</td>\n",
" <td>8572</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>13</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>21</th>\n",
" <td>201949</td>\n",
" <td>7</td>\n",
" <td>6621</td>\n",
" <td>4540</td>\n",
" <td>8702</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>13</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>201948</td>\n",
" <td>7</td>\n",
" <td>5542</td>\n",
" <td>3383</td>\n",
" <td>7701</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>201947</td>\n",
" <td>7</td>\n",
" <td>7536</td>\n",
" <td>5058</td>\n",
" <td>10014</td>\n",
" <td>11</td>\n",
" <td>7</td>\n",
" <td>15</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>201946</td>\n",
" <td>7</td>\n",
" <td>2638</td>\n",
" <td>1316</td>\n",
" <td>3960</td>\n",
" <td>4</td>\n",
" <td>2</td>\n",
" <td>6</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25</th>\n",
" <td>201945</td>\n",
" <td>7</td>\n",
" <td>4492</td>\n",
" <td>2615</td>\n",
" <td>6369</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>201944</td>\n",
" <td>7</td>\n",
" <td>5728</td>\n",
" <td>3627</td>\n",
" <td>7829</td>\n",
" <td>9</td>\n",
" <td>6</td>\n",
" <td>12</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>201943</td>\n",
" <td>7</td>\n",
" <td>4834</td>\n",
" <td>2751</td>\n",
" <td>6917</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>201942</td>\n",
" <td>7</td>\n",
" <td>6279</td>\n",
" <td>3989</td>\n",
" <td>8569</td>\n",
" <td>10</td>\n",
" <td>7</td>\n",
" <td>13</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>201941</td>\n",
" <td>7</td>\n",
" <td>4130</td>\n",
" <td>2030</td>\n",
" <td>6230</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>9</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1505</th>\n",
" <td>199126</td>\n",
" <td>7</td>\n",
" <td>17608</td>\n",
" <td>11304</td>\n",
" <td>23912</td>\n",
" <td>31</td>\n",
" <td>20</td>\n",
" <td>42</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1506</th>\n",
" <td>199125</td>\n",
" <td>7</td>\n",
" <td>16169</td>\n",
" <td>10700</td>\n",
" <td>21638</td>\n",
" <td>28</td>\n",
" <td>18</td>\n",
" <td>38</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1507</th>\n",
" <td>199124</td>\n",
" <td>7</td>\n",
" <td>16171</td>\n",
" <td>10071</td>\n",
" <td>22271</td>\n",
" <td>28</td>\n",
" <td>17</td>\n",
" <td>39</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1508</th>\n",
" <td>199123</td>\n",
" <td>7</td>\n",
" <td>11947</td>\n",
" <td>7671</td>\n",
" <td>16223</td>\n",
" <td>21</td>\n",
" <td>13</td>\n",
" <td>29</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1509</th>\n",
" <td>199122</td>\n",
" <td>7</td>\n",
" <td>15452</td>\n",
" <td>9953</td>\n",
" <td>20951</td>\n",
" <td>27</td>\n",
" <td>17</td>\n",
" <td>37</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1510</th>\n",
" <td>199121</td>\n",
" <td>7</td>\n",
" <td>14903</td>\n",
" <td>8975</td>\n",
" <td>20831</td>\n",
" <td>26</td>\n",
" <td>16</td>\n",
" <td>36</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1511</th>\n",
" <td>199120</td>\n",
" <td>7</td>\n",
" <td>19053</td>\n",
" <td>12742</td>\n",
" <td>25364</td>\n",
" <td>34</td>\n",
" <td>23</td>\n",
" <td>45</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1512</th>\n",
" <td>199119</td>\n",
" <td>7</td>\n",
" <td>16739</td>\n",
" <td>11246</td>\n",
" <td>22232</td>\n",
" <td>29</td>\n",
" <td>19</td>\n",
" <td>39</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1513</th>\n",
" <td>199118</td>\n",
" <td>7</td>\n",
" <td>21385</td>\n",
" <td>13882</td>\n",
" <td>28888</td>\n",
" <td>38</td>\n",
" <td>25</td>\n",
" <td>51</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1514</th>\n",
" <td>199117</td>\n",
" <td>7</td>\n",
" <td>13462</td>\n",
" <td>8877</td>\n",
" <td>18047</td>\n",
" <td>24</td>\n",
" <td>16</td>\n",
" <td>32</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1515</th>\n",
" <td>199116</td>\n",
" <td>7</td>\n",
" <td>14857</td>\n",
" <td>10068</td>\n",
" <td>19646</td>\n",
" <td>26</td>\n",
" <td>18</td>\n",
" <td>34</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1516</th>\n",
" <td>199115</td>\n",
" <td>7</td>\n",
" <td>13975</td>\n",
" <td>9781</td>\n",
" <td>18169</td>\n",
" <td>25</td>\n",
" <td>18</td>\n",
" <td>32</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1517</th>\n",
" <td>199114</td>\n",
" <td>7</td>\n",
" <td>12265</td>\n",
" <td>7684</td>\n",
" <td>16846</td>\n",
" <td>22</td>\n",
" <td>14</td>\n",
" <td>30</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1518</th>\n",
" <td>199113</td>\n",
" <td>7</td>\n",
" <td>9567</td>\n",
" <td>6041</td>\n",
" <td>13093</td>\n",
" <td>17</td>\n",
" <td>11</td>\n",
" <td>23</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1519</th>\n",
" <td>199112</td>\n",
" <td>7</td>\n",
" <td>10864</td>\n",
" <td>7331</td>\n",
" <td>14397</td>\n",
" <td>19</td>\n",
" <td>13</td>\n",
" <td>25</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1520</th>\n",
" <td>199111</td>\n",
" <td>7</td>\n",
" <td>15574</td>\n",
" <td>11184</td>\n",
" <td>19964</td>\n",
" <td>27</td>\n",
" <td>19</td>\n",
" <td>35</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1521</th>\n",
" <td>199110</td>\n",
" <td>7</td>\n",
" <td>16643</td>\n",
" <td>11372</td>\n",
" <td>21914</td>\n",
" <td>29</td>\n",
" <td>20</td>\n",
" <td>38</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1522</th>\n",
" <td>199109</td>\n",
" <td>7</td>\n",
" <td>13741</td>\n",
" <td>8780</td>\n",
" <td>18702</td>\n",
" <td>24</td>\n",
" <td>15</td>\n",
" <td>33</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1523</th>\n",
" <td>199108</td>\n",
" <td>7</td>\n",
" <td>13289</td>\n",
" <td>8813</td>\n",
" <td>17765</td>\n",
" <td>23</td>\n",
" <td>15</td>\n",
" <td>31</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1524</th>\n",
" <td>199107</td>\n",
" <td>7</td>\n",
" <td>12337</td>\n",
" <td>8077</td>\n",
" <td>16597</td>\n",
" <td>22</td>\n",
" <td>15</td>\n",
" <td>29</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1525</th>\n",
" <td>199106</td>\n",
" <td>7</td>\n",
" <td>10877</td>\n",
" <td>7013</td>\n",
" <td>14741</td>\n",
" <td>19</td>\n",
" <td>12</td>\n",
" <td>26</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1526</th>\n",
" <td>199105</td>\n",
" <td>7</td>\n",
" <td>10442</td>\n",
" <td>6544</td>\n",
" <td>14340</td>\n",
" <td>18</td>\n",
" <td>11</td>\n",
" <td>25</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1527</th>\n",
" <td>199104</td>\n",
" <td>7</td>\n",
" <td>7913</td>\n",
" <td>4563</td>\n",
" <td>11263</td>\n",
" <td>14</td>\n",
" <td>8</td>\n",
" <td>20</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1528</th>\n",
" <td>199103</td>\n",
" <td>7</td>\n",
" <td>15387</td>\n",
" <td>10484</td>\n",
" <td>20290</td>\n",
" <td>27</td>\n",
" <td>18</td>\n",
" <td>36</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1529</th>\n",
" <td>199102</td>\n",
" <td>7</td>\n",
" <td>16277</td>\n",
" <td>11046</td>\n",
" <td>21508</td>\n",
" <td>29</td>\n",
" <td>20</td>\n",
" <td>38</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1530</th>\n",
" <td>199101</td>\n",
" <td>7</td>\n",
" <td>15565</td>\n",
" <td>10271</td>\n",
" <td>20859</td>\n",
" <td>27</td>\n",
" <td>18</td>\n",
" <td>36</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1531</th>\n",
" <td>199052</td>\n",
" <td>7</td>\n",
" <td>19375</td>\n",
" <td>13295</td>\n",
" <td>25455</td>\n",
" <td>34</td>\n",
" <td>23</td>\n",
" <td>45</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1532</th>\n",
" <td>199051</td>\n",
" <td>7</td>\n",
" <td>19080</td>\n",
" <td>13807</td>\n",
" <td>24353</td>\n",
" <td>34</td>\n",
" <td>25</td>\n",
" <td>43</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1533</th>\n",
" <td>199050</td>\n",
" <td>7</td>\n",
" <td>11079</td>\n",
" <td>6660</td>\n",
" <td>15498</td>\n",
" <td>20</td>\n",
" <td>12</td>\n",
" <td>28</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1534</th>\n",
" <td>199049</td>\n",
" <td>7</td>\n",
" <td>1143</td>\n",
" <td>0</td>\n",
" <td>2610</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>5</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>1535 rows × 10 columns</p>\n",
"</div>"
],
"text/plain": [
" week indicator inc inc_low inc_up inc100 inc100_low \\\n",
"0 202018 7 912 47 1777 1 0 \n",
"1 202017 7 272 0 658 0 0 \n",
"2 202016 7 758 78 1438 1 0 \n",
"3 202015 7 1918 675 3161 3 1 \n",
"4 202014 7 3879 2227 5531 6 3 \n",
"5 202013 7 7326 5236 9416 11 8 \n",
"6 202012 7 8123 5790 10456 12 8 \n",
"7 202011 7 10198 7568 12828 15 11 \n",
"8 202010 7 9011 6691 11331 14 10 \n",
"9 202009 7 13631 10544 16718 21 16 \n",
"10 202008 7 10424 7708 13140 16 12 \n",
"11 202007 7 8959 6574 11344 14 10 \n",
"12 202006 7 9264 6925 11603 14 10 \n",
"13 202005 7 8505 6314 10696 13 10 \n",
"14 202004 7 7991 5831 10151 12 9 \n",
"15 202003 7 5968 4100 7836 9 6 \n",
"16 202002 7 6534 4530 8538 10 7 \n",
"17 202001 7 9835 7019 12651 15 11 \n",
"18 201952 7 7941 5246 10636 12 8 \n",
"19 201951 7 5823 3675 7971 9 6 \n",
"20 201950 7 6424 4276 8572 10 7 \n",
"21 201949 7 6621 4540 8702 10 7 \n",
"22 201948 7 5542 3383 7701 8 5 \n",
"23 201947 7 7536 5058 10014 11 7 \n",
"24 201946 7 2638 1316 3960 4 2 \n",
"25 201945 7 4492 2615 6369 7 4 \n",
"26 201944 7 5728 3627 7829 9 6 \n",
"27 201943 7 4834 2751 6917 7 4 \n",
"28 201942 7 6279 3989 8569 10 7 \n",
"29 201941 7 4130 2030 6230 6 3 \n",
"... ... ... ... ... ... ... ... \n",
"1505 199126 7 17608 11304 23912 31 20 \n",
"1506 199125 7 16169 10700 21638 28 18 \n",
"1507 199124 7 16171 10071 22271 28 17 \n",
"1508 199123 7 11947 7671 16223 21 13 \n",
"1509 199122 7 15452 9953 20951 27 17 \n",
"1510 199121 7 14903 8975 20831 26 16 \n",
"1511 199120 7 19053 12742 25364 34 23 \n",
"1512 199119 7 16739 11246 22232 29 19 \n",
"1513 199118 7 21385 13882 28888 38 25 \n",
"1514 199117 7 13462 8877 18047 24 16 \n",
"1515 199116 7 14857 10068 19646 26 18 \n",
"1516 199115 7 13975 9781 18169 25 18 \n",
"1517 199114 7 12265 7684 16846 22 14 \n",
"1518 199113 7 9567 6041 13093 17 11 \n",
"1519 199112 7 10864 7331 14397 19 13 \n",
"1520 199111 7 15574 11184 19964 27 19 \n",
"1521 199110 7 16643 11372 21914 29 20 \n",
"1522 199109 7 13741 8780 18702 24 15 \n",
"1523 199108 7 13289 8813 17765 23 15 \n",
"1524 199107 7 12337 8077 16597 22 15 \n",
"1525 199106 7 10877 7013 14741 19 12 \n",
"1526 199105 7 10442 6544 14340 18 11 \n",
"1527 199104 7 7913 4563 11263 14 8 \n",
"1528 199103 7 15387 10484 20290 27 18 \n",
"1529 199102 7 16277 11046 21508 29 20 \n",
"1530 199101 7 15565 10271 20859 27 18 \n",
"1531 199052 7 19375 13295 25455 34 23 \n",
"1532 199051 7 19080 13807 24353 34 25 \n",
"1533 199050 7 11079 6660 15498 20 12 \n",
"1534 199049 7 1143 0 2610 2 0 \n",
"\n",
" inc100_up geo_insee geo_name \n",
"0 2 FR France \n",
"1 1 FR France \n",
"2 2 FR France \n",
"3 5 FR France \n",
"4 9 FR France \n",
"5 14 FR France \n",
"6 16 FR France \n",
"7 19 FR France \n",
"8 18 FR France \n",
"9 26 FR France \n",
"10 20 FR France \n",
"11 18 FR France \n",
"12 18 FR France \n",
"13 16 FR France \n",
"14 15 FR France \n",
"15 12 FR France \n",
"16 13 FR France \n",
"17 19 FR France \n",
"18 16 FR France \n",
"19 12 FR France \n",
"20 13 FR France \n",
"21 13 FR France \n",
"22 11 FR France \n",
"23 15 FR France \n",
"24 6 FR France \n",
"25 10 FR France \n",
"26 12 FR France \n",
"27 10 FR France \n",
"28 13 FR France \n",
"29 9 FR France \n",
"... ... ... ... \n",
"1505 42 FR France \n",
"1506 38 FR France \n",
"1507 39 FR France \n",
"1508 29 FR France \n",
"1509 37 FR France \n",
"1510 36 FR France \n",
"1511 45 FR France \n",
"1512 39 FR France \n",
"1513 51 FR France \n",
"1514 32 FR France \n",
"1515 34 FR France \n",
"1516 32 FR France \n",
"1517 30 FR France \n",
"1518 23 FR France \n",
"1519 25 FR France \n",
"1520 35 FR France \n",
"1521 38 FR France \n",
"1522 33 FR France \n",
"1523 31 FR France \n",
"1524 29 FR France \n",
"1525 26 FR France \n",
"1526 25 FR France \n",
"1527 20 FR France \n",
"1528 36 FR France \n",
"1529 38 FR France \n",
"1530 36 FR France \n",
"1531 45 FR France \n",
"1532 43 FR France \n",
"1533 28 FR France \n",
"1534 5 FR France \n",
"\n",
"[1535 rows x 10 columns]"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"raw_data = pd.read_csv(data_url, skiprows=1)\n",
"raw_data"
]
},
{
"cell_type": "markdown",
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"source": [
"Analyse des points manquants"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>week</th>\n",
" <th>indicator</th>\n",
" <th>inc</th>\n",
" <th>inc_low</th>\n",
" <th>inc_up</th>\n",
" <th>inc100</th>\n",
" <th>inc100_low</th>\n",
" <th>inc100_up</th>\n",
" <th>geo_insee</th>\n",
" <th>geo_name</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
"Empty DataFrame\n",
"Columns: [week, indicator, inc, inc_low, inc_up, inc100, inc100_low, inc100_up, geo_insee, geo_name]\n",
"Index: []"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"raw_data[raw_data.isnull().any(axis=1)]"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {
"hideCode": true,
"hidePrompt": true
},
"outputs": [
{
"ename": "NameError",
"evalue": "name 'data' is not defined",
"output_type": "error",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mNameError\u001b[0m Traceback (most recent call last)",
"\u001b[0;32m<ipython-input-6-4f9c04a6e476>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m 6\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mPeriod\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mw\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mday\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'W'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 8\u001b[0;31m \u001b[0mdata\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'period'\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mconvert_week\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0myw\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0myw\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'week'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
"\u001b[0;31mNameError\u001b[0m: name 'data' is not defined"
]
}
],
"source": [
"def convert_week(year_and_week_int):\n",
" year_and_week_str = str(year_and_week_int)\n",
" year = int(year_and_week_str[:4])\n",
" week = int(year_and_week_str[4:])\n",
" w = isoweek.Week(year, week)\n",
" return pd.Period(w.day(0), 'W')\n",
"\n",
"data['period'] = [convert_week(yw) for yw in data['week']]"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"hide_code_all_hidden": true,
"kernelspec": {
"display_name": "Python 3",
"language": "python",
......@@ -16,10 +1161,9 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.3"
"version": "3.6.4"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment