etape conversion

parent 9ef9c961
...@@ -63,6 +63,1080 @@ ...@@ -63,6 +63,1080 @@
" urllib.request.urlretrieve(data_url, data_file)" " urllib.request.urlretrieve(data_url, data_file)"
] ]
}, },
{
"cell_type": "code",
"execution_count": 21,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>week</th>\n",
" <th>indicator</th>\n",
" <th>inc</th>\n",
" <th>inc_low</th>\n",
" <th>inc_up</th>\n",
" <th>inc100</th>\n",
" <th>inc100_low</th>\n",
" <th>inc100_up</th>\n",
" <th>geo_insee</th>\n",
" <th>geo_name</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>202119</td>\n",
" <td>7</td>\n",
" <td>8060</td>\n",
" <td>4941</td>\n",
" <td>11179</td>\n",
" <td>12</td>\n",
" <td>7</td>\n",
" <td>17</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>202118</td>\n",
" <td>7</td>\n",
" <td>3932</td>\n",
" <td>2093</td>\n",
" <td>5771</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>9</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>202117</td>\n",
" <td>7</td>\n",
" <td>4686</td>\n",
" <td>2878</td>\n",
" <td>6494</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>202116</td>\n",
" <td>7</td>\n",
" <td>4780</td>\n",
" <td>2891</td>\n",
" <td>6669</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>202115</td>\n",
" <td>7</td>\n",
" <td>11215</td>\n",
" <td>7627</td>\n",
" <td>14803</td>\n",
" <td>17</td>\n",
" <td>12</td>\n",
" <td>22</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>202114</td>\n",
" <td>7</td>\n",
" <td>11197</td>\n",
" <td>7994</td>\n",
" <td>14400</td>\n",
" <td>17</td>\n",
" <td>12</td>\n",
" <td>22</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>202113</td>\n",
" <td>7</td>\n",
" <td>9714</td>\n",
" <td>6289</td>\n",
" <td>13139</td>\n",
" <td>15</td>\n",
" <td>10</td>\n",
" <td>20</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7</th>\n",
" <td>202112</td>\n",
" <td>7</td>\n",
" <td>11520</td>\n",
" <td>8415</td>\n",
" <td>14625</td>\n",
" <td>17</td>\n",
" <td>12</td>\n",
" <td>22</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8</th>\n",
" <td>202111</td>\n",
" <td>7</td>\n",
" <td>9386</td>\n",
" <td>6678</td>\n",
" <td>12094</td>\n",
" <td>14</td>\n",
" <td>10</td>\n",
" <td>18</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9</th>\n",
" <td>202110</td>\n",
" <td>7</td>\n",
" <td>9056</td>\n",
" <td>6452</td>\n",
" <td>11660</td>\n",
" <td>14</td>\n",
" <td>10</td>\n",
" <td>18</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10</th>\n",
" <td>202109</td>\n",
" <td>7</td>\n",
" <td>10988</td>\n",
" <td>7938</td>\n",
" <td>14038</td>\n",
" <td>17</td>\n",
" <td>12</td>\n",
" <td>22</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>11</th>\n",
" <td>202108</td>\n",
" <td>7</td>\n",
" <td>11281</td>\n",
" <td>8361</td>\n",
" <td>14201</td>\n",
" <td>17</td>\n",
" <td>13</td>\n",
" <td>21</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>12</th>\n",
" <td>202107</td>\n",
" <td>7</td>\n",
" <td>13561</td>\n",
" <td>10315</td>\n",
" <td>16807</td>\n",
" <td>21</td>\n",
" <td>16</td>\n",
" <td>26</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>13</th>\n",
" <td>202106</td>\n",
" <td>7</td>\n",
" <td>13401</td>\n",
" <td>9810</td>\n",
" <td>16992</td>\n",
" <td>20</td>\n",
" <td>15</td>\n",
" <td>25</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14</th>\n",
" <td>202105</td>\n",
" <td>7</td>\n",
" <td>12210</td>\n",
" <td>8988</td>\n",
" <td>15432</td>\n",
" <td>18</td>\n",
" <td>13</td>\n",
" <td>23</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15</th>\n",
" <td>202104</td>\n",
" <td>7</td>\n",
" <td>12026</td>\n",
" <td>8826</td>\n",
" <td>15226</td>\n",
" <td>18</td>\n",
" <td>13</td>\n",
" <td>23</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>16</th>\n",
" <td>202103</td>\n",
" <td>7</td>\n",
" <td>8913</td>\n",
" <td>6375</td>\n",
" <td>11451</td>\n",
" <td>13</td>\n",
" <td>9</td>\n",
" <td>17</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>17</th>\n",
" <td>202102</td>\n",
" <td>7</td>\n",
" <td>7795</td>\n",
" <td>5430</td>\n",
" <td>10160</td>\n",
" <td>12</td>\n",
" <td>8</td>\n",
" <td>16</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>18</th>\n",
" <td>202101</td>\n",
" <td>7</td>\n",
" <td>10525</td>\n",
" <td>7750</td>\n",
" <td>13300</td>\n",
" <td>16</td>\n",
" <td>12</td>\n",
" <td>20</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>19</th>\n",
" <td>202053</td>\n",
" <td>7</td>\n",
" <td>11978</td>\n",
" <td>8406</td>\n",
" <td>15550</td>\n",
" <td>18</td>\n",
" <td>13</td>\n",
" <td>23</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>20</th>\n",
" <td>202052</td>\n",
" <td>7</td>\n",
" <td>12012</td>\n",
" <td>8285</td>\n",
" <td>15739</td>\n",
" <td>18</td>\n",
" <td>12</td>\n",
" <td>24</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>21</th>\n",
" <td>202051</td>\n",
" <td>7</td>\n",
" <td>10564</td>\n",
" <td>7574</td>\n",
" <td>13554</td>\n",
" <td>16</td>\n",
" <td>11</td>\n",
" <td>21</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>202050</td>\n",
" <td>7</td>\n",
" <td>7063</td>\n",
" <td>4744</td>\n",
" <td>9382</td>\n",
" <td>11</td>\n",
" <td>7</td>\n",
" <td>15</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>202049</td>\n",
" <td>7</td>\n",
" <td>5026</td>\n",
" <td>3145</td>\n",
" <td>6907</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>202048</td>\n",
" <td>7</td>\n",
" <td>6683</td>\n",
" <td>4312</td>\n",
" <td>9054</td>\n",
" <td>10</td>\n",
" <td>6</td>\n",
" <td>14</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>25</th>\n",
" <td>202047</td>\n",
" <td>7</td>\n",
" <td>4999</td>\n",
" <td>2963</td>\n",
" <td>7035</td>\n",
" <td>8</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>202046</td>\n",
" <td>7</td>\n",
" <td>3752</td>\n",
" <td>1963</td>\n",
" <td>5541</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>9</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>202045</td>\n",
" <td>7</td>\n",
" <td>3696</td>\n",
" <td>2016</td>\n",
" <td>5376</td>\n",
" <td>6</td>\n",
" <td>3</td>\n",
" <td>9</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>202044</td>\n",
" <td>7</td>\n",
" <td>4391</td>\n",
" <td>2375</td>\n",
" <td>6407</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>202043</td>\n",
" <td>7</td>\n",
" <td>4376</td>\n",
" <td>2505</td>\n",
" <td>6247</td>\n",
" <td>7</td>\n",
" <td>4</td>\n",
" <td>10</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1559</th>\n",
" <td>199126</td>\n",
" <td>7</td>\n",
" <td>17608</td>\n",
" <td>11304</td>\n",
" <td>23912</td>\n",
" <td>31</td>\n",
" <td>20</td>\n",
" <td>42</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1560</th>\n",
" <td>199125</td>\n",
" <td>7</td>\n",
" <td>16169</td>\n",
" <td>10700</td>\n",
" <td>21638</td>\n",
" <td>28</td>\n",
" <td>18</td>\n",
" <td>38</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1561</th>\n",
" <td>199124</td>\n",
" <td>7</td>\n",
" <td>16171</td>\n",
" <td>10071</td>\n",
" <td>22271</td>\n",
" <td>28</td>\n",
" <td>17</td>\n",
" <td>39</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1562</th>\n",
" <td>199123</td>\n",
" <td>7</td>\n",
" <td>11947</td>\n",
" <td>7671</td>\n",
" <td>16223</td>\n",
" <td>21</td>\n",
" <td>13</td>\n",
" <td>29</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1563</th>\n",
" <td>199122</td>\n",
" <td>7</td>\n",
" <td>15452</td>\n",
" <td>9953</td>\n",
" <td>20951</td>\n",
" <td>27</td>\n",
" <td>17</td>\n",
" <td>37</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1564</th>\n",
" <td>199121</td>\n",
" <td>7</td>\n",
" <td>14903</td>\n",
" <td>8975</td>\n",
" <td>20831</td>\n",
" <td>26</td>\n",
" <td>16</td>\n",
" <td>36</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1565</th>\n",
" <td>199120</td>\n",
" <td>7</td>\n",
" <td>19053</td>\n",
" <td>12742</td>\n",
" <td>25364</td>\n",
" <td>34</td>\n",
" <td>23</td>\n",
" <td>45</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1566</th>\n",
" <td>199119</td>\n",
" <td>7</td>\n",
" <td>16739</td>\n",
" <td>11246</td>\n",
" <td>22232</td>\n",
" <td>29</td>\n",
" <td>19</td>\n",
" <td>39</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1567</th>\n",
" <td>199118</td>\n",
" <td>7</td>\n",
" <td>21385</td>\n",
" <td>13882</td>\n",
" <td>28888</td>\n",
" <td>38</td>\n",
" <td>25</td>\n",
" <td>51</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1568</th>\n",
" <td>199117</td>\n",
" <td>7</td>\n",
" <td>13462</td>\n",
" <td>8877</td>\n",
" <td>18047</td>\n",
" <td>24</td>\n",
" <td>16</td>\n",
" <td>32</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1569</th>\n",
" <td>199116</td>\n",
" <td>7</td>\n",
" <td>14857</td>\n",
" <td>10068</td>\n",
" <td>19646</td>\n",
" <td>26</td>\n",
" <td>18</td>\n",
" <td>34</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1570</th>\n",
" <td>199115</td>\n",
" <td>7</td>\n",
" <td>13975</td>\n",
" <td>9781</td>\n",
" <td>18169</td>\n",
" <td>25</td>\n",
" <td>18</td>\n",
" <td>32</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1571</th>\n",
" <td>199114</td>\n",
" <td>7</td>\n",
" <td>12265</td>\n",
" <td>7684</td>\n",
" <td>16846</td>\n",
" <td>22</td>\n",
" <td>14</td>\n",
" <td>30</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1572</th>\n",
" <td>199113</td>\n",
" <td>7</td>\n",
" <td>9567</td>\n",
" <td>6041</td>\n",
" <td>13093</td>\n",
" <td>17</td>\n",
" <td>11</td>\n",
" <td>23</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1573</th>\n",
" <td>199112</td>\n",
" <td>7</td>\n",
" <td>10864</td>\n",
" <td>7331</td>\n",
" <td>14397</td>\n",
" <td>19</td>\n",
" <td>13</td>\n",
" <td>25</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1574</th>\n",
" <td>199111</td>\n",
" <td>7</td>\n",
" <td>15574</td>\n",
" <td>11184</td>\n",
" <td>19964</td>\n",
" <td>27</td>\n",
" <td>19</td>\n",
" <td>35</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1575</th>\n",
" <td>199110</td>\n",
" <td>7</td>\n",
" <td>16643</td>\n",
" <td>11372</td>\n",
" <td>21914</td>\n",
" <td>29</td>\n",
" <td>20</td>\n",
" <td>38</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1576</th>\n",
" <td>199109</td>\n",
" <td>7</td>\n",
" <td>13741</td>\n",
" <td>8780</td>\n",
" <td>18702</td>\n",
" <td>24</td>\n",
" <td>15</td>\n",
" <td>33</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1577</th>\n",
" <td>199108</td>\n",
" <td>7</td>\n",
" <td>13289</td>\n",
" <td>8813</td>\n",
" <td>17765</td>\n",
" <td>23</td>\n",
" <td>15</td>\n",
" <td>31</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1578</th>\n",
" <td>199107</td>\n",
" <td>7</td>\n",
" <td>12337</td>\n",
" <td>8077</td>\n",
" <td>16597</td>\n",
" <td>22</td>\n",
" <td>15</td>\n",
" <td>29</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1579</th>\n",
" <td>199106</td>\n",
" <td>7</td>\n",
" <td>10877</td>\n",
" <td>7013</td>\n",
" <td>14741</td>\n",
" <td>19</td>\n",
" <td>12</td>\n",
" <td>26</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1580</th>\n",
" <td>199105</td>\n",
" <td>7</td>\n",
" <td>10442</td>\n",
" <td>6544</td>\n",
" <td>14340</td>\n",
" <td>18</td>\n",
" <td>11</td>\n",
" <td>25</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1581</th>\n",
" <td>199104</td>\n",
" <td>7</td>\n",
" <td>7913</td>\n",
" <td>4563</td>\n",
" <td>11263</td>\n",
" <td>14</td>\n",
" <td>8</td>\n",
" <td>20</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1582</th>\n",
" <td>199103</td>\n",
" <td>7</td>\n",
" <td>15387</td>\n",
" <td>10484</td>\n",
" <td>20290</td>\n",
" <td>27</td>\n",
" <td>18</td>\n",
" <td>36</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1583</th>\n",
" <td>199102</td>\n",
" <td>7</td>\n",
" <td>16277</td>\n",
" <td>11046</td>\n",
" <td>21508</td>\n",
" <td>29</td>\n",
" <td>20</td>\n",
" <td>38</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1584</th>\n",
" <td>199101</td>\n",
" <td>7</td>\n",
" <td>15565</td>\n",
" <td>10271</td>\n",
" <td>20859</td>\n",
" <td>27</td>\n",
" <td>18</td>\n",
" <td>36</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1585</th>\n",
" <td>199052</td>\n",
" <td>7</td>\n",
" <td>19375</td>\n",
" <td>13295</td>\n",
" <td>25455</td>\n",
" <td>34</td>\n",
" <td>23</td>\n",
" <td>45</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1586</th>\n",
" <td>199051</td>\n",
" <td>7</td>\n",
" <td>19080</td>\n",
" <td>13807</td>\n",
" <td>24353</td>\n",
" <td>34</td>\n",
" <td>25</td>\n",
" <td>43</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1587</th>\n",
" <td>199050</td>\n",
" <td>7</td>\n",
" <td>11079</td>\n",
" <td>6660</td>\n",
" <td>15498</td>\n",
" <td>20</td>\n",
" <td>12</td>\n",
" <td>28</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1588</th>\n",
" <td>199049</td>\n",
" <td>7</td>\n",
" <td>1143</td>\n",
" <td>0</td>\n",
" <td>2610</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" <td>5</td>\n",
" <td>FR</td>\n",
" <td>France</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>1589 rows × 10 columns</p>\n",
"</div>"
],
"text/plain": [
" week indicator inc inc_low inc_up inc100 inc100_low \\\n",
"0 202119 7 8060 4941 11179 12 7 \n",
"1 202118 7 3932 2093 5771 6 3 \n",
"2 202117 7 4686 2878 6494 7 4 \n",
"3 202116 7 4780 2891 6669 7 4 \n",
"4 202115 7 11215 7627 14803 17 12 \n",
"5 202114 7 11197 7994 14400 17 12 \n",
"6 202113 7 9714 6289 13139 15 10 \n",
"7 202112 7 11520 8415 14625 17 12 \n",
"8 202111 7 9386 6678 12094 14 10 \n",
"9 202110 7 9056 6452 11660 14 10 \n",
"10 202109 7 10988 7938 14038 17 12 \n",
"11 202108 7 11281 8361 14201 17 13 \n",
"12 202107 7 13561 10315 16807 21 16 \n",
"13 202106 7 13401 9810 16992 20 15 \n",
"14 202105 7 12210 8988 15432 18 13 \n",
"15 202104 7 12026 8826 15226 18 13 \n",
"16 202103 7 8913 6375 11451 13 9 \n",
"17 202102 7 7795 5430 10160 12 8 \n",
"18 202101 7 10525 7750 13300 16 12 \n",
"19 202053 7 11978 8406 15550 18 13 \n",
"20 202052 7 12012 8285 15739 18 12 \n",
"21 202051 7 10564 7574 13554 16 11 \n",
"22 202050 7 7063 4744 9382 11 7 \n",
"23 202049 7 5026 3145 6907 8 5 \n",
"24 202048 7 6683 4312 9054 10 6 \n",
"25 202047 7 4999 2963 7035 8 5 \n",
"26 202046 7 3752 1963 5541 6 3 \n",
"27 202045 7 3696 2016 5376 6 3 \n",
"28 202044 7 4391 2375 6407 7 4 \n",
"29 202043 7 4376 2505 6247 7 4 \n",
"... ... ... ... ... ... ... ... \n",
"1559 199126 7 17608 11304 23912 31 20 \n",
"1560 199125 7 16169 10700 21638 28 18 \n",
"1561 199124 7 16171 10071 22271 28 17 \n",
"1562 199123 7 11947 7671 16223 21 13 \n",
"1563 199122 7 15452 9953 20951 27 17 \n",
"1564 199121 7 14903 8975 20831 26 16 \n",
"1565 199120 7 19053 12742 25364 34 23 \n",
"1566 199119 7 16739 11246 22232 29 19 \n",
"1567 199118 7 21385 13882 28888 38 25 \n",
"1568 199117 7 13462 8877 18047 24 16 \n",
"1569 199116 7 14857 10068 19646 26 18 \n",
"1570 199115 7 13975 9781 18169 25 18 \n",
"1571 199114 7 12265 7684 16846 22 14 \n",
"1572 199113 7 9567 6041 13093 17 11 \n",
"1573 199112 7 10864 7331 14397 19 13 \n",
"1574 199111 7 15574 11184 19964 27 19 \n",
"1575 199110 7 16643 11372 21914 29 20 \n",
"1576 199109 7 13741 8780 18702 24 15 \n",
"1577 199108 7 13289 8813 17765 23 15 \n",
"1578 199107 7 12337 8077 16597 22 15 \n",
"1579 199106 7 10877 7013 14741 19 12 \n",
"1580 199105 7 10442 6544 14340 18 11 \n",
"1581 199104 7 7913 4563 11263 14 8 \n",
"1582 199103 7 15387 10484 20290 27 18 \n",
"1583 199102 7 16277 11046 21508 29 20 \n",
"1584 199101 7 15565 10271 20859 27 18 \n",
"1585 199052 7 19375 13295 25455 34 23 \n",
"1586 199051 7 19080 13807 24353 34 25 \n",
"1587 199050 7 11079 6660 15498 20 12 \n",
"1588 199049 7 1143 0 2610 2 0 \n",
"\n",
" inc100_up geo_insee geo_name \n",
"0 17 FR France \n",
"1 9 FR France \n",
"2 10 FR France \n",
"3 10 FR France \n",
"4 22 FR France \n",
"5 22 FR France \n",
"6 20 FR France \n",
"7 22 FR France \n",
"8 18 FR France \n",
"9 18 FR France \n",
"10 22 FR France \n",
"11 21 FR France \n",
"12 26 FR France \n",
"13 25 FR France \n",
"14 23 FR France \n",
"15 23 FR France \n",
"16 17 FR France \n",
"17 16 FR France \n",
"18 20 FR France \n",
"19 23 FR France \n",
"20 24 FR France \n",
"21 21 FR France \n",
"22 15 FR France \n",
"23 11 FR France \n",
"24 14 FR France \n",
"25 11 FR France \n",
"26 9 FR France \n",
"27 9 FR France \n",
"28 10 FR France \n",
"29 10 FR France \n",
"... ... ... ... \n",
"1559 42 FR France \n",
"1560 38 FR France \n",
"1561 39 FR France \n",
"1562 29 FR France \n",
"1563 37 FR France \n",
"1564 36 FR France \n",
"1565 45 FR France \n",
"1566 39 FR France \n",
"1567 51 FR France \n",
"1568 32 FR France \n",
"1569 34 FR France \n",
"1570 32 FR France \n",
"1571 30 FR France \n",
"1572 23 FR France \n",
"1573 25 FR France \n",
"1574 35 FR France \n",
"1575 38 FR France \n",
"1576 33 FR France \n",
"1577 31 FR France \n",
"1578 29 FR France \n",
"1579 26 FR France \n",
"1580 25 FR France \n",
"1581 20 FR France \n",
"1582 36 FR France \n",
"1583 38 FR France \n",
"1584 36 FR France \n",
"1585 45 FR France \n",
"1586 43 FR France \n",
"1587 28 FR France \n",
"1588 5 FR France \n",
"\n",
"[1589 rows x 10 columns]"
]
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"raw_data = pd.read_csv(\"syndrome-varicelle.csv\", skiprows=1)\n",
"raw_data"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Y a-t-il des points manquants dans ce jeux de données ?"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>week</th>\n",
" <th>indicator</th>\n",
" <th>inc</th>\n",
" <th>inc_low</th>\n",
" <th>inc_up</th>\n",
" <th>inc100</th>\n",
" <th>inc100_low</th>\n",
" <th>inc100_up</th>\n",
" <th>geo_insee</th>\n",
" <th>geo_name</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
"Empty DataFrame\n",
"Columns: [week, indicator, inc, inc_low, inc_up, inc100, inc100_low, inc100_up, geo_insee, geo_name]\n",
"Index: []"
]
},
"execution_count": 22,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"raw_data[raw_data.isnull().any(axis=1)]"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Pas de point manquants."
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Nos données utilisent une convention inhabituelle: le numéro de semaine est collé à l'année, donnant l'impression qu'il s'agit de nombre entier. C'est comme ça que Pandas les interprète.\n",
"Un deuxième problème est que Pandas ne comprend pas les numéros de semaine. Il faut lui fournir les dates de début et de fin de semaine. Nous utilisons pour cela la bibliothèque isoweek.\n",
"Comme la conversion des semaines est devenu assez complexe, nous écrivons une petite fonction Python pour cela. Ensuite, nous l'appliquons à tous les points de nos donnés. Les résultats vont dans une nouvelle colonne 'period'."
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [],
"source": [
"def convert_week(year_and_week_int):\n",
" year_and_week_str = str(year_and_week_int)\n",
" year = int(year_and_week_str[:4])\n",
" week = int(year_and_week_str[4:])\n",
" w = isoweek.Week(year, week)\n",
" return pd.Period(w.day(0), 'W')\n",
"\n",
"raw_data['period'] = [convert_week(yw) for yw in raw_data['week']]"
]
},
{ {
"cell_type": "code", "cell_type": "code",
"execution_count": null, "execution_count": null,
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment