#+TITLE: Module 3 - exercice 2
#+AUTHOR: Votre nom
#+DATE: La date du jour
#+LANGUAGE: fr
# #+PROPERTY: header-args :eval never-export
#+HTML_HEAD:
#+HTML_HEAD:
#+HTML_HEAD:
#+HTML_HEAD:
#+HTML_HEAD:
#+HTML_HEAD:
* Import des données, vérification, préparation
** Import et vérification rapide
Les données au format csv sont téléchargées depuis l'adresse :
http://www.sentiweb.fr/datasets/incidence-PAY-7.csv
#+begin_src python :results output :session :exports both
from urllib.request import urlretrieve
import os
if os.path.isfile("incidence-PAY-7.csv"):
print("Chargement du fichier local")
else:
urlretrieve("http://www.sentiweb.fr/datasets/incidence-PAY-7.csv", "incidence-PAY-7.csv")
data = open("incidence-PAY-7.csv", encoding="iso-8859-1").read()
lines = data.strip().split('\n')
data_lines = lines[1:]
table = [line.split(',') for line in data_lines]
#+end_src
#+RESULTS:
: Chargement du fichier local
Vérification visuelle des premières lignes.
#+begin_src python :results value :session :exports both
table[:5]
#+end_src
#+RESULTS:
| week | indicator | inc | inc_low | inc_up | inc100 | inc100_low | inc100_up | geo_insee | geo_name |
| 202016 | 7 | 803 | 83 | 1523 | 1 | 0 | 2 | FR | France |
| 202015 | 7 | 1918 | 675 | 3161 | 3 | 1 | 5 | FR | France |
| 202014 | 7 | 3879 | 2227 | 5531 | 6 | 3 | 9 | FR | France |
| 202013 | 7 | 7326 | 5236 | 9416 | 11 | 8 | 14 | FR | France |
** Extraction des colonnes utilisées
#+begin_src python :results output :session :exports both
week = [row[0] for row in table]
assert week[0] == 'week'
del week[0]
inc = [row[2] for row in table]
assert inc[0] == 'inc'
del inc[0]
data = list(zip(week, inc))
#+end_src
#+RESULTS:
Vérification visuelle des premières et dernières lignes.
#+begin_src python :results value :session :exports both
[('week', 'inc'), None] + data[:5] + [None] + data[-5:]
#+end_src
#+RESULTS:
| week | inc |
|--------+-------|
| 202016 | 803 |
| 202015 | 1918 |
| 202014 | 3879 |
| 202013 | 7326 |
| 202012 | 8123 |
|--------+-------|
| 199101 | 15565 |
| 199052 | 19375 |
| 199051 | 19080 |
| 199050 | 11079 |
| 199049 | 1143 |
** Conversion des dates