From 65ea7df155366242393349f9043c4c0414d31fcc Mon Sep 17 00:00:00 2001 From: 67a6b213193a2d0a60e6075e4092ba12 <67a6b213193a2d0a60e6075e4092ba12@app-learninglab.inria.fr> Date: Sun, 7 Jun 2020 13:45:50 +0000 Subject: [PATCH] import du fichier depuis la source --- module3/exo3/Wheat.csv | 54 ++++ module3/exo3/exercice.ipynb | 495 +++++++++++++++++++++++++++++++++++- 2 files changed, 548 insertions(+), 1 deletion(-) create mode 100644 module3/exo3/Wheat.csv diff --git a/module3/exo3/Wheat.csv b/module3/exo3/Wheat.csv new file mode 100644 index 0000000..1a201c3 --- /dev/null +++ b/module3/exo3/Wheat.csv @@ -0,0 +1,54 @@ +"","Year","Wheat","Wages" +"1",1565,41,5 +"2",1570,45,5.05 +"3",1575,42,5.08 +"4",1580,49,5.12 +"5",1585,41.5,5.15 +"6",1590,47,5.25 +"7",1595,64,5.54 +"8",1600,27,5.61 +"9",1605,33,5.69 +"10",1610,32,5.78 +"11",1615,33,5.94 +"12",1620,35,6.01 +"13",1625,33,6.12 +"14",1630,45,6.22 +"15",1635,33,6.3 +"16",1640,39,6.37 +"17",1645,53,6.45 +"18",1650,42,6.5 +"19",1655,40.5,6.6 +"20",1660,46.5,6.75 +"21",1665,32,6.8 +"22",1670,37,6.9 +"23",1675,43,7 +"24",1680,35,7.3 +"25",1685,27,7.6 +"26",1690,40,8 +"27",1695,50,8.5 +"28",1700,30,9 +"29",1705,32,10 +"30",1710,44,11 +"31",1715,33,11.75 +"32",1720,29,12.5 +"33",1725,39,13 +"34",1730,26,13.3 +"35",1735,32,13.6 +"36",1740,27,14 +"37",1745,27.5,14.5 +"38",1750,31,15 +"39",1755,35.5,15.7 +"40",1760,31,16.5 +"41",1765,43,17.6 +"42",1770,47,18.5 +"43",1775,44,19.5 +"44",1780,46,21 +"45",1785,42,23 +"46",1790,47.5,25.5 +"47",1795,76,27.5 +"48",1800,79,28.5 +"49",1805,81,29.5 +"50",1810,99,30 +"51",1815,78,NA +"52",1820,54,NA +"53",1821,54,NA diff --git a/module3/exo3/exercice.ipynb b/module3/exo3/exercice.ipynb index 3f6f1c2..c511576 100644 --- a/module3/exo3/exercice.ipynb +++ b/module3/exo3/exercice.ipynb @@ -9,11 +9,504 @@ "Dans le cadre de cette exercice évalué par les pairs (Mooc RR, mod3) j'ai choisi le sujet n°2 intitulé :\n", "**Le pouvoir d'achat des ouvriers anglais du XVIe au XIXe siècle**\n", "\n", + "## Contexte de l'étude\n", + "\n", "William Playfair un des pionnier de la représentation graphique des données, a réalisé un graphique montrant l'évolution du prix du blé et du salaire moyen entre 1565 et 1821. Ce graphique a été publié en 1822 dans son livre *A Letter on our Agricultural Distresses, Their Causes and Remedies*. Ci-dessous une reproduction hébergée sur [Wikipédia][graph original].\n", "\n", "\n", "\n", - "[graph original]:https://fr.wikipedia.org/wiki/William_Playfair#/media/File:Chart_Showing_at_One_View_the_Price_of_the_Quarter_of_Wheat,_and_Wages_of_Labour_by_the_Week,_from_1565_to_1821.png" + "[graph original]:https://fr.wikipedia.org/wiki/William_Playfair#/media/File:Chart_Showing_at_One_View_the_Price_of_the_Quarter_of_Wheat,_and_Wages_of_Labour_by_the_Week,_from_1565_to_1821.png\n", + "\n", + "Le premier objectif de l'étude est de reproduire ce graphe, puis dans un second temps de corriger le graphique.Een effet W. Playfair a utilisé la même unité pour représenter deux quantités différentes sur l'axe des ordonnées. Enfin dans un troisième temps le but sera d'améliorer la représentation du pouvoir d'achat des agriculteurs anglais sur cette période.\n", + "\n", + "## Les données\n", + "\n", + "W. Playfair n'a pas publié les données numériques brutes de son étude. Néanmoins une version numérisée est diponible [ici][data_url], réalisé par [Vincent Arel-Bundock] et publié sur son site [R datasets][vab r datasets].\n", + "\n", + "[data_url]: https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/HistData/Wheat.csv\n", + "[Vincent Arel-Bundock]: https://github.com/vincentarelbundock\n", + "[vab r datasets]: https://vincentarelbundock.github.io/Rdatasets/\n" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Fichier déjà téléchargé\n" + ] + }, + { + "data": { + "text/plain": [ + "['exercice_python_en.org',\n", + " 'exercice_fr.ipynb',\n", + " 'Wheat.csv',\n", + " 'exercice.ipynb',\n", + " 'exercice_fr.Rmd',\n", + " 'playfair_ori_prixble_salaire.png',\n", + " 'exercice_python_fr.org',\n", + " 'exercice_R_en.org',\n", + " 'exercice_R_fr.org',\n", + " 'exercice_en.Rmd',\n", + " 'exercice_en.ipynb',\n", + " '.ipynb_checkpoints']" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# import des bibliothèques\n", + "import urllib\n", + "import matplotlib.pyplot as plt\n", + "import pandas as pd\n", + "from os import listdir\n", + "\n", + "# téléchargement du fichier\n", + "data_url = 'https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/HistData/Wheat.csv'\n", + "filename = 'Wheat.csv'\n", + "\n", + "curFiles = set(listdir())\n", + "\n", + "# téléchargement automatique du fichier\n", + "# si non présent dans le répertoire\n", + "if not(filename in curFiles):\n", + " print('Téléchargement du fichier')\n", + " urllib.request.urlretrieve(data_url, filename)\n", + "else:\n", + " print('Fichier déjà téléchargé')\n", + "\n", + "listdir()" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | Year | \n", + "Wheat | \n", + "Wages | \n", + "
---|---|---|---|
1 | \n", + "1565 | \n", + "41.0 | \n", + "5.00 | \n", + "
2 | \n", + "1570 | \n", + "45.0 | \n", + "5.05 | \n", + "
3 | \n", + "1575 | \n", + "42.0 | \n", + "5.08 | \n", + "
4 | \n", + "1580 | \n", + "49.0 | \n", + "5.12 | \n", + "
5 | \n", + "1585 | \n", + "41.5 | \n", + "5.15 | \n", + "
6 | \n", + "1590 | \n", + "47.0 | \n", + "5.25 | \n", + "
7 | \n", + "1595 | \n", + "64.0 | \n", + "5.54 | \n", + "
8 | \n", + "1600 | \n", + "27.0 | \n", + "5.61 | \n", + "
9 | \n", + "1605 | \n", + "33.0 | \n", + "5.69 | \n", + "
10 | \n", + "1610 | \n", + "32.0 | \n", + "5.78 | \n", + "
11 | \n", + "1615 | \n", + "33.0 | \n", + "5.94 | \n", + "
12 | \n", + "1620 | \n", + "35.0 | \n", + "6.01 | \n", + "
13 | \n", + "1625 | \n", + "33.0 | \n", + "6.12 | \n", + "
14 | \n", + "1630 | \n", + "45.0 | \n", + "6.22 | \n", + "
15 | \n", + "1635 | \n", + "33.0 | \n", + "6.30 | \n", + "
16 | \n", + "1640 | \n", + "39.0 | \n", + "6.37 | \n", + "
17 | \n", + "1645 | \n", + "53.0 | \n", + "6.45 | \n", + "
18 | \n", + "1650 | \n", + "42.0 | \n", + "6.50 | \n", + "
19 | \n", + "1655 | \n", + "40.5 | \n", + "6.60 | \n", + "
20 | \n", + "1660 | \n", + "46.5 | \n", + "6.75 | \n", + "
21 | \n", + "1665 | \n", + "32.0 | \n", + "6.80 | \n", + "
22 | \n", + "1670 | \n", + "37.0 | \n", + "6.90 | \n", + "
23 | \n", + "1675 | \n", + "43.0 | \n", + "7.00 | \n", + "
24 | \n", + "1680 | \n", + "35.0 | \n", + "7.30 | \n", + "
25 | \n", + "1685 | \n", + "27.0 | \n", + "7.60 | \n", + "
26 | \n", + "1690 | \n", + "40.0 | \n", + "8.00 | \n", + "
27 | \n", + "1695 | \n", + "50.0 | \n", + "8.50 | \n", + "
28 | \n", + "1700 | \n", + "30.0 | \n", + "9.00 | \n", + "
29 | \n", + "1705 | \n", + "32.0 | \n", + "10.00 | \n", + "
30 | \n", + "1710 | \n", + "44.0 | \n", + "11.00 | \n", + "
31 | \n", + "1715 | \n", + "33.0 | \n", + "11.75 | \n", + "
32 | \n", + "1720 | \n", + "29.0 | \n", + "12.50 | \n", + "
33 | \n", + "1725 | \n", + "39.0 | \n", + "13.00 | \n", + "
34 | \n", + "1730 | \n", + "26.0 | \n", + "13.30 | \n", + "
35 | \n", + "1735 | \n", + "32.0 | \n", + "13.60 | \n", + "
36 | \n", + "1740 | \n", + "27.0 | \n", + "14.00 | \n", + "
37 | \n", + "1745 | \n", + "27.5 | \n", + "14.50 | \n", + "
38 | \n", + "1750 | \n", + "31.0 | \n", + "15.00 | \n", + "
39 | \n", + "1755 | \n", + "35.5 | \n", + "15.70 | \n", + "
40 | \n", + "1760 | \n", + "31.0 | \n", + "16.50 | \n", + "
41 | \n", + "1765 | \n", + "43.0 | \n", + "17.60 | \n", + "
42 | \n", + "1770 | \n", + "47.0 | \n", + "18.50 | \n", + "
43 | \n", + "1775 | \n", + "44.0 | \n", + "19.50 | \n", + "
44 | \n", + "1780 | \n", + "46.0 | \n", + "21.00 | \n", + "
45 | \n", + "1785 | \n", + "42.0 | \n", + "23.00 | \n", + "
46 | \n", + "1790 | \n", + "47.5 | \n", + "25.50 | \n", + "
47 | \n", + "1795 | \n", + "76.0 | \n", + "27.50 | \n", + "
48 | \n", + "1800 | \n", + "79.0 | \n", + "28.50 | \n", + "
49 | \n", + "1805 | \n", + "81.0 | \n", + "29.50 | \n", + "
50 | \n", + "1810 | \n", + "99.0 | \n", + "30.00 | \n", + "
51 | \n", + "1815 | \n", + "78.0 | \n", + "NaN | \n", + "
52 | \n", + "1820 | \n", + "54.0 | \n", + "NaN | \n", + "
53 | \n", + "1821 | \n", + "54.0 | \n", + "NaN | \n", + "