From 65ea7df155366242393349f9043c4c0414d31fcc Mon Sep 17 00:00:00 2001 From: 67a6b213193a2d0a60e6075e4092ba12 <67a6b213193a2d0a60e6075e4092ba12@app-learninglab.inria.fr> Date: Sun, 7 Jun 2020 13:45:50 +0000 Subject: [PATCH] import du fichier depuis la source --- module3/exo3/Wheat.csv | 54 ++++ module3/exo3/exercice.ipynb | 495 +++++++++++++++++++++++++++++++++++- 2 files changed, 548 insertions(+), 1 deletion(-) create mode 100644 module3/exo3/Wheat.csv diff --git a/module3/exo3/Wheat.csv b/module3/exo3/Wheat.csv new file mode 100644 index 0000000..1a201c3 --- /dev/null +++ b/module3/exo3/Wheat.csv @@ -0,0 +1,54 @@ +"","Year","Wheat","Wages" +"1",1565,41,5 +"2",1570,45,5.05 +"3",1575,42,5.08 +"4",1580,49,5.12 +"5",1585,41.5,5.15 +"6",1590,47,5.25 +"7",1595,64,5.54 +"8",1600,27,5.61 +"9",1605,33,5.69 +"10",1610,32,5.78 +"11",1615,33,5.94 +"12",1620,35,6.01 +"13",1625,33,6.12 +"14",1630,45,6.22 +"15",1635,33,6.3 +"16",1640,39,6.37 +"17",1645,53,6.45 +"18",1650,42,6.5 +"19",1655,40.5,6.6 +"20",1660,46.5,6.75 +"21",1665,32,6.8 +"22",1670,37,6.9 +"23",1675,43,7 +"24",1680,35,7.3 +"25",1685,27,7.6 +"26",1690,40,8 +"27",1695,50,8.5 +"28",1700,30,9 +"29",1705,32,10 +"30",1710,44,11 +"31",1715,33,11.75 +"32",1720,29,12.5 +"33",1725,39,13 +"34",1730,26,13.3 +"35",1735,32,13.6 +"36",1740,27,14 +"37",1745,27.5,14.5 +"38",1750,31,15 +"39",1755,35.5,15.7 +"40",1760,31,16.5 +"41",1765,43,17.6 +"42",1770,47,18.5 +"43",1775,44,19.5 +"44",1780,46,21 +"45",1785,42,23 +"46",1790,47.5,25.5 +"47",1795,76,27.5 +"48",1800,79,28.5 +"49",1805,81,29.5 +"50",1810,99,30 +"51",1815,78,NA +"52",1820,54,NA +"53",1821,54,NA diff --git a/module3/exo3/exercice.ipynb b/module3/exo3/exercice.ipynb index 3f6f1c2..c511576 100644 --- a/module3/exo3/exercice.ipynb +++ b/module3/exo3/exercice.ipynb @@ -9,11 +9,504 @@ "Dans le cadre de cette exercice évalué par les pairs (Mooc RR, mod3) j'ai choisi le sujet n°2 intitulé :\n", "**Le pouvoir d'achat des ouvriers anglais du XVIe au XIXe siècle**\n", "\n", + "## Contexte de l'étude\n", + "\n", "William Playfair un des pionnier de la représentation graphique des données, a réalisé un graphique montrant l'évolution du prix du blé et du salaire moyen entre 1565 et 1821. Ce graphique a été publié en 1822 dans son livre *A Letter on our Agricultural Distresses, Their Causes and Remedies*. Ci-dessous une reproduction hébergée sur [Wikipédia][graph original].\n", "\n", "![Chart Showing at One View the Price of the Quarter of Wheat, and Wages of Labour by the Week, from 1565 to 1821](playfair_ori_prixble_salaire.png)\n", "\n", - "[graph original]:https://fr.wikipedia.org/wiki/William_Playfair#/media/File:Chart_Showing_at_One_View_the_Price_of_the_Quarter_of_Wheat,_and_Wages_of_Labour_by_the_Week,_from_1565_to_1821.png" + "[graph original]:https://fr.wikipedia.org/wiki/William_Playfair#/media/File:Chart_Showing_at_One_View_the_Price_of_the_Quarter_of_Wheat,_and_Wages_of_Labour_by_the_Week,_from_1565_to_1821.png\n", + "\n", + "Le premier objectif de l'étude est de reproduire ce graphe, puis dans un second temps de corriger le graphique.Een effet W. Playfair a utilisé la même unité pour représenter deux quantités différentes sur l'axe des ordonnées. Enfin dans un troisième temps le but sera d'améliorer la représentation du pouvoir d'achat des agriculteurs anglais sur cette période.\n", + "\n", + "## Les données\n", + "\n", + "W. Playfair n'a pas publié les données numériques brutes de son étude. Néanmoins une version numérisée est diponible [ici][data_url], réalisé par [Vincent Arel-Bundock] et publié sur son site [R datasets][vab r datasets].\n", + "\n", + "[data_url]: https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/HistData/Wheat.csv\n", + "[Vincent Arel-Bundock]: https://github.com/vincentarelbundock\n", + "[vab r datasets]: https://vincentarelbundock.github.io/Rdatasets/\n" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Fichier déjà téléchargé\n" + ] + }, + { + "data": { + "text/plain": [ + "['exercice_python_en.org',\n", + " 'exercice_fr.ipynb',\n", + " 'Wheat.csv',\n", + " 'exercice.ipynb',\n", + " 'exercice_fr.Rmd',\n", + " 'playfair_ori_prixble_salaire.png',\n", + " 'exercice_python_fr.org',\n", + " 'exercice_R_en.org',\n", + " 'exercice_R_fr.org',\n", + " 'exercice_en.Rmd',\n", + " 'exercice_en.ipynb',\n", + " '.ipynb_checkpoints']" + ] + }, + "execution_count": 2, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# import des bibliothèques\n", + "import urllib\n", + "import matplotlib.pyplot as plt\n", + "import pandas as pd\n", + "from os import listdir\n", + "\n", + "# téléchargement du fichier\n", + "data_url = 'https://raw.githubusercontent.com/vincentarelbundock/Rdatasets/master/csv/HistData/Wheat.csv'\n", + "filename = 'Wheat.csv'\n", + "\n", + "curFiles = set(listdir())\n", + "\n", + "# téléchargement automatique du fichier\n", + "# si non présent dans le répertoire\n", + "if not(filename in curFiles):\n", + " print('Téléchargement du fichier')\n", + " urllib.request.urlretrieve(data_url, filename)\n", + "else:\n", + " print('Fichier déjà téléchargé')\n", + "\n", + "listdir()" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
YearWheatWages
1156541.05.00
2157045.05.05
3157542.05.08
4158049.05.12
5158541.55.15
6159047.05.25
7159564.05.54
8160027.05.61
9160533.05.69
10161032.05.78
11161533.05.94
12162035.06.01
13162533.06.12
14163045.06.22
15163533.06.30
16164039.06.37
17164553.06.45
18165042.06.50
19165540.56.60
20166046.56.75
21166532.06.80
22167037.06.90
23167543.07.00
24168035.07.30
25168527.07.60
26169040.08.00
27169550.08.50
28170030.09.00
29170532.010.00
30171044.011.00
31171533.011.75
32172029.012.50
33172539.013.00
34173026.013.30
35173532.013.60
36174027.014.00
37174527.514.50
38175031.015.00
39175535.515.70
40176031.016.50
41176543.017.60
42177047.018.50
43177544.019.50
44178046.021.00
45178542.023.00
46179047.525.50
47179576.027.50
48180079.028.50
49180581.029.50
50181099.030.00
51181578.0NaN
52182054.0NaN
53182154.0NaN
\n", + "
" + ], + "text/plain": [ + " Year Wheat Wages\n", + "1 1565 41.0 5.00\n", + "2 1570 45.0 5.05\n", + "3 1575 42.0 5.08\n", + "4 1580 49.0 5.12\n", + "5 1585 41.5 5.15\n", + "6 1590 47.0 5.25\n", + "7 1595 64.0 5.54\n", + "8 1600 27.0 5.61\n", + "9 1605 33.0 5.69\n", + "10 1610 32.0 5.78\n", + "11 1615 33.0 5.94\n", + "12 1620 35.0 6.01\n", + "13 1625 33.0 6.12\n", + "14 1630 45.0 6.22\n", + "15 1635 33.0 6.30\n", + "16 1640 39.0 6.37\n", + "17 1645 53.0 6.45\n", + "18 1650 42.0 6.50\n", + "19 1655 40.5 6.60\n", + "20 1660 46.5 6.75\n", + "21 1665 32.0 6.80\n", + "22 1670 37.0 6.90\n", + "23 1675 43.0 7.00\n", + "24 1680 35.0 7.30\n", + "25 1685 27.0 7.60\n", + "26 1690 40.0 8.00\n", + "27 1695 50.0 8.50\n", + "28 1700 30.0 9.00\n", + "29 1705 32.0 10.00\n", + "30 1710 44.0 11.00\n", + "31 1715 33.0 11.75\n", + "32 1720 29.0 12.50\n", + "33 1725 39.0 13.00\n", + "34 1730 26.0 13.30\n", + "35 1735 32.0 13.60\n", + "36 1740 27.0 14.00\n", + "37 1745 27.5 14.50\n", + "38 1750 31.0 15.00\n", + "39 1755 35.5 15.70\n", + "40 1760 31.0 16.50\n", + "41 1765 43.0 17.60\n", + "42 1770 47.0 18.50\n", + "43 1775 44.0 19.50\n", + "44 1780 46.0 21.00\n", + "45 1785 42.0 23.00\n", + "46 1790 47.5 25.50\n", + "47 1795 76.0 27.50\n", + "48 1800 79.0 28.50\n", + "49 1805 81.0 29.50\n", + "50 1810 99.0 30.00\n", + "51 1815 78.0 NaN\n", + "52 1820 54.0 NaN\n", + "53 1821 54.0 NaN" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# lecture du fichier\n", + "\n", + "rawdata = pd.read_csv(filename, index_col=0)\n", + "rawdata" ] }, { -- 2.18.1