diff --git a/module3/exo1/analyse-syndrome-grippal.ipynb b/module3/exo1/analyse-syndrome-grippal.ipynb index a25244124844ec2dee19a30d4b8582caa095e282..34da3f78a92faafe1a50a8f662193cad297ddc61 100644 --- a/module3/exo1/analyse-syndrome-grippal.ipynb +++ b/module3/exo1/analyse-syndrome-grippal.ipynb @@ -40,11 +40,16 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": 31, "metadata": {}, "outputs": [], "source": [ - "data_url =\"https://app-learninglab.inria.fr/moocrr/gitlab/ef86fb54ef695a9083dc58696a4f7e7c/mooc-rr/blob/master/module3/exo1/incidence-PAY-3.csv\"" + "data_file = \"incidence-PAY-3.csv\"\n", + "data_url = \"\"\n", + "import os\n", + "import urllib.request\n", + "if not os.path.exists(data_file):\n", + " urllib.request.urlretrieve(data_url, data_file)" ] }, { @@ -71,32 +76,978 @@ }, { "cell_type": "code", - "execution_count": 24, + "execution_count": 32, "metadata": {}, "outputs": [ { - "ename": "ParserError", - "evalue": "Error tokenizing data. C error: Expected 1 fields in line 30, saw 21\n", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mParserError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mraw_data\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread_csv\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata_url\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mskiprows\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 2\u001b[0m \u001b[0mraw_data\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m/opt/conda/lib/python3.6/site-packages/pandas/io/parsers.py\u001b[0m in \u001b[0;36mparser_f\u001b[0;34m(filepath_or_buffer, sep, delimiter, header, names, index_col, usecols, squeeze, prefix, mangle_dupe_cols, dtype, engine, converters, true_values, false_values, skipinitialspace, skiprows, nrows, na_values, keep_default_na, na_filter, verbose, skip_blank_lines, parse_dates, infer_datetime_format, keep_date_col, date_parser, dayfirst, iterator, chunksize, compression, thousands, decimal, lineterminator, quotechar, quoting, escapechar, comment, encoding, dialect, tupleize_cols, error_bad_lines, warn_bad_lines, skipfooter, skip_footer, doublequote, delim_whitespace, as_recarray, compact_ints, use_unsigned, low_memory, buffer_lines, memory_map, float_precision)\u001b[0m\n\u001b[1;32m 707\u001b[0m skip_blank_lines=skip_blank_lines)\n\u001b[1;32m 708\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 709\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0m_read\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfilepath_or_buffer\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkwds\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 710\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 711\u001b[0m \u001b[0mparser_f\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__name__\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mname\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m/opt/conda/lib/python3.6/site-packages/pandas/io/parsers.py\u001b[0m in \u001b[0;36m_read\u001b[0;34m(filepath_or_buffer, kwds)\u001b[0m\n\u001b[1;32m 453\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 454\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 455\u001b[0;31m \u001b[0mdata\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mparser\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnrows\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 456\u001b[0m \u001b[0;32mfinally\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 457\u001b[0m \u001b[0mparser\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mclose\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m/opt/conda/lib/python3.6/site-packages/pandas/io/parsers.py\u001b[0m in \u001b[0;36mread\u001b[0;34m(self, nrows)\u001b[0m\n\u001b[1;32m 1067\u001b[0m \u001b[0;32mraise\u001b[0m \u001b[0mValueError\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'skipfooter not supported for iteration'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1068\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1069\u001b[0;31m \u001b[0mret\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_engine\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnrows\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1070\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1071\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0moptions\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mget\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'as_recarray'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m/opt/conda/lib/python3.6/site-packages/pandas/io/parsers.py\u001b[0m in \u001b[0;36mread\u001b[0;34m(self, nrows)\u001b[0m\n\u001b[1;32m 1837\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnrows\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1838\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1839\u001b[0;31m \u001b[0mdata\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_reader\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnrows\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1840\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mStopIteration\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1841\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_first_chunk\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32mpandas/_libs/parsers.pyx\u001b[0m in \u001b[0;36mpandas._libs.parsers.TextReader.read\u001b[0;34m()\u001b[0m\n", - "\u001b[0;32mpandas/_libs/parsers.pyx\u001b[0m in \u001b[0;36mpandas._libs.parsers.TextReader._read_low_memory\u001b[0;34m()\u001b[0m\n", - "\u001b[0;32mpandas/_libs/parsers.pyx\u001b[0m in \u001b[0;36mpandas._libs.parsers.TextReader._read_rows\u001b[0;34m()\u001b[0m\n", - "\u001b[0;32mpandas/_libs/parsers.pyx\u001b[0m in \u001b[0;36mpandas._libs.parsers.TextReader._tokenize_rows\u001b[0;34m()\u001b[0m\n", - "\u001b[0;32mpandas/_libs/parsers.pyx\u001b[0m in \u001b[0;36mpandas._libs.parsers.raise_parser_error\u001b[0;34m()\u001b[0m\n", - "\u001b[0;31mParserError\u001b[0m: Error tokenizing data. C error: Expected 1 fields in line 30, saw 21\n" - ] + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
weekindicatorincinc_lowinc_upinc100inc100_lowinc100_upgeo_inseegeo_name
02021203138039830.017776.02115.027.0FRFrance
1202119397747030.012518.01511.019.0FRFrance
22021183121359165.015105.01814.022.0FRFrance
32021173120588891.015225.01813.023.0FRFrance
420211631650512735.020275.02519.031.0FRFrance
520211531930615398.023214.02923.035.0FRFrance
620211432107317099.025047.03226.038.0FRFrance
720211332641322094.030732.04033.047.0FRFrance
820211233065825919.035397.04639.053.0FRFrance
920211132498820718.029258.03832.044.0FRFrance
1020211031953915951.023127.03025.035.0FRFrance
1120210931757213926.021218.02721.033.0FRFrance
1220210832088216907.024857.03226.038.0FRFrance
1320210732239318303.026483.03428.040.0FRFrance
1420210632318319134.027232.03529.041.0FRFrance
1520210532242618445.026407.03428.040.0FRFrance
1620210432580421491.030117.03932.046.0FRFrance
1720210332181017894.025726.03327.039.0FRFrance
1820210231732013906.020734.02621.031.0FRFrance
1920210132179917778.025820.03327.039.0FRFrance
2020205332122016498.025942.03225.039.0FRFrance
2120205231642812285.020571.02519.031.0FRFrance
2220205132161917370.025868.03327.039.0FRFrance
2320205031684513220.020470.02620.032.0FRFrance
242020493129399923.015955.02015.025.0FRFrance
2520204831380410641.016967.02116.026.0FRFrance
2620204731908515285.022885.02923.035.0FRFrance
2720204632480120503.029099.03831.045.0FRFrance
2820204534251636857.048175.06556.074.0FRFrance
2920204434456738521.050613.06859.077.0FRFrance
.................................
187819852132609619621.032571.04735.059.0FRFrance
187919852032789620885.034907.05138.064.0FRFrance
188019851934315432821.053487.07859.097.0FRFrance
188119851834055529935.051175.07455.093.0FRFrance
188219851733405324366.043740.06244.080.0FRFrance
188319851635036236451.064273.09166.0116.0FRFrance
188419851536388145538.082224.011683.0149.0FRFrance
18851985143134545114400.0154690.0244207.0281.0FRFrance
18861985133197206176080.0218332.0357319.0395.0FRFrance
18871985123245240223304.0267176.0445405.0485.0FRFrance
18881985113276205252399.0300011.0501458.0544.0FRFrance
18891985103353231326279.0380183.0640591.0689.0FRFrance
18901985093369895341109.0398681.0670618.0722.0FRFrance
18911985083389886359529.0420243.0707652.0762.0FRFrance
18921985073471852432599.0511105.0855784.0926.0FRFrance
18931985063565825518011.0613639.01026939.01113.0FRFrance
18941985053637302592795.0681809.011551074.01236.0FRFrance
18951985043424937390794.0459080.0770708.0832.0FRFrance
18961985033213901174689.0253113.0388317.0459.0FRFrance
189719850239758680949.0114223.0177147.0207.0FRFrance
189819850138548965918.0105060.0155120.0190.0FRFrance
189919845238483060602.0109058.0154110.0198.0FRFrance
1900198451310172680242.0123210.0185146.0224.0FRFrance
19011984503123680101401.0145959.0225184.0266.0FRFrance
1902198449310107381684.0120462.0184149.0219.0FRFrance
190319844837862060634.096606.0143110.0176.0FRFrance
190419844737202954274.089784.013199.0163.0FRFrance
190519844638733067686.0106974.0159123.0195.0FRFrance
19061984453135223101414.0169032.0246184.0308.0FRFrance
190719844436842220056.0116788.012537.0213.0FRFrance
\n", + "

1908 rows × 10 columns

\n", + "
" + ], + "text/plain": [ + " week indicator inc inc_low inc_up inc100 inc100_low \\\n", + "0 202120 3 13803 9830.0 17776.0 21 15.0 \n", + "1 202119 3 9774 7030.0 12518.0 15 11.0 \n", + "2 202118 3 12135 9165.0 15105.0 18 14.0 \n", + "3 202117 3 12058 8891.0 15225.0 18 13.0 \n", + "4 202116 3 16505 12735.0 20275.0 25 19.0 \n", + "5 202115 3 19306 15398.0 23214.0 29 23.0 \n", + "6 202114 3 21073 17099.0 25047.0 32 26.0 \n", + "7 202113 3 26413 22094.0 30732.0 40 33.0 \n", + "8 202112 3 30658 25919.0 35397.0 46 39.0 \n", + "9 202111 3 24988 20718.0 29258.0 38 32.0 \n", + "10 202110 3 19539 15951.0 23127.0 30 25.0 \n", + "11 202109 3 17572 13926.0 21218.0 27 21.0 \n", + "12 202108 3 20882 16907.0 24857.0 32 26.0 \n", + "13 202107 3 22393 18303.0 26483.0 34 28.0 \n", + "14 202106 3 23183 19134.0 27232.0 35 29.0 \n", + "15 202105 3 22426 18445.0 26407.0 34 28.0 \n", + "16 202104 3 25804 21491.0 30117.0 39 32.0 \n", + "17 202103 3 21810 17894.0 25726.0 33 27.0 \n", + "18 202102 3 17320 13906.0 20734.0 26 21.0 \n", + "19 202101 3 21799 17778.0 25820.0 33 27.0 \n", + "20 202053 3 21220 16498.0 25942.0 32 25.0 \n", + "21 202052 3 16428 12285.0 20571.0 25 19.0 \n", + "22 202051 3 21619 17370.0 25868.0 33 27.0 \n", + "23 202050 3 16845 13220.0 20470.0 26 20.0 \n", + "24 202049 3 12939 9923.0 15955.0 20 15.0 \n", + "25 202048 3 13804 10641.0 16967.0 21 16.0 \n", + "26 202047 3 19085 15285.0 22885.0 29 23.0 \n", + "27 202046 3 24801 20503.0 29099.0 38 31.0 \n", + "28 202045 3 42516 36857.0 48175.0 65 56.0 \n", + "29 202044 3 44567 38521.0 50613.0 68 59.0 \n", + "... ... ... ... ... ... ... ... \n", + "1878 198521 3 26096 19621.0 32571.0 47 35.0 \n", + "1879 198520 3 27896 20885.0 34907.0 51 38.0 \n", + "1880 198519 3 43154 32821.0 53487.0 78 59.0 \n", + "1881 198518 3 40555 29935.0 51175.0 74 55.0 \n", + "1882 198517 3 34053 24366.0 43740.0 62 44.0 \n", + "1883 198516 3 50362 36451.0 64273.0 91 66.0 \n", + "1884 198515 3 63881 45538.0 82224.0 116 83.0 \n", + "1885 198514 3 134545 114400.0 154690.0 244 207.0 \n", + "1886 198513 3 197206 176080.0 218332.0 357 319.0 \n", + "1887 198512 3 245240 223304.0 267176.0 445 405.0 \n", + "1888 198511 3 276205 252399.0 300011.0 501 458.0 \n", + "1889 198510 3 353231 326279.0 380183.0 640 591.0 \n", + "1890 198509 3 369895 341109.0 398681.0 670 618.0 \n", + "1891 198508 3 389886 359529.0 420243.0 707 652.0 \n", + "1892 198507 3 471852 432599.0 511105.0 855 784.0 \n", + "1893 198506 3 565825 518011.0 613639.0 1026 939.0 \n", + "1894 198505 3 637302 592795.0 681809.0 1155 1074.0 \n", + "1895 198504 3 424937 390794.0 459080.0 770 708.0 \n", + "1896 198503 3 213901 174689.0 253113.0 388 317.0 \n", + "1897 198502 3 97586 80949.0 114223.0 177 147.0 \n", + "1898 198501 3 85489 65918.0 105060.0 155 120.0 \n", + "1899 198452 3 84830 60602.0 109058.0 154 110.0 \n", + "1900 198451 3 101726 80242.0 123210.0 185 146.0 \n", + "1901 198450 3 123680 101401.0 145959.0 225 184.0 \n", + "1902 198449 3 101073 81684.0 120462.0 184 149.0 \n", + "1903 198448 3 78620 60634.0 96606.0 143 110.0 \n", + "1904 198447 3 72029 54274.0 89784.0 131 99.0 \n", + "1905 198446 3 87330 67686.0 106974.0 159 123.0 \n", + "1906 198445 3 135223 101414.0 169032.0 246 184.0 \n", + "1907 198444 3 68422 20056.0 116788.0 125 37.0 \n", + "\n", + " inc100_up geo_insee geo_name \n", + "0 27.0 FR France \n", + "1 19.0 FR France \n", + "2 22.0 FR France \n", + "3 23.0 FR France \n", + "4 31.0 FR France \n", + "5 35.0 FR France \n", + "6 38.0 FR France \n", + "7 47.0 FR France \n", + "8 53.0 FR France \n", + "9 44.0 FR France \n", + "10 35.0 FR France \n", + "11 33.0 FR France \n", + "12 38.0 FR France \n", + "13 40.0 FR France \n", + "14 41.0 FR France \n", + "15 40.0 FR France \n", + "16 46.0 FR France \n", + "17 39.0 FR France \n", + "18 31.0 FR France \n", + "19 39.0 FR France \n", + "20 39.0 FR France \n", + "21 31.0 FR France \n", + "22 39.0 FR France \n", + "23 32.0 FR France \n", + "24 25.0 FR France \n", + "25 26.0 FR France \n", + "26 35.0 FR France \n", + "27 45.0 FR France \n", + "28 74.0 FR France \n", + "29 77.0 FR France \n", + "... ... ... ... \n", + "1878 59.0 FR France \n", + "1879 64.0 FR France \n", + "1880 97.0 FR France \n", + "1881 93.0 FR France \n", + "1882 80.0 FR France \n", + "1883 116.0 FR France \n", + "1884 149.0 FR France \n", + "1885 281.0 FR France \n", + "1886 395.0 FR France \n", + "1887 485.0 FR France \n", + "1888 544.0 FR France \n", + "1889 689.0 FR France \n", + "1890 722.0 FR France \n", + "1891 762.0 FR France \n", + "1892 926.0 FR France \n", + "1893 1113.0 FR France \n", + "1894 1236.0 FR France \n", + "1895 832.0 FR France \n", + "1896 459.0 FR France \n", + "1897 207.0 FR France \n", + "1898 190.0 FR France \n", + "1899 198.0 FR France \n", + "1900 224.0 FR France \n", + "1901 266.0 FR France \n", + "1902 219.0 FR France \n", + "1903 176.0 FR France \n", + "1904 163.0 FR France \n", + "1905 195.0 FR France \n", + "1906 308.0 FR France \n", + "1907 213.0 FR France \n", + "\n", + "[1908 rows x 10 columns]" + ] + }, + "execution_count": 32, + "metadata": {}, + "output_type": "execute_result" } ], "source": [ - "raw_data = pd.read_csv(data_url, skiprows=1)\n", + "raw_data = pd.read_csv(data_file, skiprows=1)\n", "raw_data" ] },