Added a panda part

parent d47e4e23
......@@ -10,13 +10,14 @@
},
{
"cell_type": "code",
"execution_count": 1,
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"%matplotlib inline\n",
"import numpy as np\n",
"import matplotlib.pyplot as plt"
"import matplotlib.pyplot as plt\n",
"import pandas as pd"
]
},
{
......@@ -28,21 +29,21 @@
},
{
"cell_type": "code",
"execution_count": 2,
"execution_count": 4,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"['Year', 'Month', 'Day', 'Number of emails', 'Number that require answers']\n",
"['2023', '8', '2', '3', '0']\n",
"['2023', '8', '3', '2', '0']\n",
"['2023', '8', '4', '2', '0']\n",
"['2023', '8', '5', '0', '0']\n",
"['2023', '8', '6', '1', '0']\n",
"['2023', '8', '7', '3', '2']\n",
"['2023', '8', '8', '2', '0']\n"
"['Date', 'Number of emails', 'Number that require answers']\n",
"['2023-08-02', '3', '0']\n",
"['2023-08-03', '2', '0']\n",
"['2023-08-04', '2', '0']\n",
"['2023-08-05', '0', '0']\n",
"['2023-08-06', '1', '0']\n",
"['2023-08-07', '3', '2']\n",
"['2023-08-08', '5', '3']\n"
]
}
],
......@@ -213,6 +214,243 @@
"np.median(Nemail)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Traitement des données avec pandas"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Date</th>\n",
" <th>Number of emails</th>\n",
" <th>Number that require answers</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>2023-08-02</td>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>2023-08-03</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>2023-08-04</td>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>2023-08-05</td>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>2023-08-06</td>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>2023-08-07</td>\n",
" <td>3</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>2023-08-08</td>\n",
" <td>5</td>\n",
" <td>3</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Date Number of emails Number that require answers\n",
"0 2023-08-02 3 0\n",
"1 2023-08-03 2 0\n",
"2 2023-08-04 2 0\n",
"3 2023-08-05 0 0\n",
"4 2023-08-06 1 0\n",
"5 2023-08-07 3 2\n",
"6 2023-08-08 5 3"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"raw_data = pd.read_csv(filename)\n",
"raw_data"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Number of emails</th>\n",
" <th>Number that require answers</th>\n",
" </tr>\n",
" <tr>\n",
" <th>Date</th>\n",
" <th></th>\n",
" <th></th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>2023-08-02</th>\n",
" <td>3</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2023-08-03</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2023-08-04</th>\n",
" <td>2</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2023-08-05</th>\n",
" <td>0</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2023-08-06</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2023-08-07</th>\n",
" <td>3</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2023-08-08</th>\n",
" <td>5</td>\n",
" <td>3</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Number of emails Number that require answers\n",
"Date \n",
"2023-08-02 3 0\n",
"2023-08-03 2 0\n",
"2023-08-04 2 0\n",
"2023-08-05 0 0\n",
"2023-08-06 1 0\n",
"2023-08-07 3 2\n",
"2023-08-08 5 3"
]
},
"execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"date = pd.to_datetime(raw_data['Date'],format='%Y-%m-%d')\n",
"raw_data['Date'] = date\n",
"data = raw_data.set_index('Date')\n",
"data"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"<matplotlib.axes._subplots.AxesSubplot at 0x7f6799aa65f8>"
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
},
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 432x288 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"data['Number of emails'].plot()"
]
},
{
"cell_type": "code",
"execution_count": null,
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment