V1

parent cc155406
This source diff could not be displayed because it is too large. You can view the blob instead.
This source diff could not be displayed because it is too large. You can view the blob instead.
{
"cells": [
{
"cell_type": "code",
"execution_count": 149,
"metadata": {},
"outputs": [],
"source": [
"## Projet Maman\n",
"\n",
"import numpy as np\n",
"import pandas as pd\n",
"import matplotlib.pyplot as plt\n",
"donnees_init = pd.read_csv('Initial.csv').set_index(\"Question cachée pour enregistrer l'ID anonymisé des apprenants.\\xa0\")\n",
"donnees_fin = pd.read_csv('Final.csv').set_index(\"Question cachée pour enregistrer l'ID anonymisé des apprenants.\\xa0\")\n",
"donnees_init = donnees_init.dropna(subset=[\"Date de soumission\"])\n",
"donnees_fin = donnees_fin.dropna(subset=[\"Date de soumission\"])\n",
"donnees_init = donnees_init[~donnees_init.index.duplicated()]\n",
"donnees_index= donnees_fin.index.intersection(donnees_init.index)\n",
"donnees_columns=[]\n",
"for i in list(donnees_init.columns):\n",
" if i not in list(donnees_fin.columns):\n",
" donnees_columns+=[i]\n",
"donnees=pd.concat([donnees_init.loc[list(donnees_index),donnees_columns],donnees_fin.loc[list(donnees_index),:]],axis=1)"
]
},
{
"cell_type": "code",
"execution_count": 155,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 1224x504 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
},
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Féminin</th>\n",
" <th>Masculin</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>Retraité</th>\n",
" <td>0</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Autre</th>\n",
" <td>2</td>\n",
" <td>4</td>\n",
" </tr>\n",
" <tr>\n",
" <th>En recherche d'emploi</th>\n",
" <td>1</td>\n",
" <td>0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Étudiant</th>\n",
" <td>3</td>\n",
" <td>8</td>\n",
" </tr>\n",
" <tr>\n",
" <th>Salarié en activité</th>\n",
" <td>2</td>\n",
" <td>2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Féminin Masculin\n",
"Retraité 0 1\n",
"Autre 2 4\n",
"En recherche d'emploi 1 0\n",
"Étudiant 3 8\n",
"Salarié en activité 2 2"
]
},
"execution_count": 155,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"def hist_double_situation_professionnelle(colonne):\n",
" liste_situation=list(set(donnees.loc[:,\"Quelle est votre situation professionnelle ?\"].values))\n",
" liste_colonne=list(set(donnees.loc[:,colonne].values))\n",
" if np.nan in liste_situation:\n",
" del liste_situation[liste_situation.index(np.nan)]\n",
" if np.nan in liste_colonne:\n",
" del liste_colonne[liste_colonne.index(np.nan)]\n",
" liste_dico=[]\n",
" for situation in liste_situation:\n",
" dico={}\n",
" for item_colonne in liste_colonne:\n",
" dico[item_colonne]=donnees.loc[(donnees.loc[:,\"Quelle est votre situation professionnelle ?\"]==situation) & (donnees.loc[:,colonne]==item_colonne),colonne].count()\n",
" liste_dico.append(dico)\n",
" pd.DataFrame(liste_dico,index=liste_situation).plot(kind='bar',figsize=(17,7))\n",
" plt.show()\n",
" return pd.DataFrame(liste_dico,index=liste_situation)\n",
"\n",
"hist_double_situation_professionnelle(\"Indiquez votre genre :\")"
]
},
{
"cell_type": "code",
"execution_count": 156,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 1224x504 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
},
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>Féminin</th>\n",
" <th>Masculin</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>Ingénieur / Cadre</th>\n",
" <td>1</td>\n",
" <td>1</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" Féminin Masculin\n",
"Ingénieur / Cadre 1 1"
]
},
"execution_count": 156,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"def hist_double_fonction(colonne):\n",
" liste_fonction=list(set(donnees.loc[:,\"Quelle est votre fonction ?\"].values))\n",
" liste_colonne=list(set(donnees.loc[:,colonne].values))\n",
" if np.nan in liste_fonction:\n",
" del liste_fonction[liste_fonction.index(np.nan)]\n",
" if np.nan in liste_colonne:\n",
" del liste_colonne[liste_colonne.index(np.nan)]\n",
" liste_dico=[]\n",
" for fonction in liste_fonction:\n",
" dico={}\n",
" for item_colonne in liste_colonne:\n",
" dico[item_colonne]=donnees.loc[(donnees.loc[:,\"Quelle est votre fonction ?\"]==fonction) & (donnees.loc[:,colonne]==item_colonne),colonne].count()\n",
" liste_dico.append(dico)\n",
" pd.DataFrame(liste_dico,index=liste_fonction).plot(kind='bar',figsize=(17,7))\n",
" plt.show()\n",
" return pd.DataFrame(liste_dico,index=liste_fonction)\n",
"\n",
"hist_double_fonction(\"Indiquez votre genre :\")"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.4"
}
},
"nbformat": 4,
"nbformat_minor": 4
}
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment