diff --git a/module3/exo3/exercice.ipynb b/module3/exo3/exercice.ipynb index 4c11d8f6b483dc7c0b0daa6772e1326d47899183..deadaf0a7105a4b1ea3c6dcec2d1e37c720e1838 100644 --- a/module3/exo3/exercice.ipynb +++ b/module3/exo3/exercice.ipynb @@ -726,29 +726,42 @@ "## Taux de mortalité (question 1)" ] }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Nous allons calculer le taux de mortalité sur la période pour les deux groupes de femmes: fumeuses et non fumeuses, et représenter les résultats sous forme d'un tableau." + ] + }, { "cell_type": "code", - "execution_count": 32, + "execution_count": 36, "metadata": {}, "outputs": [ { - "ename": "SyntaxError", - "evalue": "invalid syntax (, line 8)", - "output_type": "error", - "traceback": [ - "\u001b[0;36m File \u001b[0;32m\"\"\u001b[0;36m, line \u001b[0;32m8\u001b[0m\n\u001b[0;31m print form.format(*val)\u001b[0m\n\u001b[0m ^\u001b[0m\n\u001b[0;31mSyntaxError\u001b[0m\u001b[0;31m:\u001b[0m invalid syntax\n" + "name": "stdout", + "output_type": "stream", + "text": [ + " Smokers Non-Smokers\n", + "Vivantes 443.000000 502.000000\n", + "Mortes 139.000000 230.000000\n", + "Taux mortalité 0.238832 0.314208\n" ] } ], "source": [ - "alive = [\"nb vivantes\", len(data[(data['Smoker'] == \"Yes\") & (data['Status'] == \"Alive\")].index), len(data[(data['Smoker'] == \"No\") & (data['Status'] == \"Alive\")].index)]\n", - "dead = [\"nb mortes\", len(data[(data['Smoker'] == \"Yes\") & (data['Status'] == \"Dead\")].index), len(data[(data['Smoker'] == \"No\") & (data['Status'] == \"Dead\")].index)]\n", - "deathrate = [\"taux mortalite\", dead[1]/(alive[1] + dead[1]), dead[2]/(alive[2] + dead[2])]\n", + "alive = [len(data[(data['Smoker'] == \"Yes\") & (data['Status'] == \"Alive\")].index), len(data[(data['Smoker'] == \"No\") & (data['Status'] == \"Alive\")].index)]\n", + "dead = [len(data[(data['Smoker'] == \"Yes\") & (data['Status'] == \"Dead\")].index), len(data[(data['Smoker'] == \"No\") & (data['Status'] == \"Dead\")].index)]\n", + "deathrate = [dead[0]/(alive[0] + dead[0]), dead[1]/(alive[1] + dead[1])]\n", "\n", - "tab = [[\"\", \"Smokers\", \"Non Smokers\"], alive, dead, deathrate]\n", - "form=\"{0:10}{1:10}{2:10}\"\n", - "for val in tab:\n", - " print form.format(*val)" + "print(pd.DataFrame([alive, dead, deathrate], [\"Vivantes\", \"Mortes\", \"Taux mortalité\"], [\"Smokers\", \"Non-Smokers\"]))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "On remarque que le taux de mortalité est - nettement - plus élevé dans le groupe des non fumeuses, ce qui constitue le paradoxe de Simpson" ] }, {