979 lines
51 KiB
Plaintext
979 lines
51 KiB
Plaintext
|
{
|
||
|
"cells": [
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 1,
|
||
|
"id": "935dd393-0cdb-470f-b5e7-cf2af42855fd",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [],
|
||
|
"source": [
|
||
|
"url = \"https://pixees.fr/informatiquelycee/n_site/asset/titanic.csv\""
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 2,
|
||
|
"id": "a4ff45d8-079a-4a2e-a220-87760831d4ba",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [],
|
||
|
"source": [
|
||
|
"#Importation des données \n",
|
||
|
"import pandas as pd\n",
|
||
|
"data = pd.io.parsers.read_csv(url)"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 3,
|
||
|
"id": "3f9f39d2-aced-4bba-acf7-b00505f93a21",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/html": [
|
||
|
"<div>\n",
|
||
|
"<style scoped>\n",
|
||
|
" .dataframe tbody tr th:only-of-type {\n",
|
||
|
" vertical-align: middle;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe tbody tr th {\n",
|
||
|
" vertical-align: top;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe thead th {\n",
|
||
|
" text-align: right;\n",
|
||
|
" }\n",
|
||
|
"</style>\n",
|
||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
||
|
" <thead>\n",
|
||
|
" <tr style=\"text-align: right;\">\n",
|
||
|
" <th></th>\n",
|
||
|
" <th>PassengerId</th>\n",
|
||
|
" <th>Survived</th>\n",
|
||
|
" <th>Pclass</th>\n",
|
||
|
" <th>Name</th>\n",
|
||
|
" <th>Sex</th>\n",
|
||
|
" <th>Age</th>\n",
|
||
|
" <th>SibSp</th>\n",
|
||
|
" <th>Parch</th>\n",
|
||
|
" <th>Ticket</th>\n",
|
||
|
" <th>Fare</th>\n",
|
||
|
" <th>Cabin</th>\n",
|
||
|
" <th>Embarked</th>\n",
|
||
|
" </tr>\n",
|
||
|
" </thead>\n",
|
||
|
" <tbody>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>0</th>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>Braund, Mr. Owen Harris</td>\n",
|
||
|
" <td>male</td>\n",
|
||
|
" <td>22.0</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>A/5 21171</td>\n",
|
||
|
" <td>7.2500</td>\n",
|
||
|
" <td>NaN</td>\n",
|
||
|
" <td>S</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>1</th>\n",
|
||
|
" <td>2</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>Cumings, Mrs. John Bradley (Florence Briggs Th...</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>38.0</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>PC 17599</td>\n",
|
||
|
" <td>71.2833</td>\n",
|
||
|
" <td>C85</td>\n",
|
||
|
" <td>C</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>2</th>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>Heikkinen, Miss. Laina</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>26.0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>STON/O2. 3101282</td>\n",
|
||
|
" <td>7.9250</td>\n",
|
||
|
" <td>NaN</td>\n",
|
||
|
" <td>S</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>3</th>\n",
|
||
|
" <td>4</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>Futrelle, Mrs. Jacques Heath (Lily May Peel)</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>35.0</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>113803</td>\n",
|
||
|
" <td>53.1000</td>\n",
|
||
|
" <td>C123</td>\n",
|
||
|
" <td>S</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>4</th>\n",
|
||
|
" <td>5</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>Allen, Mr. William Henry</td>\n",
|
||
|
" <td>male</td>\n",
|
||
|
" <td>35.0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>373450</td>\n",
|
||
|
" <td>8.0500</td>\n",
|
||
|
" <td>NaN</td>\n",
|
||
|
" <td>S</td>\n",
|
||
|
" </tr>\n",
|
||
|
" </tbody>\n",
|
||
|
"</table>\n",
|
||
|
"</div>"
|
||
|
],
|
||
|
"text/plain": [
|
||
|
" PassengerId Survived Pclass \\\n",
|
||
|
"0 1 0 3 \n",
|
||
|
"1 2 1 1 \n",
|
||
|
"2 3 1 3 \n",
|
||
|
"3 4 1 1 \n",
|
||
|
"4 5 0 3 \n",
|
||
|
"\n",
|
||
|
" Name Sex Age SibSp \\\n",
|
||
|
"0 Braund, Mr. Owen Harris male 22.0 1 \n",
|
||
|
"1 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 1 \n",
|
||
|
"2 Heikkinen, Miss. Laina female 26.0 0 \n",
|
||
|
"3 Futrelle, Mrs. Jacques Heath (Lily May Peel) female 35.0 1 \n",
|
||
|
"4 Allen, Mr. William Henry male 35.0 0 \n",
|
||
|
"\n",
|
||
|
" Parch Ticket Fare Cabin Embarked \n",
|
||
|
"0 0 A/5 21171 7.2500 NaN S \n",
|
||
|
"1 0 PC 17599 71.2833 C85 C \n",
|
||
|
"2 0 STON/O2. 3101282 7.9250 NaN S \n",
|
||
|
"3 0 113803 53.1000 C123 S \n",
|
||
|
"4 0 373450 8.0500 NaN S "
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 3,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data.head()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 4,
|
||
|
"id": "f4b6f349-e8d5-406b-84f0-ee876df95e1f",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/html": [
|
||
|
"<div>\n",
|
||
|
"<style scoped>\n",
|
||
|
" .dataframe tbody tr th:only-of-type {\n",
|
||
|
" vertical-align: middle;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe tbody tr th {\n",
|
||
|
" vertical-align: top;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe thead th {\n",
|
||
|
" text-align: right;\n",
|
||
|
" }\n",
|
||
|
"</style>\n",
|
||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
||
|
" <thead>\n",
|
||
|
" <tr style=\"text-align: right;\">\n",
|
||
|
" <th></th>\n",
|
||
|
" <th>PassengerId</th>\n",
|
||
|
" <th>Survived</th>\n",
|
||
|
" <th>Pclass</th>\n",
|
||
|
" <th>Name</th>\n",
|
||
|
" <th>Sex</th>\n",
|
||
|
" <th>Age</th>\n",
|
||
|
" <th>SibSp</th>\n",
|
||
|
" <th>Parch</th>\n",
|
||
|
" <th>Ticket</th>\n",
|
||
|
" <th>Fare</th>\n",
|
||
|
" <th>Cabin</th>\n",
|
||
|
" <th>Embarked</th>\n",
|
||
|
" </tr>\n",
|
||
|
" </thead>\n",
|
||
|
" <tbody>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>886</th>\n",
|
||
|
" <td>887</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>2</td>\n",
|
||
|
" <td>Montvila, Rev. Juozas</td>\n",
|
||
|
" <td>male</td>\n",
|
||
|
" <td>27.0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>211536</td>\n",
|
||
|
" <td>13.00</td>\n",
|
||
|
" <td>NaN</td>\n",
|
||
|
" <td>S</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>887</th>\n",
|
||
|
" <td>888</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>Graham, Miss. Margaret Edith</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>19.0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>112053</td>\n",
|
||
|
" <td>30.00</td>\n",
|
||
|
" <td>B42</td>\n",
|
||
|
" <td>S</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>888</th>\n",
|
||
|
" <td>889</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>Johnston, Miss. Catherine Helen \"Carrie\"</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>NaN</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>2</td>\n",
|
||
|
" <td>W./C. 6607</td>\n",
|
||
|
" <td>23.45</td>\n",
|
||
|
" <td>NaN</td>\n",
|
||
|
" <td>S</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>889</th>\n",
|
||
|
" <td>890</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>Behr, Mr. Karl Howell</td>\n",
|
||
|
" <td>male</td>\n",
|
||
|
" <td>26.0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>111369</td>\n",
|
||
|
" <td>30.00</td>\n",
|
||
|
" <td>C148</td>\n",
|
||
|
" <td>C</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>890</th>\n",
|
||
|
" <td>891</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>Dooley, Mr. Patrick</td>\n",
|
||
|
" <td>male</td>\n",
|
||
|
" <td>32.0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>370376</td>\n",
|
||
|
" <td>7.75</td>\n",
|
||
|
" <td>NaN</td>\n",
|
||
|
" <td>Q</td>\n",
|
||
|
" </tr>\n",
|
||
|
" </tbody>\n",
|
||
|
"</table>\n",
|
||
|
"</div>"
|
||
|
],
|
||
|
"text/plain": [
|
||
|
" PassengerId Survived Pclass Name \\\n",
|
||
|
"886 887 0 2 Montvila, Rev. Juozas \n",
|
||
|
"887 888 1 1 Graham, Miss. Margaret Edith \n",
|
||
|
"888 889 0 3 Johnston, Miss. Catherine Helen \"Carrie\" \n",
|
||
|
"889 890 1 1 Behr, Mr. Karl Howell \n",
|
||
|
"890 891 0 3 Dooley, Mr. Patrick \n",
|
||
|
"\n",
|
||
|
" Sex Age SibSp Parch Ticket Fare Cabin Embarked \n",
|
||
|
"886 male 27.0 0 0 211536 13.00 NaN S \n",
|
||
|
"887 female 19.0 0 0 112053 30.00 B42 S \n",
|
||
|
"888 female NaN 1 2 W./C. 6607 23.45 NaN S \n",
|
||
|
"889 male 26.0 0 0 111369 30.00 C148 C \n",
|
||
|
"890 male 32.0 0 0 370376 7.75 NaN Q "
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 4,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data.tail()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 5,
|
||
|
"id": "86cc0139-bc42-49eb-9261-946db3ce517e",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [],
|
||
|
"source": [
|
||
|
"data = data.drop(['Name', 'PassengerId', 'SibSp', 'Parch', 'Ticket', 'Fare', 'Cabin', 'Embarked'], axis=1)"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 6,
|
||
|
"id": "84dcd03a-9f74-467d-92f8-720fd5dc57a2",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/html": [
|
||
|
"<div>\n",
|
||
|
"<style scoped>\n",
|
||
|
" .dataframe tbody tr th:only-of-type {\n",
|
||
|
" vertical-align: middle;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe tbody tr th {\n",
|
||
|
" vertical-align: top;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe thead th {\n",
|
||
|
" text-align: right;\n",
|
||
|
" }\n",
|
||
|
"</style>\n",
|
||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
||
|
" <thead>\n",
|
||
|
" <tr style=\"text-align: right;\">\n",
|
||
|
" <th></th>\n",
|
||
|
" <th>Survived</th>\n",
|
||
|
" <th>Pclass</th>\n",
|
||
|
" <th>Sex</th>\n",
|
||
|
" <th>Age</th>\n",
|
||
|
" </tr>\n",
|
||
|
" </thead>\n",
|
||
|
" <tbody>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>0</th>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>male</td>\n",
|
||
|
" <td>22.0</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>1</th>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>38.0</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>2</th>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>26.0</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>3</th>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>1</td>\n",
|
||
|
" <td>female</td>\n",
|
||
|
" <td>35.0</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>4</th>\n",
|
||
|
" <td>0</td>\n",
|
||
|
" <td>3</td>\n",
|
||
|
" <td>male</td>\n",
|
||
|
" <td>35.0</td>\n",
|
||
|
" </tr>\n",
|
||
|
" </tbody>\n",
|
||
|
"</table>\n",
|
||
|
"</div>"
|
||
|
],
|
||
|
"text/plain": [
|
||
|
" Survived Pclass Sex Age\n",
|
||
|
"0 0 3 male 22.0\n",
|
||
|
"1 1 1 female 38.0\n",
|
||
|
"2 1 3 female 26.0\n",
|
||
|
"3 1 1 female 35.0\n",
|
||
|
"4 0 3 male 35.0"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 6,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data.head()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 7,
|
||
|
"id": "8fa36ab8-f947-46b2-9b26-5c608058fd48",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [],
|
||
|
"source": [
|
||
|
"data = data.dropna(axis=0)"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 8,
|
||
|
"id": "b4eeb852-30d2-43b6-82f6-23d1c5db4139",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"name": "stdout",
|
||
|
"output_type": "stream",
|
||
|
"text": [
|
||
|
"(714, 4)\n"
|
||
|
]
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"print(data.shape)"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 9,
|
||
|
"id": "3a91513f-f8e5-4ef3-b0d8-967f98539a50",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/html": [
|
||
|
"<div>\n",
|
||
|
"<style scoped>\n",
|
||
|
" .dataframe tbody tr th:only-of-type {\n",
|
||
|
" vertical-align: middle;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe tbody tr th {\n",
|
||
|
" vertical-align: top;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe thead th {\n",
|
||
|
" text-align: right;\n",
|
||
|
" }\n",
|
||
|
"</style>\n",
|
||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
||
|
" <thead>\n",
|
||
|
" <tr style=\"text-align: right;\">\n",
|
||
|
" <th></th>\n",
|
||
|
" <th>Survived</th>\n",
|
||
|
" <th>Pclass</th>\n",
|
||
|
" <th>Age</th>\n",
|
||
|
" </tr>\n",
|
||
|
" </thead>\n",
|
||
|
" <tbody>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>count</th>\n",
|
||
|
" <td>714.000000</td>\n",
|
||
|
" <td>714.000000</td>\n",
|
||
|
" <td>714.000000</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>mean</th>\n",
|
||
|
" <td>0.406162</td>\n",
|
||
|
" <td>2.236695</td>\n",
|
||
|
" <td>29.699118</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>std</th>\n",
|
||
|
" <td>0.491460</td>\n",
|
||
|
" <td>0.838250</td>\n",
|
||
|
" <td>14.526497</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>min</th>\n",
|
||
|
" <td>0.000000</td>\n",
|
||
|
" <td>1.000000</td>\n",
|
||
|
" <td>0.420000</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>25%</th>\n",
|
||
|
" <td>0.000000</td>\n",
|
||
|
" <td>1.000000</td>\n",
|
||
|
" <td>20.125000</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>50%</th>\n",
|
||
|
" <td>0.000000</td>\n",
|
||
|
" <td>2.000000</td>\n",
|
||
|
" <td>28.000000</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>75%</th>\n",
|
||
|
" <td>1.000000</td>\n",
|
||
|
" <td>3.000000</td>\n",
|
||
|
" <td>38.000000</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>max</th>\n",
|
||
|
" <td>1.000000</td>\n",
|
||
|
" <td>3.000000</td>\n",
|
||
|
" <td>80.000000</td>\n",
|
||
|
" </tr>\n",
|
||
|
" </tbody>\n",
|
||
|
"</table>\n",
|
||
|
"</div>"
|
||
|
],
|
||
|
"text/plain": [
|
||
|
" Survived Pclass Age\n",
|
||
|
"count 714.000000 714.000000 714.000000\n",
|
||
|
"mean 0.406162 2.236695 29.699118\n",
|
||
|
"std 0.491460 0.838250 14.526497\n",
|
||
|
"min 0.000000 1.000000 0.420000\n",
|
||
|
"25% 0.000000 1.000000 20.125000\n",
|
||
|
"50% 0.000000 2.000000 28.000000\n",
|
||
|
"75% 1.000000 3.000000 38.000000\n",
|
||
|
"max 1.000000 3.000000 80.000000"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 9,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data.describe()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 10,
|
||
|
"id": "5e52ca0e-69fe-47eb-b4f9-0ae4f1d38a27",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/plain": [
|
||
|
"3 355\n",
|
||
|
"1 186\n",
|
||
|
"2 173\n",
|
||
|
"Name: Pclass, dtype: int64"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 10,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data['Pclass'].value_counts()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 11,
|
||
|
"id": "61a70d41-bea2-4872-8372-7a999a8e73ac",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/plain": [
|
||
|
"<Axes: >"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 11,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
},
|
||
|
{
|
||
|
"data": {
|
||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAigAAAGYCAYAAABoLxltAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAf9klEQVR4nO3df2zU9eHH8dfZ0gNq76QU7kc4ahOqm7aQWAzQqBQoxWZQBCJMEgeRGeVHk6YwtBCzumirLF/QwEa2hYDAsPyhVTMQKQHqmo4FujEp/sJYYgk9O1m5a7G7Yvl8/1j2yY4CetBy77bPR/JJvM/7fZ97f+K5Pve5Xw7LsiwBAAAY5I54LwAAAOBqBAoAADAOgQIAAIxDoAAAAOMQKAAAwDgECgAAMA6BAgAAjEOgAAAA4yTGewE348qVKzp//rxSUlLkcDjivRwAAPADWJal9vZ2+f1+3XHHja+R9MtAOX/+vAKBQLyXAQAAbkJzc7PGjBlzwzn9MlBSUlIk/ecEXS5XnFcDAAB+iHA4rEAgYP8dv5F+GSj/fVnH5XIRKAAA9DM/5O0ZvEkWAAAYh0ABAADGIVAAAIBxCBQAAGAcAgUAABiHQAEAAMYhUAAAgHEIFAAAYBwCBQAAGIdAAQAAxiFQAACAcQgUAABgHAIFAAAYh0ABAADGSYz3Aga6u5/fF+8lDAhnX/lJvJcAALiNYrqCsnXrVo0fP14ul0sul0tTpkzR+++/b48vXbpUDocjaps8eXLUMSKRiIqLi5WWlqbk5GQVFRXp3LlzvXM2AABgQIgpUMaMGaNXXnlFJ06c0IkTJzR9+nTNnTtXp0+ftuc8+uijamlpsbf9+/dHHaOkpETV1dWqqqpSXV2dOjo6NHv2bHV3d/fOGQEAgH4vppd45syZE3X75Zdf1tatW3Xs2DHdf//9kiSn0ymv13vN+4dCIW3btk27du1Sfn6+JGn37t0KBAI6dOiQZs2adTPnAAAABpibfpNsd3e3qqqqdOnSJU2ZMsXef/ToUY0ePVr33HOPnn76abW2ttpjDQ0Nunz5sgoKCux9fr9fWVlZqq+vv+5jRSIRhcPhqA0AAAxcMQfKqVOndOedd8rpdOrZZ59VdXW17rvvPklSYWGh/vjHP+rw4cP6v//7Px0/flzTp09XJBKRJAWDQSUlJWnEiBFRx/R4PAoGg9d9zMrKSrndbnsLBAKxLhsAAPQjMX+K595779XJkyd18eJFvfXWW1qyZIlqa2t13333adGiRfa8rKwsTZw4Uenp6dq3b5/mz59/3WNaliWHw3Hd8bKyMpWWltq3w+EwkQIAwAAWc6AkJSVp3LhxkqSJEyfq+PHjev311/W73/2ux1yfz6f09HSdOXNGkuT1etXV1aW2traoqyitra3Kzc297mM6nU45nc5YlwoAAPqpW/6iNsuy7JdwrnbhwgU1NzfL5/NJknJycjRkyBDV1NTYc1paWtTY2HjDQAEAAINLTFdQ1q1bp8LCQgUCAbW3t6uqqkpHjx7VgQMH1NHRofLyci1YsEA+n09nz57VunXrlJaWpnnz5kmS3G63li1bptWrV2vkyJFKTU3VmjVrlJ2dbX+qBwAAIKZA+frrr/Xkk0+qpaVFbrdb48eP14EDBzRz5kx1dnbq1KlT2rlzpy5evCifz6dp06Zp7969SklJsY+xadMmJSYmauHChers7NSMGTO0Y8cOJSQk9PrJAQCA/slhWZYV70XEKhwOy+12KxQKyeVyxXs5N8RX3fcOvuoeAPq/WP5+82OBAADAOAQKAAAwDoECAACMQ6AAAADjECgAAMA4BAoAADAOgQIAAIxDoAAAAOMQKAAAwDgECgAAMA6BAgAAjEOgAAAA4xAoAADAOAQKAAAwDoECAACMQ6AAAADjECgAAMA4BAoAADAOgQIAAIxDoAAAAOMQKAAAwDgECgAAMA6BAgAAjEOgAAAA4xAoAADAOAQKAAAwDoECAACMQ6AAAADjECgAAMA4BAoAADAOgQIAAIxDoAAAAOMQKAAAwDgECgAAMA6BAgAAjEOgAAAA4xAoAADAOAQKAAAwDoECAACME1OgbN26VePHj5fL5ZLL5dKUKVP0/vvv2+OWZam8vFx+v1/Dhg1TXl6eTp8+HXWMSCSi4uJipaWlKTk5WUVFRTp37lzvnA0AABgQYgqUMWPG6JVXXtGJEyd04sQJTZ8+XXPnzrUjZMOGDdq4caO2bNmi48ePy+v1aubMmWpvb7ePUVJSourqalVVVamurk4dHR2aPXu2uru7e/fMAABAv+WwLMu6lQOkpqbq17/+tZ566in5/X6VlJToueeek/SfqyUej0evvvqqnnnmGYVCIY0aNUq7du3SokWLJEnnz59XIBDQ/v37NWvWrB/0mOFwWG63W6FQSC6X61aW3+fufn5fvJcwIJx95SfxXgIA4BbF8vf7pt+D0t3draqqKl26dElTpkxRU1OTgsGgCgoK7DlOp1NTp05VfX29JKmhoUGXL1+OmuP3+5WVlWXPuZZIJKJwOBy1AQCAgSvmQDl16pTuvPNOOZ1OPfvss6qurtZ9992nYDAoSfJ4PFHzPR6PPRYMBpWUlKQRI0Zcd861VFZWyu1221sgEIh12QAAoB+JOVDuvfdenTx5UseOHdPy5cu1ZMkSffzxx/a4w+GImm9ZVo99V/u+OWVlZQqFQvbW3Nwc67IBAEA/EnOgJCUlady4cZo4caIqKys1YcIEvf766/J6vZLU40pIa2urfVXF6/Wqq6tLbW1t151zLU6n0/7k0H83AAAwcN3y96BYlqVIJKKMjAx5vV7V1NTYY11dXaqtrVVubq4kKScnR0OGDIma09LSosbGRnsOAABAYiyT161bp8LCQgUCAbW3t6uqqkpHjx7VgQMH5HA4VFJSooqKCmVmZiozM1MVFRUaPny4Fi9eLElyu91atmyZVq9erZEjRyo1NVVr1qxRdna28vPz++QEAQBA/xNToHz99dd68skn1dLSIrfbrfHjx+vAgQOaOXOmJGnt2rXq7OzUihUr1NbWpkmTJungwYNKSUmxj7Fp0yYlJiZq4cKF6uzs1IwZM7Rjxw4lJCT07pkBAIB+65a/ByUe+B6UwYfvQQGA/u+2fA8KAABAXyFQAACAcQgUAABgHAIFAAAYh0ABAADGIVAAAIBxCBQAAGAcAgUAABiHQAEAAMYhUAAAgHEIFAAAYBwCBQAAGIdAAQAAxiFQAACAcQgUAABgHAIFAAAYh0ABAADGIVAAAIBxCBQAAGAcAgUAABiHQAEAAMYhUAAAgHEIFAAAYBwCBQAAGIdAAQAAxiFQAACAcQgUAABgHAIFAAAYh0ABAADGIVAAAIBxCBQAAGAcAgUAABiHQAEAAMYhUAAAgHEIFAAAYBwCBQAAGIdAAQAAxiFQAACAcWIKlMrKSj344INKSUnR6NGj9dhjj+mzzz6LmrN06VI5HI6obfLkyVFzIpGIiouLlZaWpuTkZBUVFencuXO3fjYAAGBAiClQamtrtXLlSh07dkw1NTX67rvvVFBQoEuXLkXNe/TRR9XS0mJv+/fvjxovKSlRdXW1qqqqVFdXp46ODs2ePVvd3d23fkYAAKDfS4xl8oEDB6Jub9++XaNHj1ZDQ4MeeeQRe7/T6ZTX673mMUKhkLZt26Zdu3YpPz9fkrR7924FAgEdOnRIs2bNivUcAADAAHNL70EJhUKSpNTU1Kj9R48e1ejRo3XPPffo6aefVmtrqz3W0NCgy5cvq6CgwN7n9/uVlZWl+vr6W1kOAAAYIGK6gvK/LMtSaWmpHnroIWVlZdn7CwsL9fjjjys9PV1NTU164YUXNH36dDU0NMjpdCoYDCopKUkjRoyIOp7H41EwGLzmY0UiEUUiEft2OBy+2WUDAIB+4KYDZdWqVfroo49UV1cXtX/RokX2P2dlZWnixIlKT0/Xvn37NH/+/Osez7IsORyOa45VVlbqxRdfvNmlAgCAfuamXuIpLi7We++9pyNHjmjMmDE3nOvz+ZSenq4zZ85Ikrxer7q6utTW1hY1r7W1VR6P55rHKCsrUygUsrf
|
||
|
"text/plain": [
|
||
|
"<Figure size 640x480 with 1 Axes>"
|
||
|
]
|
||
|
},
|
||
|
"metadata": {},
|
||
|
"output_type": "display_data"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data['Pclass'].value_counts().plot.bar()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 12,
|
||
|
"id": "f77de794-b854-4697-811a-c404b14eb680",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/plain": [
|
||
|
"<Axes: >"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 12,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
},
|
||
|
{
|
||
|
"data": {
|
||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAigAAAGdCAYAAAA44ojeAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/bCgiHAAAACXBIWXMAAA9hAAAPYQGoP6dpAAApbElEQVR4nO3de3SU5YHH8d8kmQwEEzTEMMkaQlBcWkMpkCq3llBNMCIepOuNbQ3rtVvKwgYqIMthqHI59KzFhS1rXRa1ISdsj8DaYgtBuZSlbiXKFrCLoYaLEswBJSEEhzF59g8PU8cESMI7zjMv3885c8K87zNPnl/mTfidd24eY4wRAACARRJivQAAAIAvoqAAAADrUFAAAIB1KCgAAMA6FBQAAGAdCgoAALAOBQUAAFiHggIAAKyTFOsFdEVra6uOHTum1NRUeTyeWC8HAAB0gDFGp0+fVnZ2thISLn6OJC4LyrFjx5STkxPrZQAAgC44evSorrvuuouOicuCkpqaKumzgGlpaY7MGQqFtHnzZhUXF8vr9Toyp03cnk9yf0a355PI6AZuzyeR8XI0NjYqJycn/P/4xcRlQTn/sE5aWpqjBSUlJUVpaWmuPODcnk9yf0a355PI6AZuzyeR0QkdeXoGT5IFAADWoaAAAADrUFAAAIB1KCgAAMA6FBQAAGAdCgoAALAOBQUAAFiHggIAAKxDQQEAANahoAAAAOtQUAAAgHUoKAAAwDoUFAAAYB0KCgAAsE5SZ2+wY8cO/eQnP1F1dbXq6uq0fv16TZgwIbz/Qh+hvHTpUv3oRz+SJBUWFmr79u0R+++77z5VVlZ2djmIY31nb3R0Pl+i0dKbpfzAJgVbLv1R3l1xaMm4qMwLAIjU6TMoZ86c0aBBg7RixYp299fV1UVc/uM//kMej0ff+c53IsY9+uijEeOee+65riUAAACu0+kzKCUlJSopKbngfr/fH3H9v/7rvzRmzBj169cvYntKSkqbsQAAAFIXCkpnfPjhh9q4caNefPHFNvvWrFmj8vJy9e7dWyUlJZo/f75SU1PbnScYDCoYDIavNzY2SpJCoZBCoZAjaz0/j1Pz2cbGfL5E4+x8CSbiazTE8udn433oNDLGP7fnk8joxLwd4THGdPmvucfjafMclM9bunSplixZomPHjqlbt27h7c8//7zy8vLk9/u1b98+zZkzRzfccIOqqqranScQCGjBggVttldUVCglJaWrywcAAF+i5uZmTZo0SQ0NDUpLS7vo2KgWlAEDBqioqEjLly+/6DzV1dUqKChQdXW1hgwZ0mZ/e2dQcnJydOLEiUsG7KhQKKSqqioVFRXJ6/U6MqdNbMyXH9jk6Hy+BKOnClo1b3eCgq3ReZLsvsDYqMzbETbeh04jY/xzez6JjJejsbFRGRkZHSooUXuI53e/+50OHDigtWvXXnLskCFD5PV6VVNT025B8fl88vl8bbZ7vV7HD45ozGkTm/JF65U2wVZP1Oa24Wdn030YLWSMf27PJ5Gxq/N1VNTeB2XVqlUaOnSoBg0adMmx+/fvVygUUlZWVrSWAwAA4kinz6A0NTXp4MGD4eu1tbXas2eP0tPT1adPH0mfncL55S9/qX/+539uc/s///nPWrNmje644w5lZGTonXfe0YwZMzR48GCNHDnyMqIAAAC36HRB2b17t8aMGRO+XlZWJkkqLS3VCy+8IEmqrKyUMUYPPPBAm9snJyfrtdde07PPPqumpibl5ORo3Lhxmj9/vhITE7sYAwAAuEmnC0phYaEu9bzaxx57TI899li7+3Jyctq8iywAAMDn8Vk8AADAOhQUAABgHQoKAACwDgUFAABYh4ICAACsE9UPCwTcpu/sjTH73r5Eo6U3f/YRAZ15p9xDS8ZFcVUAEB2cQQEAANahoAAAAOtQUAAAgHUoKAAAwDoUFAAAYB0KCgAAsA4FBQAAWIeCAgAArENBAQAA1qGgAAAA61BQAACAdSgoAADAOhQUAABgHQoKAACwDgUFAABYh4ICAACsQ0EBAADWoaAAAADrUFAAAIB1KCgAAMA6FBQAAGAdCgoAALAOBQUAAFiHggIAAKxDQQEAANahoAAAAOtQUAAAgHUoKAAAwDoUFAAAYB0KCgAAsA4FBQAAWIeCAgAArENBAQAA1ul0QdmxY4fGjx+v7OxseTwebdiwIWL/5MmT5fF4Ii7Dhg2LGBMMBjV16lRlZGSoR48euuuuu/T+++9fVhAAAOAenS4oZ86c0aBBg7RixYoLjrn99ttVV1cXvrz66qsR+6dPn67169ersrJSO3fuVFNTk+688061tLR0PgEAAHCdpM7eoKSkRCUlJRcd4/P55Pf7293X0NCgVatW6Re/+IVuu+02SVJ5eblycnK0ZcsWjR07trNLAgAALtPpgtIR27ZtU2Zmpq6++mqNHj1aCxcuVGZmpiSpurpaoVBIxcXF4fHZ2dnKz8/Xrl272i0owWBQwWAwfL2xsVGSFAqFFAqFHFnz+Xmcms82NubzJRpn50swEV/dpqv5bLrPL8XG49Rpbs/o9nwSGZ2YtyM8xpgu/zX3eDxav369JkyYEN62du1aXXXVVcrNzVVtba3mzZunTz/9VNXV1fL5fKqoqNDf/d3fRRQOSSouLlZeXp6ee+65Nt8nEAhowYIFbbZXVFQoJSWlq8sHAABfoubmZk2aNEkNDQ1KS0u76FjHz6Dcd9994X/n5+eroKBAubm52rhxoyZOnHjB2xlj5PF42t03Z84clZWVha83NjYqJydHxcXFlwzYUaFQSFVVVSoqKpLX63VkTpvYmC8/sMnR+XwJRk8VtGre7gQFW9s/luJZV/PtC8TPw6Y2HqdOc3tGt+eTyHg5zj8C0hFReYjn87KyspSbm6uamhpJkt/v17lz5/Txxx/rmmuuCY+rr6/XiBEj2p3D5/PJ5/O12e71eh0/OKIxp01syhdsiU6JCLZ6oja3DTqbz5b7uzNsOk6jxe0Z3Z5PImNX5+uoqL8PysmTJ3X06FFlZWVJkoYOHSqv16uqqqrwmLq6Ou3bt++CBQUAAFxZOn0GpampSQcPHgxfr62t1Z49e5Senq709HQFAgF95zvfUVZWlg4dOqQnn3xSGRkZuvvuuyVJPXv21MMPP6wZM2aoV69eSk9P18yZMzVw4MDwq3oAAMCVrdMFZffu3RozZkz4+vnnhpSWlmrlypXau3evXnrpJZ06dUpZWVkaM2aM1q5dq9TU1PBtfvrTnyopKUn33nuvzp49q1tvvVUvvPCCEhMTHYgEAADiXacLSmFhoS72wp9Nmy79xMdu3bpp+fLlWr58eWe/PQAAuALwWTwAAMA6FBQAAGAdCgoAALAOBQUAAFiHggIAAKxDQQEAANahoAAAAOtQUAAAgHUoKAAAwDoUFAAAYB0KCgAAsA4FBQAAWIeCAgAArENBAQAA1qGgAAAA61BQAACAdSgoAADAOhQUAABgHQoKAACwDgUFAABYh4ICAACsQ0EBAADWoaAAAADrUFAAAIB1KCgAAMA6FBQAAGAdCgoAALAOBQUAAFiHggIAAKxDQQEAANahoAAAAOtQUAAAgHUoKAAAwDoUFAAAYB0KCgAAsA4FBQAAWIeCAgAArENBAQAA1qGgAAAA63S6oOzYsUPjx49Xdna2PB6PNmzYEN4XCoU0a9YsDRw4UD169FB2drYefPBBHTt2LGKOwsJCeTyeiMv9999/2WEAAIA7dLqgnDlzRoMGDdKKFSva7GtubtZbb72lefPm6a233tK6dev07rvv6q677moz9tFHH1VdXV348txzz3UtAQAAcJ2kzt6gpKREJSUl7e7r2bOnqqqqIrYtX75cN998s44cOaI+ffqEt6ekpMjv93f22wMAgCtApwtKZzU0NMjj8ejqq6+O2L5mzRqVl5erd+/eKikp0fz585WamtruHMFgUMFgMHy9sbFR0mcPKYVCIUfWeX4ep+azjY35fInG2fkSTMRXt+lqPpvu80ux8Th1mtszuj2fREYn5u0IjzGmy3/NPR6P1q9frwkTJrS7/5NPPtGoUaM0YMAAlZeXh7c
|
||
|
"text/plain": [
|
||
|
"<Figure size 640x480 with 1 Axes>"
|
||
|
]
|
||
|
},
|
||
|
"metadata": {},
|
||
|
"output_type": "display_data"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data['Age'].hist()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 13,
|
||
|
"id": "124a3f8b-2884-40b9-ab56-3a3366c499ee",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/html": [
|
||
|
"<div>\n",
|
||
|
"<style scoped>\n",
|
||
|
" .dataframe tbody tr th:only-of-type {\n",
|
||
|
" vertical-align: middle;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe tbody tr th {\n",
|
||
|
" vertical-align: top;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe thead th {\n",
|
||
|
" text-align: right;\n",
|
||
|
" }\n",
|
||
|
"</style>\n",
|
||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
||
|
" <thead>\n",
|
||
|
" <tr style=\"text-align: right;\">\n",
|
||
|
" <th></th>\n",
|
||
|
" <th>Survived</th>\n",
|
||
|
" <th>Pclass</th>\n",
|
||
|
" <th>Age</th>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>Sex</th>\n",
|
||
|
" <th></th>\n",
|
||
|
" <th></th>\n",
|
||
|
" <th></th>\n",
|
||
|
" </tr>\n",
|
||
|
" </thead>\n",
|
||
|
" <tbody>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>female</th>\n",
|
||
|
" <td>0.754789</td>\n",
|
||
|
" <td>2.065134</td>\n",
|
||
|
" <td>27.915709</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>male</th>\n",
|
||
|
" <td>0.205298</td>\n",
|
||
|
" <td>2.335541</td>\n",
|
||
|
" <td>30.726645</td>\n",
|
||
|
" </tr>\n",
|
||
|
" </tbody>\n",
|
||
|
"</table>\n",
|
||
|
"</div>"
|
||
|
],
|
||
|
"text/plain": [
|
||
|
" Survived Pclass Age\n",
|
||
|
"Sex \n",
|
||
|
"female 0.754789 2.065134 27.915709\n",
|
||
|
"male 0.205298 2.335541 30.726645"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 13,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data.groupby(['Sex']).mean()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 14,
|
||
|
"id": "895a8e68-0e8d-4580-bfd0-be8f287d6342",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/html": [
|
||
|
"<div>\n",
|
||
|
"<style scoped>\n",
|
||
|
" .dataframe tbody tr th:only-of-type {\n",
|
||
|
" vertical-align: middle;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe tbody tr th {\n",
|
||
|
" vertical-align: top;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe thead th {\n",
|
||
|
" text-align: right;\n",
|
||
|
" }\n",
|
||
|
"</style>\n",
|
||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
||
|
" <thead>\n",
|
||
|
" <tr style=\"text-align: right;\">\n",
|
||
|
" <th></th>\n",
|
||
|
" <th></th>\n",
|
||
|
" <th>Survived</th>\n",
|
||
|
" <th>Age</th>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>Sex</th>\n",
|
||
|
" <th>Pclass</th>\n",
|
||
|
" <th></th>\n",
|
||
|
" <th></th>\n",
|
||
|
" </tr>\n",
|
||
|
" </thead>\n",
|
||
|
" <tbody>\n",
|
||
|
" <tr>\n",
|
||
|
" <th rowspan=\"3\" valign=\"top\">female</th>\n",
|
||
|
" <th>1</th>\n",
|
||
|
" <td>0.964706</td>\n",
|
||
|
" <td>34.611765</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>2</th>\n",
|
||
|
" <td>0.918919</td>\n",
|
||
|
" <td>28.722973</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>3</th>\n",
|
||
|
" <td>0.460784</td>\n",
|
||
|
" <td>21.750000</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th rowspan=\"3\" valign=\"top\">male</th>\n",
|
||
|
" <th>1</th>\n",
|
||
|
" <td>0.396040</td>\n",
|
||
|
" <td>41.281386</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>2</th>\n",
|
||
|
" <td>0.151515</td>\n",
|
||
|
" <td>30.740707</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>3</th>\n",
|
||
|
" <td>0.150198</td>\n",
|
||
|
" <td>26.507589</td>\n",
|
||
|
" </tr>\n",
|
||
|
" </tbody>\n",
|
||
|
"</table>\n",
|
||
|
"</div>"
|
||
|
],
|
||
|
"text/plain": [
|
||
|
" Survived Age\n",
|
||
|
"Sex Pclass \n",
|
||
|
"female 1 0.964706 34.611765\n",
|
||
|
" 2 0.918919 28.722973\n",
|
||
|
" 3 0.460784 21.750000\n",
|
||
|
"male 1 0.396040 41.281386\n",
|
||
|
" 2 0.151515 30.740707\n",
|
||
|
" 3 0.150198 26.507589"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 14,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data.groupby(['Sex', 'Pclass']).mean()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 15,
|
||
|
"id": "af916e1f-1acc-419d-bb9c-aae85976e218",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"data": {
|
||
|
"text/html": [
|
||
|
"<div>\n",
|
||
|
"<style scoped>\n",
|
||
|
" .dataframe tbody tr th:only-of-type {\n",
|
||
|
" vertical-align: middle;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe tbody tr th {\n",
|
||
|
" vertical-align: top;\n",
|
||
|
" }\n",
|
||
|
"\n",
|
||
|
" .dataframe thead th {\n",
|
||
|
" text-align: right;\n",
|
||
|
" }\n",
|
||
|
"</style>\n",
|
||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
||
|
" <thead>\n",
|
||
|
" <tr style=\"text-align: right;\">\n",
|
||
|
" <th></th>\n",
|
||
|
" <th></th>\n",
|
||
|
" <th>Survived</th>\n",
|
||
|
" <th>Age</th>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>Sex</th>\n",
|
||
|
" <th>Pclass</th>\n",
|
||
|
" <th></th>\n",
|
||
|
" <th></th>\n",
|
||
|
" </tr>\n",
|
||
|
" </thead>\n",
|
||
|
" <tbody>\n",
|
||
|
" <tr>\n",
|
||
|
" <th rowspan=\"3\" valign=\"top\">female</th>\n",
|
||
|
" <th>1</th>\n",
|
||
|
" <td>0.034454</td>\n",
|
||
|
" <td>185.287955</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>2</th>\n",
|
||
|
" <td>0.075528</td>\n",
|
||
|
" <td>165.706451</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>3</th>\n",
|
||
|
" <td>0.250922</td>\n",
|
||
|
" <td>162.051980</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th rowspan=\"3\" valign=\"top\">male</th>\n",
|
||
|
" <th>1</th>\n",
|
||
|
" <td>0.241584</td>\n",
|
||
|
" <td>229.206594</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>2</th>\n",
|
||
|
" <td>0.129870</td>\n",
|
||
|
" <td>218.859292</td>\n",
|
||
|
" </tr>\n",
|
||
|
" <tr>\n",
|
||
|
" <th>3</th>\n",
|
||
|
" <td>0.128145</td>\n",
|
||
|
" <td>147.853777</td>\n",
|
||
|
" </tr>\n",
|
||
|
" </tbody>\n",
|
||
|
"</table>\n",
|
||
|
"</div>"
|
||
|
],
|
||
|
"text/plain": [
|
||
|
" Survived Age\n",
|
||
|
"Sex Pclass \n",
|
||
|
"female 1 0.034454 185.287955\n",
|
||
|
" 2 0.075528 165.706451\n",
|
||
|
" 3 0.250922 162.051980\n",
|
||
|
"male 1 0.241584 229.206594\n",
|
||
|
" 2 0.129870 218.859292\n",
|
||
|
" 3 0.128145 147.853777"
|
||
|
]
|
||
|
},
|
||
|
"execution_count": 15,
|
||
|
"metadata": {},
|
||
|
"output_type": "execute_result"
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"data.groupby(['Sex', 'Pclass']).var()"
|
||
|
]
|
||
|
},
|
||
|
{
|
||
|
"cell_type": "code",
|
||
|
"execution_count": 16,
|
||
|
"id": "42a4b1ae-7a0f-4f43-9ebb-df2f6929e241",
|
||
|
"metadata": {
|
||
|
"tags": []
|
||
|
},
|
||
|
"outputs": [
|
||
|
{
|
||
|
"name": "stdout",
|
||
|
"output_type": "stream",
|
||
|
"text": [
|
||
|
"/home/onyxia\n"
|
||
|
]
|
||
|
}
|
||
|
],
|
||
|
"source": [
|
||
|
"cd"
|
||
|
]
|
||
|
}
|
||
|
],
|
||
|
"metadata": {
|
||
|
"kernelspec": {
|
||
|
"display_name": "Python 3 (ipykernel)",
|
||
|
"language": "python",
|
||
|
"name": "python3"
|
||
|
},
|
||
|
"language_info": {
|
||
|
"codemirror_mode": {
|
||
|
"name": "ipython",
|
||
|
"version": 3
|
||
|
},
|
||
|
"file_extension": ".py",
|
||
|
"mimetype": "text/x-python",
|
||
|
"name": "python",
|
||
|
"nbconvert_exporter": "python",
|
||
|
"pygments_lexer": "ipython3",
|
||
|
"version": "3.10.9"
|
||
|
}
|
||
|
},
|
||
|
"nbformat": 4,
|
||
|
"nbformat_minor": 5
|
||
|
}
|