anova
This commit is contained in:
parent
29ac99df14
commit
eaf1884bb6
|
@ -4168,355 +4168,7 @@
|
|||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 13,
|
||||
"id": "58cbe8a5-3899-4aa3-91ab-48bed9124fbd",
|
||||
"metadata": {},
|
||||
"outputs": [],
|
||||
"source": [
|
||||
"#creation des base servant au test d'anova\n",
|
||||
"\n",
|
||||
"time_between_purchase_10 = products_purchased_reduced_spectacle.loc[products_purchased_reduced_spectacle['number_compagny'] == 10]\n"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 25,
|
||||
"id": "f563009c-e9a8-4e09-a345-87c49cbd4485",
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"0 581.065880\n",
|
||||
"1 0.000023\n",
|
||||
"2 1032.951030\n",
|
||||
"3 2502.966319\n",
|
||||
"4 1728.097037\n",
|
||||
" ... \n",
|
||||
"35217 0.000000\n",
|
||||
"35218 0.000000\n",
|
||||
"35219 0.000000\n",
|
||||
"35220 0.000000\n",
|
||||
"35221 0.000000\n",
|
||||
"Name: time_between_purchase, Length: 35222, dtype: float64\n",
|
||||
"0 753.75116\n",
|
||||
"1 0.00000\n",
|
||||
"2 0.00000\n",
|
||||
"3 0.00000\n",
|
||||
"4 0.00000\n",
|
||||
" ... \n",
|
||||
"213494 0.00000\n",
|
||||
"213495 0.00000\n",
|
||||
"213496 0.00000\n",
|
||||
"213497 0.00000\n",
|
||||
"213498 0.00000\n",
|
||||
"Name: time_between_purchase, Length: 213499, dtype: float64\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"import pandas as pd\n",
|
||||
"\n",
|
||||
"# Supposons que vous avez un DataFrame appelé products_purchased_reduced_spectacle\n",
|
||||
"# qui contient les données de vos produits achetés avec la colonne 'number_compagny'\n",
|
||||
"\n",
|
||||
"# Créez une liste des identifiants d'entreprise pour lesquels vous voulez effectuer la sélection\n",
|
||||
"entreprises = [11, 12, 13, 14]\n",
|
||||
"\n",
|
||||
"# Parcourez chaque entreprise et effectuez la sélection\n",
|
||||
"for entreprise in entreprises:\n",
|
||||
" nom_variable = f\"time_between_purchase_{entreprise}\"\n",
|
||||
" globals()[nom_variable] = products_purchased_reduced_spectacle.loc[products_purchased_reduced_spectacle['number_compagny'] == entreprise,\"time_between_purchase\"]\n",
|
||||
"\n",
|
||||
"# Maintenant, les résultats pour chaque entreprise sont stockés dans des variables distinctes\n",
|
||||
"# Vous pouvez y accéder directement\n",
|
||||
"print(time_between_purchase_11)\n",
|
||||
"print(time_between_purchase_12)\n",
|
||||
"# et ainsi de suite pour les autres entreprises\n"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 76,
|
||||
"id": "58f49748-e55f-4d1b-b58b-102d02a9e0eb",
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
" sum_sq df F PR(>F)\n",
|
||||
"number_compagny 4.108441e+09 1.0 23548.336165 0.0\n",
|
||||
"Residual 1.334471e+11 764878.0 NaN NaN la p-value associé à la stat de fisher est inferieure à 5% donc il y a un lien entre les entreprise et le temps écoulés entre le premier et le dernier achat\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"#test anova entre les entreprise de spectacle et time_between_purchase\n",
|
||||
"import statsmodels.api as sm\n",
|
||||
"from statsmodels.formula.api import ols\n",
|
||||
"model = ols('time_between_purchase ~ number_compagny', data=products_purchased_reduced_spectacle).fit()\n",
|
||||
"anova_table = sm.stats.anova_lm(model, typ=2)\n",
|
||||
"anova_table\n",
|
||||
"print(anova_table,\"la p-value associé à la stat de fisher est inferieure à 5% donc il y a un lien entre les entreprise et le temps écoulés entre le premier et le dernier achat\" )\n"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 23,
|
||||
"id": "aa000e3e-a44d-4cb4-b44b-9794f4b711ca",
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"data": {
|
||||
"text/html": [
|
||||
"<div>\n",
|
||||
"<style scoped>\n",
|
||||
" .dataframe tbody tr th:only-of-type {\n",
|
||||
" vertical-align: middle;\n",
|
||||
" }\n",
|
||||
"\n",
|
||||
" .dataframe tbody tr th {\n",
|
||||
" vertical-align: top;\n",
|
||||
" }\n",
|
||||
"\n",
|
||||
" .dataframe thead th {\n",
|
||||
" text-align: right;\n",
|
||||
" }\n",
|
||||
"</style>\n",
|
||||
"<table border=\"1\" class=\"dataframe\">\n",
|
||||
" <thead>\n",
|
||||
" <tr style=\"text-align: right;\">\n",
|
||||
" <th></th>\n",
|
||||
" <th>customer_id</th>\n",
|
||||
" <th>nb_tickets</th>\n",
|
||||
" <th>nb_purchases</th>\n",
|
||||
" <th>total_amount</th>\n",
|
||||
" <th>nb_suppliers</th>\n",
|
||||
" <th>vente_internet_max</th>\n",
|
||||
" <th>purchase_date_min</th>\n",
|
||||
" <th>purchase_date_max</th>\n",
|
||||
" <th>time_between_purchase</th>\n",
|
||||
" <th>nb_tickets_internet</th>\n",
|
||||
" <th>number_compagny</th>\n",
|
||||
" </tr>\n",
|
||||
" </thead>\n",
|
||||
" <tbody>\n",
|
||||
" <tr>\n",
|
||||
" <th>0</th>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>12</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" <td>271.60</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>1778.407639</td>\n",
|
||||
" <td>1197.341759</td>\n",
|
||||
" <td>581.065880</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>1</th>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>46.00</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>1407.365937</td>\n",
|
||||
" <td>1407.365914</td>\n",
|
||||
" <td>0.000023</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>2</th>\n",
|
||||
" <td>3</td>\n",
|
||||
" <td>9</td>\n",
|
||||
" <td>8</td>\n",
|
||||
" <td>261.25</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>1461.382106</td>\n",
|
||||
" <td>428.431076</td>\n",
|
||||
" <td>1032.951030</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>3</th>\n",
|
||||
" <td>4</td>\n",
|
||||
" <td>50</td>\n",
|
||||
" <td>48</td>\n",
|
||||
" <td>646.00</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>2846.403148</td>\n",
|
||||
" <td>343.436829</td>\n",
|
||||
" <td>2502.966319</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>4</th>\n",
|
||||
" <td>5</td>\n",
|
||||
" <td>5956</td>\n",
|
||||
" <td>5758</td>\n",
|
||||
" <td>8442.20</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>1732.338241</td>\n",
|
||||
" <td>4.241204</td>\n",
|
||||
" <td>1728.097037</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>...</th>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" <td>...</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>35217</th>\n",
|
||||
" <td>520144</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>20.00</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>0.227512</td>\n",
|
||||
" <td>0.227512</td>\n",
|
||||
" <td>0.000000</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>35218</th>\n",
|
||||
" <td>520148</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>92.00</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>0.111319</td>\n",
|
||||
" <td>0.111319</td>\n",
|
||||
" <td>0.000000</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>35219</th>\n",
|
||||
" <td>520150</td>\n",
|
||||
" <td>3</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>20.00</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>0.088669</td>\n",
|
||||
" <td>0.088669</td>\n",
|
||||
" <td>0.000000</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>35220</th>\n",
|
||||
" <td>520151</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>126.00</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>0.044988</td>\n",
|
||||
" <td>0.044988</td>\n",
|
||||
" <td>0.000000</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" <tr>\n",
|
||||
" <th>35221</th>\n",
|
||||
" <td>520152</td>\n",
|
||||
" <td>2</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>126.00</td>\n",
|
||||
" <td>1</td>\n",
|
||||
" <td>0</td>\n",
|
||||
" <td>0.000000</td>\n",
|
||||
" <td>0.000000</td>\n",
|
||||
" <td>0.000000</td>\n",
|
||||
" <td>0.0</td>\n",
|
||||
" <td>11</td>\n",
|
||||
" </tr>\n",
|
||||
" </tbody>\n",
|
||||
"</table>\n",
|
||||
"<p>35222 rows × 11 columns</p>\n",
|
||||
"</div>"
|
||||
],
|
||||
"text/plain": [
|
||||
" customer_id nb_tickets nb_purchases total_amount nb_suppliers \\\n",
|
||||
"0 1 12 11 271.60 2 \n",
|
||||
"1 2 2 2 46.00 1 \n",
|
||||
"2 3 9 8 261.25 2 \n",
|
||||
"3 4 50 48 646.00 1 \n",
|
||||
"4 5 5956 5758 8442.20 2 \n",
|
||||
"... ... ... ... ... ... \n",
|
||||
"35217 520144 2 1 20.00 1 \n",
|
||||
"35218 520148 2 1 92.00 1 \n",
|
||||
"35219 520150 3 1 20.00 1 \n",
|
||||
"35220 520151 2 1 126.00 1 \n",
|
||||
"35221 520152 2 1 126.00 1 \n",
|
||||
"\n",
|
||||
" vente_internet_max purchase_date_min purchase_date_max \\\n",
|
||||
"0 0 1778.407639 1197.341759 \n",
|
||||
"1 0 1407.365937 1407.365914 \n",
|
||||
"2 0 1461.382106 428.431076 \n",
|
||||
"3 0 2846.403148 343.436829 \n",
|
||||
"4 0 1732.338241 4.241204 \n",
|
||||
"... ... ... ... \n",
|
||||
"35217 0 0.227512 0.227512 \n",
|
||||
"35218 0 0.111319 0.111319 \n",
|
||||
"35219 0 0.088669 0.088669 \n",
|
||||
"35220 0 0.044988 0.044988 \n",
|
||||
"35221 0 0.000000 0.000000 \n",
|
||||
"\n",
|
||||
" time_between_purchase nb_tickets_internet number_compagny \n",
|
||||
"0 581.065880 0.0 11 \n",
|
||||
"1 0.000023 0.0 11 \n",
|
||||
"2 1032.951030 0.0 11 \n",
|
||||
"3 2502.966319 0.0 11 \n",
|
||||
"4 1728.097037 0.0 11 \n",
|
||||
"... ... ... ... \n",
|
||||
"35217 0.000000 0.0 11 \n",
|
||||
"35218 0.000000 0.0 11 \n",
|
||||
"35219 0.000000 0.0 11 \n",
|
||||
"35220 0.000000 0.0 11 \n",
|
||||
"35221 0.000000 0.0 11 \n",
|
||||
"\n",
|
||||
"[35222 rows x 11 columns]"
|
||||
]
|
||||
},
|
||||
"execution_count": 23,
|
||||
"metadata": {},
|
||||
"output_type": "execute_result"
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"time_between_purchase_11"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 28,
|
||||
"execution_count": 29,
|
||||
"id": "e2c51e28-6197-48f0-ab6d-9fc7b3b0de74",
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
|
@ -4528,7 +4180,7 @@
|
|||
"Valeur de p : 0.0\n",
|
||||
"Nombre de degrés de liberté entre les groupes : 4\n",
|
||||
"Nombre de degrés de liberté à l'intérieur des groupes : 764875\n",
|
||||
"Il y a des différences significatives entre au moins une paire de catégories.\n"
|
||||
"Il y a des différences significatives entre au moins une des entrepries .\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
|
|
Loading…
Reference in New Issue
Block a user