diff --git a/Exploration_billet_AJ.ipynb b/Exploration_billet_AJ.ipynb index 64402cd..3280f31 100644 --- a/Exploration_billet_AJ.ipynb +++ b/Exploration_billet_AJ.ipynb @@ -100,9 +100,7 @@ { "cell_type": "markdown", "id": "ccf597b0-b459-4ea5-baf0-5ba8c90915e4", - "metadata": { - "jp-MarkdownHeadingCollapsed": true - }, + "metadata": {}, "source": [ "# Cleaning target area and tags" ] @@ -406,7 +404,101 @@ "metadata": {}, "outputs": [], "source": [ - "#export_in_temporary(target_agg, 'Target_kpi_concatenate')" + "#export_inv_temporary(target_agg, 'Target_kpi_concatenate')" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "id": "9d224485-3472-4cc7-9825-1a643bc94fef", + "metadata": {}, + "outputs": [], + "source": [ + "nb_compagnie = ['1', '2']\n", + "\n", + "def load_files(nb_compagnie):\n", + " targets = pd.DataFrame()\n", + " \n", + " # début de la boucle permettant de générer des datasets agrégés pour les 5 compagnies de spectacle\n", + " for directory_path in nb_compagnie:\n", + " df_customerplus_clean_0 = display_input_databases(directory_path, file_name = \"customerplus_cleaned\")\n", + " df_target_information = display_input_databases(directory_path, file_name = \"target_information\")\n", + " \n", + " df_target_KPI = targets_KPI(df_target = df_target_information)\n", + " df_target_KPI = pd.merge(df_customerplus_clean_0[['customer_id']], df_target_KPI, how = 'left', on = 'customer_id')\n", + "\n", + " targets_columns = list(df_target_KPI.columns)\n", + " targets_columns.remove('customer_id')\n", + " df_target_KPI[targets_columns] = df_target_KPI[targets_columns].fillna(0)\n", + " \n", + " # creation de la colonne Number compagnie, qui permettra d'agréger les résultats\n", + " df_target_KPI[\"number_company\"]=int(directory_path)\n", + " \n", + " # Traitement des index\n", + " df_target_KPI[\"customer_id\"]= directory_path + '_' + df_target_KPI['customer_id'].astype('str')\n", + " \n", + " # Concaténation\n", + " targets = pd.concat([targets, df_target_KPI], ignore_index=True)\n", + " \n", + " return targets" + ] + }, + { + "cell_type": "code", + "execution_count": 50, + "id": "3c911274-0ebd-49af-9487-26524ba20e74", + "metadata": {}, + "outputs": [], + "source": [ + "companies = {'musee' : ['1', '2', '3', '4'], # , '101'\n", + " 'sport': ['5', '6', '7', '8', '9'],\n", + " 'musique' : ['10', '11', '12', '13', '14']}\n", + "\n", + "def target_description(targets):\n", + "\n", + " describe_target = targets.groupby('number_company').agg(\n", + " prop_target_jeune=('target_jeune', lambda x: (x.sum() / x.count())*100),\n", + " prop_target_optin=('target_optin', lambda x: (x.sum() / x.count())*100),\n", + " prop_target_optout=('target_optout', lambda x: (x.sum() / x.count())*100),\n", + " prop_target_scolaire=('target_scolaire', lambda x: (x.sum() / x.count())*100),\n", + " prop_target_entreprise=('target_entreprise', lambda x: (x.sum() / x.count())*100),\n", + " prop_target_famille=('target_famille', lambda x: (x.sum() / x.count())*100),\n", + " prop_target_newsletter=('target_newsletter', lambda x: (x.sum() / x.count())*100))\n", + "\n", + " plot = describe_target[['prop_target_jeune', 'prop_target_scolaire', 'prop_target_entreprise', 'prop_target_famille']].plot.bar()\n", + " \n", + " return plot" + ] + }, + { + "cell_type": "code", + "execution_count": 51, + "id": "af62ecef-9120-4107-af3e-512588a96800", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 51, + "metadata": {}, + "output_type": "execute_result" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "target_description(targets)" ] }, { @@ -546,9 +638,7 @@ { "cell_type": "markdown", "id": "ca2c8b6a-4965-422e-ba7c-66423a464fc1", - "metadata": { - "jp-MarkdownHeadingCollapsed": true - }, + "metadata": {}, "source": [ "## Base communes au types Musée" ] @@ -781,9 +871,7 @@ { "cell_type": "markdown", "id": "76bffba1-5f7e-4308-9224-437ca66148f8", - "metadata": { - "jp-MarkdownHeadingCollapsed": true - }, + "metadata": {}, "source": [ "## KPI sur target_type" ]