{ "cells": [ { "cell_type": "markdown", "id": "08977396-ae9a-4c48-9890-e2d3f9bf5c0e", "metadata": {}, "source": [ "# TP : graphique barplot - nombre d'achats par mois" ] }, { "cell_type": "code", "execution_count": 5, "id": "225af1ed-6dcd-4116-99d1-f649dfa8f96f", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import os\n", "import s3fs\n", "import re\n", "import matplotlib.pyplot as plt\n", "\n", "import matplotlib.dates as mdates\n", "from datetime import datetime" ] }, { "cell_type": "code", "execution_count": 2, "id": "7fe35156-ea0b-4f9b-b981-1231e26b1baf", "metadata": {}, "outputs": [], "source": [ "# Create filesystem object\n", "S3_ENDPOINT_URL = \"https://\" + os.environ[\"AWS_S3_ENDPOINT\"]\n", "fs = s3fs.S3FileSystem(client_kwargs={'endpoint_url': S3_ENDPOINT_URL})" ] }, { "cell_type": "code", "execution_count": 3, "id": "e0a09bf5-5a96-40c2-93be-ba0a6a130266", "metadata": {}, "outputs": [], "source": [ "## Evolution vente \n", "\n", "# Importation\n", "# Chargement des données temporaires\n", "BUCKET = \"projet-bdc2324-team1\"\n", "FILE_KEY_S3 = \"0_Temp/Company 1 - Purchases.csv\"\n", "FILE_PATH_S3 = BUCKET + \"/\" + FILE_KEY_S3\n", "\n", "with fs.open(FILE_PATH_S3, mode=\"rb\") as file_in:\n", " purchases = pd.read_csv(file_in, sep=\",\")" ] }, { "cell_type": "code", "execution_count": 27, "id": "0c686793-b760-4013-9f79-f2eeee86cafb", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | ticket_id | \n", "customer_id | \n", "purchase_id | \n", "event_type_id | \n", "supplier_name | \n", "purchase_date | \n", "type_of_ticket_name | \n", "amount | \n", "children | \n", "is_full_price | \n", "name_event_types | \n", "name_facilities | \n", "name_categories | \n", "name_events | \n", "name_seasons | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "13070859 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "8.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
| 1 | \n", "13070860 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
| 2 | \n", "13070861 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
| 3 | \n", "13070862 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
| 4 | \n", "13070863 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 1826667 | \n", "20662815 | \n", "1256135 | \n", "8007697 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 17:23:54+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
| 1826668 | \n", "20662816 | \n", "1256136 | \n", "8007698 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 18:32:18+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
| 1826669 | \n", "20662817 | \n", "1256136 | \n", "8007698 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 18:32:18+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
| 1826670 | \n", "20662818 | \n", "1256137 | \n", "8007699 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 19:30:28+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
| 1826671 | \n", "20662819 | \n", "1256137 | \n", "8007699 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 19:30:28+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
1826672 rows × 15 columns
\n", "| \n", " | month | \n", "fake_category | \n", "purchase_id | \n", "
|---|---|---|---|
| 0 | \n", "2013-06-01 | \n", "1 | \n", "1 | \n", "
| 1 | \n", "2013-07-01 | \n", "1 | \n", "1 | \n", "
| 2 | \n", "2013-09-01 | \n", "0 | \n", "2 | \n", "
| 3 | \n", "2013-10-01 | \n", "1 | \n", "1 | \n", "
| 4 | \n", "2013-11-01 | \n", "0 | \n", "2 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "
| 196 | \n", "2023-09-01 | \n", "1 | \n", "6900 | \n", "
| 197 | \n", "2023-10-01 | \n", "0 | \n", "3621 | \n", "
| 198 | \n", "2023-10-01 | \n", "1 | \n", "8313 | \n", "
| 199 | \n", "2023-11-01 | \n", "0 | \n", "945 | \n", "
| 200 | \n", "2023-11-01 | \n", "1 | \n", "2268 | \n", "
201 rows × 3 columns
\n", "| \n", " | month | \n", "fake_category | \n", "purchase_id | \n", "
|---|---|---|---|
| 96 | \n", "2019-03-01 | \n", "1 | \n", "102 | \n", "
| 100 | \n", "2019-05-01 | \n", "1 | \n", "140 | \n", "
| 102 | \n", "2019-06-01 | \n", "1 | \n", "131 | \n", "
| 142 | \n", "2021-06-01 | \n", "1 | \n", "157 | \n", "
| 144 | \n", "2021-07-01 | \n", "1 | \n", "145 | \n", "
| 148 | \n", "2021-09-01 | \n", "1 | \n", "123 | \n", "
| 150 | \n", "2021-10-01 | \n", "1 | \n", "220 | \n", "
| 160 | \n", "2022-03-01 | \n", "1 | \n", "112 | \n", "
| 162 | \n", "2022-04-01 | \n", "1 | \n", "107 | \n", "
| 164 | \n", "2022-05-01 | \n", "1 | \n", "164 | \n", "
| 166 | \n", "2022-06-01 | \n", "1 | \n", "158 | \n", "
| 172 | \n", "2022-09-01 | \n", "1 | \n", "178 | \n", "
| 174 | \n", "2022-10-01 | \n", "1 | \n", "218 | \n", "
| 176 | \n", "2022-11-01 | \n", "1 | \n", "137 | \n", "
| 178 | \n", "2022-12-01 | \n", "1 | \n", "107 | \n", "
| 179 | \n", "2023-01-01 | \n", "0 | \n", "2052 | \n", "
| 180 | \n", "2023-01-01 | \n", "1 | \n", "5079 | \n", "
| 181 | \n", "2023-02-01 | \n", "0 | \n", "2684 | \n", "
| 182 | \n", "2023-02-01 | \n", "1 | \n", "6350 | \n", "
| 183 | \n", "2023-03-01 | \n", "0 | \n", "2196 | \n", "
| 184 | \n", "2023-03-01 | \n", "1 | \n", "5304 | \n", "
| 185 | \n", "2023-04-01 | \n", "0 | \n", "3595 | \n", "
| 186 | \n", "2023-04-01 | \n", "1 | \n", "8563 | \n", "
| 187 | \n", "2023-05-01 | \n", "0 | \n", "3727 | \n", "
| 188 | \n", "2023-05-01 | \n", "1 | \n", "8653 | \n", "
| 189 | \n", "2023-06-01 | \n", "0 | \n", "2904 | \n", "
| 190 | \n", "2023-06-01 | \n", "1 | \n", "6641 | \n", "
| 191 | \n", "2023-07-01 | \n", "0 | \n", "4247 | \n", "
| 192 | \n", "2023-07-01 | \n", "1 | \n", "10022 | \n", "
| 193 | \n", "2023-08-01 | \n", "0 | \n", "6146 | \n", "
| 194 | \n", "2023-08-01 | \n", "1 | \n", "14593 | \n", "
| 195 | \n", "2023-09-01 | \n", "0 | \n", "2954 | \n", "
| 196 | \n", "2023-09-01 | \n", "1 | \n", "6900 | \n", "
| 197 | \n", "2023-10-01 | \n", "0 | \n", "3621 | \n", "
| 198 | \n", "2023-10-01 | \n", "1 | \n", "8313 | \n", "
| 199 | \n", "2023-11-01 | \n", "0 | \n", "945 | \n", "
| 200 | \n", "2023-11-01 | \n", "1 | \n", "2268 | \n", "