{ "cells": [ { "cell_type": "markdown", "id": "08977396-ae9a-4c48-9890-e2d3f9bf5c0e", "metadata": {}, "source": [ "# TP : graphique barplot - nombre d'achats par mois" ] }, { "cell_type": "code", "execution_count": 5, "id": "225af1ed-6dcd-4116-99d1-f649dfa8f96f", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import os\n", "import s3fs\n", "import re\n", "import matplotlib.pyplot as plt\n", "\n", "import matplotlib.dates as mdates\n", "from datetime import datetime" ] }, { "cell_type": "code", "execution_count": 2, "id": "7fe35156-ea0b-4f9b-b981-1231e26b1baf", "metadata": {}, "outputs": [], "source": [ "# Create filesystem object\n", "S3_ENDPOINT_URL = \"https://\" + os.environ[\"AWS_S3_ENDPOINT\"]\n", "fs = s3fs.S3FileSystem(client_kwargs={'endpoint_url': S3_ENDPOINT_URL})" ] }, { "cell_type": "code", "execution_count": 3, "id": "e0a09bf5-5a96-40c2-93be-ba0a6a130266", "metadata": {}, "outputs": [], "source": [ "## Evolution vente \n", "\n", "# Importation\n", "# Chargement des données temporaires\n", "BUCKET = \"projet-bdc2324-team1\"\n", "FILE_KEY_S3 = \"0_Temp/Company 1 - Purchases.csv\"\n", "FILE_PATH_S3 = BUCKET + \"/\" + FILE_KEY_S3\n", "\n", "with fs.open(FILE_PATH_S3, mode=\"rb\") as file_in:\n", " purchases = pd.read_csv(file_in, sep=\",\")" ] }, { "cell_type": "code", "execution_count": 27, "id": "0c686793-b760-4013-9f79-f2eeee86cafb", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | ticket_id | \n", "customer_id | \n", "purchase_id | \n", "event_type_id | \n", "supplier_name | \n", "purchase_date | \n", "type_of_ticket_name | \n", "amount | \n", "children | \n", "is_full_price | \n", "name_event_types | \n", "name_facilities | \n", "name_categories | \n", "name_events | \n", "name_seasons | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "13070859 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "8.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
1 | \n", "13070860 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
2 | \n", "13070861 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
3 | \n", "13070862 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
4 | \n", "13070863 | \n", "48187 | \n", "5107462 | \n", "4 | \n", "vente en ligne | \n", "2018-12-28 14:47:50+00:00 | \n", "Atelier | \n", "4.0 | \n", "pricing_formula | \n", "False | \n", "spectacle vivant | \n", "mucem | \n", "indiv prog enfant | \n", "l'école des magiciens | \n", "2018 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1826667 | \n", "20662815 | \n", "1256135 | \n", "8007697 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 17:23:54+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
1826668 | \n", "20662816 | \n", "1256136 | \n", "8007698 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 18:32:18+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
1826669 | \n", "20662817 | \n", "1256136 | \n", "8007698 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 18:32:18+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
1826670 | \n", "20662818 | \n", "1256137 | \n", "8007699 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 19:30:28+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
1826671 | \n", "20662819 | \n", "1256137 | \n", "8007699 | \n", "5 | \n", "vente en ligne | \n", "2023-11-08 19:30:28+00:00 | \n", "Atelier | \n", "11.0 | \n", "pricing_formula | \n", "False | \n", "offre muséale groupe | \n", "mucem | \n", "indiv entrées tp | \n", "NaN | \n", "2023 | \n", "
1826672 rows × 15 columns
\n", "\n", " | month | \n", "fake_category | \n", "purchase_id | \n", "
---|---|---|---|
0 | \n", "2013-06-01 | \n", "1 | \n", "1 | \n", "
1 | \n", "2013-07-01 | \n", "1 | \n", "1 | \n", "
2 | \n", "2013-09-01 | \n", "0 | \n", "2 | \n", "
3 | \n", "2013-10-01 | \n", "1 | \n", "1 | \n", "
4 | \n", "2013-11-01 | \n", "0 | \n", "2 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
196 | \n", "2023-09-01 | \n", "1 | \n", "6900 | \n", "
197 | \n", "2023-10-01 | \n", "0 | \n", "3621 | \n", "
198 | \n", "2023-10-01 | \n", "1 | \n", "8313 | \n", "
199 | \n", "2023-11-01 | \n", "0 | \n", "945 | \n", "
200 | \n", "2023-11-01 | \n", "1 | \n", "2268 | \n", "
201 rows × 3 columns
\n", "\n", " | month | \n", "fake_category | \n", "purchase_id | \n", "
---|---|---|---|
96 | \n", "2019-03-01 | \n", "1 | \n", "102 | \n", "
100 | \n", "2019-05-01 | \n", "1 | \n", "140 | \n", "
102 | \n", "2019-06-01 | \n", "1 | \n", "131 | \n", "
142 | \n", "2021-06-01 | \n", "1 | \n", "157 | \n", "
144 | \n", "2021-07-01 | \n", "1 | \n", "145 | \n", "
148 | \n", "2021-09-01 | \n", "1 | \n", "123 | \n", "
150 | \n", "2021-10-01 | \n", "1 | \n", "220 | \n", "
160 | \n", "2022-03-01 | \n", "1 | \n", "112 | \n", "
162 | \n", "2022-04-01 | \n", "1 | \n", "107 | \n", "
164 | \n", "2022-05-01 | \n", "1 | \n", "164 | \n", "
166 | \n", "2022-06-01 | \n", "1 | \n", "158 | \n", "
172 | \n", "2022-09-01 | \n", "1 | \n", "178 | \n", "
174 | \n", "2022-10-01 | \n", "1 | \n", "218 | \n", "
176 | \n", "2022-11-01 | \n", "1 | \n", "137 | \n", "
178 | \n", "2022-12-01 | \n", "1 | \n", "107 | \n", "
179 | \n", "2023-01-01 | \n", "0 | \n", "2052 | \n", "
180 | \n", "2023-01-01 | \n", "1 | \n", "5079 | \n", "
181 | \n", "2023-02-01 | \n", "0 | \n", "2684 | \n", "
182 | \n", "2023-02-01 | \n", "1 | \n", "6350 | \n", "
183 | \n", "2023-03-01 | \n", "0 | \n", "2196 | \n", "
184 | \n", "2023-03-01 | \n", "1 | \n", "5304 | \n", "
185 | \n", "2023-04-01 | \n", "0 | \n", "3595 | \n", "
186 | \n", "2023-04-01 | \n", "1 | \n", "8563 | \n", "
187 | \n", "2023-05-01 | \n", "0 | \n", "3727 | \n", "
188 | \n", "2023-05-01 | \n", "1 | \n", "8653 | \n", "
189 | \n", "2023-06-01 | \n", "0 | \n", "2904 | \n", "
190 | \n", "2023-06-01 | \n", "1 | \n", "6641 | \n", "
191 | \n", "2023-07-01 | \n", "0 | \n", "4247 | \n", "
192 | \n", "2023-07-01 | \n", "1 | \n", "10022 | \n", "
193 | \n", "2023-08-01 | \n", "0 | \n", "6146 | \n", "
194 | \n", "2023-08-01 | \n", "1 | \n", "14593 | \n", "
195 | \n", "2023-09-01 | \n", "0 | \n", "2954 | \n", "
196 | \n", "2023-09-01 | \n", "1 | \n", "6900 | \n", "
197 | \n", "2023-10-01 | \n", "0 | \n", "3621 | \n", "
198 | \n", "2023-10-01 | \n", "1 | \n", "8313 | \n", "
199 | \n", "2023-11-01 | \n", "0 | \n", "945 | \n", "
200 | \n", "2023-11-01 | \n", "1 | \n", "2268 | \n", "