Project_Carmignac/clustering/data_loader.py

23 lines
718 B
Python
Raw Normal View History

2026-02-02 11:37:16 +01:00
import pandas as pd
def load_and_clean_data(flows_path, aum_path, rates_path, gov_path):
"""
Loads raw CSVs and parses dates for consistent time-series analysis.
"""
2026-02-02 12:31:08 +01:00
2026-02-02 11:37:16 +01:00
flows = pd.read_csv(flows_path)
flows['Centralisation Date'] = pd.to_datetime(flows['Centralisation Date'])
aum = pd.read_csv(aum_path)
aum['Centralisation Date'] = pd.to_datetime(aum['Centralisation Date'])
2026-02-02 12:31:08 +01:00
2026-02-02 11:37:16 +01:00
rates = pd.read_csv(rates_path)
try:
rates['Date'] = pd.to_datetime(rates['Date'], dayfirst=True)
except:
rates['Date'] = pd.to_datetime(rates['Date'])
gov = pd.read_csv(gov_path)
gov['Date'] = pd.to_datetime(gov['Date'])
return flows, aum, rates, gov