33 lines
996 B
Python
33 lines
996 B
Python
# scripts/make_minutely_dataset.py
|
|
from __future__ import annotations
|
|
|
|
from pathlib import Path
|
|
|
|
from meteo.dataset import load_raw_csv, resample_to_minutes
|
|
|
|
|
|
FORMATTED_CSV_PATH = Path("data/weather_filled_1s.csv")
|
|
OUTPUT_CSV_PATH = Path("data/weather_minutely.csv")
|
|
|
|
|
|
def main() -> None:
|
|
if not FORMATTED_CSV_PATH.exists():
|
|
print(f"⚠ Fichier formaté introuvable : {FORMATTED_CSV_PATH}")
|
|
print(" Lancez d'abord : python -m scripts.format_raw_csv")
|
|
return
|
|
|
|
df_1s = load_raw_csv(FORMATTED_CSV_PATH)
|
|
print(f"Fichier 1s chargé : {FORMATTED_CSV_PATH}")
|
|
print(f" Lignes : {len(df_1s)}, colonnes : {list(df_1s.columns)}")
|
|
|
|
df_min = resample_to_minutes(df_1s)
|
|
print(f"Après resampling 60s : {len(df_min)} lignes")
|
|
|
|
OUTPUT_CSV_PATH.parent.mkdir(parents=True, exist_ok=True)
|
|
df_min.to_csv(OUTPUT_CSV_PATH, index_label="time")
|
|
print(f"✔ Dataset minuté écrit dans : {OUTPUT_CSV_PATH.resolve()}")
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|