You've already forked etude_lego_jurassic_world
Ajoute la heatmap annuelle des personnages
This commit is contained in:
@@ -14,6 +14,11 @@ def load_counts(path: Path) -> List[dict]:
|
||||
return read_rows(path)
|
||||
|
||||
|
||||
def load_presence(path: Path) -> List[dict]:
|
||||
"""Charge le CSV de présence par année/personnage."""
|
||||
return read_rows(path)
|
||||
|
||||
|
||||
def plot_minifigs_per_character(counts_path: Path, destination_path: Path) -> None:
|
||||
"""Trace un diagramme en barres horizontales du nombre de minifigs par personnage."""
|
||||
rows = load_counts(counts_path)
|
||||
@@ -40,3 +45,49 @@ def plot_minifigs_per_character(counts_path: Path, destination_path: Path) -> No
|
||||
fig.tight_layout()
|
||||
fig.savefig(destination_path, dpi=160)
|
||||
plt.close(fig)
|
||||
|
||||
|
||||
def plot_character_year_presence(presence_path: Path, destination_path: Path) -> None:
|
||||
"""Trace une heatmap binaire indiquant la présence d'un personnage par année."""
|
||||
rows = load_presence(presence_path)
|
||||
if not rows:
|
||||
return
|
||||
years = sorted({int(row["year"]) for row in rows})
|
||||
characters = sorted(
|
||||
{row["known_character"] for row in rows},
|
||||
key=lambda name: (
|
||||
-sum(1 for r in rows if r["known_character"] == name and r["present"] == "1"),
|
||||
name,
|
||||
),
|
||||
)
|
||||
matrix = []
|
||||
for character in characters:
|
||||
row_values = []
|
||||
for year in years:
|
||||
present = next(
|
||||
(r["present"] for r in rows if r["known_character"] == character and int(r["year"]) == year),
|
||||
"0",
|
||||
)
|
||||
row_values.append(int(present))
|
||||
matrix.append(row_values)
|
||||
|
||||
height = max(5, len(characters) * 0.35)
|
||||
fig, ax = plt.subplots(figsize=(12, height))
|
||||
cax = ax.imshow(matrix, aspect="auto", cmap="Greens", interpolation="nearest")
|
||||
ax.set_xticks(range(len(years)))
|
||||
ax.set_xticklabels(years, rotation=45, ha="right")
|
||||
ax.set_yticks(range(len(characters)))
|
||||
ax.set_yticklabels(characters)
|
||||
ax.set_xlabel("Année")
|
||||
ax.set_ylabel("Personnage")
|
||||
ax.set_title("Présence des personnages par année (hors figurants)")
|
||||
for i, character in enumerate(characters):
|
||||
for j, year in enumerate(years):
|
||||
value = matrix[i][j]
|
||||
if value == 1:
|
||||
ax.text(j, i, "●", ha="center", va="center", color="#0d0d0d", fontsize=7)
|
||||
fig.colorbar(cax, ax=ax, fraction=0.046, pad=0.04, label="Présence (1 si minifig)")
|
||||
ensure_parent_dir(destination_path)
|
||||
fig.tight_layout()
|
||||
fig.savefig(destination_path, dpi=160)
|
||||
plt.close(fig)
|
||||
|
||||
@@ -39,3 +39,59 @@ def write_character_counts(path: Path, rows: Sequence[dict]) -> None:
|
||||
writer.writeheader()
|
||||
for row in rows:
|
||||
writer.writerow(row)
|
||||
|
||||
|
||||
def load_sets_enriched(path: Path) -> Dict[str, str]:
|
||||
"""Indexe les années par set_num."""
|
||||
lookup: Dict[str, str] = {}
|
||||
with path.open() as sets_file:
|
||||
reader = csv.DictReader(sets_file)
|
||||
for row in reader:
|
||||
lookup[row["set_num"]] = row["year"]
|
||||
return lookup
|
||||
|
||||
|
||||
def aggregate_presence_by_year(
|
||||
minifigs_rows: Iterable[dict],
|
||||
sets_years: Dict[str, str],
|
||||
excluded_characters: Sequence[str] | None = None,
|
||||
) -> List[dict]:
|
||||
"""Construit la présence binaire des personnages par année (hors figurants)."""
|
||||
excluded = set(excluded_characters or [])
|
||||
presence: set[tuple[str, int]] = set()
|
||||
years_all = {int(year) for year in sets_years.values()}
|
||||
for row in minifigs_rows:
|
||||
character = row["known_character"].strip()
|
||||
fig_num = row["fig_num"].strip()
|
||||
if character == "" or fig_num == "":
|
||||
continue
|
||||
if character in excluded:
|
||||
continue
|
||||
year = sets_years.get(row["set_num"])
|
||||
if year is None:
|
||||
continue
|
||||
presence.add((character, int(year)))
|
||||
years = sorted(years_all)
|
||||
characters = sorted({character for character, _ in presence})
|
||||
results: List[dict] = []
|
||||
for character in characters:
|
||||
for year in years:
|
||||
results.append(
|
||||
{
|
||||
"known_character": character,
|
||||
"year": str(year),
|
||||
"present": "1" if (character, year) in presence else "0",
|
||||
}
|
||||
)
|
||||
return results
|
||||
|
||||
|
||||
def write_presence_by_year(path: Path, rows: Sequence[dict]) -> None:
|
||||
"""Écrit la matrice présence binaire année/personnage."""
|
||||
ensure_parent_dir(path)
|
||||
fieldnames = ["known_character", "year", "present"]
|
||||
with path.open("w", newline="") as csv_file:
|
||||
writer = csv.DictWriter(csv_file, fieldnames=fieldnames)
|
||||
writer.writeheader()
|
||||
for row in rows:
|
||||
writer.writerow(row)
|
||||
|
||||
Reference in New Issue
Block a user