from pathlib import Path
import json

import matplotlib.pyplot as plt
import pandas as pd
from IPython.display import Image, display

PROJECT_ROOT = None
for candidate in [Path.cwd().resolve(), *Path.cwd().resolve().parents]:
    if (candidate / 'artifacts').exists() and (candidate / 'README.md').exists():
        PROJECT_ROOT = candidate
        break
if PROJECT_ROOT is None:
    raise RuntimeError('Could not locate the project root from the current working directory.')

benchmark_root = PROJECT_ROOT / 'artifacts' / 'modern' / 'benchmark'
final_root = PROJECT_ROOT / 'artifacts' / 'modern' / 'final_model'
leaderboard = pd.read_csv(benchmark_root / 'leaderboard.csv')
runs = pd.read_csv(benchmark_root / 'benchmark_runs.csv')
summary = json.loads((benchmark_root / 'metrics_summary.json').read_text(encoding='utf-8'))
winner_name = summary['winner']['model']
leaderboard

pd.DataFrame([summary['winner']])

fig, axes = plt.subplots(1, 2, figsize=(12, 4))

axes[0].bar(leaderboard['model'], leaderboard['mean_image_AUROC'], color=['#d97706', '#2563eb'])
axes[0].set_ylim(0, 1.05)
axes[0].set_title('Mean image AUROC')
axes[0].set_ylabel('score')

axes[1].bar(leaderboard['model'], leaderboard['mean_latency_ms'], color=['#b45309', '#1d4ed8'])
axes[1].set_title('Latency per image (ms)')
axes[1].set_ylabel('ms')

fig.tight_layout()
fig

runs

gallery_root = final_root / 'Patchcore' / 'mandarine_cropped_modern' / 'v0' / 'images'
good_examples = sorted((gallery_root / 'good').glob('*'))[:3]
bad_examples = sorted((gallery_root / 'bad').glob('*'))[:3]

print('Good examples:')
for path in good_examples:
    print(path.name)
    display(Image(filename=str(path), width=420))

print('Bad examples:')
for path in bad_examples:
    print(path.name)
    display(Image(filename=str(path), width=420))

Good examples:
cropped_normal_0002.jpg

cropped_normal_0008.jpg

cropped_normal_0009.jpg

Bad examples:
cropped_abnormal_0001.jpg

cropped_abnormal_0003.jpg

cropped_abnormal_0004.jpg

	model	mean_image_AUROC	std_image_AUROC	mean_image_AUPR	std_image_AUPR	mean_image_F1	std_image_F1	mean_latency_ms	std_latency_ms	completed_runs
0	patchcore	0.933333	0.049889	0.939841	0.050396	0.840741	0.036665	173.664240	2.374339	3
1	anomalydino	0.786667	0.018856	0.811111	0.015713	0.551587	0.170681	106.279883	1.855926	3

	seed	model	status	error_message	image_AUROC	image_F1Score	image_AUPR	latency_ms
0	13	patchcore	ok	NaN	1.00	0.888889	1.000000	176.98990
1	13	anomalydino	ok	NaN	0.80	0.571429	0.800000	107.14405
2	23	patchcore	ok	NaN	0.88	0.800000	0.876667	171.59989
3	23	anomalydino	ok	NaN	0.80	0.333333	0.800000	107.99410
4	42	patchcore	ok	NaN	0.92	0.833333	0.942857	172.40293
5	42	anomalydino	ok	NaN	0.76	0.750000	0.833333	103.70150

Modern Benchmark Report¶

Contexto¶

Ganador del benchmark¶

Gráficas rápidas¶

Resultados por seed¶

Ejemplos visuales del conjunto final¶