marktvogt.de/backend/cmd/discovery-eval/run.go

package main

import (
	"context"
	"fmt"
	"log/slog"

	"marktvogt.de/backend/internal/domain/discovery/enrich"
)

// Result is one pair's eval outcome: the label, the verdict, and cache hit
// status (so the summary can report how much was actually paid for).
type Result struct {
	Pair      LabelledPair
	Verdict   CachedVerdict
	Correct   bool
	FromCache bool
}

// run executes the classifier against every pair in the fixture, populating
// the cache along the way. Never fails on individual classifier errors —
// those are reported as "not correct" with a prominent log line so the
// eval always finishes and reports whatever it has.
func run(ctx context.Context, classifier enrich.SimilarityClassifier, cache *Cache, fixture *Fixture, model string) ([]Result, error) {
	results := make([]Result, 0, len(fixture.Pairs))
	for i, p := range fixture.Pairs {
		if err := ctx.Err(); err != nil {
			return results, err
		}

		a := toSimRow(p.A)
		b := toSimRow(p.B)

		if v, ok := cache.Get(a, b, model); ok {
			results = append(results, Result{
				Pair:      p,
				Verdict:   v,
				Correct:   v.Same == p.Same,
				FromCache: true,
			})
			continue
		}

		verdict, err := classifier.Classify(ctx, a, b)
		if err != nil {
			slog.Warn("classify failed; counting as incorrect",
				"pair_index", i, "a_name", p.A.Name, "b_name", p.B.Name, "error", err)
			results = append(results, Result{
				Pair:    p,
				Verdict: CachedVerdict{Reason: fmt.Sprintf("error: %v", err)},
				Correct: false,
			})
			continue
		}
		cached := CachedVerdict{
			Same:       verdict.Same,
			Confidence: verdict.Confidence,
			Reason:     verdict.Reason,
			Model:      verdict.Model,
		}
		cache.Put(a, b, model, cached)
		results = append(results, Result{
			Pair:    p,
			Verdict: cached,
			Correct: cached.Same == p.Same,
		})
	}
	return results, nil
}

// toSimRow maps the fixture shape to the classifier input. NameNormalized
// defaults to Name when the fixture author didn't bother — eval pairs are
// typically written with display names only.
func toSimRow(r PairRow) enrich.SimilarityRow {
	nn := r.NameNormalized
	if nn == "" {
		nn = r.Name
	}
	return enrich.SimilarityRow{
		Name:           r.Name,
		Stadt:          r.Stadt,
		Year:           r.Year,
		NameNormalized: nn,
	}
}