feat(discovery): AI tiebreak for ambiguous similarity matches

Ship 2 MR 4. Adds per-pair AI-backed classification for operator use inside the existing Similar panel: an "AI?" button next to each candidate asks Mistral whether the two queue rows refer to the same underlying market. Result shown inline as a green "✓ same N%" or grey "✗ diff N%" chip with the LLM's reason on hover. No scraping — the classifier works from (name, city, year) alone, which is enough for the common cases (same venue on two calendars, typos, cross-year recurrence). Call is short (usually <3s) so the handler is synchronous, 15s deadline. Caching - Migration 000020 adds similarity_ai_cache keyed on a content hash over (normalized_name|stadt|year) for both rows, sorted for symmetry. Survives queue row accept/reject because the hash is about markt-content, not queue-row lifecycle. - enrich.SimilarityPairKey computes the key. Classify(a,b) and Classify(b,a) hit the same entry. Stadt casing drift doesn't invalidate. - Repo methods GetSimilarityCache / SetSimilarityCache + corresponding mock hooks. DefaultSimilarityCacheTTL=30d. Mistral integration - enrich.MistralSimilarityClassifier reuses the same aiPass2 interface as the enricher. English system prompt asks for JSON-only output with {same_market, confidence 0..1, reason}. Confidence clamped to [0,1] because models occasionally return 1.2 or -0.1. Reason is short German justification. - NoopSimilarityClassifier returns an error — callers must check ai.Enabled() before deciding which binding to pass. Service.ClassifySimilarPair loads both rows, computes pair key, cache-first, calls classifier on miss, writes cache, returns verdict. Rejects self-comparison (pair-key collapses). Handler POST /admin/discovery/queue/:aid/similar/:bid/classify. UI: new AI? column inside the Similar panel. Per-candidate pending state via Set<string>, disabled button while in-flight, inline verdict chip after response. Tooltip shows the LLM's reason. Tests: pair-key symmetry + differentiation + casing tolerance; Mistral classifier happy path, clamping edge cases, error propagation, bad-JSON handling, Noop rejection. Service tests: happy path writes cache, cache-hit skips LLM, self-comparison rejected, classifier errors don't poison the cache. NewService signature grows by one param (sim enrich. SimilarityClassifier). All 14 existing callers (routes.go + tests) updated; tests pass nil.
2026-04-24 11:04:15 +02:00
parent ce32f76731
commit e0b73acfd6
13 changed files with 703 additions and 22 deletions
--- a/backend/internal/domain/discovery/enrich/similarity.go
+++ b/backend/internal/domain/discovery/enrich/similarity.go
@@ -0,0 +1,181 @@
 package enrich
 import (
 	"context"
 	"crypto/sha256"
 	"encoding/hex"
 	"encoding/json"
 	"errors"
 	"fmt"
 	"strings"
 	"time"
 )
 // SimilarityRow carries the minimal identifying fields the classifier reads.
 // Callers adapt their domain row into this shape — the enrich package stays
 // free of a reverse import on discovery.
 type SimilarityRow struct {
 	NameNormalized string
 	Stadt          string
 	// Year is StartDatum.Year() (or 0 when unknown). Two rows differing only
 	// in year are almost always the same series in different editions —
 	// useful signal but not identity.
 	Year int
 	// Display fields — shown to the LLM verbatim so it can reason about
 	// casing / diacritics that NameNormalized strips.
 	Name string
 	// Quellen are passed in but not scraped — the classifier works from
 	// name/city/date alone. Included in the prompt only as metadata.
 	Quellen []string
 }
 // Verdict is the classifier's answer about one pair.
 type Verdict struct {
 	Same         bool      `json:"same"`
 	Confidence   float64   `json:"confidence"` // 0..1
 	Reason       string    `json:"reason"`
 	Model        string    `json:"model,omitempty"`
 	ClassifiedAt time.Time `json:"classified_at,omitempty"`
 }
 // SimilarityClassifier decides whether two queue rows refer to the same
 // underlying market. Implementations should be deterministic across calls
 // on the same input — callers cache the result.
 type SimilarityClassifier interface {
 	Classify(ctx context.Context, a, b SimilarityRow) (Verdict, error)
 }
 // NoopSimilarityClassifier returns a zero-confidence verdict without calling
 // anything. Used as a fallback when AI is disabled; callers should check
 // ai.Enabled() and fall back to this type rather than passing nil.
 type NoopSimilarityClassifier struct{}
 func (NoopSimilarityClassifier) Classify(_ context.Context, _, _ SimilarityRow) (Verdict, error) {
 	return Verdict{}, errors.New("similarity classifier not configured")
 }
 // SimilarityPairKey derives a content-hash cache key over the two rows'
 // identifying tuples. Ordering-independent: Classify(a,b) and Classify(b,a)
 // must hit the same cache entry.
 //
 // Uses NameNormalized + lowered Stadt + Year so the key survives casing
 // drift, whitespace, and umlaut normalisation (NameNormalized already did
 // the heavy lifting).
 func SimilarityPairKey(a, b SimilarityRow) string {
 	keyA := fmt.Sprintf("%s|%s|%d", a.NameNormalized, lowerASCII(a.Stadt), a.Year)
 	keyB := fmt.Sprintf("%s|%s|%d", b.NameNormalized, lowerASCII(b.Stadt), b.Year)
 	// Sort lexicographically for symmetry.
 	var raw string
 	if keyA <= keyB {
 		raw = keyA + "||" + keyB
 	} else {
 		raw = keyB + "||" + keyA
 	}
 	sum := sha256.Sum256([]byte(raw))
 	return hex.EncodeToString(sum[:])
 }
 // DefaultSimilarityCacheTTL: 30 days matches the enrichment cache TTL —
 // same reasoning (amortise cost across re-crawls, source edits eventually
 // propagate).
 const DefaultSimilarityCacheTTL = 30 * 24 * time.Hour
 // MistralSimilarityClassifier implements SimilarityClassifier by sending a
 // JSON-formatted comparison prompt to Mistral's chat endpoint.
 type MistralSimilarityClassifier struct {
 	Client aiPass2
 }
 // NewMistralSimilarityClassifier binds a Mistral ai.Client. client must be
 // non-nil; routes.go falls back to NoopSimilarityClassifier when AI is off.
 func NewMistralSimilarityClassifier(client aiPass2) *MistralSimilarityClassifier {
 	return &MistralSimilarityClassifier{Client: client}
 }
 // simResponse is the JSON shape we instruct Mistral to return. Confidence
 // must be parseable as a float 0..1; anything outside that range is clamped.
 type simResponse struct {
 	SameMarket bool    `json:"same_market"`
 	Confidence float64 `json:"confidence"`
 	Reason     string  `json:"reason"`
 }
 // Classify sends the paired metadata to Mistral and parses the JSON response.
 // No web scraping — the classifier works from name/city/year alone, which is
 // enough for the common cases (same venue listed on two different calendars,
 // editing typos, cross-year recurrence).
 func (m *MistralSimilarityClassifier) Classify(ctx context.Context, a, b SimilarityRow) (Verdict, error) {
 	if m.Client == nil {
 		return Verdict{}, errors.New("mistral similarity classifier not configured")
 	}
 	systemPrompt := simSystemPrompt()
 	userPrompt := simUserPrompt(a, b)
 	result, err := m.Client.Pass2(ctx, systemPrompt, userPrompt)
 	if err != nil {
 		return Verdict{}, fmt.Errorf("pass2: %w", err)
 	}
 	var parsed simResponse
 	if err := json.Unmarshal([]byte(result.Content), &parsed); err != nil {
 		return Verdict{}, fmt.Errorf("parse response: %w (content=%q)", err, result.Content)
 	}
 	// Clamp confidence to [0,1]; the model occasionally returns 1.2 or -0.1.
 	conf := parsed.Confidence
 	if conf < 0 {
 		conf = 0
 	}
 	if conf > 1 {
 		conf = 1
 	}
 	return Verdict{
 		Same:         parsed.SameMarket,
 		Confidence:   conf,
 		Reason:       strings.TrimSpace(parsed.Reason),
 		Model:        result.Model,
 		ClassifiedAt: time.Now().UTC(),
 	}, nil
 }
 func simSystemPrompt() string {
 	return strings.TrimSpace(`
 You decide whether two candidate entries refer to the same medieval market
 (Mittelaltermarkt) in the DACH region. Input: two objects each with a name,
 city, and year. Output a single JSON object:
  {
    "same_market": true|false,
    "confidence": 0.0-1.0,     // how sure you are
    "reason":     "..."         // short German justification (<= 140 chars)
  }
 Rules:
 - Return ONLY the JSON object. No prose, no code fences.
 - "Same market" means same recurring event — same venue, same organiser,
  same audience. A market and its anniversary edition in a later year ARE
  the same market (just different editions).
 - Different cities = different markets, even if the name matches.
 - Rephrasings, typos, and umlaut differences (Dresden vs Straßburg vs
  Strassburg) are the same market if the underlying identifiers align.
 - If the evidence is weak, return same_market=false with low confidence
  rather than guessing. Low confidence is more useful than a wrong guess.
 `)
 }
 func simUserPrompt(a, b SimilarityRow) string {
 	// Keep the JSON compact; the model handles inline JSON better than
 	// pretty-printed when the task is "read two records".
 	ja, _ := json.Marshal(map[string]any{
 		"name": a.Name,
 		"city": a.Stadt,
 		"year": a.Year,
 	})
 	jb, _ := json.Marshal(map[string]any{
 		"name": b.Name,
 		"city": b.Stadt,
 		"year": b.Year,
 	})
 	return fmt.Sprintf("A: %s\nB: %s", ja, jb)
 }
--- a/backend/internal/domain/discovery/enrich/similarity_test.go
+++ b/backend/internal/domain/discovery/enrich/similarity_test.go
@@ -0,0 +1,118 @@
 package enrich
 import (
 	"context"
 	"errors"
 	"strings"
 	"testing"
 	"marktvogt.de/backend/internal/pkg/ai"
 )
 func TestSimilarityPairKey_Symmetric(t *testing.T) {
 	a := SimilarityRow{NameNormalized: "ritterfest dresden", Stadt: "Dresden", Year: 2026}
 	b := SimilarityRow{NameNormalized: "ritterfest leipzig", Stadt: "Leipzig", Year: 2026}
 	if SimilarityPairKey(a, b) != SimilarityPairKey(b, a) {
 		t.Error("pair key must be symmetric: (a,b) and (b,a) should produce identical keys")
 	}
 }
 func TestSimilarityPairKey_DifferentInputsDifferentKeys(t *testing.T) {
 	a := SimilarityRow{NameNormalized: "ritterfest dresden", Stadt: "Dresden", Year: 2026}
 	b := SimilarityRow{NameNormalized: "ritterfest leipzig", Stadt: "Leipzig", Year: 2026}
 	c := SimilarityRow{NameNormalized: "ritterfest dresden", Stadt: "Dresden", Year: 2027}
 	if SimilarityPairKey(a, b) == SimilarityPairKey(a, c) {
 		t.Error("different pairs must produce different keys")
 	}
 	// Stadt casing must not change the key.
 	d := SimilarityRow{NameNormalized: "ritterfest dresden", Stadt: "DRESDEN", Year: 2026}
 	if SimilarityPairKey(a, b) != SimilarityPairKey(d, b) {
 		t.Error("stadt casing drift must not change the key")
 	}
 }
 func TestMistralSimilarity_HappyPath(t *testing.T) {
 	client := &stubPass2{
 		result: ai.PassResult{
 			Content: `{"same_market":true,"confidence":0.82,"reason":"Gleicher Name, gleiche Stadt, gleiches Jahr."}`,
 			Model:   "mistral-large-latest",
 		},
 	}
 	c := NewMistralSimilarityClassifier(client)
 	got, err := c.Classify(context.Background(),
 		SimilarityRow{Name: "Mittelaltermarkt Dresden", Stadt: "Dresden", Year: 2026},
 		SimilarityRow{Name: "Mittelaltermarkt Dresden 2026", Stadt: "Dresden", Year: 2026},
 	)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if !got.Same {
 		t.Errorf("same = false; want true")
 	}
 	if got.Confidence < 0.8 || got.Confidence > 0.85 {
 		t.Errorf("confidence = %v; want ~0.82", got.Confidence)
 	}
 	if got.Reason == "" {
 		t.Error("reason missing")
 	}
 	if got.Model != "mistral-large-latest" {
 		t.Errorf("model = %q", got.Model)
 	}
 	// Prompt must carry both rows' identifying fields for the LLM to reason on.
 	if !strings.Contains(client.lastUser, "Mittelaltermarkt Dresden") {
 		t.Error("user prompt missing A.name")
 	}
 	if !strings.Contains(client.lastSystem, "same_market") {
 		t.Error("system prompt should describe the JSON schema (same_market key)")
 	}
 }
 func TestMistralSimilarity_ClampsConfidence(t *testing.T) {
 	tests := []struct {
 		name     string
 		raw      string
 		wantConf float64
 	}{
 		{"above 1 clamps to 1", `{"same_market":true,"confidence":1.4,"reason":"x"}`, 1.0},
 		{"below 0 clamps to 0", `{"same_market":false,"confidence":-0.3,"reason":"x"}`, 0.0},
 		{"in range passes through", `{"same_market":true,"confidence":0.5,"reason":"x"}`, 0.5},
 	}
 	for _, tc := range tests {
 		t.Run(tc.name, func(t *testing.T) {
 			c := NewMistralSimilarityClassifier(&stubPass2{result: ai.PassResult{Content: tc.raw}})
 			got, err := c.Classify(context.Background(), SimilarityRow{}, SimilarityRow{})
 			if err != nil {
 				t.Fatalf("unexpected error: %v", err)
 			}
 			if got.Confidence != tc.wantConf {
 				t.Errorf("confidence = %v; want %v", got.Confidence, tc.wantConf)
 			}
 		})
 	}
 }
 func TestMistralSimilarity_PropagatesPass2Error(t *testing.T) {
 	c := NewMistralSimilarityClassifier(&stubPass2{err: errors.New("mistral down")})
 	_, err := c.Classify(context.Background(), SimilarityRow{}, SimilarityRow{})
 	if err == nil {
 		t.Fatal("expected error; got nil")
 	}
 }
 func TestMistralSimilarity_RejectsBadJSON(t *testing.T) {
 	c := NewMistralSimilarityClassifier(&stubPass2{result: ai.PassResult{Content: "not json at all"}})
 	_, err := c.Classify(context.Background(), SimilarityRow{}, SimilarityRow{})
 	if err == nil {
 		t.Fatal("expected parse error; got nil")
 	}
 }
 func TestNoopSimilarityClassifier_Errors(t *testing.T) {
 	_, err := NoopSimilarityClassifier{}.Classify(context.Background(), SimilarityRow{}, SimilarityRow{})
 	if err == nil {
 		t.Error("NoopSimilarityClassifier should return error — it's the fallback when AI is disabled")
 	}
 }
--- a/backend/internal/domain/discovery/handler.go
+++ b/backend/internal/domain/discovery/handler.go
@@ -386,6 +386,36 @@ func (h *Handler) EnrichLLM(c *gin.Context) {
 	c.JSON(http.StatusOK, gin.H{"data": payload})
 }
 // ClassifySimilarPair runs the LLM duplicate-tiebreaker on the two queue
 // rows identified by URL params :aid and :bid. Synchronous, 15s deadline —
 // the call is short (no scraping) so the operator can click and immediately
 // see the verdict.
 func (h *Handler) ClassifySimilarPair(c *gin.Context) {
 	aID, err := uuid.Parse(c.Param("aid"))
 	if err != nil {
 		apiErr := apierror.BadRequest("invalid_id", "invalid queue id A")
 		c.JSON(apiErr.Status, apierror.NewResponse(apiErr))
 		return
 	}
 	bID, err := uuid.Parse(c.Param("bid"))
 	if err != nil {
 		apiErr := apierror.BadRequest("invalid_id", "invalid queue id B")
 		c.JSON(apiErr.Status, apierror.NewResponse(apiErr))
 		return
 	}
 	ctx, cancel := context.WithTimeout(c.Request.Context(), 15*time.Second)
 	defer cancel()
 	verdict, err := h.service.ClassifySimilarPair(ctx, aID, bID)
 	if err != nil {
 		slog.WarnContext(ctx, "classify similar failed", "a", aID, "b", bID, "error", err)
 		apiErr := apierror.Internal("classify failed: " + err.Error())
 		c.JSON(apiErr.Status, apierror.NewResponse(apiErr))
 		return
 	}
 	c.JSON(http.StatusOK, gin.H{"data": verdict})
 }
 func currentUserID(c *gin.Context) (uuid.UUID, bool) {
 	raw, exists := c.Get("user_id")
 	if !exists {
--- a/backend/internal/domain/discovery/handler_test.go
+++ b/backend/internal/domain/discovery/handler_test.go
@@ -57,6 +57,7 @@ func TestCrawlHandlerReturns202AndStartsCrawl(t *testing.T) {
 		noopMarketCreator{},
 		nil,
 		nil,
 		nil,
 	)
 	h := NewHandler(svc, 0) // rate limit disabled
@@ -91,7 +92,7 @@ func TestCrawlHandlerReturns202AndStartsCrawl(t *testing.T) {
 // TestCrawlStatusInitialState verifies the zero state of a freshly constructed Handler.
 func TestCrawlStatusInitialState(t *testing.T) {
-	svc := NewService(newMockRepo(), &stubCrawlerRunner{}, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(newMockRepo(), &stubCrawlerRunner{}, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	h := NewHandler(svc, 0)
 	w := httptest.NewRecorder()
@@ -141,7 +142,7 @@ func TestCrawlHandlerConcurrentReturnsTooManyRequests(t *testing.T) {
 		started: make(chan struct{}),
 		release: make(chan struct{}),
 	}
-	svc := NewService(newMockRepo(), bc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(newMockRepo(), bc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	h := NewHandler(svc, 0) // rate limit disabled
 	// First request — returns 202 and spawns goroutine.
@@ -184,6 +185,7 @@ func TestCrawlHandlerRateLimit(t *testing.T) {
 		noopMarketCreator{},
 		nil,
 		nil,
 		nil,
 	)
 	// 1 per hour window.
 	h := NewHandler(svc, 1)
--- a/backend/internal/domain/discovery/mock_repo_test.go
+++ b/backend/internal/domain/discovery/mock_repo_test.go
@@ -36,6 +36,10 @@ type mockRepo struct {
 	getCacheFn          func(key string) (enrich.Enrichment, bool, error)
 	setCacheFn          func(key string, payload enrich.Enrichment, ttl time.Duration) error
 	listPendingEnrichFn func(limit int) ([]DiscoveredMarket, error)
 	// Similarity AI cache hooks.
 	getSimCacheFn func(pairKey string) (enrich.Verdict, bool, error)
 	setSimCacheFn func(pairKey string, v enrich.Verdict, ttl time.Duration) error
 }
 func (m *mockRepo) ListSeriesByCity(ctx context.Context, c string) ([]SeriesCandidate, error) {
@@ -122,6 +126,18 @@ func (m *mockRepo) ListPendingEnrichment(_ context.Context, limit int) ([]Discov
 	}
 	return nil, nil
 }
 func (m *mockRepo) GetSimilarityCache(_ context.Context, pairKey string) (enrich.Verdict, bool, error) {
 	if m.getSimCacheFn != nil {
 		return m.getSimCacheFn(pairKey)
 	}
 	return enrich.Verdict{}, false, nil
 }
 func (m *mockRepo) SetSimilarityCache(_ context.Context, pairKey string, v enrich.Verdict, ttl time.Duration) error {
 	if m.setSimCacheFn != nil {
 		return m.setSimCacheFn(pairKey, v, ttl)
 	}
 	return nil
 }
 // noopLinkVerifier passes every URL — used by tests to isolate from network.
 type noopLinkVerifier struct{}
--- a/backend/internal/domain/discovery/repository.go
+++ b/backend/internal/domain/discovery/repository.go
@@ -40,6 +40,10 @@ type Repository interface {
 	// Cache operations keyed on sha256(name_normalized|stadt|year).
 	GetEnrichmentCache(ctx context.Context, key string) (enrich.Enrichment, bool, error)
 	SetEnrichmentCache(ctx context.Context, key string, payload enrich.Enrichment, ttl time.Duration) error
 	// Similarity AI cache — keyed on enrich.SimilarityPairKey.
 	GetSimilarityCache(ctx context.Context, pairKey string) (enrich.Verdict, bool, error)
 	SetSimilarityCache(ctx context.Context, pairKey string, v enrich.Verdict, ttl time.Duration) error
 }
 // SeriesCandidate is a minimal projection used for name-normalization comparison in Go.
@@ -426,3 +430,43 @@ ON CONFLICT (cache_key) DO UPDATE
 	}
 	return nil
 }
 // GetSimilarityCache returns a cached AI verdict for a (pairKey) or
 // (zero, false, nil) on miss/expiry. Expired entries are treated as misses.
 func (r *pgRepository) GetSimilarityCache(ctx context.Context, pairKey string) (enrich.Verdict, bool, error) {
 	var v enrich.Verdict
 	err := r.pool.QueryRow(ctx, `
 SELECT same, confidence, reason, model FROM similarity_ai_cache
 WHERE pair_key = $1
  AND (expires_at IS NULL OR expires_at > now())`, pairKey).Scan(&v.Same, &v.Confidence, &v.Reason, &v.Model)
 	if errors.Is(err, pgx.ErrNoRows) {
 		return enrich.Verdict{}, false, nil
 	}
 	if err != nil {
 		return enrich.Verdict{}, false, fmt.Errorf("similarity cache get: %w", err)
 	}
 	return v, true, nil
 }
 // SetSimilarityCache upserts a verdict. ttl=0 means "no expiry" (nullable).
 func (r *pgRepository) SetSimilarityCache(ctx context.Context, pairKey string, v enrich.Verdict, ttl time.Duration) error {
 	var expiresAt *time.Time
 	if ttl > 0 {
 		t := time.Now().Add(ttl)
 		expiresAt = &t
 	}
 	_, err := r.pool.Exec(ctx, `
 INSERT INTO similarity_ai_cache (pair_key, same, confidence, reason, model, expires_at)
 VALUES ($1, $2, $3, $4, $5, $6)
 ON CONFLICT (pair_key) DO UPDATE
  SET same       = EXCLUDED.same,
      confidence = EXCLUDED.confidence,
      reason     = EXCLUDED.reason,
      model      = EXCLUDED.model,
      created_at = now(),
      expires_at = EXCLUDED.expires_at`, pairKey, v.Same, v.Confidence, v.Reason, v.Model, expiresAt)
 	if err != nil {
 		return fmt.Errorf("similarity cache set: %w", err)
 	}
 	return nil
 }
--- a/backend/internal/domain/discovery/routes.go
+++ b/backend/internal/domain/discovery/routes.go
@@ -26,6 +26,8 @@ func RegisterRoutes(
 		admin.GET("/queue/:id/similar", h.Similar)
 		// Per-row LLM enrichment (MR 3b). Synchronous — operator waits.
 		admin.POST("/queue/:id/enrich", h.EnrichLLM)
 		// Per-pair AI similarity tiebreak (MR 4). Synchronous; short call.
 		admin.POST("/queue/:aid/similar/:bid/classify", h.ClassifySimilarPair)
 		// Manual crawl trigger — subject to hourly rate limit.
 		admin.POST("/crawl-manual", h.Crawl)
 		// Async crawl status polling.
--- a/backend/internal/domain/discovery/service.go
+++ b/backend/internal/domain/discovery/service.go
@@ -57,13 +57,17 @@ type Service struct {
 	// llmEnricher is the AI-backed fallback pass. Nil-safe via NoopLLMEnricher
 	// in test wiring; production code passes a real MistralLLMEnricher.
 	llmEnricher enrich.LLMEnricher
 	// simClassifier is the AI-backed duplicate tiebreaker. Nil-safe via
 	// NoopSimilarityClassifier.
 	simClassifier enrich.SimilarityClassifier
 }
 // NewService constructs a Service wired for the crawler-driven Crawl path.
 // geocoder may be nil; in that case crawl-enrich runs consolidation only and
 // skips the lat/lng step. llm may be nil; per-row LLM enrichment then
-// returns an error instead of attempting a call.
+// returns an error instead of attempting a call. simClassifier may be nil;
-func NewService(repo Repository, cr crawlerRunner, lc linkVerifier, mc marketCreator, gc Geocoder, llm enrich.LLMEnricher) *Service {
+// ClassifySimilarPair returns an error rather than a zero-confidence answer.
 func NewService(repo Repository, cr crawlerRunner, lc linkVerifier, mc marketCreator, gc Geocoder, llm enrich.LLMEnricher, sim enrich.SimilarityClassifier) *Service {
 	return &Service{
 		repo:          repo,
 		crawler:       cr,
@@ -71,6 +75,7 @@ func NewService(repo Repository, cr crawlerRunner, lc linkVerifier, mc marketCre
 		linkChecker:   lc,
 		geocoder:      gc,
 		llmEnricher:   llm,
 		simClassifier: sim,
 	}
 }
@@ -595,6 +600,68 @@ func (s *Service) RunLLMEnrichOne(ctx context.Context, queueID uuid.UUID) (enric
 	return merged, nil
 }
 // ClassifySimilarPair runs the AI classifier on the two queue rows identified
 // by aID and bID, returning a verdict about whether they're the same market.
 // Cache-first: a content-keyed entry (enrich.SimilarityPairKey) shortcuts the
 // LLM call when the same pair has been classified before.
 //
 // Intended for operator-triggered "AI tiebreak" on ambiguous similarity
 // matches. The crawl-time auto-merge in MR 7 will call this on its own.
 func (s *Service) ClassifySimilarPair(ctx context.Context, aID, bID uuid.UUID) (enrich.Verdict, error) {
 	if s.simClassifier == nil {
 		return enrich.Verdict{}, errors.New("similarity classifier not configured")
 	}
 	if aID == bID {
 		return enrich.Verdict{}, errors.New("cannot classify a row against itself")
 	}
 	a, err := s.repo.GetDiscovered(ctx, aID)
 	if err != nil {
 		return enrich.Verdict{}, fmt.Errorf("load row A: %w", err)
 	}
 	b, err := s.repo.GetDiscovered(ctx, bID)
 	if err != nil {
 		return enrich.Verdict{}, fmt.Errorf("load row B: %w", err)
 	}
 	rowA := rowToSimilarity(a)
 	rowB := rowToSimilarity(b)
 	pairKey := enrich.SimilarityPairKey(rowA, rowB)
 	if cached, hit, err := s.repo.GetSimilarityCache(ctx, pairKey); err != nil {
 		slog.WarnContext(ctx, "similarity cache get failed; continuing",
 			"pair_key", pairKey, "error", err)
 	} else if hit {
 		return cached, nil
 	}
 	verdict, err := s.simClassifier.Classify(ctx, rowA, rowB)
 	if err != nil {
 		return enrich.Verdict{}, fmt.Errorf("classify: %w", err)
 	}
 	if err := s.repo.SetSimilarityCache(ctx, pairKey, verdict, enrich.DefaultSimilarityCacheTTL); err != nil {
 		slog.WarnContext(ctx, "similarity cache set failed; continuing",
 			"pair_key", pairKey, "error", err)
 	}
 	return verdict, nil
 }
 // rowToSimilarity adapts a DiscoveredMarket to the narrow SimilarityRow the
 // enrich package consumes. Year comes from StartDatum (0 when unknown).
 func rowToSimilarity(r DiscoveredMarket) enrich.SimilarityRow {
 	year := 0
 	if r.StartDatum != nil {
 		year = r.StartDatum.Year()
 	}
 	return enrich.SimilarityRow{
 		NameNormalized: r.NameNormalized,
 		Stadt:          r.Stadt,
 		Year:           year,
 		Name:           r.MarktName,
 		Quellen:        r.Quellen,
 	}
 }
 // CrawlEnrichSummary reports the outcome of one RunCrawlEnrichAll pass.
 // Mirrors CrawlSummary's shape so the admin UI can reuse its render path.
 type CrawlEnrichSummary struct {
--- a/backend/internal/domain/discovery/service_test.go
+++ b/backend/internal/domain/discovery/service_test.go
@@ -147,7 +147,7 @@ func TestAccept_NewSeries_CallsCreate(t *testing.T) {
 		markAcceptedFn: func(_ context.Context, _ pgx.Tx, _, _, _ uuid.UUID) error { return nil },
 	}
 	mc := &stubCreator{}
-	svc := NewService(m, nil, noopLinkVerifier{}, mc, nil, nil)
+	svc := NewService(m, nil, noopLinkVerifier{}, mc, nil, nil, nil)
 	_, _, err := svc.Accept(context.Background(), qID, uuid.New())
 	if err != nil {
 		t.Fatalf("accept err: %v", err)
@@ -169,7 +169,7 @@ func TestAccept_ExistingSeries_CallsCreateEditionForSeries(t *testing.T) {
 		markAcceptedFn: func(_ context.Context, _ pgx.Tx, _, _, _ uuid.UUID) error { return nil },
 	}
 	mc := &stubCreator{}
-	svc := NewService(m, nil, noopLinkVerifier{}, mc, nil, nil)
+	svc := NewService(m, nil, noopLinkVerifier{}, mc, nil, nil, nil)
 	_, _, err := svc.Accept(context.Background(), uuid.New(), uuid.New())
 	if err != nil {
 		t.Fatalf("accept err: %v", err)
@@ -200,7 +200,7 @@ func TestServiceCrawlHappyPath(t *testing.T) {
 			PerSourceMS: map[string]int64{"marktkalendarium": 1},
 		},
 	}
-	svc := NewService(repo, sc, lc, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, sc, lc, noopMarketCreator{}, nil, nil, nil)
 	summary, err := svc.Crawl(context.Background())
 	if err != nil {
@@ -241,7 +241,7 @@ func TestServiceCrawlDedupQueue(t *testing.T) {
 			},
 		},
 	}
-	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	summary, err := svc.Crawl(context.Background())
 	if err != nil {
@@ -272,7 +272,7 @@ func TestServiceCrawlDefaultsEndDate(t *testing.T) {
 			},
 		},
 	}
-	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	if _, err := svc.Crawl(context.Background()); err != nil {
 		t.Fatal(err)
@@ -318,7 +318,7 @@ func TestServiceCrawlDetachesInsertContextFromRequestCtx(t *testing.T) {
 			},
 		},
 	}
-	svc := NewService(repo, sc, ctxAwareLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, sc, ctxAwareLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	// Cancel the context BEFORE Crawl runs — simulates gateway timeout
 	// that fires while the handler is still mid-run.
@@ -343,7 +343,7 @@ func TestListPendingQueuePaged_ReturnsBothRowsAndTotal(t *testing.T) {
 	m := &mockRepo{
 		countQueueFn: func(_ context.Context, _ string) (int, error) { return 42, nil },
 	}
-	svc := NewService(m, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(m, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	rows, total, err := svc.ListPendingQueuePaged(context.Background(), 50, 0)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
@@ -375,7 +375,7 @@ func TestServiceCrawlPersistsSourcesAndContributions(t *testing.T) {
 			},
 		},
 	}
-	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	if _, err := svc.Crawl(context.Background()); err != nil {
 		t.Fatal(err)
@@ -424,7 +424,7 @@ func TestServiceCrawlMultiSourceHighKonfidenz(t *testing.T) {
 			},
 		},
 	}
-	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, sc, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	summary, err := svc.Crawl(context.Background())
 	if err != nil {
@@ -486,7 +486,7 @@ func TestRunCrawlEnrichAll_HappyPath(t *testing.T) {
 		},
 	}
 	gc := stubGeocoder{lat: ptrFloat(51.05), lng: ptrFloat(13.74)}
-	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, gc, nil)
+	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, gc, nil, nil)
 	summary, err := svc.RunCrawlEnrichAll(context.Background())
 	if err != nil {
@@ -547,7 +547,7 @@ func TestRunCrawlEnrichAll_SetEnrichmentFailure(t *testing.T) {
 			return nil
 		},
 	}
-	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	summary, err := svc.RunCrawlEnrichAll(context.Background())
 	if err != nil {
@@ -639,7 +639,7 @@ func TestRunLLMEnrichOne_HappyPath(t *testing.T) {
 		},
 	}
 	llm := &stubLLMEnricher{result: llmResult}
-	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, llm)
+	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, llm, nil)
 	got, err := svc.RunLLMEnrichOne(context.Background(), rowID)
 	if err != nil {
@@ -709,7 +709,7 @@ func TestRunLLMEnrichOne_CacheHitSkipsLLM(t *testing.T) {
 		},
 	}
 	llm := &stubLLMEnricher{}
-	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, llm)
+	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, llm, nil)
 	got, err := svc.RunLLMEnrichOne(context.Background(), rowID)
 	if err != nil {
@@ -738,7 +738,7 @@ func TestRunLLMEnrichOne_LLMErrorMarksFailed(t *testing.T) {
 		},
 	}
 	llm := &stubLLMEnricher{err: errors.New("mistral down")}
-	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, llm)
+	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, llm, nil)
 	_, err := svc.RunLLMEnrichOne(context.Background(), rowID)
 	if err == nil {
@@ -761,7 +761,7 @@ func TestRunCrawlEnrichAll_EmptyQueueNoOp(t *testing.T) {
 			return nil
 		},
 	}
-	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil)
+	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, nil)
 	summary, err := svc.RunCrawlEnrichAll(context.Background())
 	if err != nil {
@@ -774,3 +774,129 @@ func TestRunCrawlEnrichAll_EmptyQueueNoOp(t *testing.T) {
 		t.Errorf("SetEnrichment called %d times on empty queue", writes)
 	}
 }
 // stubSimilarityClassifier returns canned verdicts or errors.
 type stubSimilarityClassifier struct {
 	result enrich.Verdict
 	err    error
 	calls  int
 }
 func (s *stubSimilarityClassifier) Classify(_ context.Context, _, _ enrich.SimilarityRow) (enrich.Verdict, error) {
 	s.calls++
 	return s.result, s.err
 }
 // TestClassifySimilarPair_HappyPath: cache miss → LLM → cache write → return.
 func TestClassifySimilarPair_HappyPath(t *testing.T) {
 	aID, bID := uuid.New(), uuid.New()
 	start := time.Date(2026, 5, 1, 0, 0, 0, 0, time.UTC)
 	rowA := DiscoveredMarket{ID: aID, MarktName: "Ritterfest Dresden", Stadt: "Dresden", NameNormalized: "ritterfest dresden", StartDatum: &start}
 	rowB := DiscoveredMarket{ID: bID, MarktName: "Mittelaltermarkt Dresden 2026", Stadt: "Dresden", NameNormalized: "mittelaltermarkt dresden", StartDatum: &start}
 	var cacheSet struct {
 		called  bool
 		verdict enrich.Verdict
 	}
 	repo := &mockRepo{
 		getDiscoveredFn: func(_ context.Context, id uuid.UUID) (DiscoveredMarket, error) {
 			if id == aID {
 				return rowA, nil
 			}
 			return rowB, nil
 		},
 		setSimCacheFn: func(_ string, v enrich.Verdict, _ time.Duration) error {
 			cacheSet.called = true
 			cacheSet.verdict = v
 			return nil
 		},
 	}
 	sim := &stubSimilarityClassifier{
 		result: enrich.Verdict{Same: false, Confidence: 0.6, Reason: "Unterschiedliche Namen."},
 	}
 	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, sim)
 	got, err := svc.ClassifySimilarPair(context.Background(), aID, bID)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if sim.calls != 1 {
 		t.Errorf("classifier called %d times; want 1", sim.calls)
 	}
 	if got.Same || got.Confidence != 0.6 {
 		t.Errorf("verdict = %+v; want same=false, confidence=0.6", got)
 	}
 	if !cacheSet.called {
 		t.Error("expected SetSimilarityCache to be called on a cache miss")
 	}
 	if cacheSet.verdict.Confidence != 0.6 {
 		t.Errorf("cached verdict lost confidence: %+v", cacheSet.verdict)
 	}
 }
 // TestClassifySimilarPair_CacheHitSkipsLLM: cache hit returns directly,
 // no classifier call.
 func TestClassifySimilarPair_CacheHitSkipsLLM(t *testing.T) {
 	aID, bID := uuid.New(), uuid.New()
 	cached := enrich.Verdict{Same: true, Confidence: 0.9, Reason: "same venue"}
 	repo := &mockRepo{
 		getDiscoveredFn: func(context.Context, uuid.UUID) (DiscoveredMarket, error) {
 			return DiscoveredMarket{}, nil
 		},
 		getSimCacheFn: func(string) (enrich.Verdict, bool, error) {
 			return cached, true, nil
 		},
 	}
 	sim := &stubSimilarityClassifier{}
 	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, sim)
 	got, err := svc.ClassifySimilarPair(context.Background(), aID, bID)
 	if err != nil {
 		t.Fatalf("unexpected error: %v", err)
 	}
 	if sim.calls != 0 {
 		t.Errorf("classifier called %d times on cache hit; want 0", sim.calls)
 	}
 	if !got.Same || got.Confidence != 0.9 {
 		t.Errorf("cached verdict not returned: %+v", got)
 	}
 }
 // TestClassifySimilarPair_RejectsSelfComparison: the pair-key scheme would
 // collapse (a,a) to a single key which never tells you anything useful.
 func TestClassifySimilarPair_RejectsSelfComparison(t *testing.T) {
 	id := uuid.New()
 	svc := NewService(&mockRepo{}, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, &stubSimilarityClassifier{})
 	_, err := svc.ClassifySimilarPair(context.Background(), id, id)
 	if err == nil {
 		t.Error("expected error on self-comparison; got nil")
 	}
 }
 // TestClassifySimilarPair_LLMErrorPropagates: classifier errors surface;
 // cache is not written.
 func TestClassifySimilarPair_LLMErrorPropagates(t *testing.T) {
 	aID, bID := uuid.New(), uuid.New()
 	cacheWritten := false
 	repo := &mockRepo{
 		getDiscoveredFn: func(context.Context, uuid.UUID) (DiscoveredMarket, error) {
 			return DiscoveredMarket{}, nil
 		},
 		setSimCacheFn: func(string, enrich.Verdict, time.Duration) error {
 			cacheWritten = true
 			return nil
 		},
 	}
 	sim := &stubSimilarityClassifier{err: errors.New("mistral 500")}
 	svc := NewService(repo, nil, noopLinkVerifier{}, noopMarketCreator{}, nil, nil, sim)
 	_, err := svc.ClassifySimilarPair(context.Background(), aID, bID)
 	if err == nil {
 		t.Fatal("expected error; got nil")
 	}
 	if cacheWritten {
 		t.Error("cache should not be written when classifier errors")
 	}
 }
--- a/backend/internal/server/routes.go
+++ b/backend/internal/server/routes.go
@@ -79,11 +79,13 @@ func (s *Server) registerRoutes() {
 	// Per-row LLM enrichment (MR 3b). Operator-triggered only; disabled rows
 	// fall through via NoopLLMEnricher when AI isn't configured.
 	var llmEnricher enrich.LLMEnricher = enrich.NoopLLMEnricher{}
 	var simClassifier enrich.SimilarityClassifier = enrich.NoopSimilarityClassifier{}
 	if aiClient.Enabled() {
 		scraper := scrape.New(s.cfg.Discovery.CrawlerUserAgent)
 		llmEnricher = enrich.NewMistralLLMEnricher(aiClient, scraper)
 		simClassifier = enrich.NewMistralSimilarityClassifier(aiClient)
 	}
-	discoveryService := discovery.NewService(discoveryRepo, crawlerInstance, discovery.NewLinkChecker(), marketSvc, geocoder, llmEnricher)
+	discoveryService := discovery.NewService(discoveryRepo, crawlerInstance, discovery.NewLinkChecker(), marketSvc, geocoder, llmEnricher, simClassifier)
 	discoveryHandler := discovery.NewHandler(discoveryService, s.cfg.Discovery.CrawlerManualRateLimitPerHour)
 	requireTickToken := middleware.RequireBearerToken(s.cfg.Discovery.Token)
 	discovery.RegisterRoutes(v1, discoveryHandler, requireAuth, requireAdmin, requireTickToken)
--- a/backend/migrations/000020_similarity_ai_cache.down.sql
+++ b/backend/migrations/000020_similarity_ai_cache.down.sql
@@ -0,0 +1,2 @@
 DROP INDEX IF EXISTS idx_similarity_ai_cache_expires_at;
 DROP TABLE IF EXISTS similarity_ai_cache;
--- a/backend/migrations/000020_similarity_ai_cache.up.sql
+++ b/backend/migrations/000020_similarity_ai_cache.up.sql
@@ -0,0 +1,18 @@
 -- Cache for LLM-based similarity verdicts. Pair key is a sha256 over the
 -- content tuple (normalized_name|stadt|year for both rows, sorted) — NOT
 -- over queue UUIDs, so the cache survives queue row deletion (accept/reject)
 -- while still invalidating correctly when a row's identifying fields change.
 CREATE TABLE similarity_ai_cache (
  pair_key   text        PRIMARY KEY,
  same       bool        NOT NULL,
  confidence real        NOT NULL,
  reason     text        NOT NULL DEFAULT '',
  model      text        NOT NULL DEFAULT '',
  created_at timestamptz NOT NULL DEFAULT now(),
  expires_at timestamptz
 );
 -- Opportunistic pruning; workers or manual jobs SELECT WHERE expires_at < now().
 CREATE INDEX idx_similarity_ai_cache_expires_at
  ON similarity_ai_cache (expires_at)
  WHERE expires_at IS NOT NULL;
--- a/web/src/routes/admin/discovery/+page.svelte
+++ b/web/src/routes/admin/discovery/+page.svelte
@@ -99,6 +99,7 @@
 		similarOpenId = id;
 		similarLoading = true;
 		similarEntries = [];
 		similarVerdicts = {};
 		try {
 			const res = await fetch(`/admin/discovery/queue/${id}/similar`);
 			if (!res.ok) {
@@ -114,6 +115,53 @@
 		}
 	}
 	// Per-pair AI similarity verdict. Keyed on the candidate's queue id since
 	// the "anchor" row (similarOpenId) is already known from context.
 	type SimilarityVerdict = {
 		same: boolean;
 		confidence: number;
 		reason: string;
 		model?: string;
 		classified_at?: string;
 	};
 	let similarVerdicts = $state<Record<string, SimilarityVerdict>>({});
 	let similarClassifying = $state(new Set<string>());
 	async function classifySimilar(anchorId: string, candidateId: string) {
 		if (similarClassifying.has(candidateId)) return;
 		const next = new Set(similarClassifying);
 		next.add(candidateId);
 		similarClassifying = next;
 		try {
 			const res = await fetch(
 				`/admin/discovery/queue/${anchorId}/similar/${candidateId}/classify`,
 				{ method: 'POST' }
 			);
 			if (!res.ok) {
 				similarVerdicts = {
 					...similarVerdicts,
 					[candidateId]: { same: false, confidence: 0, reason: `HTTP ${res.status}` }
 				};
 				return;
 			}
 			const body = await res.json();
 			similarVerdicts = { ...similarVerdicts, [candidateId]: body.data };
 		} catch (err) {
 			similarVerdicts = {
 				...similarVerdicts,
 				[candidateId]: {
 					same: false,
 					confidence: 0,
 					reason: err instanceof Error ? err.message : 'Fehler'
 				}
 			};
 		} finally {
 			const afterNext = new Set(similarClassifying);
 			afterNext.delete(candidateId);
 			similarClassifying = afterNext;
 		}
 	}
 	// Pagination helpers.
 	const totalPages = $derived(Math.ceil((data.total ?? 0) / data.limit));
@@ -777,7 +825,8 @@
 													<th class="pr-4 pb-1 font-medium">Markt</th>
 													<th class="pr-4 pb-1 font-medium">Stadt</th>
 													<th class="pr-4 pb-1 font-medium">Datum</th>
-													<th class="pb-1 font-medium">Konfidenz</th>
+													<th class="pr-4 pb-1 font-medium">Konfidenz</th>
 													<th class="pb-1 font-medium">AI-Verdict</th>
 												</tr>
 											</thead>
 											<tbody>
@@ -791,7 +840,7 @@
 														<td class="py-1 pr-4 whitespace-nowrap"
 															>{fmtDate(m.entry.start_datum)}</td
 														>
-														<td class="py-1">
+														<td class="py-1 pr-4">
 															<span
 																class="inline-block rounded px-1.5 py-0.5 {konfidenzClass(
 																	m.entry.konfidenz
@@ -800,6 +849,30 @@
 																{m.entry.konfidenz || '—'}
 															</span>
 														</td>
 														<td class="py-1">
 															{#if similarVerdicts[m.entry.id]}
 																{@const v = similarVerdicts[m.entry.id]}
 																<span
 																	class="inline-block rounded px-1.5 py-0.5 text-[10px] {v.same
 																		? 'bg-emerald-100 text-emerald-700 dark:bg-emerald-900/50 dark:text-emerald-300'
 																		: 'bg-stone-200 text-stone-700 dark:bg-stone-700 dark:text-stone-200'}"
 																	title={v.reason}
 																>
 																	{v.same ? '✓ same' : '✗ diff'}
 																	{(v.confidence * 100).toFixed(0)}%
 																</span>
 															{:else}
 																<button
 																	type="button"
 																	disabled={similarClassifying.has(m.entry.id)}
 																	onclick={() => classifySimilar(row.id, m.entry.id)}
 																	class="rounded bg-purple-100 px-1.5 py-0.5 text-[10px] text-purple-700 hover:bg-purple-200 disabled:cursor-not-allowed disabled:opacity-60 dark:bg-purple-900/50 dark:text-purple-300 dark:hover:bg-purple-900"
 																	title="LLM-Tiebreak: sind das derselbe Markt?"
 																>
 																	{similarClassifying.has(m.entry.id) ? 'AI…' : 'AI?'}
 																</button>
 															{/if}
 														</td>
 													</tr>
 												{/each}
 											</tbody>
		`@@ -0,0 +1,2 @@`
							`DROP INDEX IF EXISTS idx_similarity_ai_cache_expires_at;`
							`DROP TABLE IF EXISTS similarity_ai_cache;`