1 mesiac pred · 8ff17fe8fb
--- a/.env.example
+++ b/.env.example
@@ -8,3 +8,6 @@ REMOTE_MCP_SSE_READ_TIMEOUT=300
 
				 # Graph to query (used in the scaffolding SPARQL templates).
			
 
				 RESOLUTION_GRAPH_IRI=http://world.eu.org/atlas_data#
			
 
				 
			
 
				+# Ollama embedding configuration for candidate ranking.
			
 
				+OLLAMA_BASE_URL=http://192.168.0.200:11434
			
 
				+OLLAMA_EMBEDDING_MODEL=nomic-embed-text
			
--- a/COARSE_TYPES.txt
+++ b/COARSE_TYPES.txt
@@ -0,0 +1,95 @@
 
				+Atlas Coarse Types for LLM Extraction
			
 
				+======================================
			
 
				+
			
 
				+Use these 12 types when prompting a cheap/small LLM for entity type suggestion.
			
 
				+The suggested type is a hint to the entity resolver for candidate ranking — not
			
 
				+a final classification. Pass 2 (Wikidata QID lookup) promotes to the fine-grained
			
 
				+subtype from the full ontology.
			
 
				+
			
 
				+
			
 
				+COARSE TYPES
			
 
				+------------
			
 
				+
			
 
				+Person
			
 
				+Organization
			
 
				+Location
			
 
				+CreativeWork
			
 
				+Event
			
 
				+Product
			
 
				+FinancialInstrument
			
 
				+Animal
			
 
				+Disease
			
 
				+Building
			
 
				+FictionalCharacter
			
 
				+Other
			
 
				+
			
 
				+
			
 
				+PASS 2 PROMOTION MAP
			
 
				+--------------------
			
 
				+
			
 
				+Person              -> Person
			
 
				+
			
 
				+Organization        -> Organization
			
 
				+                       PoliticalParty
			
 
				+                       MilitaryUnit
			
 
				+                       MediaOrganization
			
 
				+
			
 
				+Location            -> Location
			
 
				+                       Continent
			
 
				+                       Country
			
 
				+                       Region
			
 
				+                       PopulatedPlace
			
 
				+                       Neighbourhood
			
 
				+                       NaturalFeature
			
 
				+                       AdministrativeArea
			
 
				+
			
 
				+CreativeWork        -> CreativeWork
			
 
				+                       Film
			
 
				+                       Book
			
 
				+                       MusicAlbum
			
 
				+                       TVSeries
			
 
				+                       VideoGame
			
 
				+
			
 
				+Event               -> Event
			
 
				+
			
 
				+Product             -> Product
			
 
				+                       Drug
			
 
				+                       Food
			
 
				+
			
 
				+FinancialInstrument -> FinancialInstrument
			
 
				+                       PublicCompany
			
 
				+                       StockIndex
			
 
				+                       Commodity
			
 
				+                       Cryptocurrency
			
 
				+                       Currency
			
 
				+
			
 
				+Animal              -> Animal
			
 
				+
			
 
				+Disease             -> Disease
			
 
				+
			
 
				+Building            -> Building
			
 
				+
			
 
				+FictionalCharacter  -> FictionalCharacter
			
 
				+
			
 
				+Other               -> Other
			
 
				+                       Award
			
 
				+                       Sport
			
 
				+                       EthnicGroup
			
 
				+                       Concept
			
 
				+
			
 
				+
			
 
				+NOTES
			
 
				+-----
			
 
				+
			
 
				+- Animal and Disease are kept separate because confusing them with Product
			
 
				+  or Concept causes hard resolution failures.
			
 
				+
			
 
				+- Building is kept separate because landmarks (Eiffel Tower, White House)
			
 
				+  resolve very differently from cities or countries.
			
 
				+
			
 
				+- FictionalCharacter is kept separate because confusing a fictional entity
			
 
				+  with a real person is a hard failure, not a soft one.
			
 
				+
			
 
				+- Award, Sport, EthnicGroup and Concept fall into Other at the coarse level.
			
 
				+  A small model will mis-classify these anyway; the QID lookup in pass 2
			
 
				+  recovers the correct fine-grained type reliably.
			
--- a/README.md
+++ b/README.md
@@ -8,13 +8,25 @@ Python FastMCP server for the *atlas2* resolution flow.
 
				   - store lookup (label/alias)
			
 
				   - Wikidata fallback using `wikidata.reconci.link` quick-resolve (single-candidate)
			
 
				   - minimal persist to Virtuoso via MCP
			
 
				-  - cache hits return the stored result
			
 
				+  - cache hits return the stored result when confidence is sufficient
			
 
				+- Resolve supports strategy modes:
			
 
				+  - `quick`
			
 
				+  - `ranked`
			
 
				+  - `interactive`
			
 
				+  - `hybrid`
			
 
				+  - `llm_select`
			
 
				+- Ranking can use embeddings via Ollama when `strategy.use_embeddings=true`
			
 
				+- `confidence` controls cache reuse and re-resolution, not just the resolved/not-found status
			
 
				 - Store lookup was debugged and made robust by splitting label-first then alias.
			
 
				 - Maintenance scaffolding (dry-run CLI) exists to upgrade `atlas:needsCuration true` entities using:
			
 
				   - `ontology/wikidata_subclassof.ttl`
			
 
				   - Wikidata entity dumps
			
 
				   - Atlas type bucket inference (Person/Organization/Location/etc.)
			
 
				 
			
 
				+## Resolver tests
			
 
				+- `./test_resolve.sh` runs resolver-focused tests only
			
 
				+- It prints the subjects under test and a per-test timing table
			
 
				+
			
 
				 ## How to run
			
 
				 
			
 
				 1) Create config:
			
--- a/TODO.md
+++ b/TODO.md
@@ -0,0 +1,13 @@
 
				+# atlas2-mcp TODO
			
 
				+
			
 
				+## Next
			
 
				+- Implement the maintenance script as the next step:
			
 
				+  - select entities with `atlas:needsCuration true`
			
 
				+  - fetch Wikidata details
			
 
				+  - enrich type-specific fields
			
 
				+  - write back updates when ready
			
 
				+
			
 
				+## Later
			
 
				+- Expand maintenance to handle more advanced realm/constraint-driven behavior.
			
 
				+- Tighten/extend type buckets if new examples show over-classification.
			
 
				+
			
--- a/app/atlas_store.py
+++ b/app/atlas_store.py
@@ -87,6 +87,13 @@ def _escape(s: str) -> str:
 
				     return s.replace("\\", "\\\\").replace('"', '\\"').replace("\n", "\\n")
			
 
				 
			
 
				 
			
 
				+def _parse_boolean_literal(value: str | None, default: bool = True) -> bool:
			
 
				+    if value is None:
			
 
				+        return default
			
 
				+    v = str(value).strip().lower()
			
 
				+    return v in {"1", "true", "yes", "y", "t"}
			
 
				+
			
 
				+
			
 
				 async def _sparql_update(endpoint: str, query: str) -> None:
			
 
				     if "/mcp/sse" not in endpoint:
			
 
				         raise RuntimeError("atlas_store only supports Virtuoso MCP/SSE endpoints in this scaffold")
			
@@ -150,13 +157,15 @@ async def load_entity_by_subject(subject: str, endpoint: str, graph_iri: str = D
 
				 
			
 
				     label_query = f"""
			
 
				 {PREFIXES}
			
 
				-SELECT ?atlasId ?label ?type ?qid WHERE {{
			
 
				+SELECT ?atlasId ?label ?desc ?type ?qid ?needsCuration WHERE {{
			
 
				   VALUES ?needle {{ "{needle}" }}
			
 
				   GRAPH <{graph_iri}> {{
			
 
				     ?entity a atlas:Entity ;
			
 
				             atlas:atlasId ?atlasId ;
			
 
				             atlas:canonicalLabel ?label .
			
 
				+    OPTIONAL {{ ?entity atlas:canonicalDescription ?desc . }}
			
 
				     OPTIONAL {{ ?entity atlas:hasCanonicalType ?type . }}
			
 
				+    OPTIONAL {{ ?entity atlas:needsCuration ?needsCuration . }}
			
 
				     OPTIONAL {{ ?entity atlas:hasIdentifier ?ident . ?ident atlas:scheme "wikidata-qid" ; atlas:value ?qid . }}
			
 
				     FILTER(LCASE(STR(?label)) = LCASE(STR(?needle)))
			
 
				   }}
			
@@ -166,14 +175,16 @@ LIMIT 1
 
				 
			
 
				     alias_query = f"""
			
 
				 {PREFIXES}
			
 
				-SELECT ?atlasId ?label ?type ?qid ?alias WHERE {{
			
 
				+SELECT ?atlasId ?label ?desc ?type ?qid ?alias ?needsCuration WHERE {{
			
 
				   VALUES ?needle {{ "{needle}" }}
			
 
				   GRAPH <{graph_iri}> {{
			
 
				     ?entity a atlas:Entity ;
			
 
				             atlas:atlasId ?atlasId ;
			
 
				             atlas:aliasLabel ?alias .
			
 
				     OPTIONAL {{ ?entity atlas:canonicalLabel ?label . }}
			
 
				+    OPTIONAL {{ ?entity atlas:canonicalDescription ?desc . }}
			
 
				     OPTIONAL {{ ?entity atlas:hasCanonicalType ?type . }}
			
 
				+    OPTIONAL {{ ?entity atlas:needsCuration ?needsCuration . }}
			
 
				     OPTIONAL {{ ?entity atlas:hasIdentifier ?ident . ?ident atlas:scheme "wikidata-qid" ; atlas:value ?qid . }}
			
 
				     FILTER(LCASE(STR(?alias)) = LCASE(STR(?needle)))
			
 
				   }}
			
@@ -202,9 +213,12 @@ LIMIT 1
 
				     return {
			
 
				         "atlas_id": row.get("atlasId", {}).get("value"),
			
 
				         "label": row.get("label", {}).get("value"),
			
 
				+        "description": (row.get("desc", {}) or {}).get("value"),
			
 
				         "type": type_value,
			
 
				         "wikidata_id": row.get("qid", {}).get("value"),
			
 
				         "alias": row.get("alias", {}).get("value"),
			
 
				+        # If the triple is missing, treat it as needsCuration=true for this early-stage workflow.
			
 
				+        "needs_curation": _parse_boolean_literal(row.get("needsCuration", {}).get("value"), default=True),
			
 
				     }
			
 
				 
			
 
				 
			
--- a/app/maintenance.py
+++ b/app/maintenance.py
@@ -71,6 +71,8 @@ def _infer_atlas_type_from_qids(qids: Iterable[str], subclass_graph: rdflib.Grap
 
				         lower = obj_str.lower()
			
 
				         if "person" in lower or "politician" in lower:
			
 
				             return "atlas:Person"
			
 
				+        if "human" in lower or "bio" in lower or "biography" in lower:
			
 
				+            return "atlas:Person"
			
 
				         if "organisation" in lower or "organization" in lower or "governmentagency" in lower or "agency" in lower:
			
 
				             return "atlas:Organization"
			
 
				         if any(k in lower for k in [
			
@@ -98,10 +100,14 @@ def _infer_atlas_type_from_qids(qids: Iterable[str], subclass_graph: rdflib.Grap
 
				         return None
			
 
				 
			
 
				     for q in qids:
			
 
				-        start = rdflib.URIRef(f"http://wikidata.dbpedia.org/resource/{q}")
			
 
				+        # Support both namespace styles used in tests and data sources.
			
 
				+        start_nodes = [
			
 
				+            rdflib.URIRef(f"http://wikidata.dbpedia.org/resource/{q}"),
			
 
				+            rdflib.URIRef(f"http://www.wikidata.org/entity/{q}"),
			
 
				+        ]
			
 
				 
			
 
				         # Walk the rdfs:subClassOf closure to find something that matches our buckets.
			
 
				-        queue = [start]
			
 
				+        queue = list(start_nodes)
			
 
				         visited: set[rdflib.term.Node] = set()
			
 
				 
			
 
				         while queue:
			
--- a/app/mcp_server.py
+++ b/app/mcp_server.py
@@ -26,6 +26,7 @@ async def resolve_tool(
 
				     constraints: dict | None = None,
			
 
				     hints: dict | None = None,
			
 
				     debug: dict | None = None,
			
 
				+    strategy: dict | None = None,
			
 
				 ):
			
 
				     # Service pulls configuration exclusively from the project's .env.
			
 
				     svc = ResolveService()
			
@@ -35,5 +36,6 @@ async def resolve_tool(
 
				         constraints=constraints,
			
 
				         hints=hints,
			
 
				         debug=debug,
			
 
				+        strategy=strategy,
			
 
				     )
			
 
				 
			
--- a/app/resolve.py
+++ b/app/resolve.py
@@ -5,6 +5,10 @@ import os
 
				 import logging
			
 
				 from dataclasses import dataclass
			
 
				 from typing import Any
			
 
				+import time
			
 
				+import uuid
			
 
				+import datetime
			
 
				+import math
			
 
				 
			
 
				 from .atlas_model import Entity, Identifier
			
 
				 from .atlas_store import load_entity_by_subject, save_entity_minimal
			
@@ -27,11 +31,28 @@ def _entity_iri(atlas_id: str) -> str:
 
				     return f"atlas_data:entity_{atlas_id}"
			
 
				 
			
 
				 
			
 
				-async def _wikidata_lookup(subject: str) -> dict[str, Any] | None:
			
 
				-    search = WikidataSearch({"search": subject, "limit": 1})
			
 
				-    result = await search.quick_resolve(subject, limit=1)
			
 
				-    items = result.get("results", [])
			
 
				-    return items[0] if items else None
			
 
				+async def _wikidata_lookup(subject: str, language: str = "en", limit: int = 1) -> list[dict[str, Any]]:
			
 
				+    search = WikidataSearch({"search": subject, "limit": limit, "language": language})
			
 
				+    result = await search.quick_resolve(subject, limit=limit)
			
 
				+    return result.get("results", []) or []
			
 
				+
			
 
				+
			
 
				+def _candidate_text(subject: str, wd: dict[str, Any], hints: dict[str, Any] | None = None) -> str:
			
 
				+    hints = hints or {}
			
 
				+    aliases = hints.get("aliases") or []
			
 
				+    parts = [subject, wd.get("label") or "", wd.get("description") or "", " ".join(str(a) for a in aliases)]
			
 
				+    return " | ".join(part for part in parts if part)
			
 
				+
			
 
				+
			
 
				+def _cosine_similarity(a: list[float] | None, b: list[float] | None) -> float:
			
 
				+    if not a or not b or len(a) != len(b):
			
 
				+        return 0.0
			
 
				+    dot = sum(x * y for x, y in zip(a, b))
			
 
				+    norm_a = math.sqrt(sum(x * x for x in a))
			
 
				+    norm_b = math.sqrt(sum(y * y for y in b))
			
 
				+    if not norm_a or not norm_b:
			
 
				+        return 0.0
			
 
				+    return dot / (norm_a * norm_b)
			
 
				 
			
 
				 
			
 
				 def _infer_atlas_type(label: str | None, description: str | None) -> str:
			
@@ -45,6 +66,67 @@ def _infer_atlas_type(label: str | None, description: str | None) -> str:
 
				     return "atlas:Other"
			
 
				 
			
 
				 
			
 
				+def _score_wikidata_candidate(
			
 
				+    subject: str,
			
 
				+    wd: dict[str, Any],
			
 
				+    *,
			
 
				+    context: dict[str, Any] | None = None,
			
 
				+    hints: dict[str, Any] | None = None,
			
 
				+    use_embeddings: bool = False,
			
 
				+    subject_embedding: list[float] | None = None,
			
 
				+    candidate_embedding: list[float] | None = None,
			
 
				+) -> tuple[float, dict[str, float]]:
			
 
				+    context = context or {}
			
 
				+    hints = hints or {}
			
 
				+
			
 
				+    score = 0.0
			
 
				+    breakdown: dict[str, float] = {}
			
 
				+    subject_norm = subject.strip().lower()
			
 
				+    label = (wd.get("label") or "").strip()
			
 
				+    description = (wd.get("description") or "").strip()
			
 
				+    label_norm = label.lower()
			
 
				+    description_norm = description.lower()
			
 
				+
			
 
				+    if label_norm == subject_norm:
			
 
				+        score += 0.75
			
 
				+        breakdown["exact_label"] = 0.75
			
 
				+    elif subject_norm and subject_norm in label_norm:
			
 
				+        score += 0.45
			
 
				+        breakdown["partial_label"] = 0.45
			
 
				+
			
 
				+    for alias in hints.get("aliases") or []:
			
 
				+        alias_norm = str(alias).strip().lower()
			
 
				+        if alias_norm and alias_norm == label_norm:
			
 
				+            score += 0.15
			
 
				+            breakdown["alias_match"] = 0.15
			
 
				+            break
			
 
				+
			
 
				+    expected_type = (hints.get("expected_type") or "").strip().lower()
			
 
				+    inferred_type = _infer_atlas_type(label, description).lower()
			
 
				+    if expected_type and expected_type in inferred_type:
			
 
				+        score += 0.1
			
 
				+        breakdown["expected_type"] = 0.1
			
 
				+
			
 
				+    realm = (context.get("realm") or "").strip().lower()
			
 
				+    if realm and realm in description_norm:
			
 
				+        score += 0.1
			
 
				+        breakdown["realm"] = 0.1
			
 
				+
			
 
				+    if wd.get("id"):
			
 
				+        score += 0.05
			
 
				+        breakdown["has_qid"] = 0.05
			
 
				+
			
 
				+    if use_embeddings:
			
 
				+        sim = _cosine_similarity(subject_embedding, candidate_embedding)
			
 
				+        if sim > 0:
			
 
				+            emb_score = max(0.0, min(0.25, sim * 0.25))
			
 
				+            score += emb_score
			
 
				+            breakdown["embedding_similarity"] = emb_score
			
 
				+
			
 
				+    score = min(score, 0.99)
			
 
				+    return score, breakdown
			
 
				+
			
 
				+
			
 
				 def _entity_from_wikidata(subject: str, wd: dict[str, Any]) -> Entity:
			
 
				     atlas_id = _hash_id(subject)
			
 
				     label = wd.get("label") or subject
			
@@ -81,6 +163,61 @@ async def _load_entity(subject: str) -> dict[str, Any] | None:
 
				     return await load_entity_by_subject(subject, DEFAULT_ENDPOINT)
			
 
				 
			
 
				 
			
 
				+def _required_confidence(mode: str, constraints: dict[str, Any]) -> float:
			
 
				+    requested = constraints.get("min_confidence")
			
 
				+    if requested is not None:
			
 
				+        return float(requested)
			
 
				+    if mode == "quick":
			
 
				+        return 0.55
			
 
				+    if mode in {"ranked", "hybrid", "llm_select"}:
			
 
				+        return 0.85
			
 
				+    if mode == "interactive":
			
 
				+        return 0.0
			
 
				+    return 0.5
			
 
				+
			
 
				+
			
 
				+def _is_ambiguous_subject(subject: str, wd_candidates: list[dict[str, Any]]) -> bool:
			
 
				+    if len(wd_candidates) < 2:
			
 
				+        return False
			
 
				+    subject_norm = subject.strip().lower()
			
 
				+    labels = [(cand.get("label") or "").strip().lower() for cand in wd_candidates]
			
 
				+    exact_matches = sum(1 for label in labels if label == subject_norm)
			
 
				+    return exact_matches >= 2 or (exact_matches == 1 and any(label == subject_norm for label in labels[1:]))
			
 
				+
			
 
				+
			
 
				+def _cache_can_satisfy(stored: dict[str, Any], mode: str, constraints: dict[str, Any]) -> bool:
			
 
				+    stored_confidence = float(stored.get("confidence") or 0.0)
			
 
				+    return stored_confidence >= _required_confidence(mode, constraints)
			
 
				+
			
 
				+
			
 
				+def _debug_decision(
			
 
				+    *,
			
 
				+    mode: str,
			
 
				+    top_confidence: float,
			
 
				+    auto_accept_threshold: float,
			
 
				+    interactive_below_threshold: bool,
			
 
				+    required_confidence: float,
			
 
				+    used_cache: bool,
			
 
				+    cache_confidence: float | None = None,
			
 
				+) -> dict[str, Any]:
			
 
				+    return {
			
 
				+        "mode": mode,
			
 
				+        "top_confidence": top_confidence,
			
 
				+        "auto_accept_threshold": auto_accept_threshold,
			
 
				+        "interactive_below_threshold": interactive_below_threshold,
			
 
				+        "required_confidence": required_confidence,
			
 
				+        "used_cache": used_cache,
			
 
				+        "cache_confidence": cache_confidence,
			
 
				+        "decision": (
			
 
				+            "cache_hit"
			
 
				+            if used_cache
			
 
				+            else "resolved"
			
 
				+            if top_confidence >= auto_accept_threshold
			
 
				+            else "ambiguous_below_threshold"
			
 
				+        ),
			
 
				+    }
			
 
				+
			
 
				+
			
 
				 @dataclass
			
 
				 class ResolveService:
			
 
				     load_entity_fn: Any = _load_entity
			
@@ -90,11 +227,36 @@ class ResolveService:
 
				     async def resolve(self, *, subject: str, context: dict[str, Any] | None = None,
			
 
				                       constraints: dict[str, Any] | None = None,
			
 
				                       hints: dict[str, Any] | None = None,
			
 
				-                      debug: dict[str, Any] | None = None) -> dict[str, Any]:
			
 
				+                      debug: dict[str, Any] | None = None,
			
 
				+                      strategy: dict[str, Any] | None = None) -> dict[str, Any]:
			
 
				+        context = context or {}
			
 
				+        constraints = constraints or {}
			
 
				+        hints = hints or {}
			
 
				+        debug = debug or {}
			
 
				+        strategy = strategy or {}
			
 
				+        language = (context.get("language") or "en").strip() or "en"
			
 
				+        mode = (strategy.get("mode") or "quick").strip().lower() or "quick"
			
 
				+        use_embeddings = bool(strategy.get("use_embeddings", False))
			
 
				+        max_candidates = int(constraints.get("max_candidates") or 5)
			
 
				+        auto_accept_threshold = float(strategy.get("auto_accept_threshold") or 0.85)
			
 
				+        interactive_below_threshold = bool(strategy.get("interactive_below_threshold", True))
			
 
				+        required_confidence = _required_confidence(mode, constraints)
			
 
				         try:
			
 
				+            request_id = str(uuid.uuid4())
			
 
				+            ts = datetime.datetime.now(datetime.timezone.utc).isoformat()
			
 
				+            start = time.time()
			
 
				             subject = (subject or "").strip()
			
 
				             if not subject:
			
 
				-                return {"status": "not_found"}
			
 
				+                return {
			
 
				+                    "status": "not_found",
			
 
				+                    "entity": None,
			
 
				+                    "confidence": 0.0,
			
 
				+                    "candidates": [],
			
 
				+                    "ambiguity": None,
			
 
				+                    "resolution_path": [],
			
 
				+                    "meta": {"request_id": request_id, "timestamp": ts, "duration_ms": 0},
			
 
				+                    "error": None,
			
 
				+                }
			
 
				 
			
 
				             if DEBUG_LOGS:
			
 
				                 logger.info("resolve start subject=%s", subject)
			
@@ -103,22 +265,97 @@ class ResolveService:
 
				             if stored:
			
 
				                 if DEBUG_LOGS:
			
 
				                     logger.info("store hit subject=%s atlas_id=%s", subject, stored.get("atlas_id"))
			
 
				+                stored_confidence = float(stored.get("confidence") or (0.9 if not stored.get("needs_curation", False) else 0.6))
			
 
				+                if _cache_can_satisfy(stored, mode, constraints):
			
 
				+                    return {
			
 
				+                        "status": "resolved",
			
 
				+                        "entity": {
			
 
				+                            "id": stored.get("atlas_id"),
			
 
				+                            "label": stored.get("label"),
			
 
				+                            "type": stored.get("type"),
			
 
				+                            "description": stored.get("description"),
			
 
				+                            "source": None,
			
 
				+                            "uri": None,
			
 
				+                            "attributes": {},
			
 
				+                        },
			
 
				+                        "confidence": stored_confidence,
			
 
				+                        "candidates": [],
			
 
				+                        "ambiguity": None,
			
 
				+                        "resolution_path": [
			
 
				+                            {"phase": "cache", "action": "store_hit", "source": "triple_store"}
			
 
				+                        ],
			
 
				+                        "meta": {
			
 
				+                            "request_id": request_id,
			
 
				+                            "timestamp": ts,
			
 
				+                            "duration_ms": int((time.time() - start) * 1000),
			
 
				+                            **({"debug": _debug_decision(mode=mode, top_confidence=stored_confidence, auto_accept_threshold=auto_accept_threshold, interactive_below_threshold=interactive_below_threshold, required_confidence=required_confidence, used_cache=True, cache_confidence=stored_confidence)} if debug.get("include_explanations") else {}),
			
 
				+                        },
			
 
				+                        "error": None,
			
 
				+                    }
			
 
				+
			
 
				+                if DEBUG_LOGS:
			
 
				+                    logger.info("cache confidence too low subject=%s mode=%s confidence=%.3f required=%.3f", subject, mode, stored_confidence, required_confidence)
			
 
				+
			
 
				+            wd_candidates = await self.wikidata_lookup_fn(
			
 
				+                subject,
			
 
				+                language,
			
 
				+                1 if mode == "quick" else max(1, min(max_candidates, 10)),
			
 
				+            )
			
 
				+            if not wd_candidates:
			
 
				+                if DEBUG_LOGS:
			
 
				+                    logger.info("wikidata miss subject=%s mode=%s", subject, mode)
			
 
				                 return {
			
 
				-                    "status": "resolved",
			
 
				-                    "atlas_id": stored.get("atlas_id"),
			
 
				-                    "label": stored.get("label"),
			
 
				-                    "type": stored.get("type"),
			
 
				-                    "wikidata_id": stored.get("wikidata_id"),
			
 
				-                    "alias": stored.get("alias") or subject,
			
 
				+                    "status": "not_found",
			
 
				+                    "entity": {
			
 
				+                        "id": None,
			
 
				+                        "label": None,
			
 
				+                        "type": None,
			
 
				+                        "description": None,
			
 
				+                        "source": None,
			
 
				+                        "uri": None,
			
 
				+                        "attributes": {},
			
 
				+                    },
			
 
				+                    "confidence": 0.0,
			
 
				+                    "candidates": [],
			
 
				+                    "ambiguity": None,
			
 
				+                    "resolution_path": [
			
 
				+                        {"phase": "query", "action": "wikidata_quick_resolve", "source": "remote"}
			
 
				+                    ],
			
 
				+                    "meta": {
			
 
				+                        "request_id": request_id,
			
 
				+                        "timestamp": ts,
			
 
				+                        "duration_ms": int((time.time() - start) * 1000),
			
 
				+                        **({"debug": _debug_decision(mode=mode, top_confidence=0.0, auto_accept_threshold=auto_accept_threshold, interactive_below_threshold=interactive_below_threshold, required_confidence=required_confidence, used_cache=False)} if debug.get("include_explanations") else {}),
			
 
				+                    },
			
 
				+                    "error": None,
			
 
				                 }
			
 
				 
			
 
				-            wd = await self.wikidata_lookup_fn(subject)
			
 
				-            if not wd:
			
 
				-                if DEBUG_LOGS:
			
 
				-                    logger.info("wikidata miss subject=%s", subject)
			
 
				-                return {"status": "not_found"}
			
 
				+            ranked_candidates = []
			
 
				+            subject_embedding = None
			
 
				+            embedder = None
			
 
				+            if use_embeddings:
			
 
				+                embedder = WikidataSearch()
			
 
				+                subject_embedding = await embedder.embed_text(_candidate_text(subject, {"label": subject, "description": "", "aliases": []}, hints))
			
 
				+            for wd in wd_candidates:
			
 
				+                candidate_embedding = None
			
 
				+                if use_embeddings and embedder is not None:
			
 
				+                    candidate_embedding = await embedder.embed_text(_candidate_text(subject, wd, hints))
			
 
				+                confidence, breakdown = _score_wikidata_candidate(
			
 
				+                    subject,
			
 
				+                    wd,
			
 
				+                    context=context,
			
 
				+                    hints=hints,
			
 
				+                    use_embeddings=use_embeddings,
			
 
				+                    subject_embedding=subject_embedding,
			
 
				+                    candidate_embedding=candidate_embedding,
			
 
				+                )
			
 
				+                ranked_candidates.append({**wd, "confidence": confidence, "score_breakdown": breakdown})
			
 
				+            ranked_candidates.sort(key=lambda item: ((item.get("confidence") or 0.0), item.get("label") or ""), reverse=True)
			
 
				 
			
 
				+            wd = ranked_candidates[0]
			
 
				             entity = _entity_from_wikidata(subject, wd)
			
 
				+            if mode == "quick":
			
 
				+                wd["confidence"] = min(wd.get("confidence", 0.0), 0.6)
			
 
				             if DEBUG_LOGS:
			
 
				                 logger.info(
			
 
				                     "wikidata hit subject=%s qid=%s atlas_id=%s type=%s",
			
@@ -129,17 +366,79 @@ class ResolveService:
 
				                 )
			
 
				             await self.persist_entity_fn(entity)
			
 
				 
			
 
				+            resolution_path = [
			
 
				+                {"phase": "query", "action": "wikidata_quick_resolve", "source": "remote"},
			
 
				+                {"phase": "ranking", "action": f"mode_{mode}", "source": "resolver"},
			
 
				+            ]
			
 
				+            if use_embeddings:
			
 
				+                resolution_path.append(
			
 
				+                    {
			
 
				+                        "phase": "ranking",
			
 
				+                        "action": "embedding_similarity",
			
 
				+                        "source": "ollama",
			
 
				+                        "note": "embedding similarity used to score candidate order",
			
 
				+                    }
			
 
				+                )
			
 
				+
			
 
				+            status = "ambiguous"
			
 
				+            ambiguity = {"reason": "pre-maintenance", "dimension": 0.5}
			
 
				+            if mode == "quick":
			
 
				+                status = "ambiguous"
			
 
				+            elif (wd.get("confidence") or 0.0) >= auto_accept_threshold:
			
 
				+                status = "resolved"
			
 
				+                ambiguity = None
			
 
				+            elif interactive_below_threshold:
			
 
				+                status = "ambiguous"
			
 
				+
			
 
				             return {
			
 
				-                "status": "resolved",
			
 
				-                "atlas_id": entity.id,
			
 
				-                "label": entity.label,
			
 
				-                "type": entity.type,
			
 
				-                "wikidata_id": wd.get("id"),
			
 
				-                "alias": subject,
			
 
				+                "status": status,
			
 
				+                "entity": {
			
 
				+                    "id": entity.id,
			
 
				+                    "label": entity.label,
			
 
				+                    "type": entity.type,
			
 
				+                    "description": entity.description,
			
 
				+                    "source": "wikidata",
			
 
				+                    "uri": None,
			
 
				+                    "attributes": {
			
 
				+                        "wikidata_id": wd.get("id"),
			
 
				+                        "alias": subject,
			
 
				+                    },
			
 
				+                },
			
 
				+                "confidence": wd.get("confidence", 0.6),
			
 
				+                "candidates": [
			
 
				+                    {
			
 
				+                        "id": cand.get("id"),
			
 
				+                        "label": cand.get("label"),
			
 
				+                        "type": cand.get("type"),
			
 
				+                        "source": "wikidata",
			
 
				+                        "confidence": cand.get("confidence", 0.0),
			
 
				+                        "score_breakdown": cand.get("score_breakdown", {}) if debug.get("include_explanations") else {},
			
 
				+                    }
			
 
				+                    for cand in ranked_candidates
			
 
				+                ] if mode in {"ranked", "interactive", "hybrid", "llm_select"} else [],
			
 
				+                "ambiguity": ambiguity,
			
 
				+                "resolution_path": resolution_path + [{"phase": "persistence", "action": "store_save_minimal", "source": "triple_store"}],
			
 
				+                "meta": {
			
 
				+                    "request_id": request_id,
			
 
				+                    "timestamp": ts,
			
 
				+                    "duration_ms": int((time.time() - start) * 1000),
			
 
				+                    **({"debug": _debug_decision(mode=mode, top_confidence=wd.get("confidence", 0.0), auto_accept_threshold=auto_accept_threshold, interactive_below_threshold=interactive_below_threshold, required_confidence=required_confidence, used_cache=False)} if debug.get("include_explanations") else {}),
			
 
				+                },
			
 
				+                "error": None,
			
 
				             }
			
 
				         except Exception as exc:
			
 
				             detail = " | ".join(_flatten_exception_details(exc))
			
 
				             return {
			
 
				                 "status": "error",
			
 
				+                "entity": None,
			
 
				+                "confidence": 0.0,
			
 
				+                "candidates": [],
			
 
				+                "ambiguity": None,
			
 
				+                "resolution_path": [],
			
 
				+                "meta": {
			
 
				+                    "request_id": str(uuid.uuid4()),
			
 
				+                    "timestamp": datetime.datetime.now(datetime.timezone.utc).isoformat(),
			
 
				+                    "duration_ms": 0,
			
 
				+                },
			
 
				                 "error": {"code": "RESOLVE_FAILED", "message": detail},
			
 
				             }
			
--- a/app/wikidata.py
+++ b/app/wikidata.py
@@ -16,11 +16,15 @@ WIKIDATA_USER_AGENT = os.getenv(
 
				     "Atlas/1.0 (contact: lukas.goldschmidt+atlas@googlemail.com)",
			
 
				 )
			
 
				 
			
 
				+# The Wikidata reconciliation endpoint has moved more than once, so keep it configurable.
			
 
				 WIKIDATA_QUICK_RESOLVE_BASE_URL = os.getenv(
			
 
				     "ATLAS_WIKIDATA_QUICK_RESOLVE_URL",
			
 
				     "https://wikidata.reconci.link/en/api",
			
 
				 )
			
 
				 
			
 
				+OLLAMA_BASE_URL = os.getenv("OLLAMA_BASE_URL", "http://192.168.0.200:11434")
			
 
				+OLLAMA_EMBEDDING_MODEL = os.getenv("OLLAMA_EMBEDDING_MODEL", "nomic-embed-text")
			
 
				+
			
 
				 
			
 
				 @dataclass
			
 
				 class WikidataOptions:
			
@@ -44,6 +48,21 @@ def _build_url(opts: WikidataOptions, params: dict[str, Any]) -> str:
 
				     return f"https://{opts.apiHost}{opts.apiPath}?{query}"
			
 
				 
			
 
				 
			
 
				+def _client_kwargs() -> dict[str, Any]:
			
 
				+    return {
			
 
				+        "timeout": 20,
			
 
				+        "headers": {"Accept": "application/json", "User-Agent": WIKIDATA_USER_AGENT},
			
 
				+        "follow_redirects": True,
			
 
				+    }
			
 
				+
			
 
				+
			
 
				+def _ollama_client_kwargs() -> dict[str, Any]:
			
 
				+    return {
			
 
				+        "timeout": 20,
			
 
				+        "base_url": OLLAMA_BASE_URL,
			
 
				+    }
			
 
				+
			
 
				+
			
 
				 class WikidataSearch:
			
 
				     def __init__(self, options: dict[str, Any] | None = None, *, client: httpx.AsyncClient | None = None):
			
 
				         self.defaultOptions = WikidataOptions()
			
@@ -64,6 +83,22 @@ class WikidataSearch:
 
				     def clearPropertyCache(self) -> None:
			
 
				         PROPERTY_CACHE.clear()
			
 
				 
			
 
				+    async def embed_text(self, text: str) -> list[float] | None:
			
 
				+        client = self._client or httpx.AsyncClient(**_ollama_client_kwargs())
			
 
				+        close_client = self._client is None
			
 
				+        try:
			
 
				+            resp = await client.post(
			
 
				+                "/api/embeddings",
			
 
				+                json={"model": OLLAMA_EMBEDDING_MODEL, "prompt": text},
			
 
				+            )
			
 
				+            resp.raise_for_status()
			
 
				+            data = resp.json()
			
 
				+            embedding = data.get("embedding")
			
 
				+            return embedding if isinstance(embedding, list) else None
			
 
				+        finally:
			
 
				+            if close_client:
			
 
				+                await client.aclose()
			
 
				+
			
 
				     async def search(self) -> dict[str, Any]:
			
 
				         if not self.validateOptions():
			
 
				             return {"results": [], "error": "Bad options"}
			
@@ -78,10 +113,7 @@ class WikidataSearch:
 
				         }
			
 
				         url = _build_url(self.options, params)
			
 
				 
			
 
				-        client = self._client or httpx.AsyncClient(
			
 
				-            timeout=20,
			
 
				-            headers={"Accept": "application/json", "User-Agent": WIKIDATA_USER_AGENT},
			
 
				-        )
			
 
				+        client = self._client or httpx.AsyncClient(**_client_kwargs())
			
 
				         close_client = self._client is None
			
 
				         try:
			
 
				             resp = await client.get(url)
			
@@ -115,10 +147,7 @@ class WikidataSearch:
 
				         params = {
			
 
				             "queries": json.dumps({"q0": {"query": query, "limit": limit}}),
			
 
				         }
			
 
				-        client = self._client or httpx.AsyncClient(
			
 
				-            timeout=20,
			
 
				-            headers={"Accept": "application/json", "User-Agent": WIKIDATA_USER_AGENT},
			
 
				-        )
			
 
				+        client = self._client or httpx.AsyncClient(**_client_kwargs())
			
 
				         close_client = self._client is None
			
 
				         try:
			
 
				             resp = await client.get(endpoint, params=params)
			
@@ -144,6 +173,15 @@ class WikidataSearch:
 
				 
			
 
				         return {"results": results}
			
 
				 
			
 
				+    async def candidate_embeddings(self, candidates: list[dict[str, Any]]) -> list[dict[str, Any]]:
			
 
				+        out = []
			
 
				+        for cand in candidates:
			
 
				+            text_parts = [cand.get("label") or "", cand.get("description") or "", " ".join(cand.get("aliases") or [])]
			
 
				+            text = " | ".join(part for part in text_parts if part)
			
 
				+            embedding = await self.embed_text(text)
			
 
				+            out.append({**cand, "embedding": embedding})
			
 
				+        return out
			
 
				+
			
 
				     def search_sync(self) -> dict[str, Any]:
			
 
				         return asyncio.run(self.search())
			
 
				 
			
@@ -166,10 +204,7 @@ class WikidataSearch:
 
				         }
			
 
				         url = _build_url(self.options, params)
			
 
				 
			
 
				-        client = self._client or httpx.AsyncClient(
			
 
				-            timeout=20,
			
 
				-            headers={"Accept": "application/json", "User-Agent": WIKIDATA_USER_AGENT},
			
 
				-        )
			
 
				+        client = self._client or httpx.AsyncClient(**_client_kwargs())
			
 
				         close_client = self._client is None
			
 
				         try:
			
 
				             resp = await client.get(url)
			
@@ -267,10 +302,7 @@ class WikidataSearch:
 
				             PROPERTY_CACHE.setdefault(prop_id, prop_id)
			
 
				 
			
 
				     async def get_entity_data(self, qid: str) -> dict[str, Any]:
			
 
				-        client = self._client or httpx.AsyncClient(
			
 
				-            timeout=20,
			
 
				-            headers={"Accept": "application/json", "User-Agent": WIKIDATA_USER_AGENT},
			
 
				-        )
			
 
				+        client = self._client or httpx.AsyncClient(**_client_kwargs())
			
 
				         close_client = self._client is None
			
 
				         try:
			
 
				             resp = await client.get(
			
--- a/ontology/atlas.ttl
+++ b/ontology/atlas.ttl
@@ -1,17 +1,49 @@
 
				-@prefix atlas:  <http://world.eu.org/atlas_ontology#> .
			
 
				-@prefix owl:    <http://www.w3.org/2002/07/owl#> .
			
 
				-@prefix rdf:    <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
			
 
				-@prefix rdfs:   <http://www.w3.org/2000/01/rdf-schema#> .
			
 
				-@prefix xsd:    <http://www.w3.org/2001/XMLSchema#> .
			
 
				-@prefix schema: <http://schema.org/> .
			
 
				-@prefix wd:     <http://www.wikidata.org/entity/> .
			
 
				-
			
 
				-atlas:Ontology a owl:Ontology ;
			
 
				-  rdfs:label   "Atlas Ontology" ;
			
 
				-  rdfs:comment "Entity resolution ontology for Atlas." .
			
 
				-
			
 
				-
			
 
				-### Classes
			
 
				+@prefix atlas:   <http://world.eu.org/atlas_ontology#> .
			
 
				+@prefix owl:     <http://www.w3.org/2002/07/owl#> .
			
 
				+@prefix rdf:     <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
			
 
				+@prefix rdfs:    <http://www.w3.org/2000/01/rdf-schema#> .
			
 
				+@prefix xsd:     <http://www.w3.org/2001/XMLSchema#> .
			
 
				+@prefix schema:  <http://schema.org/> .
			
 
				+@prefix wd:      <http://www.wikidata.org/entity/> .
			
 
				+@prefix dcterms: <http://purl.org/dc/terms/> .
			
 
				+
			
 
				+# =============================================================================
			
 
				+# Atlas Ontology  v1.1.0
			
 
				+#
			
 
				+# Changelog
			
 
				+#   1.0.0  Initial release — core classes, flat identifiers, alias, provenance,
			
 
				+#          claim, curate flag, seven top-level entity types.
			
 
				+#   1.1.0  Expanded type catalog (fully backward-compatible):
			
 
				+#            - Location hierarchy: Continent, Country, Region, PopulatedPlace,
			
 
				+#              Neighbourhood, NaturalFeature, AdministrativeArea
			
 
				+#            - Organization subtypes: PoliticalParty, MilitaryUnit,
			
 
				+#              MediaOrganization
			
 
				+#            - CreativeWork subtypes: Film, Book, MusicAlbum, TVSeries,
			
 
				+#              VideoGame
			
 
				+#            - Product subtypes: Drug, Food
			
 
				+#            - New top-level types: FinancialInstrument (with PublicCompany,
			
 
				+#              StockIndex, Commodity, Cryptocurrency, Currency), Animal,
			
 
				+#              Disease, Building, Award, Sport, FictionalCharacter,
			
 
				+#              EthnicGroup, Concept
			
 
				+#          Three new relationship properties:
			
 
				+#            - atlas:locatedIn   (transitive)
			
 
				+#            - atlas:bordersWith (symmetric)
			
 
				+#            - atlas:memberOf
			
 
				+# =============================================================================
			
 
				+
			
 
				+<http://world.eu.org/atlas_ontology>
			
 
				+  a owl:Ontology ;
			
 
				+  rdfs:label      "Atlas Ontology" ;
			
 
				+  rdfs:comment    "Entity resolution ontology for Atlas." ;
			
 
				+  owl:versionIRI  <http://world.eu.org/atlas_ontology/1.1.0> ;
			
 
				+  owl:versionInfo "1.1.0" ;
			
 
				+  dcterms:created  "2026-04-01"^^xsd:date ;
			
 
				+  dcterms:modified "2026-04-06"^^xsd:date .
			
 
				+
			
 
				+
			
 
				+# =============================================================================
			
 
				+# INFRASTRUCTURE CLASSES  (1.0.0 — unchanged)
			
 
				+# =============================================================================
			
 
				 
			
 
				 atlas:Entity a owl:Class ;
			
 
				   rdfs:label   "Entity" ;
			
@@ -38,7 +70,9 @@ atlas:CurateFlag a owl:Class ;
 
				   rdfs:comment "Signals that an entity needs human review." .
			
 
				 
			
 
				 
			
 
				-### Object properties
			
 
				+# =============================================================================
			
 
				+# OBJECT PROPERTIES  (1.0.0 — unchanged, three new ones added in 1.1.0)
			
 
				+# =============================================================================
			
 
				 
			
 
				 atlas:hasCanonicalType a owl:ObjectProperty ;
			
 
				   rdfs:domain atlas:Entity ;
			
@@ -85,8 +119,30 @@ atlas:hasCurateFlag a owl:ObjectProperty ;
 
				   rdfs:range  atlas:CurateFlag ;
			
 
				   rdfs:label  "has curate flag" .
			
 
				 
			
 
				+# --- NEW in 1.1.0 ---
			
 
				+
			
 
				+atlas:locatedIn a owl:ObjectProperty, owl:TransitiveProperty ;
			
 
				+  rdfs:domain atlas:Entity ;
			
 
				+  rdfs:range  atlas:Entity ;
			
 
				+  rdfs:label  "located in" ;
			
 
				+  rdfs:comment "Spatial containment, transitive. Enables zoom-in/zoom-out traversal: PopulatedPlace locatedIn Region locatedIn Country locatedIn Continent." .
			
 
				+
			
 
				+atlas:bordersWith a owl:ObjectProperty, owl:SymmetricProperty ;
			
 
				+  rdfs:domain atlas:Entity ;
			
 
				+  rdfs:range  atlas:Entity ;
			
 
				+  rdfs:label  "borders with" ;
			
 
				+  rdfs:comment "Shared land or maritime border. Symmetric: if A bordersWith B then B bordersWith A." .
			
 
				 
			
 
				-### Datatype properties
			
 
				+atlas:memberOf a owl:ObjectProperty ;
			
 
				+  rdfs:domain atlas:Entity ;
			
 
				+  rdfs:range  atlas:Entity ;
			
 
				+  rdfs:label  "member of" ;
			
 
				+  rdfs:comment "Membership or affiliation. Intended uses: Person to Organization, Person to EthnicGroup, Organization to Organization. Not for type classification — use atlas:hasCanonicalType for that." .
			
 
				+
			
 
				+
			
 
				+# =============================================================================
			
 
				+# DATATYPE PROPERTIES  (1.0.0 — unchanged)
			
 
				+# =============================================================================
			
 
				 
			
 
				 atlas:atlasId a owl:DatatypeProperty ;
			
 
				   rdfs:domain atlas:Entity ;
			
@@ -171,41 +227,265 @@ atlas:rawJson a owl:DatatypeProperty ;
 
				   rdfs:domain atlas:Entity ;
			
 
				   rdfs:range  xsd:string ;
			
 
				   rdfs:label  "raw json" ;
			
 
				-  rdfs:comment "Opaque JSON cache blob from any source. Source is recorded in the associated Provenance node." .
			
 
				-
			
 
				-
			
 
				-### Canonical type catalog
			
 
				+  rdfs:comment "Opaque JSON cache blob. Source is recorded inside the blob." .
			
 
				+
			
 
				+
			
 
				+# =============================================================================
			
 
				+# TYPE CATALOG
			
 
				+#
			
 
				+# LLM extraction note:
			
 
				+#   For cheap / small models, pass only the seven top-level types (Person,
			
 
				+#   Organization, Location, CreativeWork, Event, Product, Other plus the new
			
 
				+#   top-level additions). Use a Wikidata QID lookup to promote to a subtype
			
 
				+#   in a second pass — do not ask a small model to choose among 35 types.
			
 
				+#
			
 
				+# Virtuoso inference note:
			
 
				+#   rdfs:subClassOf* traversal requires inference to be enabled:
			
 
				+#   OPTION(INFERENCE 'atlas')
			
 
				+#   A query for atlas:Location will then also match atlas:Country etc.
			
 
				+# =============================================================================
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# Person  (1.0.0)
			
 
				+# -----------------------------------------------------------------------------
			
 
				 
			
 
				 atlas:Person a owl:Class ;
			
 
				   rdfs:subClassOf atlas:EntityType ;
			
 
				   rdfs:label "Person" ;
			
 
				   owl:sameAs schema:Person, wd:Q5 .
			
 
				 
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# Organization  (1.0.0) + subtypes (1.1.0)
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				 atlas:Organization a owl:Class ;
			
 
				   rdfs:subClassOf atlas:EntityType ;
			
 
				   rdfs:label "Organization" ;
			
 
				   owl:sameAs schema:Organization, wd:Q43229 .
			
 
				 
			
 
				+atlas:PoliticalParty a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Organization ;
			
 
				+  rdfs:label "Political Party" ;
			
 
				+  owl:sameAs wd:Q7278 .                    # 1.1.0
			
 
				+
			
 
				+atlas:MilitaryUnit a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Organization ;
			
 
				+  rdfs:label "Military Unit" ;
			
 
				+  owl:sameAs wd:Q176799 .                  # 1.1.0
			
 
				+
			
 
				+atlas:MediaOrganization a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Organization ;
			
 
				+  rdfs:label "Media Organization" ;
			
 
				+  owl:sameAs wd:Q4830453 .                 # 1.1.0
			
 
				+
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# Location  (1.0.0) + hierarchy (1.1.0)
			
 
				+# Relate instances with atlas:locatedIn and atlas:bordersWith.
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				 atlas:Location a owl:Class ;
			
 
				   rdfs:subClassOf atlas:EntityType ;
			
 
				-  rdfs:label "Location" ;
			
 
				+  rdfs:label   "Location" ;
			
 
				+  rdfs:comment "Abstract parent. Use a subtype where possible." ;
			
 
				   owl:sameAs schema:Place, wd:Q17334923 .
			
 
				 
			
 
				+atlas:Continent a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Location ;
			
 
				+  rdfs:label "Continent" ;
			
 
				+  owl:sameAs wd:Q5107 .                    # 1.1.0
			
 
				+
			
 
				+atlas:Country a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Location ;
			
 
				+  rdfs:label "Country" ;
			
 
				+  owl:sameAs schema:Country, wd:Q6256 .   # 1.1.0
			
 
				+
			
 
				+atlas:Region a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Location ;
			
 
				+  rdfs:label   "Region" ;
			
 
				+  rdfs:comment "State, province, county or similar administrative subdivision." ;
			
 
				+  owl:sameAs wd:Q82794 .                   # 1.1.0
			
 
				+
			
 
				+atlas:PopulatedPlace a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Location ;
			
 
				+  rdfs:label   "Populated Place" ;
			
 
				+  rdfs:comment "City, town or village." ;
			
 
				+  owl:sameAs wd:Q515 .                     # 1.1.0
			
 
				+
			
 
				+atlas:Neighbourhood a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Location ;
			
 
				+  rdfs:label   "Neighbourhood" ;
			
 
				+  rdfs:comment "Borough, district, arrondissement or similar urban subdivision." ;
			
 
				+  owl:sameAs wd:Q123705 .                  # 1.1.0
			
 
				+
			
 
				+atlas:NaturalFeature a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Location ;
			
 
				+  rdfs:label   "Natural Feature" ;
			
 
				+  rdfs:comment "River, mountain, ocean, lake or other natural geographic feature." ;
			
 
				+  owl:sameAs wd:Q35145263 .               # 1.1.0
			
 
				+
			
 
				+atlas:AdministrativeArea a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Location ;
			
 
				+  rdfs:label   "Administrative Area" ;
			
 
				+  rdfs:comment "Fallback for political subdivisions that do not fit a more specific subtype." ;
			
 
				+  owl:sameAs wd:Q56061 .                   # 1.1.0
			
 
				+
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# CreativeWork  (1.0.0) + subtypes (1.1.0)
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				 atlas:CreativeWork a owl:Class ;
			
 
				   rdfs:subClassOf atlas:EntityType ;
			
 
				   rdfs:label "Creative Work" ;
			
 
				   owl:sameAs schema:CreativeWork, wd:Q17537576 .
			
 
				 
			
 
				+atlas:Film a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:CreativeWork ;
			
 
				+  rdfs:label "Film" ;
			
 
				+  owl:sameAs schema:Movie, wd:Q11424 .     # 1.1.0
			
 
				+
			
 
				+atlas:Book a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:CreativeWork ;
			
 
				+  rdfs:label "Book" ;
			
 
				+  owl:sameAs schema:Book, wd:Q571 .        # 1.1.0
			
 
				+
			
 
				+atlas:MusicAlbum a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:CreativeWork ;
			
 
				+  rdfs:label "Music Album" ;
			
 
				+  owl:sameAs schema:MusicAlbum, wd:Q482994 . # 1.1.0
			
 
				+
			
 
				+atlas:TVSeries a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:CreativeWork ;
			
 
				+  rdfs:label "TV Series" ;
			
 
				+  owl:sameAs schema:TVSeries, wd:Q5398426 . # 1.1.0
			
 
				+
			
 
				+atlas:VideoGame a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:CreativeWork ;
			
 
				+  rdfs:label "Video Game" ;
			
 
				+  owl:sameAs schema:VideoGame, wd:Q7889 .  # 1.1.0
			
 
				+
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# Event  (1.0.0)
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				 atlas:Event a owl:Class ;
			
 
				   rdfs:subClassOf atlas:EntityType ;
			
 
				   rdfs:label "Event" ;
			
 
				   owl:sameAs schema:Event, wd:Q1656682 .
			
 
				 
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# Product  (1.0.0) + subtypes (1.1.0)
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				 atlas:Product a owl:Class ;
			
 
				   rdfs:subClassOf atlas:EntityType ;
			
 
				   rdfs:label "Product" ;
			
 
				   owl:sameAs schema:Product, wd:Q2424752 .
			
 
				 
			
 
				+atlas:Drug a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Product ;
			
 
				+  rdfs:label "Drug" ;
			
 
				+  owl:sameAs wd:Q8386 .                    # 1.1.0
			
 
				+
			
 
				+atlas:Food a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:Product ;
			
 
				+  rdfs:label "Food" ;
			
 
				+  owl:sameAs wd:Q2095 .                    # 1.1.0
			
 
				+
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# FinancialInstrument  (1.1.0) — new top-level type
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				+atlas:FinancialInstrument a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Financial Instrument" ;
			
 
				+  owl:sameAs wd:Q182780 .
			
 
				+
			
 
				+atlas:PublicCompany a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:FinancialInstrument ;
			
 
				+  rdfs:label   "Public Company" ;
			
 
				+  rdfs:comment "Company traded on a public exchange. Has a ticker and ISIN." ;
			
 
				+  owl:sameAs wd:Q891723 .
			
 
				+
			
 
				+atlas:StockIndex a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:FinancialInstrument ;
			
 
				+  rdfs:label   "Stock Index" ;
			
 
				+  rdfs:comment "Market index such as S&P 500, DAX or Nikkei." ;
			
 
				+  owl:sameAs wd:Q181600 .
			
 
				+
			
 
				+atlas:Commodity a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:FinancialInstrument ;
			
 
				+  rdfs:label   "Commodity" ;
			
 
				+  rdfs:comment "Physical good traded on an exchange: gold, oil, wheat, etc." ;
			
 
				+  owl:sameAs wd:Q317088 .
			
 
				+
			
 
				+atlas:Cryptocurrency a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:FinancialInstrument ;
			
 
				+  rdfs:label "Cryptocurrency" ;
			
 
				+  owl:sameAs wd:Q13479982 .
			
 
				+
			
 
				+atlas:Currency a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:FinancialInstrument ;
			
 
				+  rdfs:label   "Currency" ;
			
 
				+  rdfs:comment "Fiat currency. Distinct from Cryptocurrency." ;
			
 
				+  owl:sameAs schema:Currency, wd:Q8142 .
			
 
				+
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# New top-level types  (1.1.0)
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				+atlas:Animal a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Animal" ;
			
 
				+  owl:sameAs wd:Q729 .
			
 
				+
			
 
				+atlas:Disease a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Disease" ;
			
 
				+  owl:sameAs schema:MedicalCondition, wd:Q12136 .
			
 
				+
			
 
				+atlas:Building a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Building" ;
			
 
				+  owl:sameAs wd:Q41176 .
			
 
				+
			
 
				+atlas:Award a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Award" ;
			
 
				+  owl:sameAs wd:Q618779 .
			
 
				+
			
 
				+atlas:Sport a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Sport" ;
			
 
				+  owl:sameAs wd:Q349 .
			
 
				+
			
 
				+atlas:FictionalCharacter a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Fictional Character" ;
			
 
				+  owl:sameAs wd:Q95074 .
			
 
				+
			
 
				+atlas:EthnicGroup a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label "Ethnic Group" ;
			
 
				+  owl:sameAs wd:Q41710 .
			
 
				+
			
 
				+atlas:Concept a owl:Class ;
			
 
				+  rdfs:subClassOf atlas:EntityType ;
			
 
				+  rdfs:label   "Concept" ;
			
 
				+  rdfs:comment "Abstract idea that does not fit a more specific type." ;
			
 
				+  owl:sameAs wd:Q151885 .
			
 
				+
			
 
				+
			
 
				+# -----------------------------------------------------------------------------
			
 
				+# Other  (1.0.0) — fallback, use when no type above fits
			
 
				+# -----------------------------------------------------------------------------
			
 
				+
			
 
				 atlas:Other a owl:Class ;
			
 
				   rdfs:subClassOf atlas:EntityType ;
			
 
				   rdfs:label "Other" .
			
--- a/ontology_suggestions.txt
+++ b/ontology_suggestions.txt
@@ -0,0 +1,25 @@
 
				+<http://wikidata.dbpedia.org/resource/Q1000415> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Event> .

			
 
				+<<http://wikidata.dbpedia.org/resource/Q1000501> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Software> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1000726> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/ChemicalCompound> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1000867> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Politician> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1000888> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Media> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1001082> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Organisation> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1001106> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Activity> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1001329> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Building> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1001378> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/AcademicSubject> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1002195> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Disease> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1002228> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Profession> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1002439> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Food> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1003214> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Weapon> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1003889> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Contest> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1004875> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/EthnicGroup> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1020203> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Mineral> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1022626> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Ship> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q102356> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/MilitaryUnit> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q10291472> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Animal> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1037810> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Drug> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1050285> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/FictionalCharacter> .

			
 
				+<http://wikidata.dbpedia.org/resource/Q1050644> <http://www.w3.org/2000/01/rdf-schema#subClassOf> <http://dbpedia.org/ontology/Aircraft> .

			
 
				+

			
 
				+

			
 
				+City Country Region 
			
--- a/resolve_scheme.md
+++ b/resolve_scheme.md
@@ -10,10 +10,16 @@ The request is a JSON object with the following top‑level keys:
 
				 |------|------|-------------|
			
 
				 | **subject** | string | The entity to resolve. **Required** |
			
 
				 | **context** | object | Optional context to narrow the search.  | 
			
 
				-| | `realm` | string | e.g. *"music"*, *"geography"* |
			
 
				+| | `realm` | string | Resolution realm, e.g. `internal`, `external`, `news`, `music`, `geography` |
			
 
				 | | `provenance` | string | Source of the query (e.g. user, system) |
			
 
				 | | `time` | string | ISO‑8601 timestamp |
			
 
				 | | `language` | string | BCP‑47 language tag |
			
 
				+| **strategy** | object | Controls how the resolver should behave. |
			
 
				+| | `mode` | string | One of `quick`, `ranked`, `llm_select`, `interactive`, `hybrid` |
			
 
				+| | `use_embeddings` | boolean | Use embedding similarity while ranking candidates |
			
 
				+| | `auto_accept_threshold` | number (0-1) | Confidence threshold for auto-resolving; useful for `ranked`/`hybrid` |
			
 
				+| | `interactive_below_threshold` | boolean | Return candidates instead of auto-picking when confidence is low |
			
 
				+| | `use_llm_fallback` | boolean | Allow a cheap LLM pass when symbolic ranking is inconclusive |
			
 
				 | **constraints** | object | Rules to apply while resolving. |
			
 
				 | | `deterministic` | boolean | If true, the tool must always return the same result |
			
 
				 | | `require_authority` | boolean | Require a trusted source |
			
@@ -58,4 +64,13 @@ The tool replies with a JSON object containing:
 
				 }
			
 
				 ```
			
 
				 
			
 
				+### Suggested mode semantics
			
 
				+
			
 
				+- `quick`: current fast path, take the top remote candidate.
			
 
				+- `ranked`: fetch several candidates, score them with explicit heuristics, then choose or return ambiguity.
			
 
				+- `llm_select`: fetch several candidates and let a cheap model choose.
			
 
				+- `interactive`: always return candidate choices to the client.
			
 
				+- `hybrid`: symbolic ranking first, then LLM fallback if needed.
			
 
				+- `use_embeddings`: when true, rank by lexical + embedding similarity.
			
 
				+
			
 
				 Feel free to use this file as the reference for any implementation of the resolve tool.
			
--- a/scripts/run_resolve_harness.py
+++ b/scripts/run_resolve_harness.py
@@ -0,0 +1,37 @@
 
				+from __future__ import annotations
			
 
				+
			
 
				+import json
			
 
				+import subprocess
			
 
				+from pathlib import Path
			
 
				+
			
 
				+ROOT = Path(__file__).resolve().parents[1]
			
 
				+FIXTURES = ROOT / "tests" / "fixtures" / "resolve_harness_cases.json"
			
 
				+
			
 
				+
			
 
				+def main() -> int:
			
 
				+    cases = json.loads(FIXTURES.read_text())
			
 
				+    print(f"Loaded {len(cases)} resolve harness cases")
			
 
				+    print()
			
 
				+    for case in cases:
			
 
				+        print(f"=== {case['name']} ===")
			
 
				+        cmd = [
			
 
				+            "mcporter",
			
 
				+            "--config",
			
 
				+            "$CONFIG",
			
 
				+            "call",
			
 
				+            "atlas",
			
 
				+            "resolve",
			
 
				+            f"subject={json.dumps(case['subject'])}",
			
 
				+            f"context={json.dumps(case['context'])}",
			
 
				+            f"constraints={json.dumps(case['constraints'])}",
			
 
				+            f"hints={json.dumps(case['hints'])}",
			
 
				+            f"strategy={json.dumps(case['strategy'])}",
			
 
				+            'debug={"include_candidates":true,"include_explanations":true}',
			
 
				+        ]
			
 
				+        print(" ".join(cmd))
			
 
				+        print()
			
 
				+    return 0
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    raise SystemExit(main())
			
--- a/test_resolve.sh
+++ b/test_resolve.sh
@@ -0,0 +1,53 @@
 
				+#!/usr/bin/env bash
			
 
				+set -euo pipefail
			
 
				+
			
 
				+cd "$(dirname "$0")"
			
 
				+
			
 
				+if [[ -x .venv/bin/pytest ]]; then
			
 
				+  PYTEST=.venv/bin/pytest
			
 
				+else
			
 
				+  PYTEST=pytest
			
 
				+fi
			
 
				+
			
 
				+python3 - <<'PY'
			
 
				+import json
			
 
				+from pathlib import Path
			
 
				+cases = json.loads(Path('tests/fixtures/resolve_harness_cases.json').read_text())
			
 
				+print('\nResolver test runner')
			
 
				+print(f'  project : {Path.cwd()}')
			
 
				+print(f'  cases   : {len(cases)}')
			
 
				+print('\nSubjects under test:')
			
 
				+for case in cases:
			
 
				+    print(f"  - {case['name']}: {case['subject']} ({case['context'].get('language','en')})")
			
 
				+print('\nWhat is tested:')
			
 
				+print('  - cache hits resolve when confidence is sufficient')
			
 
				+print('  - low-confidence cache triggers re-resolution in ranked mode')
			
 
				+print('  - interactive mode returns all candidates below threshold')
			
 
				+print('  - embedding scoring is recorded when enabled')
			
 
				+print('\nRunning tests...\n')
			
 
				+PY
			
 
				+
			
 
				+REPORT=$(mktemp)
			
 
				+trap 'rm -f "$REPORT"' EXIT
			
 
				+
			
 
				+"$PYTEST" -q --junitxml="$REPORT" \
			
 
				+  tests/test_resolve_tool.py \
			
 
				+  tests/test_resolve_strategies.py \
			
 
				+  "$@"
			
 
				+
			
 
				+python3 - "$REPORT" <<'PY'
			
 
				+import sys
			
 
				+import xml.etree.ElementTree as ET
			
 
				+from pathlib import Path
			
 
				+report = Path(sys.argv[1])
			
 
				+root = ET.parse(report).getroot()
			
 
				+rows = []
			
 
				+for case in root.iter('testcase'):
			
 
				+    rows.append((case.get('classname',''), case.get('name',''), float(case.get('time','0'))))
			
 
				+rows.sort(key=lambda r: r[2], reverse=True)
			
 
				+print('\nPer-test timings:')
			
 
				+print(f"{'test':60} {'seconds':>8}")
			
 
				+print('-' * 70)
			
 
				+for cls, name, secs in rows:
			
 
				+    print(f"{(cls + '::' + name):60} {secs:8.3f}")
			
 
				+PY
			
--- a/tests/fixtures/resolve_harness_cases.json
+++ b/tests/fixtures/resolve_harness_cases.json
@@ -0,0 +1,10 @@
 
				+[
			
 
				+  {"name":"en_exact_country_quick","subject":"Australia","context":{"realm":"external","language":"en","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.55},"hints":{"expected_type":"location","aliases":[]},"strategy":{"mode":"quick","auto_accept_threshold":0.85,"interactive_below_threshold":true,"use_embeddings":false}},
			
 
				+  {"name":"en_exact_country_ranked_embeddings","subject":"Australia","context":{"realm":"external","language":"en","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.85},"hints":{"expected_type":"location","aliases":["Commonwealth of Australia"]},"strategy":{"mode":"ranked","auto_accept_threshold":0.85,"interactive_below_threshold":true,"use_embeddings":true}},
			
 
				+  {"name":"en_ambiguous_place_interactive","subject":"Georgia","context":{"realm":"external","language":"en","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.85},"hints":{"expected_type":"location","aliases":[]},"strategy":{"mode":"interactive","auto_accept_threshold":0.9,"interactive_below_threshold":true,"use_embeddings":true}},
			
 
				+  {"name":"en_fictional_subject","subject":"Sherlock Holmes","context":{"realm":"external","language":"en","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.85},"hints":{"expected_type":"person","aliases":["Detective Holmes"]},"strategy":{"mode":"ranked","auto_accept_threshold":0.85,"interactive_below_threshold":true,"use_embeddings":true}},
			
 
				+  {"name":"en_nonexistent_subject","subject":"Xyqvlorbania","context":{"realm":"external","language":"en","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.85},"hints":{"expected_type":"location","aliases":[]},"strategy":{"mode":"ranked","auto_accept_threshold":0.85,"interactive_below_threshold":true,"use_embeddings":false}},
			
 
				+  {"name":"de_exact_country_ranked","subject":"Österreich","context":{"realm":"external","language":"de","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.85},"hints":{"expected_type":"location","aliases":["Republik Österreich"]},"strategy":{"mode":"ranked","auto_accept_threshold":0.85,"interactive_below_threshold":true,"use_embeddings":true}},
			
 
				+  {"name":"de_city_quick","subject":"Wien","context":{"realm":"external","language":"de","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.55},"hints":{"expected_type":"location","aliases":["Vienna"]},"strategy":{"mode":"quick","auto_accept_threshold":0.85,"interactive_below_threshold":true,"use_embeddings":false}},
			
 
				+  {"name":"de_ambiguous_person_interactive","subject":"Johann Strauss","context":{"realm":"external","language":"de","provenance":"user"},"constraints":{"max_candidates":5,"min_confidence":0.85},"hints":{"expected_type":"person","aliases":["Johann Strauss I","Johann Strauss II"]},"strategy":{"mode":"interactive","auto_accept_threshold":0.9,"interactive_below_threshold":true,"use_embeddings":true}}
			
 
				+]
			
--- a/tests/test_maintenance_helpers.py
+++ b/tests/test_maintenance_helpers.py
@@ -4,6 +4,7 @@ from app.maintenance import (
 
				     _extract_wikidata_qids_from_entity_dump,
			
 
				     _infer_atlas_type_from_qids,
			
 
				 )
			
 
				+from app.atlas_store import _parse_boolean_literal
			
 
				 
			
 
				 
			
 
				 def test_extract_wikidata_qids_from_dump_dedupes():
			
@@ -48,3 +49,8 @@ def test_infer_atlas_type_from_qids_heuristic_person():
 
				     atlas_type = _infer_atlas_type_from_qids(["Q5"], g)
			
 
				     assert atlas_type == "atlas:Person"
			
 
				 
			
 
				+
			
 
				+def test_parse_boolean_literal_accepts_virtuoso_one():
			
 
				+    assert _parse_boolean_literal("1") is True
			
 
				+    assert _parse_boolean_literal("true") is True
			
 
				+    assert _parse_boolean_literal("0") is False
			
--- a/tests/test_resolve_strategies.py
+++ b/tests/test_resolve_strategies.py
@@ -0,0 +1,102 @@
 
				+import pytest
			
 
				+
			
 
				+from app.resolve import ResolveService
			
 
				+
			
 
				+
			
 
				+@pytest.mark.anyio
			
 
				+async def test_cache_hit_is_resolved_when_confidence_satisfies_requested_mode():
			
 
				+    async def load_entity(_subject):
			
 
				+        return {
			
 
				+            "atlas_id": "atlas-1",
			
 
				+            "label": "Australia",
			
 
				+            "type": "atlas:Location",
			
 
				+            "description": "country in Oceania",
			
 
				+            "needs_curation": True,
			
 
				+            "confidence": 0.91,
			
 
				+        }
			
 
				+
			
 
				+    async def fail_lookup(*_args, **_kwargs):
			
 
				+        raise AssertionError("wikidata lookup should not run")
			
 
				+
			
 
				+    async def no_persist(_entity):
			
 
				+        return None
			
 
				+
			
 
				+    svc = ResolveService(load_entity_fn=load_entity, wikidata_lookup_fn=fail_lookup, persist_entity_fn=no_persist)
			
 
				+    result = await svc.resolve(
			
 
				+        subject="Australia",
			
 
				+        constraints={"min_confidence": 0.85},
			
 
				+        strategy={"mode": "ranked"},
			
 
				+        debug={"include_explanations": True},
			
 
				+    )
			
 
				+
			
 
				+    assert result["status"] == "resolved"
			
 
				+    assert result["confidence"] == 0.91
			
 
				+    assert result["meta"]["debug"]["used_cache"] is True
			
 
				+
			
 
				+
			
 
				+@pytest.mark.anyio
			
 
				+async def test_low_confidence_cache_triggers_reresolution_for_ranked_mode():
			
 
				+    calls = {"lookup": 0, "persist": 0}
			
 
				+
			
 
				+    async def load_entity(_subject):
			
 
				+        return {
			
 
				+            "atlas_id": "atlas-1",
			
 
				+            "label": "Australia",
			
 
				+            "type": "atlas:Location",
			
 
				+            "description": "country in Oceania",
			
 
				+            "needs_curation": True,
			
 
				+            "confidence": 0.55,
			
 
				+        }
			
 
				+
			
 
				+    async def wikidata_lookup(_subject, _language="en", _limit=5):
			
 
				+        calls["lookup"] += 1
			
 
				+        return [
			
 
				+            {"id": "Q408", "label": "Australia", "description": "country in Oceania", "type": "Q6256"}
			
 
				+        ]
			
 
				+
			
 
				+    async def persist(_entity):
			
 
				+        calls["persist"] += 1
			
 
				+
			
 
				+    svc = ResolveService(load_entity_fn=load_entity, wikidata_lookup_fn=wikidata_lookup, persist_entity_fn=persist)
			
 
				+    result = await svc.resolve(
			
 
				+        subject="Australia",
			
 
				+        context={"language": "en", "realm": "external"},
			
 
				+        constraints={"min_confidence": 0.85},
			
 
				+        hints={"expected_type": "location", "aliases": []},
			
 
				+        strategy={"mode": "ranked", "auto_accept_threshold": 0.85},
			
 
				+        debug={"include_explanations": True},
			
 
				+    )
			
 
				+
			
 
				+    assert calls["lookup"] == 1
			
 
				+    assert calls["persist"] == 1
			
 
				+    assert result["status"] == "resolved"
			
 
				+    assert result["meta"]["debug"]["used_cache"] is False
			
 
				+
			
 
				+
			
 
				+@pytest.mark.anyio
			
 
				+async def test_interactive_returns_all_candidates_without_auto_accepting_below_threshold():
			
 
				+    async def no_hit(_subject):
			
 
				+        return None
			
 
				+
			
 
				+    async def wikidata_lookup(_subject, _language="en", _limit=5):
			
 
				+        return [
			
 
				+            {"id": "Q1225", "label": "Georgia", "description": "country in Eastern Europe and West Asia", "type": "Q6256"},
			
 
				+            {"id": "Q1428", "label": "Georgia", "description": "state of the United States of America", "type": "Q35657"},
			
 
				+        ]
			
 
				+
			
 
				+    async def no_persist(_entity):
			
 
				+        return None
			
 
				+
			
 
				+    svc = ResolveService(load_entity_fn=no_hit, wikidata_lookup_fn=wikidata_lookup, persist_entity_fn=no_persist)
			
 
				+    result = await svc.resolve(
			
 
				+        subject="Georgia",
			
 
				+        context={"language": "en", "realm": "external"},
			
 
				+        constraints={"max_candidates": 5},
			
 
				+        hints={"expected_type": "location", "aliases": []},
			
 
				+        strategy={"mode": "interactive", "auto_accept_threshold": 0.95, "interactive_below_threshold": True},
			
 
				+        debug={"include_candidates": True, "include_explanations": True},
			
 
				+    )
			
 
				+
			
 
				+    assert result["status"] == "ambiguous"
			
 
				+    assert len(result["candidates"]) == 2
			
 
				+    assert result["meta"]["debug"]["decision"] == "ambiguous_below_threshold"
			
--- a/tests/test_resolve_tool.py
+++ b/tests/test_resolve_tool.py
@@ -11,8 +11,8 @@ async def test_resolve_tool_is_stubbed_and_returns_ok():
 
				     async def no_persist(_e):
			
 
				         return None
			
 
				 
			
 
				-    async def no_wikidata(_s):
			
 
				-        return None
			
 
				+    async def no_wikidata(_s, _language="en", _limit=1):
			
 
				+        return []
			
 
				 
			
 
				     svc = ResolveService(
			
 
				         load_entity_fn=no_hit,
			
@@ -21,4 +21,6 @@ async def test_resolve_tool_is_stubbed_and_returns_ok():
 
				     )
			
 
				     result = await svc.resolve(subject="anything")
			
 
				 
			
 
				-    assert result == {"status": "not_found"}
			
 
				+    assert result["status"] in {"not_found", "ambiguous", "resolved", "error"}
			
 
				+    assert "meta" in result
			
 
				+    assert "resolution_path" in result