test_claims.py 1.7 KB

123456789101112131415161718192021222324252627282930313233
  1. from app.claims import build_claim_sets
  2. from app.models import AtlasAlias, AtlasEntity, AtlasIdentifier, AtlasProvenance
  3. def test_build_claim_sets_attaches_provenance_per_claim():
  4. entity = AtlasEntity(
  5. atlas_id="atlas:mid:/m/0cqt90",
  6. canonical_label="Donald Trump",
  7. canonical_description="45th and 47th U.S. President",
  8. entity_type="Person",
  9. aliases=[AtlasAlias(label="Donald Trump")],
  10. identifiers=[
  11. AtlasIdentifier(value="/m/0cqt90", source="google", identifier_type="mid"),
  12. AtlasIdentifier(value="Q22686", source="wikidata", identifier_type="qid"),
  13. ],
  14. provenance=[
  15. AtlasProvenance(source="google", retrieval_method="trends-resolution", confidence=0.9, retrieved_at="2026-04-03T00:00:00Z"),
  16. AtlasProvenance(source="wikidata", retrieval_method="wbsearchentities + entitydata", confidence=0.99, retrieved_at="2026-04-03T00:00:01Z"),
  17. AtlasProvenance(source="openai-llm", retrieval_method="type-classification", confidence=1.0, retrieved_at="2026-04-03T00:00:02Z"),
  18. ],
  19. raw_payload={"wikidata": {"status": "ok", "qid": "Q22686", "retrieved_at": "2026-04-03T00:00:01Z"}},
  20. needs_curation=False,
  21. )
  22. raw_claims, derived_claims = build_claim_sets(entity)
  23. mid_claim = next(c for c in raw_claims if c["object"].get("value") == "/m/0cqt90")
  24. qid_claim = next(c for c in raw_claims if c["object"].get("value") == "Q22686")
  25. canonical_type = next(c for c in derived_claims if c["predicate"] == "atlas:hasCanonicalType")
  26. assert mid_claim["provenance"]["source"] == "google"
  27. assert qid_claim["provenance"]["source"] == "wikidata"
  28. assert canonical_type["provenance"]["method"] == "type-classification"