glam/data/custodian.backup.20251230/CZ-10-DOM-A-ANK.yaml
2025-12-30 23:07:03 +01:00

267 lines
9.5 KiB
YAML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: Archiv Národní knihovny
institution_type: ARCHIVE
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ARON_UUID
identifier_value: e262b2e2-5213-4e1e-b4ac-32843aa1c36c
identifier_url: https://portal.nacr.cz/aron/apu/e262b2e2-5213-4e1e-b4ac-32843aa1c36c
- &id002
identifier_scheme: INSTITUTION_CODE
identifier_value: '630000050'
- &id003
identifier_scheme: Wikidata
identifier_value: Q64869380
identifier_url: https://www.wikidata.org/wiki/Q64869380
- &id004
identifier_scheme: VIAF
identifier_value: '136515365'
identifier_url: https://viaf.org/viaf/136515365
locations: []
processing_timestamp: '2025-12-06T23:37:44.792710+00:00'
ghcid:
ghcid_current: CZ-10-DOM-A-ANK
ghcid_original: XX-XX-XXX-A-ANK
ghcid_uuid: 9db9d6d2-f0f3-5c2c-ac8a-6fa6c2f55c02
ghcid_uuid_sha256: f5481d53-2b5b-8134-07da-b14e74501678
ghcid_numeric: 17674408980662444340
record_id: 1aa0af71-24f3-410a-9405-4ca431f7ab2a
generation_timestamp: '2025-12-06T23:37:44.792710+00:00'
location_resolution:
country_code: CZ
region_code: '10'
city_code: DOM
method: WIKIDATA_COORDS_REVERSE_GEOCODE
resolution_timestamp: '2025-12-07T00:25:56.478232+00:00'
region_name: CZ-10
iso_code_source: CZ-10
city_label: Dolni Mecholupy
geonames_id: 3076771
ghcid_history:
- previous_ghcid_component: "DM"
new_ghcid_component: "DOM"
change_date: "2025-12-20T19:55:24Z"
reason: "Fixed 2-letter city code to proper 3-letter code per AGENTS.md. City: Dolni Mecholupy"
- ghcid: XX-XX-XXX-A-ANK
ghcid_numeric: 17674408980662444340
valid_from: '2025-12-06T23:37:44.792710+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
- ghcid: CZ-XX-XXX-A-ANK
valid_from: '2025-12-06T23:54:40.648223+00:00'
reason: 'Country resolved via Wikidata P17: XX→CZ'
- ghcid: CZ-10-XXX-A-ANK
valid_from: '2025-12-07T00:01:29.808795+00:00'
reason: 'Region resolved via Wikidata P131: XX->10 (CZ-10)'
- ghcid: CZ-10-DM-A-ANK
valid_from: '2025-12-07T00:25:56.478255+00:00'
reason: 'City resolved via Wikidata Q64869380 coordinates: XXX->DM (Dolni Mecholupy)'
custodian_name:
claim_type: custodian_name
claim_value: Archiv Národní knihovny
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: XX-XX-XXX-A-ANK
- identifier_scheme: GHCID_UUID
identifier_value: 9db9d6d2-f0f3-5c2c-ac8a-6fa6c2f55c02
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: f5481d53-2b5b-8134-07da-b14e74501678
- identifier_scheme: GHCID_NUMERIC
identifier_value: '17674408980662444340'
- identifier_scheme: RECORD_ID
identifier_value: 1aa0af71-24f3-410a-9405-4ca431f7ab2a
- *id001
- *id002
- *id003
- *id004
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T11:35:45.745453+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'Country resolved 2025-12-06T23:54:40Z: XX→CZ via Wikidata P17'
- 'Region resolved 2025-12-07T00:01:29Z: XX->10 via Wikidata P131 (CZ-10)'
- 'City resolved 2025-12-07T00:25:56Z: XXX->DM via Wikidata Q64869380 coords (50.0467,14.5567) -> Dolni Mecholupy (GeoNames:3076771)'
- 'YouTube/Google Maps enrichment 2025-12-08T19:45:12Z: Maps: rejected by LLM; YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:03Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:27Z
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-lWbaXQExFjOYWdHnD7QBvO/AspEx6zsrXjooMMIA5Pg=
verified_at: '2025-12-28T19:58:20.765235+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q64869380
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:58:20.765250+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.745453+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date:
verified_by:
entity_claims:
- claim_type: full_name
claim_value: Archiv Národní knihovny
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.745453+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.85
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.745453+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
- claim_type: wikidata_id
claim_value: Q64869380
property_uri: owl:sameAs
provenance:
namespace: wikidata
path: /entity/Q64869380
timestamp: '2025-11-19T11:35:45.745453+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.98
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:44.792710+00:00'
creation_method: create_custodian_from_ch_annotator.py
wikidata_enrichment:
wikidata_entity_id: Q64869380
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-08T23:41:07.388472+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P31
- P17
- P214
- P18
- P131
- P571
- P159
- P968
- P361
- P2671
wikidata_labels:
cs: Archiv Národní knihovny ČR
en: Archives of the National Library of the Czech Republic
wikidata_label_en: Archives of the National Library of the Czech Republic
wikidata_descriptions:
cs: český specializovaný archiv
wikidata_aliases:
cs:
- Archiv Národní knihovny
- ANK
wikidata_sitelinks:
cswiki: Archiv Národní knihovny České republiky
wikidata_temporal:
inception: '1990-00-00'
wikidata_inception: '1990-00-00'
wikidata_classification:
instance_of: &id005
- id: Q101470010
label: specialized archives
description: type of archives in Czechia
wikidata_instance_of: *id005
wikidata_location:
country: &id006
id: Q213
label: Czech Republic
description: country in Central Europe
located_in_admin_entity: &id007
id: Q1085
label: Prague
description: capital city of the Czech Republic
headquarters_location:
id: Q3490834
label: Prague 15
description: municipal part of Prague
wikidata_country: *id006
wikidata_located_in: *id007
wikidata_organization:
part_of:
id: Q1967876
label: National Library of the Czech Republic
description: central library of the Czech Republic
wikidata_media:
image: Národní knihovna ČR Centrální depozitář Hostivař 4.jpg
wikidata_image: Národní knihovna ČR Centrální depozitář Hostivař 4.jpg
wikidata_contact:
email: mailto:Katerina.Hekrdlova@nkp.cz
_provenance:
content_hash:
algorithm: sha256
value: sha256-lWbaXQExFjOYWdHnD7QBvO/AspEx6zsrXjooMMIA5Pg=
scope: enrichment_section
computed_at: '2025-12-28T19:58:20.765235+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q64869380
verification:
status: verified
last_verified: '2025-12-28T19:58:20.765242+00:00'
google_maps_status: NO_MATCH
google_maps_rejected:
candidate_name: National Archives of the Czech Republic
rejection_reason: The candidate 'National Archives of the Czech Republic' is a different institution from the source 'Archiv Národní knihovny'. The source is the archive of the National Library of the Czech Republic, while the candidate is the main National Archives. Although both are archives in Prague, they are separate organizations, which is a critical mismatch.
timestamp: '2025-12-08T19:45:12.427546+00:00'
youtube_status: NOT_FOUND
youtube_search_query: Archiv Národní knihovny official
youtube_search_timestamp: '2025-12-08T19:45:12.757543+00:00'
location:
region: CZ-10
region_code: '10'
country: CZ
geonames_id: 3076771
normalization_timestamp: '2025-12-09T15:34:38.593418+00:00'
latitude: 50.06037
longitude: 14.55733
coordinate_provenance:
source_type: GEONAMES_LOCAL
source_path: data/reference/geonames.db
entity_id: 3076771
original_timestamp: '2025-12-09T15:34:38.593047+00:00'
geonames_name: Dolní Měcholupy
feature_code: PPL