glam/data/custodian/CZ-10-PRA-A-MCPUMCOSA.yaml
2025-12-30 23:01:01 +01:00

165 lines
6.8 KiB
YAML

custodian_name:
claim_type: custodian_name
claim_value: Městská část Praha 8, Úřad městské části, oddělení správní archiv
source_type: ch_annotator
original_entry:
name: Městská část Praha 8, Úřad městské části, oddělení správní archiv
institution_type: ARCHIVE
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ARON_UUID
identifier_value: 8eb1af65-589b-4387-b275-ded623e45958
identifier_url: https://portal.nacr.cz/aron/apu/8eb1af65-589b-4387-b275-ded623e45958
- &id002
identifier_scheme: INSTITUTION_CODE
identifier_value: '430000020'
locations: []
processing_timestamp: '2025-12-06T23:37:44.412611+00:00'
ghcid:
ghcid_current: CZ-10-PRA-A-MCPUMCOSA
ghcid_original: XX-XX-XXX-A-MČPÚMČOSA
ghcid_uuid: ebd1d928-73a4-55f7-a8f8-808f820926f1
ghcid_uuid_sha256: 7d3a0ff6-400b-8b03-81b9-afb39b88b4ef
ghcid_numeric: 9023542353701055235
record_id: d840e672-9808-44eb-af86-5302867f472f
generation_timestamp: '2025-12-06T23:37:44.412611+00:00'
location_resolution:
country_code: CZ
region_code: '10'
city_code: PRA
method: NAME_EXTRACTION
resolution_timestamp: '2025-12-07T12:33:44.242569+00:00'
region_name: Praha
city_label: Prague
reason: 'City extracted from institution name: "praha" → Prague'
ghcid_history:
- ghcid: CZ-10-PRA-A-MCPUMCOSA
ghcid_numeric: 9023542353701055235
valid_from: '2025-12-08T11:21:38.203600+00:00'
reason: 'Normalized diacritics to ASCII per ABBREV-DIACRITICS rule (was: CZ-10-PRA-A-MČPÚMČOSA)'
- ghcid: XX-XX-XXX-A-MČPÚMČOSA
ghcid_numeric: 17749544531385161246
valid_from: '2025-12-06T23:37:44.412611+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
valid_to: '2025-12-08T11:21:38.203600+00:00'
- ghcid: CZ-XX-XXX-A-MČPÚMČOSA
valid_from: '2025-12-06T23:56:12.338911+00:00'
reason: 'Country resolved via Wikidata P17: XX→CZ'
- ghcid: CZ-10-PRA-A-MČPÚMČOSA
valid_from: '2025-12-07T12:33:44.242578+00:00'
reason: 'Location resolved from name: XX→10, XXX→PRA (Prague)'
identifiers:
- identifier_scheme: GHCID
identifier_value: CZ-10-PRA-A-MCPUMCOSA
- identifier_scheme: GHCID_UUID
identifier_value: ebd1d928-73a4-55f7-a8f8-808f820926f1
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 7d3a0ff6-400b-8b03-81b9-afb39b88b4ef
- identifier_scheme: GHCID_NUMERIC
identifier_value: '9023542353701055235'
- identifier_scheme: RECORD_ID
identifier_value: d840e672-9808-44eb-af86-5302867f472f
- *id001
- *id002
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T11:35:45.744674+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'Country resolved 2025-12-06T23:56:12Z: XX→CZ via Wikidata P17'
- 'YouTube/Google Maps enrichment 2025-12-08T19:47:23Z: Maps: rejected by LLM; YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:11:19Z
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:04Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:28Z
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.744674+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date: null
verified_by: null
entity_claims:
- claim_type: full_name
claim_value: Městská část Praha 8, Úřad městské části, oddělení správní archiv
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.744674+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.85
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.744674+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.95
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:44.412611+00:00'
creation_method: create_custodian_from_ch_annotator.py
google_maps_status: NO_MATCH
google_maps_rejected:
candidate_name: Municipal District Office of Prague 8
rejection_reason: 'TYPE_MISMATCH: The source name indicates an administrative archive (''oddělení správní archiv''), but
the Google Place entry is for the broader municipal district office (''Městská část Praha 8, Úřad městské části''). The
Google Place types confirm this mismatch, listing ''local_government_office'' instead of a heritage-related type like
a library or archive. This is a government office, not a heritage institution.'
timestamp: '2025-12-08T19:47:22.840017+00:00'
youtube_status: NOT_FOUND
youtube_search_query: Městská část Praha 8, Úřad městské části, oddělení správní archiv official
youtube_search_timestamp: '2025-12-08T19:47:23.180787+00:00'
location:
region: Praha
region_code: '10'
country: CZ
normalization_timestamp: '2025-12-09T15:34:39.747246+00:00'
latitude: 50.08804
longitude: 14.42076
coordinate_provenance:
source_type: GEONAMES_LOCAL
source_path: data/reference/geonames.db
entity_id: 3067696
original_timestamp: '2025-12-09T15:34:39.747214+00:00'
geonames_id: 3067696
geonames_name: Prague
feature_code: PPLC