glam/data/custodian/CZ-10-PRK-A-SOAPVSSVP.yaml
2025-12-30 23:01:01 +01:00

185 lines
7.5 KiB
YAML

original_entry:
name: Státní okresní archiv Praha-východ se sídlem v Přemyšlení
institution_type: ARCHIVE
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ARON_UUID
identifier_value: 8b97e6fe-0615-4adb-9b4f-09c0b00c4edf
identifier_url: https://portal.nacr.cz/aron/apu/8b97e6fe-0615-4adb-9b4f-09c0b00c4edf
- &id002
identifier_scheme: INSTITUTION_CODE
identifier_value: '221209010'
locations: []
processing_timestamp: '2025-12-06T23:37:44.401323+00:00'
ghcid:
ghcid_current: CZ-10-PRK-A-SOAPVSSVP
ghcid_original: XX-XX-XXX-A-SOAPVSSVP
ghcid_uuid: c38ffa04-944b-5c0e-8781-b774f749a527
ghcid_uuid_sha256: c7e3cfa8-9aff-8da6-f016-601e01448ceb
ghcid_numeric: 14403584356322880934
record_id: 144317eb-9e65-45a6-b8c7-21a7694cf444
generation_timestamp: '2025-12-06T23:37:44.401323+00:00'
location_resolution:
country_code: CZ
region_code: '10'
city_code: PRK
method: CH_ANNOTATOR_TOP_SET
resolution_timestamp: '2025-12-07T00:19:29.810682+00:00'
city_name: Praha Klanovice
geonames_id: 8629195
feature_code: PPL
extracted_toponym: Praha
latitude: 50.0974
longitude: 14.66915
ghcid_history:
- previous_ghcid_component: PK
new_ghcid_component: PRK
change_date: '2025-12-20T19:55:24Z'
reason: 'Fixed 2-letter city code to proper 3-letter code per AGENTS.md. City: Praha Klanovice'
- ghcid: XX-XX-XXX-A-SOAPVSSVP
ghcid_numeric: 14403584356322880934
valid_from: '2025-12-06T23:37:44.401323+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
- ghcid: CZ-XX-XXX-A-SOAPVSSVP
valid_from: '2025-12-06T23:56:11.991897+00:00'
reason: 'Country resolved via Wikidata P17: XX→CZ'
- ghcid: CZ-10-PK-A-SOAPVSSVP
valid_from: '2025-12-07T00:19:29.810692+00:00'
reason: 'Location resolved via CH-Annotator TOP.SET extraction: Praha -> Praha Klanovice (GeoNames:8629195)'
custodian_name:
claim_type: custodian_name
claim_value: Státní okresní archiv Praha-východ se sídlem v Přemyšlení
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: XX-XX-XXX-A-SOAPVSSVP
- identifier_scheme: GHCID_UUID
identifier_value: c38ffa04-944b-5c0e-8781-b774f749a527
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: c7e3cfa8-9aff-8da6-f016-601e01448ceb
- identifier_scheme: GHCID_NUMERIC
identifier_value: '14403584356322880934'
- identifier_scheme: RECORD_ID
identifier_value: 144317eb-9e65-45a6-b8c7-21a7694cf444
- *id001
- *id002
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T11:35:45.744650+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'Country resolved 2025-12-06T23:56:11Z: XX→CZ via Wikidata P17'
- 'Location resolved 2025-12-07T00:19:29Z: CH-Annotator TOP.SET extraction ''Praha'' -> Praha Klanovice (GeoNames:8629195,
Region:10)'
- 'YouTube/Google Maps enrichment 2025-12-08T19:45:30Z: Maps: rejected by LLM; YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:11:18Z
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:03Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:27Z
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.744650+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date: null
verified_by: null
entity_claims:
- claim_type: full_name
claim_value: Státní okresní archiv Praha-východ se sídlem v Přemyšlení
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.744650+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.85
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.744650+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.95
- claim_type: location_settlement
claim_value: Praha Klanovice
property_uri: schema:location
hypernym_code: TOP.SET
hypernym_label: SETTLEMENT
provenance:
namespace: geonames
path: /geonames/8629195
timestamp: '2025-12-07T00:19:29.810696+00:00'
agent: extract_locations_ch_annotator.py
context_convention: ch_annotator-v1_7_0
confidence: 0.85
extraction_source:
field: institution_name
extracted_text: Praha
method: pattern_matching
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:44.401323+00:00'
creation_method: create_custodian_from_ch_annotator.py
google_maps_status: NO_MATCH
google_maps_rejected:
candidate_name: Státní Okresní Archiv Praha-východ
rejection_reason: The names are a strong match for the same institution. The location mismatch is minor (Zdiby vs. Praha
Klanovice) and likely indicates that the institution moved from its listed location. However, the Google Place types ('point_of_interest',
'establishment') are too generic and do not confirm its function as an archive. The 'CLOSED_PERMANENTLY' status further
weakens the case for a current match. REJECT due to incorrect and generic Google Place Types.
timestamp: '2025-12-08T19:45:30.189507+00:00'
youtube_status: NOT_FOUND
youtube_search_query: Státní okresní archiv Praha-východ se sídlem v Přemyšlení official
youtube_search_timestamp: '2025-12-08T19:45:30.522902+00:00'
location:
latitude: 50.0974
longitude: 14.66915
coordinate_provenance:
source_type: GHCID_RESOLUTION_DIRECT
source_path: ghcid.location_resolution
original_timestamp: '2025-12-07T00:19:29.810682+00:00'
entity_id: 8629195
resolution_method: CH_ANNOTATOR_TOP_SET
city: Praha Klanovice
region_code: '10'
country: CZ
geonames_id: 8629195
feature_code: PPL
normalization_timestamp: '2025-12-09T06:49:27.679546+00:00'