glam/data/custodian.backup.20251230/CZ-10-PRA-A-AUMAVESPZ.yaml
2025-12-30 23:07:03 +01:00

264 lines
12 KiB
YAML
Raw Permalink Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: Archiválie uložené mimo archivy v evidenci SOkA Praha-západ
institution_type: ARCHIVE
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ARON_UUID
identifier_value: 1443b0ae-a411-4adc-8700-18241bbe1200
identifier_url: https://portal.nacr.cz/aron/apu/1443b0ae-a411-4adc-8700-18241bbe1200
- &id002
identifier_scheme: INSTITUTION_CODE
identifier_value: '801210010'
locations: []
processing_timestamp: '2025-12-06T23:37:43.832878+00:00'
ghcid:
ghcid_current: CZ-10-PRA-A-AUMAVESPZ
ghcid_original: XX-XX-XXX-A-AUMAVESPZ
ghcid_uuid: 2fa8dd54-2c9c-56b8-86c7-663f0822c17a
ghcid_uuid_sha256: e8055cba-a0f9-8a1c-df59-75f406483f4b
ghcid_numeric: 16718871148317219356
record_id: 5fbd91cb-6f5e-49ec-8763-3b10226a0886
generation_timestamp: '2025-12-06T23:37:43.832878+00:00'
location_resolution:
country_code: CZ
region_code: '10'
city_code: PRA
method: NAME_EXTRACTION
resolution_timestamp: '2025-12-07T12:33:44.011667+00:00'
region_name: Praha
city_label: Prague
reason: 'City extracted from institution name: "praha" → Prague'
ghcid_history:
- ghcid: XX-XX-XXX-A-AUMAVESPZ
ghcid_numeric: 16718871148317219356
valid_from: '2025-12-06T23:37:43.832878+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
- ghcid: CZ-XX-XXX-A-AUMAVESPZ
valid_from: '2025-12-06T23:56:12.760155+00:00'
reason: 'Country resolved via Wikidata P17: XX→CZ'
- ghcid: CZ-10-PRA-A-AUMAVESPZ
valid_from: '2025-12-07T12:33:44.011685+00:00'
reason: 'Location resolved from name: XX→10, XXX→PRA (Prague)'
custodian_name:
claim_type: custodian_name
claim_value: Archiválie uložené mimo archivy v evidenci SOkA Praha-západ
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: XX-XX-XXX-A-AUMAVESPZ
- identifier_scheme: GHCID_UUID
identifier_value: 2fa8dd54-2c9c-56b8-86c7-663f0822c17a
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: e8055cba-a0f9-8a1c-df59-75f406483f4b
- identifier_scheme: GHCID_NUMERIC
identifier_value: '16718871148317219356'
- identifier_scheme: RECORD_ID
identifier_value: 5fbd91cb-6f5e-49ec-8763-3b10226a0886
- *id001
- *id002
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T11:35:45.743469+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'Country resolved 2025-12-06T23:56:12Z: XX→CZ via Wikidata P17'
- 'YouTube/Google Maps enrichment 2025-12-08T19:46:55Z: Maps: State Regional Archives in Prague (conf: 0.90); YouTube:
not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:11:19Z
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:04Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:28Z
schema_version: 2.0.0
enrichment_provenance:
google_maps_enrichment:
content_hash: sha256-yEo7rRSuFitnH3Z6qYiLiOhTj0sO+NtzAhTr3Fp61j0=
verified_at: '2025-12-28T19:58:21.316662+00:00'
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:58:21.316682+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.743469+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date:
verified_by:
entity_claims:
- claim_type: full_name
claim_value: Archiválie uložené mimo archivy v evidenci SOkA Praha-západ
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.743469+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.85
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.743469+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:43.832878+00:00'
creation_method: create_custodian_from_ch_annotator.py
google_maps_enrichment:
place_id: ChIJpeVeWjWSC0cReyWDSRX37SM
name: State Regional Archives in Prague
fetch_timestamp: '2025-12-08T19:46:50.601512+00:00'
api_status: OK
coordinates:
latitude: 50.0386519
longitude: 14.492900899999999
formatted_address: Archivní 2257/4, 149 00 Praha 4-Chodov, Czechia
short_address: Archivní 2257/4, Praha 4-Chodov
phone_local: 974 847 358
phone_international: +420 974 847 358
website: http://www.soapraha.cz/
google_place_types:
- library
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 5
total_ratings: 21
reviews:
- author_name: Milan Vyhlídal
author_uri: https://www.google.com/maps/contrib/111835299486855944674/reviews
rating: 5
relative_time_description: a year ago
text: Experts in their field. They are always willing and professional to help or provide further guidance. Thank you
for your work!
publish_time: '2024-01-17T19:00:55.036123Z'
- author_name: Petra Kincl Braunová
author_uri: https://www.google.com/maps/contrib/116976865976878167071/reviews
rating: 5
relative_time_description: 2 years ago
text: Friendly and helpful staff. Pleasant environment.
publish_time: '2023-04-28T10:23:39.415867Z'
- author_name: Jaroslav Mašek
author_uri: https://www.google.com/maps/contrib/101001995239972380058/reviews
rating: 5
relative_time_description: 3 years ago
text: A very interesting visit with expert explanations from knowledgeable employees, for the uninitiated an amazing
experience, thank you very much
publish_time: '2022-11-03T12:04:46.976780Z'
- author_name: Jan Wójcicki
author_uri: https://www.google.com/maps/contrib/115803697556900327251/reviews
rating: 5
relative_time_description: 3 years ago
text:
publish_time: '2022-08-13T09:04:21.743042Z'
- author_name: Tereza Kosnarová
author_uri: https://www.google.com/maps/contrib/105482423779246590586/reviews
rating: 5
relative_time_description: 7 months ago
text:
publish_time: '2025-05-10T12:42:37.398757Z'
opening_hours:
open_now: false
weekday_text:
- 'Monday: 9:00AM6:00PM'
- 'Tuesday: 9:00AM4:00PM'
- 'Wednesday: 9:00AM6:00PM'
- 'Thursday: 9:00AM4:00PM'
- 'Friday: 9:00AM2:00PM'
- 'Saturday: Closed'
- 'Sunday: Closed'
photo_count: 5
photos_metadata:
- name: places/ChIJpeVeWjWSC0cReyWDSRX37SM/photos/AZLasHom1LZGFkFPP3k1FXYCvMagtv61BPtsTSzXPBNLa3w7ixQeulO9sn65lClUHLXjINmhBpNbn4h-DWQ2pQmjKR8oNaz0Xl2yFWXW9lmK7C7iN46RCtM7aYJAMUfGOWoKxdQslDz9sO2Nu9JXQDBib77sn7uApy9wO4hOqyJe119p0hju4WzGTX5Kzedqxix73YNQfDMcZ7RPnP4H6sPdyW-TVgHrdVybyZkWNUNgneUHxiBpvDlMgYyTiV5UF2UB-imcRLBI4sIgdeq5ndTefU2Sljn_LTydDP_Ckk29c2gRsd28IB5FYxU4L4sn2wsEq_xfpL7Dm2-UoWKauKmb8R08gFu-yrOfmqTzZo2OdOC0kZVujfo-PayRtAQFNIfOta2LJ1XbQwzBfr6A_dQhqfbsrhygW3M0OixQxSk6kkBtqg
height: 850
width: 1275
- name: places/ChIJpeVeWjWSC0cReyWDSRX37SM/photos/AZLasHoofZy3zYXohxWcbl_YsMEq0eGBVdSRII2JKmCS12WFx_PJaISX-1Jc0MGasqYKGmZvm2NLXJXxcEZ7-vhLvxz8JHU9X8A-sRFeuW4MErdIbsZmKlN5we1MNpJ2nmj3ujR_XG6wy4BjER8q3_46bRLYvYqJaZc69VQaHZigu1amPpwn-_XZd1EObHkLn_Wmz3EgFO_OdUyYPItBPrqh0YfEYfVnrZ3LUI_LFWM5rnJ_z5pzZFf58AKTQeyWr0N2PKkF58V5XeZTAD5_sIDIBj0ES48Z8thI3F-QvHdH_9NUiHya1O2nDEbA_ARF3xHbrkNmCv_l5QvNYyv68RBfrfY9KN1beC3kd53qLnD9BazlwgiUUKA-g68GXGfolvmnivhpHwoROwwvchdKS_Jonf5gUh408Bp-8usSDDJEse0
height: 4080
width: 2294
- name: places/ChIJpeVeWjWSC0cReyWDSRX37SM/photos/AZLasHqBXXqlKeyt8jzcBvVYDxzMOWOfZ2bFGc_5NzcsuqOdQyxJ9MisyuXbM42Et_bIW83fGw9rtziXTwssz59QC6LmNwgyVcwc5vGrcgHgFv0ArPU_KiFVKhatwX69f7UpMUWMYTgx5KqE2O78tU3PPrbp1SVxWskZVlICWp5s6AaAKplpKe29JkvBJ1pKuudr-Khnu1zRq8l7xck8DF5OW4-BYCsFTpT-d8GlBZB9qWCzBgX0VKFdnylvBr6dCPIo--W_kNusrOI_YnsGBdxfcrUkYh9oR1Gd6PY8hYPYgjsW1-k0sz-mmMCJMuAo-Kt1KF3y9v16OxI8bVukuSV5WkgHs8a2EB6xHMURXh-PKvZ_cDonA26sNxiMasW3wuzJ_Jd4Vh2673Es_Jt7oMrMabYZQwi2fckhMXlp_h5ZpSXBigQe
height: 3072
width: 4096
- name: places/ChIJpeVeWjWSC0cReyWDSRX37SM/photos/AZLasHr9mjMzK7sQzISoLVUvkPHfReECPnXr-LH5RCiHglKhELNOMWEoFg5xhcHHWcy6cli9dhPBbcD5We6lN1AUxF2fyqSEm_lVWn8BAU4SzqJETWXdUG2_O-Z8VHCJ0cVI-BEwdr3TgunX094ZnI9I76CbamOAarqbFm7bu1uAKWT6t0OgObGX8PPsWjv_DmRfZgqx83A_nfP-0JdLnY5U7K38Ma6jHbK5GyVPCmjsLx-0IKZjXvqc8L6iBwlFDubLpdGOLlszcU5LsYb7YxfFy3ktsQVUjfCNAssYcK0OQ8bpFd199OvL4GAxQ1AqOdfpDo-fJc-_b_Wni8StmAlRZLqZ6E_aFgAgM4rx5LQu3HYiEEPe9hYbmlzXXsE0hqiQNwyQBLmJ8KuxwgFqfJFXfF1y9iac511YM_W23qCZaY2zxA
height: 3024
width: 4032
- name: places/ChIJpeVeWjWSC0cReyWDSRX37SM/photos/AZLasHp9h9HvgzBCzaA8jbksoQgbQO169zSnvCnD8URiS1QQgDMJb1S7bo7jHkkcCLFt033XYJ2Rseq4y-GrhiMMXoh3U13V-bjeBKV0HE91n4tLLjrbJAPvbSVt0W1bubmQ0vbKkltxSyr57zbNZjp3COLBAUrZRlgqAU0INFkNXLX_Rf1Ncq_tCnxDGebxcXaocF69duvZ2UflaC7ePGfnGhKvcY9cmDkWfiVFWl-fMtD43rLlLXqm1v7XBaCXKQ3HhHFoaOcYXye46ERAHlU-lQhGsq9hPaVuRXlsfYo9OWt01Tnahjgm_CvrsOp5i6DYRR74T7OUSDEp-JCBvi1flJuEzhezeT4VH5UqQY8eWOW3DJWDm2SnO4uZzTJWheztu_Kec1d8ctIcczJgW5OUUzRANxWDp7q0zjRtrwbDYd0
height: 4032
width: 3024
google_maps_url: https://maps.google.com/?cid=2588997031607608699&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
llm_verification:
is_match: true
confidence: 0.9
entity_type: GRP.HER
reasoning: 'NAME MATCH: The source name ''Archiválie uložené mimo archivy v evidenci SOkA Praha-západ'' describes a collection
managed by an institution. The candidate ''State Regional Archives in Prague'' corresponds to ''Státní oblastní archiv
v Praze'' (SOA Praha), which is a regional archive for Prague. The source name specifies the ''západ'' (west) district,
which is a part of the Prague region. Therefore, the institution is a match. LOCATION MATCH: The address is in Prague,
Czechia, matching the source country (CZ). TYPE MATCH: The Google Place type ''library'' is an acceptable proxy for
an archive. ENTITY TYPE: An archive is a heritage institution (GRP.HER).'
agent: glm-4.6
verified: true
ch_annotator_version: ch_annotator-v1_7_0
_provenance:
content_hash:
algorithm: sha256
value: sha256-yEo7rRSuFitnH3Z6qYiLiOhTj0sO+NtzAhTr3Fp61j0=
scope: enrichment_section
computed_at: '2025-12-28T19:58:21.316662+00:00'
prov:
wasDerivedFrom: https://maps.googleapis.com/maps/api/place/details/json?place_id=ChIJpeVeWjWSC0cReyWDSRX37SM
generatedAtTime: '2025-12-08T19:46:50.601512+00:00'
wasGeneratedBy:
'@type': prov:Activity
name: google_maps_api_fetch
used: https://maps.googleapis.com/maps/api/place
verification:
status: verified
last_verified: '2025-12-28T19:58:21.316672+00:00'
google_maps_status: SUCCESS
youtube_status: NOT_FOUND
youtube_search_query: Archiválie uložené mimo archivy v evidenci SOkA Praha-západ official
youtube_search_timestamp: '2025-12-08T19:46:55.414685+00:00'
location:
latitude: 50.0386519
longitude: 14.492900899999999
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-12-08T19:46:50.601512+00:00'
entity_id: ChIJpeVeWjWSC0cReyWDSRX37SM
region: Praha
region_code: '10'
country: CZ
street_address: Archivní 2257/4, Praha 4-Chodov
formatted_address: Archivní 2257/4, 149 00 Praha 4-Chodov, Czechia
normalization_timestamp: '2025-12-09T06:49:28.290311+00:00'