glam/data/custodian/CZ-10-PRA-A-SAMCP.yaml
2025-12-30 23:01:01 +01:00

304 lines
15 KiB
YAML
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: Správní archiv Městské části Praha 4
institution_type: ARCHIVE
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ARON_UUID
identifier_value: 02616f31-b430-4f20-9a25-c1cc5f776a39
identifier_url: https://portal.nacr.cz/aron/apu/02616f31-b430-4f20-9a25-c1cc5f776a39
- &id002
identifier_scheme: INSTITUTION_CODE
identifier_value: '430000010'
locations: []
processing_timestamp: '2025-12-06T23:37:43.709674+00:00'
ghcid:
ghcid_current: CZ-10-PRA-A-SAMCP
ghcid_original: XX-XX-XXX-A-SAMČP
ghcid_uuid: 6089db39-510d-5207-980f-1d2f158862fd
ghcid_uuid_sha256: 05c51c29-c9d5-8227-bd83-778e97c40ee4
ghcid_numeric: 415769506407080487
record_id: d2ecb3af-99a7-4b15-9d17-e667e832bbfb
generation_timestamp: '2025-12-06T23:37:43.709674+00:00'
location_resolution:
country_code: CZ
region_code: '10'
city_code: PRA
method: NAME_EXTRACTION
resolution_timestamp: '2025-12-07T12:33:44.360604+00:00'
region_name: Praha
city_label: Prague
reason: 'City extracted from institution name: "praha" → Prague'
ghcid_history:
- ghcid: CZ-10-PRA-A-SAMCP
ghcid_numeric: 415769506407080487
valid_from: '2025-12-08T11:21:24.305222+00:00'
reason: 'Normalized diacritics to ASCII per ABBREV-DIACRITICS rule (was: CZ-10-PRA-A-SAMČP)'
- ghcid: XX-XX-XXX-A-SAMČP
ghcid_numeric: 4076524634618873589
valid_from: '2025-12-06T23:37:43.709674+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
valid_to: '2025-12-08T11:21:24.305222+00:00'
- ghcid: CZ-XX-XXX-A-SAMČP
valid_from: '2025-12-06T23:56:12.096620+00:00'
reason: 'Country resolved via Wikidata P17: XX→CZ'
- ghcid: CZ-10-PRA-A-SAMČP
valid_from: '2025-12-07T12:33:44.360613+00:00'
reason: 'Location resolved from name: XX→10, XXX→PRA (Prague)'
custodian_name:
claim_type: custodian_name
claim_value: Správní archiv Městské části Praha 4
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: CZ-10-PRA-A-SAMCP
- identifier_scheme: GHCID_UUID
identifier_value: 6089db39-510d-5207-980f-1d2f158862fd
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 05c51c29-c9d5-8227-bd83-778e97c40ee4
- identifier_scheme: GHCID_NUMERIC
identifier_value: '415769506407080487'
- identifier_scheme: RECORD_ID
identifier_value: d2ecb3af-99a7-4b15-9d17-e667e832bbfb
- *id001
- *id002
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T11:35:45.743241+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'Country resolved 2025-12-06T23:56:12Z: XX→CZ via Wikidata P17'
- 'YouTube/Google Maps enrichment 2025-12-08T19:48:15Z: Maps: Prague City Archives (conf: 0.85); YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:11:19Z
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:05Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:28Z
schema_version: 2.0.0
enrichment_provenance:
google_maps_enrichment:
content_hash: sha256-12DORqox/OLI9TR/moXst5vxManWzhscpip7RfeMMBY=
verified_at: '2025-12-28T19:58:21.689247+00:00'
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:58:21.689284+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.743241+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date: null
verified_by: null
entity_claims:
- claim_type: full_name
claim_value: Správní archiv Městské části Praha 4
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.743241+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.85
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.743241+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.95
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:43.709674+00:00'
creation_method: create_custodian_from_ch_annotator.py
google_maps_enrichment:
place_id: ChIJs25iXjWSC0cRUrL7RFH6_yU
name: Prague City Archives
fetch_timestamp: '2025-12-08T19:48:11.254379+00:00'
api_status: OK
coordinates:
latitude: 50.039733999999996
longitude: 14.4943593
formatted_address: Archivní 1280/6, 149 00 Praha 4-Chodov, Czechia
short_address: Archivní 1280/6, Praha 4-Chodov
phone_local: 236 004 017
phone_international: +420 236 004 017
website: http://www.ahmp.cz/
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 4.5
total_ratings: 94
reviews:
- author_name: Miroslav Pek
author_uri: https://www.google.com/maps/contrib/110035999753123270153/reviews
rating: 5
relative_time_description: 6 years ago
text: Ok
publish_time: '2019-04-12T12:59:49.720715Z'
- author_name: Karel Pojsl
author_uri: https://www.google.com/maps/contrib/109561705096115465097/reviews
rating: 5
relative_time_description: a year ago
text: The building dates back to 1995, it's nice and very interesting. I recommend visiting the archive.
publish_time: '2024-04-21T15:15:20.793882Z'
- author_name: Libor Šedivý
author_uri: https://www.google.com/maps/contrib/112581391891260052369/reviews
rating: 5
relative_time_description: 9 months ago
text: There are interesting things here but they didn't find what I needed.
publish_time: '2025-03-13T16:33:51.147142Z'
- author_name: Martin Martin
author_uri: https://www.google.com/maps/contrib/102671748185462032746/reviews
rating: 3
relative_time_description: 6 years ago
text: You need to communicate at least two weeks before the planned visit so that you don't lose out unnecessarily. You
won't get anything at first... In addition, you need to take into account that they will present you with 5 archival
units in one day, i.e. not 5 cartons, but only 5 folders, regardless of whether it is a bookmark with one sheet or a
package with hundreds of documents... The ambition to complete more extensive research requires much more time than
we are used to in other archives. So much luck, patience and research happiness! 🍀
publish_time: '2019-12-01T07:46:56.111948Z'
- author_name: Miroslav Havel
author_uri: https://www.google.com/maps/contrib/109030248799737237070/reviews
rating: 5
relative_time_description: 7 years ago
text: A modern archive building built in the 1990s, I was lucky enough to see the facilities. Willing and quirky workers,
the profession of archivist probably requires a certain amount of perspective, a sense of humor and self-irony. If you
come to a professional course, you can look forward not only to insightful information, but also to great comments and
glosses on current events. It's worth it. 😉
publish_time: '2018-03-17T09:34:30.117Z'
opening_hours:
open_now: false
weekday_text:
- 'Monday: 9:00AM4:00PM'
- 'Tuesday: 9:00AM4:00PM'
- 'Wednesday: 9:00AM4:00PM'
- 'Thursday: 9:00AM4:00PM'
- 'Friday: Closed'
- 'Saturday: Closed'
- 'Sunday: Closed'
photo_count: 10
photos_metadata:
- name: places/ChIJs25iXjWSC0cRUrL7RFH6_yU/photos/AZLasHrfhaRKmgDVTlg1hZ782_7QHA_vJmWr7JBaHb9v57U2FI_7k4xjKrL_iaw7wBm1clM4Efd7mKD6k_Rufmr4bUnVvsyobsRiRfHema4Gcs2aDug0I9OvMivDoTk_aZMSE9P15sN5wCNs3IMtcnQn_3ZWBdDV9N2qNR1q1jdleAGM73YloLCwwz2RBz8OGI0UnsI2K8zUDA3aq2_kve3CS9Of47-H52hjMV7sShps3elFdMHsZDJtZZ4AJ6o9LMY-rTAjN3vZsyPDqsg9KKaLbl8zoFWvG2ecqELd_-k2uVDxsHvqNfAEIWw_yDJJNA6NIbcF26OY52CQLlnp5dsV5abk9uGjTPoVWZMgSAhWf-6QXctnHm_4FQYNJ-Jrv9aqYgbj2KgdG7INrVJjQpJkkHHCq24kywZagqVWAHwxwtcbxlaQ
height: 2827
width: 3769
- name: places/ChIJs25iXjWSC0cRUrL7RFH6_yU/photos/AZLasHoi_2nP2TT3K5T63V6dlEnYfUl5Vgh5-hIqkUtBJo0UhI7X_x7UU5V52V9uRoNTo79e2ZDkzUCksy_LDWdRnSeb4QRALNfSe53Cr3k6-uPWBNPgg32owLMCRwubyyKTM60-MSucNkg7ghHRq8UKjZjRYjqMD5IFSWndVNcxLh6Is8RW6xbUooRNfh8rqNTYiyOQa7uS-PUuZ0mFvk90-GSxJidtkKPG_SLdR8SQwmVfGQQgCy9r7ZHxKAKutNWdfATz9dFGV4zurU_u5vgfRGq0p5qEQIsO8jXObG0LTYRTecVS8_hPvcFF9nI_qxgHLVw7Es1HLJ-lh7nGW89EP5agnozK4fZZVlM04jrR7sJAV7xxACpceivs5SekMWkS6BLq3yAHuaTEtj_iwTbfhCOnc0uuXv_63L2AHuBq8B57mA
height: 4000
width: 3000
- name: places/ChIJs25iXjWSC0cRUrL7RFH6_yU/photos/AZLasHpMXXvLREFY3BPeZEp8pqiIMiBFWJjfSne3AnAHfwxTA5lFYszEjwzWomTUqRxdzChd9Xzf_EWk8YafPUCppjVlRRsFGvwlOHRdypyZP3BNTh3YAbHKoY8T_QK04wwm5qHMPTAD6T3B0F4aEjdqnyHgGqiamD-FtzeLZrRK9xoLWqe7st0l0vLK-YutEQdDEBsuHLPcA51uhJjzQdGlGZ6Hu3eJx2XymlSy8IXOAYFGERn6g-_LOfdCV8X16fN3hkYnP6sCrVt5b1h-OCc_1Rt9NQYW7DkDUuj_ORAk-NdhlEaycNcYk_ycDE8Pa8LyReJsfqvpStGtIPjv6voRdtS_0ul9u-yZ-av4GhdnjNV0T-eOj_manGfdtGKkxOI1XwPec93hr7BEGNKELygVFsPFvh0FojmmCDTesQSd8_Y
height: 3024
width: 4032
- name: places/ChIJs25iXjWSC0cRUrL7RFH6_yU/photos/AZLasHrgCf16YfQXELcW2M3BUBCC9fg54w97LAowC-dRypNd_vAhQA45n8NJXv8NEut5gro6W07URoMx_JbIU3wgpsL4PVrSCRQWEcDHNSjCz_4-jFjGc4rCL0ZmuVjflRgI6MJon2BuCzGg_kInBSHHsLruXM4jlZajYd4hL88sydOdmruK9KJRfBTSICxUKkz8KZ5muhK9DgMDMwDKT1JO8Bmpo-XwEdbWT-ZPv0MECetOAvZp0AcsyE-Fq3sf5ExReW4kTSyZTDQWFizTzTSAsN4yj16IxHeWYnTqaWnd7WmStV8UaHUWqs-ChcCY32tm0cZWAsmD1LnhexEBhnVyj-5IwnpOiI9tEPBKk0BPiCB2HliDbGz0bTP6fY7Jh_Z7vxIF7ZNsiabR3oI_GoJ6EFx8D-u0wlCvKOKiao1feTA3Uo98
height: 4080
width: 3060
- name: places/ChIJs25iXjWSC0cRUrL7RFH6_yU/photos/AZLasHoIManYHyV5JbaDNSH-Px8QpUIiDPTkckstr0xRGS4f9_SdN7-U_xdZzvp74BXBvfuWpk4KgC1gunxqCS_YyHFtD8rKS2Wea0bdkxnxGurN__K1KbnreF1YUbjQDgp5cGWDU9zizSJLsFBJVZyb4prZvKR41l38ma3MDcNmUVCfXVpb7-nQXBVBpZJU8BTRF9d8zVE8V-qpcWGftS8iYUMYeC_GPfATxGia6QUSnZmwDjcf1MwRfngpwCJXgIFbUqvTcY1fPR1yLlXiTe_nveC0m2lkBbwdVA6uLV68RelIsu-91Rc5Yfuo0l84-BRUZZOhx-nMCI4hpL4Xm55EXFoANf_rwIJ-FrNdTO7_5uKyljJmy_tjv99n16U9B4kurxnZ-yXuYleUKAZGfMHesGPItAPE5tzWIfDpZP2b43s
height: 4000
width: 3000
google_maps_url: https://maps.google.com/?cid=2738182325421191762&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
llm_verification:
is_match: true
confidence: 0.85
entity_type: GRP.HER
reasoning: 'The source institution ''Správní archiv Městské části Praha 4'' (Administrative Archive of the Prague 4 City
District) is a clear match for the Google Maps candidate ''Prague City Archives''. The reasoning is as follows: 1) NAME
MATCH: The Google name is a translation and a more general description of the specific Czech name. The source name indicates
it is the administrative archive for a specific district of Prague, while the Google name refers to the main city archives,
but their identities can be confirmed via the shared website domain ''ahmp.cz'', which stands for Archiv Hlavního města
Prahy (Archives of the Capital City of Prague). This confirms the candidate is the correct parent institution. 2) LOCATION
MATCH: The source name specifies ''Praha 4'' and the Google Maps address is in ''Praha 4-Chodov'', a perfect location
match. 3) TYPE MATCH: Although the Google Place types (''point_of_interest'', ''establishment'') are generic, the institution
is unambiguously an ''archiv'', which is a heritage institution type. 4) ENTITY TYPE: An administrative archive is a
definitive example of a Heritage Institution (GRP.HER).'
agent: glm-4.6
verified: true
ch_annotator_version: ch_annotator-v1_7_0
_provenance:
content_hash:
algorithm: sha256
value: sha256-12DORqox/OLI9TR/moXst5vxManWzhscpip7RfeMMBY=
scope: enrichment_section
computed_at: '2025-12-28T19:58:21.689247+00:00'
prov:
wasDerivedFrom: https://maps.googleapis.com/maps/api/place/details/json?place_id=ChIJs25iXjWSC0cRUrL7RFH6_yU
generatedAtTime: '2025-12-08T19:48:11.254379+00:00'
wasGeneratedBy:
'@type': prov:Activity
name: google_maps_api_fetch
used: https://maps.googleapis.com/maps/api/place
verification:
status: verified
last_verified: '2025-12-28T19:58:21.689267+00:00'
google_maps_status: SUCCESS
youtube_status: NOT_FOUND
youtube_search_query: Správní archiv Městské části Praha 4 official
youtube_search_timestamp: '2025-12-08T19:48:15.462090+00:00'
location:
latitude: 50.039733999999996
longitude: 14.4943593
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-12-08T19:48:11.254379+00:00'
entity_id: ChIJs25iXjWSC0cRUrL7RFH6_yU
region: Praha
region_code: '10'
country: CZ
street_address: Archivní 1280/6, Praha 4-Chodov
formatted_address: Archivní 1280/6, 149 00 Praha 4-Chodov, Czechia
normalization_timestamp: '2025-12-09T06:49:28.915410+00:00'
logo_enrichment:
enrichment_timestamp: '2025-12-23T20:58:23.615923+00:00'
source_url: http://www.ahmp.cz
extraction_method: crawl4ai
claims:
- claim_type: favicon_url
claim_value: http://www.ahmp.cz/img/ahmp_favicon.ico
source_url: http://www.ahmp.cz
css_selector: '[document] > html > head > link'
retrieved_on: '2025-12-23T20:58:23.615923+00:00'
extraction_method: crawl4ai_link_rel
favicon_type: ''
favicon_sizes: ''
summary:
total_claims: 1
has_primary_logo: false
has_favicon: true
has_og_image: false
favicon_count: 1