379 lines
16 KiB
YAML
379 lines
16 KiB
YAML
original_entry:
|
||
name: Archiv České strany sociálně demokratické
|
||
institution_type: ARCHIVE
|
||
source: CH-Annotator (czech_unified_ch_annotator.yaml)
|
||
identifiers:
|
||
- &id001
|
||
identifier_scheme: ARON_UUID
|
||
identifier_value: 16f1a5e4-4a04-4ae3-9a14-6a7945d62650
|
||
identifier_url: https://portal.nacr.cz/aron/apu/16f1a5e4-4a04-4ae3-9a14-6a7945d62650
|
||
- &id002
|
||
identifier_scheme: INSTITUTION_CODE
|
||
identifier_value: '521100020'
|
||
- &id003
|
||
identifier_scheme: Wikidata
|
||
identifier_value: Q101493931
|
||
identifier_url: https://www.wikidata.org/wiki/Q101493931
|
||
locations: []
|
||
processing_timestamp: '2025-12-06T23:37:43.862249+00:00'
|
||
ghcid:
|
||
ghcid_current: CZ-10-CES-A-ACSSD
|
||
ghcid_original: XX-XX-XXX-A-AČSSD
|
||
ghcid_uuid: 6e774869-8589-55d4-8219-f4906a1614c1
|
||
ghcid_uuid_sha256: d0dabba8-0494-892e-86eb-c6e2c62fc7cd
|
||
ghcid_numeric: 15049547435117701422
|
||
record_id: ad94c806-09bc-4635-af2e-805c3b77408b
|
||
generation_timestamp: '2025-12-06T23:37:43.862249+00:00'
|
||
location_resolution:
|
||
country_code: CZ
|
||
region_code: '10'
|
||
city_code: CES
|
||
method: CH_ANNOTATOR_TOP_SET
|
||
resolution_timestamp: '2025-12-07T00:19:32.601188+00:00'
|
||
region_name: CZ-10
|
||
iso_code_source: CZ-10
|
||
city_name: Ceske Budejovice
|
||
geonames_id: 3077916
|
||
feature_code: PPLA
|
||
extracted_toponym: České
|
||
latitude: 48.97447
|
||
longitude: 14.47434
|
||
ghcid_history:
|
||
- previous_ghcid_component: "CB"
|
||
new_ghcid_component: "CES"
|
||
change_date: "2025-12-20T19:57:18Z"
|
||
reason: "Fixed 2-letter city code to proper 3-letter code per AGENTS.md. City: Ceske Budejovice"
|
||
- ghcid: CZ-10-CB-A-ACSSD
|
||
ghcid_numeric: 15049547435117701422
|
||
valid_from: '2025-12-08T11:21:23.213378+00:00'
|
||
reason: 'Normalized diacritics to ASCII per ABBREV-DIACRITICS rule (was: CZ-10-CB-A-AČSSD)'
|
||
- ghcid: XX-XX-XXX-A-AČSSD
|
||
ghcid_numeric: 7823242705250668629
|
||
valid_from: '2025-12-06T23:37:43.862249+00:00'
|
||
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
|
||
valid_to: '2025-12-08T11:21:23.213378+00:00'
|
||
- ghcid: CZ-XX-XXX-A-AČSSD
|
||
valid_from: '2025-12-06T23:54:39.919772+00:00'
|
||
reason: 'Country resolved via Wikidata P17: XX→CZ'
|
||
- ghcid: CZ-10-XXX-A-AČSSD
|
||
valid_from: '2025-12-07T00:00:57.993551+00:00'
|
||
reason: 'Region resolved via Wikidata P131: XX->10 (CZ-10)'
|
||
- ghcid: CZ-10-CB-A-AČSSD
|
||
valid_from: '2025-12-07T00:19:32.601195+00:00'
|
||
reason: 'Location resolved via CH-Annotator TOP.SET extraction: České -> Ceske Budejovice (GeoNames:3077916)'
|
||
custodian_name:
|
||
claim_type: custodian_name
|
||
claim_value: Archiv České strany sociálně demokratické
|
||
source_type: ch_annotator
|
||
identifiers:
|
||
- identifier_scheme: GHCID
|
||
identifier_value: CZ-10-CB-A-ACSSD
|
||
- identifier_scheme: GHCID_UUID
|
||
identifier_value: 6e774869-8589-55d4-8219-f4906a1614c1
|
||
- identifier_scheme: GHCID_UUID_SHA256
|
||
identifier_value: d0dabba8-0494-892e-86eb-c6e2c62fc7cd
|
||
- identifier_scheme: GHCID_NUMERIC
|
||
identifier_value: '15049547435117701422'
|
||
- identifier_scheme: RECORD_ID
|
||
identifier_value: ad94c806-09bc-4635-af2e-805c3b77408b
|
||
- *id001
|
||
- *id002
|
||
- *id003
|
||
provenance:
|
||
data_source: API_SCRAPING
|
||
data_tier: TIER_1_AUTHORITATIVE
|
||
extraction_date: '2025-11-19T11:35:45.743609+00:00'
|
||
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
|
||
confidence_score: 0.85
|
||
notes:
|
||
- 'Country resolved 2025-12-06T23:54:39Z: XX→CZ via Wikidata P17'
|
||
- 'Region resolved 2025-12-07T00:00:57Z: XX->10 via Wikidata P131 (CZ-10)'
|
||
- 'Location resolved 2025-12-07T00:19:32Z: CH-Annotator TOP.SET extraction ''České'' -> Ceske Budejovice (GeoNames:3077916, Region:31)'
|
||
- 'YouTube/Google Maps enrichment 2025-12-08T19:45:02Z: Maps: State Regional Archive Ceske Budejovice (conf: 0.85); YouTube: not found'
|
||
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:03Z
|
||
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:27Z
|
||
schema_version: 2.0.0
|
||
enrichment_provenance:
|
||
wikidata_enrichment:
|
||
content_hash: sha256-cTtiK9TKHQTb2+NG4JfFMAwpkSwqEhwii4YlWV3QwOI=
|
||
verified_at: '2025-12-28T19:58:20.701195+00:00'
|
||
wasDerivedFrom: https://www.wikidata.org/wiki/Q101493931
|
||
google_maps_enrichment:
|
||
content_hash: sha256-VB2AGVtI2HWVJBzOs5qbJZsHWpN941oCWHxhm5+wz1E=
|
||
verified_at: '2025-12-28T19:58:20.701289+00:00'
|
||
provenance_schema_version: '2.0'
|
||
standards_compliance:
|
||
- W3C PROV-O
|
||
- W3C SRI (content hashes)
|
||
generated_at: '2025-12-28T19:58:20.701300+00:00'
|
||
ch_annotator:
|
||
convention_id: ch_annotator-v1_7_0
|
||
convention_version: 1.7.0
|
||
entity_classification:
|
||
hypernym: GRP
|
||
hypernym_label: GROUP
|
||
subtype: GRP.HER.ARC
|
||
subtype_label: ARCHIVE
|
||
ontology_class: schema:ArchiveOrganization
|
||
alternative_classes:
|
||
- org:FormalOrganization
|
||
- rov:RegisteredOrganization
|
||
- glam:HeritageCustodian
|
||
extraction_provenance:
|
||
namespace: glam
|
||
path: /files/czech_unified.yaml
|
||
timestamp: '2025-11-19T11:35:45.743609+00:00'
|
||
agent: claude-conversation
|
||
context_convention: ch_annotator-v1_7_0
|
||
annotation_provenance:
|
||
annotation_agent: opencode-claude-sonnet-4
|
||
annotation_date: '2025-12-06T21:12:32.389491+00:00'
|
||
annotation_method: retroactive CH-Annotator application via batch script
|
||
source_file: czech_unified.yaml
|
||
annotation_metadata:
|
||
confidence_score: 0.85
|
||
verified: false
|
||
verification_date:
|
||
verified_by:
|
||
entity_claims:
|
||
- claim_type: full_name
|
||
claim_value: Archiv České strany sociálně demokratické
|
||
property_uri: skos:prefLabel
|
||
provenance:
|
||
namespace: glam
|
||
path: /files/czech_unified.yaml
|
||
timestamp: '2025-11-19T11:35:45.743609+00:00'
|
||
agent: claude-conversation
|
||
context_convention: ch_annotator-v1_7_0
|
||
confidence: 0.85
|
||
- claim_type: institution_type
|
||
claim_value: ARCHIVE
|
||
property_uri: rdf:type
|
||
provenance:
|
||
namespace: glam
|
||
path: /files/czech_unified.yaml
|
||
timestamp: '2025-11-19T11:35:45.743609+00:00'
|
||
agent: claude-conversation
|
||
context_convention: ch_annotator-v1_7_0
|
||
confidence: 0.95
|
||
- claim_type: wikidata_id
|
||
claim_value: Q101493931
|
||
property_uri: owl:sameAs
|
||
provenance:
|
||
namespace: wikidata
|
||
path: /entity/Q101493931
|
||
timestamp: '2025-11-19T11:35:45.743609+00:00'
|
||
agent: claude-conversation
|
||
context_convention: ch_annotator-v1_7_0
|
||
confidence: 0.98
|
||
- claim_type: location_settlement
|
||
claim_value: Ceske Budejovice
|
||
property_uri: schema:location
|
||
hypernym_code: TOP.SET
|
||
hypernym_label: SETTLEMENT
|
||
provenance:
|
||
namespace: geonames
|
||
path: /geonames/3077916
|
||
timestamp: '2025-12-07T00:19:32.601198+00:00'
|
||
agent: extract_locations_ch_annotator.py
|
||
context_convention: ch_annotator-v1_7_0
|
||
confidence: 0.85
|
||
extraction_source:
|
||
field: institution_name
|
||
extracted_text: České
|
||
method: pattern_matching
|
||
integration_note:
|
||
created_from: czech_unified_ch_annotator.yaml
|
||
creation_date: '2025-12-06T23:37:43.862249+00:00'
|
||
creation_method: create_custodian_from_ch_annotator.py
|
||
wikidata_enrichment:
|
||
wikidata_entity_id: Q101493931
|
||
api_metadata:
|
||
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
|
||
fetch_timestamp: '2025-12-08T23:41:04.690503+00:00'
|
||
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
|
||
enrichment_version: 2.0_full
|
||
properties_found:
|
||
- P31
|
||
- P968
|
||
- P159
|
||
- P17
|
||
- P361
|
||
- P18
|
||
- P856
|
||
wikidata_labels:
|
||
cs: Archiv České strany sociálně demokratické
|
||
wikidata_descriptions:
|
||
cs: český soukromý archiv
|
||
wikidata_aliases:
|
||
cs:
|
||
- Archiv ČSSD
|
||
wikidata_classification:
|
||
instance_of: &id004
|
||
- id: Q12161242
|
||
label: private archive
|
||
description: archival collection or institution that is not accessible to the public
|
||
- id: Q53252161
|
||
label: party archive
|
||
description: subclass of political archive
|
||
wikidata_instance_of: *id004
|
||
wikidata_location:
|
||
headquarters_location:
|
||
id: Q1085
|
||
label: Prague
|
||
description: capital city of the Czech Republic
|
||
country: &id005
|
||
id: Q213
|
||
label: Czech Republic
|
||
description: country in Central Europe
|
||
wikidata_country: *id005
|
||
wikidata_organization:
|
||
part_of:
|
||
id: Q341148
|
||
label: Social Democracy
|
||
description: centre-left Czech political party
|
||
wikidata_web:
|
||
official_website: https://www.cssd.cz/aktualne/aktuality/archiv-cssd/
|
||
wikidata_official_website: https://www.cssd.cz/aktualne/aktuality/archiv-cssd/
|
||
wikidata_media:
|
||
image: Hybernská Losyovský palác 2.jpg
|
||
wikidata_image: Hybernská Losyovský palác 2.jpg
|
||
wikidata_contact:
|
||
email: mailto:archiv@socdem.cz
|
||
_provenance:
|
||
content_hash:
|
||
algorithm: sha256
|
||
value: sha256-cTtiK9TKHQTb2+NG4JfFMAwpkSwqEhwii4YlWV3QwOI=
|
||
scope: enrichment_section
|
||
computed_at: '2025-12-28T19:58:20.701195+00:00'
|
||
prov:
|
||
wasGeneratedBy:
|
||
'@type': prov:Activity
|
||
name: wikidata_api_fetch
|
||
used: https://www.wikidata.org/w/rest.php/wikibase/v1
|
||
wasDerivedFrom: https://www.wikidata.org/wiki/Q101493931
|
||
verification:
|
||
status: verified
|
||
last_verified: '2025-12-28T19:58:20.701201+00:00'
|
||
google_maps_enrichment:
|
||
place_id: ChIJa7L6-clPc0cR-V_8UYGa4KE
|
||
name: State Regional Archive Ceske Budejovice
|
||
fetch_timestamp: '2025-12-08T19:44:57.371405+00:00'
|
||
api_status: OK
|
||
coordinates:
|
||
latitude: 48.9764677
|
||
longitude: 14.4845555
|
||
formatted_address: 40, Rudolfovská tř. 70, 370 01 České Budějovice-České Budějovice 1, Czechia
|
||
short_address: Rudolfovská tř. 70, České Budějovice 1
|
||
phone_local: 386 701 214
|
||
phone_international: +420 386 701 214
|
||
website: https://www.ceskearchivy.cz/statni-okresni-archivy/ceske-budejovice/soka-cb-uvod
|
||
google_place_types:
|
||
- point_of_interest
|
||
- establishment
|
||
business_status: OPERATIONAL
|
||
rating: 4.9
|
||
total_ratings: 15
|
||
reviews:
|
||
- author_name: Hana Dvořáková
|
||
author_uri: https://www.google.com/maps/contrib/106223614438373881734/reviews
|
||
rating: 5
|
||
relative_time_description: 9 months ago
|
||
text: Hello, we attended Eleonore's lecture yesterday and it was great. Beautiful. I have never experienced such a beautiful lecture.
|
||
publish_time: '2025-02-26T09:05:14.246458Z'
|
||
- author_name: Jakub Bouček (Opravdové příběhy)
|
||
author_uri: https://www.google.com/maps/contrib/109262906392895391758/reviews
|
||
rating: 5
|
||
relative_time_description: 7 years ago
|
||
text: 'State archives are one of the places where you can find real information about the history of a particular region, and the České Budějovice archive is a good example of this.
|
||
|
||
So if you want to find out details about the history of the city and its surroundings, the archive is the right place.'
|
||
publish_time: '2018-03-31T13:23:16.449Z'
|
||
- author_name: Hana Havlova
|
||
author_uri: https://www.google.com/maps/contrib/109085353083285723508/reviews
|
||
rating: 4
|
||
relative_time_description: 9 months ago
|
||
text:
|
||
publish_time: '2025-03-02T13:55:04.823721Z'
|
||
- author_name: Tomáš Bína
|
||
author_uri: https://www.google.com/maps/contrib/103342603459226127712/reviews
|
||
rating: 5
|
||
relative_time_description: a year ago
|
||
text:
|
||
publish_time: '2024-11-27T04:07:39.599965Z'
|
||
- author_name: Karel Halla
|
||
author_uri: https://www.google.com/maps/contrib/107629645487979595240/reviews
|
||
rating: 5
|
||
relative_time_description: a year ago
|
||
text:
|
||
publish_time: '2024-11-10T19:38:06.688202Z'
|
||
opening_hours:
|
||
open_now: false
|
||
weekday_text:
|
||
- 'Monday: 8:00 AM – 4:00 PM'
|
||
- 'Tuesday: Closed'
|
||
- 'Wednesday: 8:00 AM – 4:00 PM'
|
||
- 'Thursday: Closed'
|
||
- 'Friday: Closed'
|
||
- 'Saturday: Closed'
|
||
- 'Sunday: Closed'
|
||
photo_count: 4
|
||
photos_metadata:
|
||
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHr-vtwhO8_7QYyCotFkZZpx2jNDBwsl3moqXbVuyunrqWO4-x2uN08JmTmMw5rGB_vLvMXA5OoS5iMxgl7D_N5ssN3IXNMZ3wa5jkHHYrQeqVrbm8OJn2C_0Qv0dau9Wx_DpVPIzqECac7ho50EtIqeJY5FcI-TqasWDuGgR2LfP9UOAoBQ5z8Af9aVTZm1NY0_frlhL-5qzu3Sncbg7OZzYBbvTGQQFCHSBlbeRhjodLExfJzRDxxBBakIcazLziO_fnMWsgLrs0wLmcfFQ914H2Uf0Z-PZlqW0CkSYrFvHYnBbWEWmLdddghLfFsWrGttD6B3ujEYjNcCZxrGentMOIpcvvaHGKVeghSar615y_fJKJIAxF9p3HQkjJcjdN5k7T4Bs849897w_7KOKXXOm4iZxDEra-GCOVvxQRSApDHL
|
||
height: 3264
|
||
width: 2448
|
||
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHrsdTVIuuYKx1c9f0BYd39B2ga5Efd34DScNj4npLV5cyig2V7eOykZWSE03Y3jWoF-XwryvDDX-Vk4qBx9AtwQFxBDgXOvaaUAbNnvam-EwRL6hh4h7sRwr0s4htKLESjWeqwWvLrMh_usyeCvH6RIaB3Qt5SV48iCzWd6t7mmksRdWwNt8vURYdIdLAcZQWXqny6J0MYtIXqGtRuVc3N_TS1W_Nct2qfXTd-d9Uavx1G8eGX0zWvfTtTFelSI_Jsbrp8GkhrqTQ7rLtA_7FWRjD_7SjXxK0q2TROKuskPESxwowlB7cYQN9Ypl7DFElEA_kISEdVou7HaSFbOkeBnro79Qp_xtExcb8hLq5_BJGlITWf-oVIbf5GmJi9r1hL0Y_vGaLocWgXOPrtHoUXDozuzbTLl2k_1wYQ2-AI8GQ
|
||
height: 4128
|
||
width: 3096
|
||
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHo1afv732mZ1uob8-ZbfTlN2v2vrjtJKDzScSVTsGcMfuH38V3URm4_S1znrlDm_AAw98opmCgsBd7m8zvIfXyIGUPp76EvMOufOrouNA3932in56YQxjwPRKYwjmXr708E-t_z172oOf3TKLhIJ0UZD2eoNFwMMK6QDUxZ7ahzuX8tYJ5H7QrMzT6lWLOMO9WcnqrnmVAuF4Kl1rWmDPAjZXWwRhA_y03EkwiVpRM-Fm7EX0XpBtTSjfvaoDBS10HRfjleNTjO0YOXAWl-Lhxn8TLv5vNyATgxRkdvZb6330jMflqqL2bWI5C8xyOSbvWoQ1-ew9ue09zkrSIQ9Yt2Rs3hzbbOqNVBS6DPGWTifmvE_LJD1xWW1IKZYlhauid2rTFUpXU5MxoQ-h-6HighbK4vN8NpJLBKWBEGCTWjHQ
|
||
height: 2448
|
||
width: 3264
|
||
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHqG2tLij0i5XHlfn0LaZ6eVy52cI6NyYxd8lALteov7SSQxdgJJdfSE3FRT1AetiXQ_A8zfg5r2BIPyPCvQQ1OIACa4cosh_kbRZ5S6XvNaqpYJpL-C1l5Uf5JUTLR2TiDTDGzn5tOFkMkTg9KqgG6E3MT8mAjJgDY_d093lCwyT81IXRIcV_-RK6Eatn15UA3i-verMBa-42SD5wAy2E3j1Du_4zgSYZeUtOsbSGYAf9sUn4oQPJBNdfOG91uwn0UUCjo9sDFPhq4GGHCULptEu_z7IbQwRXNUE66OQNMiz0yZYuSxQ3OADS-GaYyI8gCkuqopDFETKVt7pPL234ELolwsQlKrdEsqElSixFOdu4yCfN0tqXb0Qfu41_iY9UpAS-QO-aEN8jSUHP-PeiRpXeSVaodorG20pn5y16lpKQ
|
||
height: 4032
|
||
width: 3024
|
||
google_maps_url: https://maps.google.com/?cid=11664492915106537465&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
|
||
llm_verification:
|
||
is_match: true
|
||
confidence: 0.85
|
||
entity_type: GRP.HER
|
||
reasoning: The Google Maps candidate is a very strong match. The names refer to the same institution, with 'Archiv České strany sociálně demokratické' being a specific collection within the 'State Regional Archive Ceske Budejovice'. The location in České Budějovice is a perfect match. The website confirms it is an archive, and while the generic Google Place types ('point_of_interest', 'establishment') are not a specific match, the website and name context override this to confirm it is a heritage institution (GRP.HER).
|
||
agent: glm-4.6
|
||
verified: true
|
||
ch_annotator_version: ch_annotator-v1_7_0
|
||
_provenance:
|
||
content_hash:
|
||
algorithm: sha256
|
||
value: sha256-VB2AGVtI2HWVJBzOs5qbJZsHWpN941oCWHxhm5+wz1E=
|
||
scope: enrichment_section
|
||
computed_at: '2025-12-28T19:58:20.701289+00:00'
|
||
prov:
|
||
wasDerivedFrom: https://maps.googleapis.com/maps/api/place/details/json?place_id=ChIJa7L6-clPc0cR-V_8UYGa4KE
|
||
generatedAtTime: '2025-12-08T19:44:57.371405+00:00'
|
||
wasGeneratedBy:
|
||
'@type': prov:Activity
|
||
name: google_maps_api_fetch
|
||
used: https://maps.googleapis.com/maps/api/place
|
||
verification:
|
||
status: verified
|
||
last_verified: '2025-12-28T19:58:20.701293+00:00'
|
||
google_maps_status: SUCCESS
|
||
youtube_status: NOT_FOUND
|
||
youtube_search_query: Archiv České strany sociálně demokratické official
|
||
youtube_search_timestamp: '2025-12-08T19:45:02.813274+00:00'
|
||
location:
|
||
latitude: 48.9764677
|
||
longitude: 14.4845555
|
||
coordinate_provenance:
|
||
source_type: GOOGLE_MAPS
|
||
source_path: google_maps_enrichment.coordinates
|
||
original_timestamp: '2025-12-08T19:44:57.371405+00:00'
|
||
entity_id: ChIJa7L6-clPc0cR-V_8UYGa4KE
|
||
city: Ceske Budejovice
|
||
region: CZ-10
|
||
region_code: '10'
|
||
country: CZ
|
||
street_address: Rudolfovská tř. 70, České Budějovice 1
|
||
formatted_address: 40, Rudolfovská tř. 70, 370 01 České Budějovice-České Budějovice 1, Czechia
|
||
geonames_id: 3077916
|
||
feature_code: PPLA
|
||
normalization_timestamp: '2025-12-09T06:49:27.447581+00:00'
|