glam/data/custodian/CZ-10-CES-A-ACSSD.yaml
2025-12-30 23:01:01 +01:00

398 lines
17 KiB
YAML
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: Archiv České strany sociálně demokratické
institution_type: ARCHIVE
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ARON_UUID
identifier_value: 16f1a5e4-4a04-4ae3-9a14-6a7945d62650
identifier_url: https://portal.nacr.cz/aron/apu/16f1a5e4-4a04-4ae3-9a14-6a7945d62650
- &id002
identifier_scheme: INSTITUTION_CODE
identifier_value: '521100020'
- &id003
identifier_scheme: Wikidata
identifier_value: Q101493931
identifier_url: https://www.wikidata.org/wiki/Q101493931
locations: []
processing_timestamp: '2025-12-06T23:37:43.862249+00:00'
ghcid:
ghcid_current: CZ-10-CES-A-ACSSD
ghcid_original: XX-XX-XXX-A-AČSSD
ghcid_uuid: 6e774869-8589-55d4-8219-f4906a1614c1
ghcid_uuid_sha256: d0dabba8-0494-892e-86eb-c6e2c62fc7cd
ghcid_numeric: 15049547435117701422
record_id: ad94c806-09bc-4635-af2e-805c3b77408b
generation_timestamp: '2025-12-06T23:37:43.862249+00:00'
location_resolution:
country_code: CZ
region_code: '10'
city_code: CES
method: CH_ANNOTATOR_TOP_SET
resolution_timestamp: '2025-12-07T00:19:32.601188+00:00'
region_name: CZ-10
iso_code_source: CZ-10
city_name: Ceske Budejovice
geonames_id: 3077916
feature_code: PPLA
extracted_toponym: České
latitude: 48.97447
longitude: 14.47434
ghcid_history:
- previous_ghcid_component: CB
new_ghcid_component: CES
change_date: '2025-12-20T19:57:18Z'
reason: 'Fixed 2-letter city code to proper 3-letter code per AGENTS.md. City: Ceske Budejovice'
- ghcid: CZ-10-CB-A-ACSSD
ghcid_numeric: 15049547435117701422
valid_from: '2025-12-08T11:21:23.213378+00:00'
reason: 'Normalized diacritics to ASCII per ABBREV-DIACRITICS rule (was: CZ-10-CB-A-AČSSD)'
- ghcid: XX-XX-XXX-A-AČSSD
ghcid_numeric: 7823242705250668629
valid_from: '2025-12-06T23:37:43.862249+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
valid_to: '2025-12-08T11:21:23.213378+00:00'
- ghcid: CZ-XX-XXX-A-AČSSD
valid_from: '2025-12-06T23:54:39.919772+00:00'
reason: 'Country resolved via Wikidata P17: XX→CZ'
- ghcid: CZ-10-XXX-A-AČSSD
valid_from: '2025-12-07T00:00:57.993551+00:00'
reason: 'Region resolved via Wikidata P131: XX->10 (CZ-10)'
- ghcid: CZ-10-CB-A-AČSSD
valid_from: '2025-12-07T00:19:32.601195+00:00'
reason: 'Location resolved via CH-Annotator TOP.SET extraction: České -> Ceske Budejovice (GeoNames:3077916)'
custodian_name:
claim_type: custodian_name
claim_value: Archiv České strany sociálně demokratické
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: CZ-10-CB-A-ACSSD
- identifier_scheme: GHCID_UUID
identifier_value: 6e774869-8589-55d4-8219-f4906a1614c1
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: d0dabba8-0494-892e-86eb-c6e2c62fc7cd
- identifier_scheme: GHCID_NUMERIC
identifier_value: '15049547435117701422'
- identifier_scheme: RECORD_ID
identifier_value: ad94c806-09bc-4635-af2e-805c3b77408b
- *id001
- *id002
- *id003
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T11:35:45.743609+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'Country resolved 2025-12-06T23:54:39Z: XX→CZ via Wikidata P17'
- 'Region resolved 2025-12-07T00:00:57Z: XX->10 via Wikidata P131 (CZ-10)'
- 'Location resolved 2025-12-07T00:19:32Z: CH-Annotator TOP.SET extraction ''České'' -> Ceske Budejovice (GeoNames:3077916,
Region:31)'
- 'YouTube/Google Maps enrichment 2025-12-08T19:45:02Z: Maps: State Regional Archive Ceske Budejovice (conf: 0.85); YouTube:
not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:03Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:27Z
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-cTtiK9TKHQTb2+NG4JfFMAwpkSwqEhwii4YlWV3QwOI=
verified_at: '2025-12-28T19:58:20.701195+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q101493931
google_maps_enrichment:
content_hash: sha256-VB2AGVtI2HWVJBzOs5qbJZsHWpN941oCWHxhm5+wz1E=
verified_at: '2025-12-28T19:58:20.701289+00:00'
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:58:20.701300+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.743609+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date: null
verified_by: null
entity_claims:
- claim_type: full_name
claim_value: Archiv České strany sociálně demokratické
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.743609+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.85
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.743609+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.95
- claim_type: wikidata_id
claim_value: Q101493931
property_uri: owl:sameAs
provenance:
namespace: wikidata
path: /entity/Q101493931
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T11:35:45.743609+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.98
- claim_type: location_settlement
claim_value: Ceske Budejovice
property_uri: schema:location
hypernym_code: TOP.SET
hypernym_label: SETTLEMENT
provenance:
namespace: geonames
path: /geonames/3077916
timestamp: '2025-12-07T00:19:32.601198+00:00'
agent: extract_locations_ch_annotator.py
context_convention: ch_annotator-v1_7_0
confidence: 0.85
extraction_source:
field: institution_name
extracted_text: České
method: pattern_matching
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:43.862249+00:00'
creation_method: create_custodian_from_ch_annotator.py
wikidata_enrichment:
wikidata_entity_id: Q101493931
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-08T23:41:04.690503+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P31
- P968
- P159
- P17
- P361
- P18
- P856
wikidata_labels:
cs: Archiv České strany sociálně demokratické
wikidata_descriptions:
cs: český soukromý archiv
wikidata_aliases:
cs:
- Archiv ČSSD
wikidata_classification:
instance_of: &id004
- id: Q12161242
label: private archive
description: archival collection or institution that is not accessible to the public
- id: Q53252161
label: party archive
description: subclass of political archive
wikidata_instance_of: *id004
wikidata_location:
headquarters_location:
id: Q1085
label: Prague
description: capital city of the Czech Republic
country: &id005
id: Q213
label: Czech Republic
description: country in Central Europe
wikidata_country: *id005
wikidata_organization:
part_of:
id: Q341148
label: Social Democracy
description: centre-left Czech political party
wikidata_web:
official_website: https://www.cssd.cz/aktualne/aktuality/archiv-cssd/
wikidata_official_website: https://www.cssd.cz/aktualne/aktuality/archiv-cssd/
wikidata_media:
image: Hybernská Losyovský palác 2.jpg
wikidata_image: Hybernská Losyovský palác 2.jpg
wikidata_contact:
email: mailto:archiv@socdem.cz
_provenance:
content_hash:
algorithm: sha256
value: sha256-cTtiK9TKHQTb2+NG4JfFMAwpkSwqEhwii4YlWV3QwOI=
scope: enrichment_section
computed_at: '2025-12-28T19:58:20.701195+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q101493931
verification:
status: verified
last_verified: '2025-12-28T19:58:20.701201+00:00'
google_maps_enrichment:
place_id: ChIJa7L6-clPc0cR-V_8UYGa4KE
name: State Regional Archive Ceske Budejovice
fetch_timestamp: '2025-12-08T19:44:57.371405+00:00'
api_status: OK
coordinates:
latitude: 48.9764677
longitude: 14.4845555
formatted_address: 40, Rudolfovská tř. 70, 370 01 České Budějovice-České Budějovice 1, Czechia
short_address: Rudolfovská tř. 70, České Budějovice 1
phone_local: 386 701 214
phone_international: +420 386 701 214
website: https://www.ceskearchivy.cz/statni-okresni-archivy/ceske-budejovice/soka-cb-uvod
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 4.9
total_ratings: 15
reviews:
- author_name: Hana Dvořáková
author_uri: https://www.google.com/maps/contrib/106223614438373881734/reviews
rating: 5
relative_time_description: 9 months ago
text: Hello, we attended Eleonore's lecture yesterday and it was great. Beautiful. I have never experienced such a beautiful
lecture.
publish_time: '2025-02-26T09:05:14.246458Z'
- author_name: Jakub Bouček (Opravdové příběhy)
author_uri: https://www.google.com/maps/contrib/109262906392895391758/reviews
rating: 5
relative_time_description: 7 years ago
text: |-
State archives are one of the places where you can find real information about the history of a particular region, and the České Budějovice archive is a good example of this.
So if you want to find out details about the history of the city and its surroundings, the archive is the right place.
publish_time: '2018-03-31T13:23:16.449Z'
- author_name: Hana Havlova
author_uri: https://www.google.com/maps/contrib/109085353083285723508/reviews
rating: 4
relative_time_description: 9 months ago
text: null
publish_time: '2025-03-02T13:55:04.823721Z'
- author_name: Tomáš Bína
author_uri: https://www.google.com/maps/contrib/103342603459226127712/reviews
rating: 5
relative_time_description: a year ago
text: null
publish_time: '2024-11-27T04:07:39.599965Z'
- author_name: Karel Halla
author_uri: https://www.google.com/maps/contrib/107629645487979595240/reviews
rating: 5
relative_time_description: a year ago
text: null
publish_time: '2024-11-10T19:38:06.688202Z'
opening_hours:
open_now: false
weekday_text:
- 'Monday: 8:00AM4:00PM'
- 'Tuesday: Closed'
- 'Wednesday: 8:00AM4:00PM'
- 'Thursday: Closed'
- 'Friday: Closed'
- 'Saturday: Closed'
- 'Sunday: Closed'
photo_count: 4
photos_metadata:
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHr-vtwhO8_7QYyCotFkZZpx2jNDBwsl3moqXbVuyunrqWO4-x2uN08JmTmMw5rGB_vLvMXA5OoS5iMxgl7D_N5ssN3IXNMZ3wa5jkHHYrQeqVrbm8OJn2C_0Qv0dau9Wx_DpVPIzqECac7ho50EtIqeJY5FcI-TqasWDuGgR2LfP9UOAoBQ5z8Af9aVTZm1NY0_frlhL-5qzu3Sncbg7OZzYBbvTGQQFCHSBlbeRhjodLExfJzRDxxBBakIcazLziO_fnMWsgLrs0wLmcfFQ914H2Uf0Z-PZlqW0CkSYrFvHYnBbWEWmLdddghLfFsWrGttD6B3ujEYjNcCZxrGentMOIpcvvaHGKVeghSar615y_fJKJIAxF9p3HQkjJcjdN5k7T4Bs849897w_7KOKXXOm4iZxDEra-GCOVvxQRSApDHL
height: 3264
width: 2448
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHrsdTVIuuYKx1c9f0BYd39B2ga5Efd34DScNj4npLV5cyig2V7eOykZWSE03Y3jWoF-XwryvDDX-Vk4qBx9AtwQFxBDgXOvaaUAbNnvam-EwRL6hh4h7sRwr0s4htKLESjWeqwWvLrMh_usyeCvH6RIaB3Qt5SV48iCzWd6t7mmksRdWwNt8vURYdIdLAcZQWXqny6J0MYtIXqGtRuVc3N_TS1W_Nct2qfXTd-d9Uavx1G8eGX0zWvfTtTFelSI_Jsbrp8GkhrqTQ7rLtA_7FWRjD_7SjXxK0q2TROKuskPESxwowlB7cYQN9Ypl7DFElEA_kISEdVou7HaSFbOkeBnro79Qp_xtExcb8hLq5_BJGlITWf-oVIbf5GmJi9r1hL0Y_vGaLocWgXOPrtHoUXDozuzbTLl2k_1wYQ2-AI8GQ
height: 4128
width: 3096
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHo1afv732mZ1uob8-ZbfTlN2v2vrjtJKDzScSVTsGcMfuH38V3URm4_S1znrlDm_AAw98opmCgsBd7m8zvIfXyIGUPp76EvMOufOrouNA3932in56YQxjwPRKYwjmXr708E-t_z172oOf3TKLhIJ0UZD2eoNFwMMK6QDUxZ7ahzuX8tYJ5H7QrMzT6lWLOMO9WcnqrnmVAuF4Kl1rWmDPAjZXWwRhA_y03EkwiVpRM-Fm7EX0XpBtTSjfvaoDBS10HRfjleNTjO0YOXAWl-Lhxn8TLv5vNyATgxRkdvZb6330jMflqqL2bWI5C8xyOSbvWoQ1-ew9ue09zkrSIQ9Yt2Rs3hzbbOqNVBS6DPGWTifmvE_LJD1xWW1IKZYlhauid2rTFUpXU5MxoQ-h-6HighbK4vN8NpJLBKWBEGCTWjHQ
height: 2448
width: 3264
- name: places/ChIJa7L6-clPc0cR-V_8UYGa4KE/photos/AZLasHqG2tLij0i5XHlfn0LaZ6eVy52cI6NyYxd8lALteov7SSQxdgJJdfSE3FRT1AetiXQ_A8zfg5r2BIPyPCvQQ1OIACa4cosh_kbRZ5S6XvNaqpYJpL-C1l5Uf5JUTLR2TiDTDGzn5tOFkMkTg9KqgG6E3MT8mAjJgDY_d093lCwyT81IXRIcV_-RK6Eatn15UA3i-verMBa-42SD5wAy2E3j1Du_4zgSYZeUtOsbSGYAf9sUn4oQPJBNdfOG91uwn0UUCjo9sDFPhq4GGHCULptEu_z7IbQwRXNUE66OQNMiz0yZYuSxQ3OADS-GaYyI8gCkuqopDFETKVt7pPL234ELolwsQlKrdEsqElSixFOdu4yCfN0tqXb0Qfu41_iY9UpAS-QO-aEN8jSUHP-PeiRpXeSVaodorG20pn5y16lpKQ
height: 4032
width: 3024
google_maps_url: https://maps.google.com/?cid=11664492915106537465&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
llm_verification:
is_match: true
confidence: 0.85
entity_type: GRP.HER
reasoning: The Google Maps candidate is a very strong match. The names refer to the same institution, with 'Archiv České
strany sociálně demokratické' being a specific collection within the 'State Regional Archive Ceske Budejovice'. The
location in České Budějovice is a perfect match. The website confirms it is an archive, and while the generic Google
Place types ('point_of_interest', 'establishment') are not a specific match, the website and name context override this
to confirm it is a heritage institution (GRP.HER).
agent: glm-4.6
verified: true
ch_annotator_version: ch_annotator-v1_7_0
_provenance:
content_hash:
algorithm: sha256
value: sha256-VB2AGVtI2HWVJBzOs5qbJZsHWpN941oCWHxhm5+wz1E=
scope: enrichment_section
computed_at: '2025-12-28T19:58:20.701289+00:00'
prov:
wasDerivedFrom: https://maps.googleapis.com/maps/api/place/details/json?place_id=ChIJa7L6-clPc0cR-V_8UYGa4KE
generatedAtTime: '2025-12-08T19:44:57.371405+00:00'
wasGeneratedBy:
'@type': prov:Activity
name: google_maps_api_fetch
used: https://maps.googleapis.com/maps/api/place
verification:
status: verified
last_verified: '2025-12-28T19:58:20.701293+00:00'
google_maps_status: SUCCESS
youtube_status: NOT_FOUND
youtube_search_query: Archiv České strany sociálně demokratické official
youtube_search_timestamp: '2025-12-08T19:45:02.813274+00:00'
location:
latitude: 48.9764677
longitude: 14.4845555
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-12-08T19:44:57.371405+00:00'
entity_id: ChIJa7L6-clPc0cR-V_8UYGa4KE
city: Ceske Budejovice
region: CZ-10
region_code: '10'
country: CZ
street_address: Rudolfovská tř. 70, České Budějovice 1
formatted_address: 40, Rudolfovská tř. 70, 370 01 České Budějovice-České Budějovice 1, Czechia
geonames_id: 3077916
feature_code: PPLA
normalization_timestamp: '2025-12-09T06:49:27.447581+00:00'