glam/data/custodian/CZ-64-TRE-O-CSOAVT.yaml
2025-12-30 23:01:01 +01:00

352 lines
12 KiB
YAML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: ČR Státní oblastní archiv v Třeboni
institution_type: OFFICIAL_INSTITUTION
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: Sigla
identifier_value: JHE501
- &id002
identifier_scheme: IČO
identifier_value: '70978956'
- &id003
identifier_scheme: DIČ
identifier_value: CZ-70978956
- &id004
identifier_scheme: Website
identifier_value: https://www.ceskearchivy.cz/
identifier_url: https://www.ceskearchivy.cz/
- &id005
identifier_scheme: Wikidata
identifier_value: Q12056841
identifier_url: https://www.wikidata.org/wiki/Q12056841
- &id006
identifier_scheme: VIAF
identifier_value: '264257947'
identifier_url: https://viaf.org/viaf/264257947
locations:
- street_address: Husova 143
postal_code: 379 01
city: Třeboň
region: Jihočeský
country: CZ
latitude: 49.005466
longitude: 14.769143
processing_timestamp: '2025-12-06T23:37:17.923978+00:00'
ghcid:
ghcid_current: CZ-64-TRE-O-CSOAVT
ghcid_original: CZ-JI-TRE-O-ČSOAVT
ghcid_uuid: a74af54d-22e7-5728-88db-6d671ab7b998
ghcid_uuid_sha256: 736e3791-0b20-8148-a785-184fad09a629
ghcid_numeric: 8317646657896350024
record_id: a2eff982-c339-495b-ab54-f633b09d7f12
generation_timestamp: '2025-12-06T23:37:17.923978+00:00'
location_resolution:
country_code: CZ
region_code: 64
city_code: TRE
method: CH_ANNOTATOR_SOURCE
ghcid_history:
- ghcid: CZ-64-TRE-O-CSOAVT
valid_from: '2025-12-10T09:47:02Z'
valid_to: null
reason: Corrected region code from CZ-JI to CZ-64 (South Moravian (Jihomoravský)) per ISO 3166-2:CZ
- ghcid: CZ-JI-TRE-O-CSOAVT
valid_from: null
valid_to: '2025-12-10T09:47:02Z'
reason: Previous GHCID with incorrect region code
- ghcid: CZ-JI-TRE-O-CSOAVT
ghcid_numeric: 8317646657896350024
valid_from: '2025-12-08T11:21:25.763612+00:00'
reason: 'Normalized diacritics to ASCII per ABBREV-DIACRITICS rule (was: CZ-JI-TRE-O-ČSOAVT)'
- ghcid: CZ-JI-TRE-O-ČSOAVT
ghcid_numeric: 10960043114461633251
valid_from: '2025-12-06T23:37:17.923978+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
valid_to: '2025-12-08T11:21:25.763612+00:00'
custodian_name:
claim_type: custodian_name
claim_value: ČR Státní oblastní archiv v Třeboni
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: CZ-64-TRE-O-CSOAVT
- identifier_scheme: GHCID_UUID
identifier_value: a74af54d-22e7-5728-88db-6d671ab7b998
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 736e3791-0b20-8148-a785-184fad09a629
- identifier_scheme: GHCID_NUMERIC
identifier_value: '8317646657896350024'
- identifier_scheme: RECORD_ID
identifier_value: a2eff982-c339-495b-ab54-f633b09d7f12
- *id001
- *id002
- *id003
- *id004
- *id005
- *id006
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T10:14:29.942075+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.95
notes: Removed incorrect wikidata_enrichment on 2025-12-08T08:18:24.222278+00:00. Re-enrichment required with proper matching.
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-tydmQk2HUVdznIullwhY8icmdu5Ai+6PS4Y+dfph0Gc=
verified_at: '2025-12-28T19:59:58.919359+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q12056841
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:59:58.919382+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.OFF
subtype_label: OFFICIAL_INSTITUTION
ontology_class: schema:GovernmentOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T10:14:29.942075+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.95
verified: false
verification_date: null
verified_by: null
entity_claims:
- claim_type: full_name
claim_value: ČR Státní oblastní archiv v Třeboni
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T10:14:29.942075+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.95
- claim_type: institution_type
claim_value: OFFICIAL_INSTITUTION
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T10:14:29.942075+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.95
- claim_type: located_in_city
claim_value: Třeboň
property_uri: schema:addressLocality
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T10:14:29.942075+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.9
- claim_type: wikidata_id
claim_value: Q12056841
property_uri: owl:sameAs
provenance:
namespace: wikidata
path: /entity/Q12056841
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T10:14:29.942075+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 0.98
- claim_type: ghcid
claim_value: CZ-JHE501
property_uri: glam:ghcid
provenance:
namespace: glam
path: /files/czech_unified.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-19T10:14:29.942075+00:00'
statement_created_at: '2025-12-06T21:12:32.389491+00:00'
source_type: library_registry_api
migration_note: Migrated from agent:claude-conversation on 2025-12-30
confidence: 1.0
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:17.923978+00:00'
creation_method: create_custodian_from_ch_annotator.py
wikidata_enrichment:
wikidata_entity_id: Q12056841
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-09T08:40:13.812457+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P31
- P214
- P373
- P17
- P856
- P2427
- P18
- P159
- P527
- P213
- P571
- P6782
- P968
- P1329
- P2671
- P244
wikidata_labels:
cs: Státní oblastní archiv v Třeboni
en: Regional State Archives in Třeboň
sv: Třeboňs regionala statliga arkiv
wikidata_label_en: Regional State Archives in Třeboň
wikidata_descriptions:
en: archives in the Czech Republic
cs: archiv v Česku
wikidata_description_en: archives in the Czech Republic
wikidata_aliases:
cs:
- SOA Třeboň
wikidata_sitelinks:
cswiki: Státní oblastní archiv v Třeboni
wikidata_temporal:
inception: '2002-08-01'
wikidata_inception: '2002-08-01'
wikidata_classification:
instance_of: &id007
- id: Q53130134
label: state regional archive (Czechia)
description: ''
wikidata_instance_of: *id007
wikidata_location:
country: &id008
id: Q213
label: Czech Republic
description: country in Central Europe
headquarters_location:
id: Q773312
label: Třeboň
description: town in Czechia
wikidata_country: *id008
wikidata_organization:
has_parts:
- id: Q54684376
label: Státní okresní archiv Písek
description: ''
- id: Q54685096
label: Q54685096
description: ''
- id: Q54762394
label: Státní okresní archiv Prachatice
description: ''
- id: Q54763218
label: Státní okresní archiv v Českém Krumlově
description: ''
- id: Q54763949
label: State Disctrict Archives České Budějovice
description: organization in České Budějovice, Czechia
- id: Q54764489
label: State District Archives Jindřichův Hradec
description: ''
- id: Q54764947
label: State District Archives Tábor
description: ''
wikidata_web:
official_website: http://www.ceskearchivy.cz/
wikidata_official_website: http://www.ceskearchivy.cz/
wikidata_media:
commons_category: Státní oblastní archiv v Třeboni
image: Klášter augustiniánů (Třeboň) - výřez.jpg
wikidata_image: Klášter augustiniánů (Třeboň) - výřez.jpg
wikidata_contact:
email: mailto:posta@tb.ceskearchivy.cz
phone_number: +420-384-721-128
_provenance:
content_hash:
algorithm: sha256
value: sha256-tydmQk2HUVdznIullwhY8icmdu5Ai+6PS4Y+dfph0Gc=
scope: enrichment_section
computed_at: '2025-12-28T19:59:58.919359+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q12056841
verification:
status: verified
last_verified: '2025-12-28T19:59:58.919372+00:00'
location:
latitude: 49.005466
longitude: 14.769143
coordinate_provenance:
source_type: ORIGINAL_ENTRY
source_path: original_entry.locations[0]
city: Třeboň
region: Jihočeský
region_code: 64
country: *id008
postal_code: 379 01
street_address: Husova 143
normalization_timestamp: '2025-12-09T10:52:50.073754+00:00'
logo_enrichment:
enrichment_timestamp: '2025-12-27T21:07:41.875418+00:00'
source_url: https://www.ceskearchivy.cz
extraction_method: crawl4ai
claims:
- claim_type: logo_url
claim_value: https://www.ceskearchivy.cz/images/INST_logo.png
source_url: https://www.ceskearchivy.cz
css_selector: '#mod-custom206 > p > a > img'
retrieved_on: '2025-12-27T21:07:41.875418+00:00'
extraction_method: crawl4ai_header_logo
detection_confidence: high
alt_text: ''
- claim_type: favicon_url
claim_value: https://www.ceskearchivy.cz/favicon.ico
source_url: https://www.ceskearchivy.cz
css_selector: '[document] > html > head > link:nth-of-type(3)'
retrieved_on: '2025-12-27T21:07:41.875418+00:00'
extraction_method: crawl4ai_link_rel
favicon_type: image/vnd.microsoft.icon
favicon_sizes: ''
summary:
total_claims: 2
has_primary_logo: true
has_favicon: true
has_og_image: false
favicon_count: 1