glam/data/custodian.backup.20251230/AT-2-GUR-A-DGADG-diozese_gurk_archiv_der_diozese_gurk.yaml
2025-12-30 23:07:03 +01:00

197 lines
7.6 KiB
YAML

original_entry:
name: Diözese Gurk | Archiv der Diözese Gurk
institution_type: ARCHIVE
source: CH-Annotator (austria_complete_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ISIL
identifier_value: AT-ARCHDZSGURK
identifier_url: https://permalink.obvsg.at/ais/AT-ARCHDZSGURK
locations:
- country: AT
processing_timestamp: '2025-12-06T23:36:14.160828+00:00'
ghcid:
ghcid_current: AT-2-GUR-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
ghcid_original: AT-XX-XXX-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
ghcid_uuid: b5d5020e-ee76-50c0-a13c-185eb4c804ed
ghcid_uuid_sha256: 66b50851-52d6-89c5-9f67-d14227d48705
ghcid_numeric: 7400830708028414405
record_id: 8b54d29e-640d-47d1-b919-b266883e6132
generation_timestamp: '2025-12-06T23:36:14.160828+00:00'
location_resolution:
country_code: AT
region_code: '2'
city_code: GUR
method: CH_ANNOTATOR_TOP_SET
city_name: Gurk
geonames_id: 2777237
feature_code: PPLA3
resolution_timestamp: '2025-12-07T00:18:33.093698+00:00'
extracted_toponym: Gurk
latitude: 46.87389
longitude: 14.29167
ghcid_history:
- ghcid: AT-XX-XXX-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
ghcid_numeric: 7400830708028414405
valid_from: '2025-12-06T23:36:14.160828+00:00'
reason: Initial GHCID from CH-Annotator (austria_complete_ch_annotator.yaml)
- ghcid: AT-2-GUR-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
valid_from: '2025-12-07T00:18:33.093708+00:00'
reason: 'Location resolved via CH-Annotator TOP.SET extraction: Gurk -> Gurk (GeoNames:2777237)'
custodian_name:
claim_type: custodian_name
claim_value: Diözese Gurk | Archiv der Diözese Gurk
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: AT-XX-XXX-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
- identifier_scheme: GHCID_UUID
identifier_value: b5d5020e-ee76-50c0-a13c-185eb4c804ed
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 66b50851-52d6-89c5-9f67-d14227d48705
- identifier_scheme: GHCID_NUMERIC
identifier_value: '7400830708028414405'
- identifier_scheme: RECORD_ID
identifier_value: 8b54d29e-640d-47d1-b919-b266883e6132
- *id001
provenance:
data_source: CSV_REGISTRY
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-18T12:43:45.600495+00:00'
extraction_method: 'Created from CH-Annotator file: austria_complete_ch_annotator.yaml'
confidence_score: 0.95
notes:
- 'Location resolved 2025-12-07T00:18:33Z: CH-Annotator TOP.SET extraction ''Gurk'' -> Gurk (GeoNames:2777237, Region:2)'
- 'YouTube/Google Maps enrichment 2025-12-08T18:42:17Z: Maps: rejected by LLM; YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:10:40Z
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:32Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:47:55Z
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-0PBmATyXd9rkEnXPYx6UfGvarP6+tlokqHUdrfffKQg=
verified_at: '2025-12-28T19:57:15.159473+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q254887
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:57:15.159489+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/austria_complete.yaml
timestamp: '2025-11-18T12:43:45.600495+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:07.943197+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: austria_complete.yaml
annotation_metadata:
confidence_score: 0.95
verified: false
verification_date:
verified_by:
entity_claims:
- claim_type: full_name
claim_value: Diözese Gurk | Archiv der Diözese Gurk
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/austria_complete.yaml
timestamp: '2025-11-18T12:43:45.600495+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/austria_complete.yaml
timestamp: '2025-11-18T12:43:45.600495+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
- claim_type: location_settlement
claim_value: Gurk
property_uri: schema:location
hypernym_code: TOP.SET
hypernym_label: SETTLEMENT
provenance:
namespace: geonames
path: /geonames/2777237
timestamp: '2025-12-07T00:18:33.093712+00:00'
agent: extract_locations_ch_annotator.py
context_convention: ch_annotator-v1_7_0
confidence: 0.85
extraction_source:
field: institution_name
extracted_text: Gurk
method: pattern_matching
integration_note:
created_from: austria_complete_ch_annotator.yaml
creation_date: '2025-12-06T23:36:14.160828+00:00'
creation_method: create_custodian_from_ch_annotator.py
wikidata_enrichment:
wikidata_id: Q254887
wikidata_url: https://www.wikidata.org/wiki/Q254887
label: Diözese Gurk
description: römisch-katholische Diözese in Österreich
enrichment_timestamp: '2025-12-23T00:00:00Z'
enrichment_method: manual_wikidata_lookup
notes: Wikidata entry is for parent diocese (Diözese Gurk), not specifically for the diocesan archive (Archiv der Diözese Gurk)
_provenance:
content_hash:
algorithm: sha256
value: sha256-0PBmATyXd9rkEnXPYx6UfGvarP6+tlokqHUdrfffKQg=
scope: enrichment_section
computed_at: '2025-12-28T19:57:15.159473+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q254887
generatedAtTime: '2025-12-23T00:00:00Z'
verification:
status: verified
last_verified: '2025-12-28T19:57:15.159480+00:00'
wikidata_entity_id: Q254887
google_maps_status: NO_MATCH
google_maps_rejected:
candidate_name: Kirchenarchive
rejection_reason: The candidate is not a match for the source institution. The source is located in 'Gurk', while the candidate is in 'Klagenfurt am Wörthersee'. Although the name 'Kirchenarchive' (Church Archives) is semantically similar to 'Archiv der Diözese Gurk' (Archive of the Diocese of Gurk) and points to the correct institution type (an archive), the mismatch in location makes it a different entity.
timestamp: '2025-12-08T18:42:17.479257+00:00'
youtube_status: NOT_FOUND
youtube_search_query: Diözese Gurk | Archiv der Diözese Gurk official
youtube_search_timestamp: '2025-12-08T18:42:17.847423+00:00'
location:
latitude: 46.87389
longitude: 14.29167
coordinate_provenance:
source_type: GHCID_RESOLUTION_DIRECT
source_path: ghcid.location_resolution
original_timestamp: '2025-12-07T00:18:33.093698+00:00'
entity_id: 2777237
resolution_method: CH_ANNOTATOR_TOP_SET
city: Gurk
region_code: '2'
country: AT
geonames_id: 2777237
feature_code: PPLA3
normalization_timestamp: '2025-12-09T06:47:55.801969+00:00'