197 lines
7.6 KiB
YAML
197 lines
7.6 KiB
YAML
original_entry:
|
|
name: Diözese Gurk | Archiv der Diözese Gurk
|
|
institution_type: ARCHIVE
|
|
source: CH-Annotator (austria_complete_ch_annotator.yaml)
|
|
identifiers:
|
|
- &id001
|
|
identifier_scheme: ISIL
|
|
identifier_value: AT-ARCHDZSGURK
|
|
identifier_url: https://permalink.obvsg.at/ais/AT-ARCHDZSGURK
|
|
locations:
|
|
- country: AT
|
|
processing_timestamp: '2025-12-06T23:36:14.160828+00:00'
|
|
ghcid:
|
|
ghcid_current: AT-2-GUR-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
|
|
ghcid_original: AT-XX-XXX-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
|
|
ghcid_uuid: b5d5020e-ee76-50c0-a13c-185eb4c804ed
|
|
ghcid_uuid_sha256: 66b50851-52d6-89c5-9f67-d14227d48705
|
|
ghcid_numeric: 7400830708028414405
|
|
record_id: 8b54d29e-640d-47d1-b919-b266883e6132
|
|
generation_timestamp: '2025-12-06T23:36:14.160828+00:00'
|
|
location_resolution:
|
|
country_code: AT
|
|
region_code: '2'
|
|
city_code: GUR
|
|
method: CH_ANNOTATOR_TOP_SET
|
|
city_name: Gurk
|
|
geonames_id: 2777237
|
|
feature_code: PPLA3
|
|
resolution_timestamp: '2025-12-07T00:18:33.093698+00:00'
|
|
extracted_toponym: Gurk
|
|
latitude: 46.87389
|
|
longitude: 14.29167
|
|
ghcid_history:
|
|
- ghcid: AT-XX-XXX-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
|
|
ghcid_numeric: 7400830708028414405
|
|
valid_from: '2025-12-06T23:36:14.160828+00:00'
|
|
reason: Initial GHCID from CH-Annotator (austria_complete_ch_annotator.yaml)
|
|
- ghcid: AT-2-GUR-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
|
|
valid_from: '2025-12-07T00:18:33.093708+00:00'
|
|
reason: 'Location resolved via CH-Annotator TOP.SET extraction: Gurk -> Gurk (GeoNames:2777237)'
|
|
custodian_name:
|
|
claim_type: custodian_name
|
|
claim_value: Diözese Gurk | Archiv der Diözese Gurk
|
|
source_type: ch_annotator
|
|
identifiers:
|
|
- identifier_scheme: GHCID
|
|
identifier_value: AT-XX-XXX-A-DGADG-diozese_gurk_archiv_der_diozese_gurk
|
|
- identifier_scheme: GHCID_UUID
|
|
identifier_value: b5d5020e-ee76-50c0-a13c-185eb4c804ed
|
|
- identifier_scheme: GHCID_UUID_SHA256
|
|
identifier_value: 66b50851-52d6-89c5-9f67-d14227d48705
|
|
- identifier_scheme: GHCID_NUMERIC
|
|
identifier_value: '7400830708028414405'
|
|
- identifier_scheme: RECORD_ID
|
|
identifier_value: 8b54d29e-640d-47d1-b919-b266883e6132
|
|
- *id001
|
|
provenance:
|
|
data_source: CSV_REGISTRY
|
|
data_tier: TIER_1_AUTHORITATIVE
|
|
extraction_date: '2025-11-18T12:43:45.600495+00:00'
|
|
extraction_method: 'Created from CH-Annotator file: austria_complete_ch_annotator.yaml'
|
|
confidence_score: 0.95
|
|
notes:
|
|
- 'Location resolved 2025-12-07T00:18:33Z: CH-Annotator TOP.SET extraction ''Gurk'' -> Gurk (GeoNames:2777237, Region:2)'
|
|
- 'YouTube/Google Maps enrichment 2025-12-08T18:42:17Z: Maps: rejected by LLM; YouTube: not found'
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:10:40Z
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:32Z
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:47:55Z
|
|
schema_version: 2.0.0
|
|
enrichment_provenance:
|
|
wikidata_enrichment:
|
|
content_hash: sha256-0PBmATyXd9rkEnXPYx6UfGvarP6+tlokqHUdrfffKQg=
|
|
verified_at: '2025-12-28T19:57:15.159473+00:00'
|
|
wasDerivedFrom: https://www.wikidata.org/wiki/Q254887
|
|
provenance_schema_version: '2.0'
|
|
standards_compliance:
|
|
- W3C PROV-O
|
|
- W3C SRI (content hashes)
|
|
generated_at: '2025-12-28T19:57:15.159489+00:00'
|
|
ch_annotator:
|
|
convention_id: ch_annotator-v1_7_0
|
|
convention_version: 1.7.0
|
|
entity_classification:
|
|
hypernym: GRP
|
|
hypernym_label: GROUP
|
|
subtype: GRP.HER.ARC
|
|
subtype_label: ARCHIVE
|
|
ontology_class: schema:ArchiveOrganization
|
|
alternative_classes:
|
|
- org:FormalOrganization
|
|
- rov:RegisteredOrganization
|
|
- glam:HeritageCustodian
|
|
extraction_provenance:
|
|
namespace: glam
|
|
path: /files/austria_complete.yaml
|
|
timestamp: '2025-11-18T12:43:45.600495+00:00'
|
|
agent: claude-conversation
|
|
context_convention: ch_annotator-v1_7_0
|
|
annotation_provenance:
|
|
annotation_agent: opencode-claude-sonnet-4
|
|
annotation_date: '2025-12-06T21:12:07.943197+00:00'
|
|
annotation_method: retroactive CH-Annotator application via batch script
|
|
source_file: austria_complete.yaml
|
|
annotation_metadata:
|
|
confidence_score: 0.95
|
|
verified: false
|
|
verification_date:
|
|
verified_by:
|
|
entity_claims:
|
|
- claim_type: full_name
|
|
claim_value: Diözese Gurk | Archiv der Diözese Gurk
|
|
property_uri: skos:prefLabel
|
|
provenance:
|
|
namespace: glam
|
|
path: /files/austria_complete.yaml
|
|
timestamp: '2025-11-18T12:43:45.600495+00:00'
|
|
agent: claude-conversation
|
|
context_convention: ch_annotator-v1_7_0
|
|
confidence: 0.95
|
|
- claim_type: institution_type
|
|
claim_value: ARCHIVE
|
|
property_uri: rdf:type
|
|
provenance:
|
|
namespace: glam
|
|
path: /files/austria_complete.yaml
|
|
timestamp: '2025-11-18T12:43:45.600495+00:00'
|
|
agent: claude-conversation
|
|
context_convention: ch_annotator-v1_7_0
|
|
confidence: 0.95
|
|
- claim_type: location_settlement
|
|
claim_value: Gurk
|
|
property_uri: schema:location
|
|
hypernym_code: TOP.SET
|
|
hypernym_label: SETTLEMENT
|
|
provenance:
|
|
namespace: geonames
|
|
path: /geonames/2777237
|
|
timestamp: '2025-12-07T00:18:33.093712+00:00'
|
|
agent: extract_locations_ch_annotator.py
|
|
context_convention: ch_annotator-v1_7_0
|
|
confidence: 0.85
|
|
extraction_source:
|
|
field: institution_name
|
|
extracted_text: Gurk
|
|
method: pattern_matching
|
|
integration_note:
|
|
created_from: austria_complete_ch_annotator.yaml
|
|
creation_date: '2025-12-06T23:36:14.160828+00:00'
|
|
creation_method: create_custodian_from_ch_annotator.py
|
|
wikidata_enrichment:
|
|
wikidata_id: Q254887
|
|
wikidata_url: https://www.wikidata.org/wiki/Q254887
|
|
label: Diözese Gurk
|
|
description: römisch-katholische Diözese in Österreich
|
|
enrichment_timestamp: '2025-12-23T00:00:00Z'
|
|
enrichment_method: manual_wikidata_lookup
|
|
notes: Wikidata entry is for parent diocese (Diözese Gurk), not specifically for the diocesan archive (Archiv der Diözese Gurk)
|
|
_provenance:
|
|
content_hash:
|
|
algorithm: sha256
|
|
value: sha256-0PBmATyXd9rkEnXPYx6UfGvarP6+tlokqHUdrfffKQg=
|
|
scope: enrichment_section
|
|
computed_at: '2025-12-28T19:57:15.159473+00:00'
|
|
prov:
|
|
wasGeneratedBy:
|
|
'@type': prov:Activity
|
|
name: wikidata_api_fetch
|
|
used: https://www.wikidata.org/w/rest.php/wikibase/v1
|
|
wasDerivedFrom: https://www.wikidata.org/wiki/Q254887
|
|
generatedAtTime: '2025-12-23T00:00:00Z'
|
|
verification:
|
|
status: verified
|
|
last_verified: '2025-12-28T19:57:15.159480+00:00'
|
|
wikidata_entity_id: Q254887
|
|
google_maps_status: NO_MATCH
|
|
google_maps_rejected:
|
|
candidate_name: Kirchenarchive
|
|
rejection_reason: The candidate is not a match for the source institution. The source is located in 'Gurk', while the candidate is in 'Klagenfurt am Wörthersee'. Although the name 'Kirchenarchive' (Church Archives) is semantically similar to 'Archiv der Diözese Gurk' (Archive of the Diocese of Gurk) and points to the correct institution type (an archive), the mismatch in location makes it a different entity.
|
|
timestamp: '2025-12-08T18:42:17.479257+00:00'
|
|
youtube_status: NOT_FOUND
|
|
youtube_search_query: Diözese Gurk | Archiv der Diözese Gurk official
|
|
youtube_search_timestamp: '2025-12-08T18:42:17.847423+00:00'
|
|
location:
|
|
latitude: 46.87389
|
|
longitude: 14.29167
|
|
coordinate_provenance:
|
|
source_type: GHCID_RESOLUTION_DIRECT
|
|
source_path: ghcid.location_resolution
|
|
original_timestamp: '2025-12-07T00:18:33.093698+00:00'
|
|
entity_id: 2777237
|
|
resolution_method: CH_ANNOTATOR_TOP_SET
|
|
city: Gurk
|
|
region_code: '2'
|
|
country: AT
|
|
geonames_id: 2777237
|
|
feature_code: PPLA3
|
|
normalization_timestamp: '2025-12-09T06:47:55.801969+00:00'
|