glam/data/custodian.backup.20251230/AT-2-GUR-A-DGADG.yaml
2025-12-30 23:07:03 +01:00

315 lines
14 KiB
YAML
Raw Permalink Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: Diözese Gurk | Archiv der Diözese Gurk
institution_type: ARCHIVE
source: CH-Annotator (austria_complete_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ISIL
identifier_value: AT-ARCHDZSGURK
identifier_url: https://permalink.obvsg.at/ais/AT-ARCHDZSGURK
locations:
- country: AT
processing_timestamp: '2025-12-06T23:34:14.067262+00:00'
ghcid:
ghcid_current: AT-2-GUR-A-DGADG
ghcid_original: AT-XX-XXX-A-DGADG
ghcid_uuid: f2937282-de68-5873-8441-0988412e1fd4
ghcid_uuid_sha256: fe144588-b87e-8a6e-d065-193f004e4823
ghcid_numeric: 18308334838681061998
record_id: ca523e4b-229d-4822-979e-07d11674c3df
generation_timestamp: '2025-12-06T23:34:14.067262+00:00'
location_resolution:
country_code: AT
region_code: '2'
city_code: GUR
method: CH_ANNOTATOR_TOP_SET
city_name: Gurk
geonames_id: 2777237
feature_code: PPLA3
resolution_timestamp: '2025-12-07T00:18:32.843256+00:00'
extracted_toponym: Gurk
latitude: 46.87389
longitude: 14.29167
ghcid_history:
- ghcid: AT-XX-XXX-A-DGADG
ghcid_numeric: 18308334838681061998
valid_from: '2025-12-06T23:34:14.067262+00:00'
reason: Initial GHCID from CH-Annotator (austria_complete_ch_annotator.yaml)
- ghcid: AT-2-GUR-A-DGADG
valid_from: '2025-12-07T00:18:32.843263+00:00'
reason: 'Location resolved via CH-Annotator TOP.SET extraction: Gurk -> Gurk (GeoNames:2777237)'
custodian_name:
claim_type: custodian_name
claim_value: Diözese Gurk | Archiv der Diözese Gurk
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: AT-XX-XXX-A-DGADG
- identifier_scheme: GHCID_UUID
identifier_value: f2937282-de68-5873-8441-0988412e1fd4
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: fe144588-b87e-8a6e-d065-193f004e4823
- identifier_scheme: GHCID_NUMERIC
identifier_value: '18308334838681061998'
- identifier_scheme: RECORD_ID
identifier_value: ca523e4b-229d-4822-979e-07d11674c3df
- *id001
provenance:
data_source: CSV_REGISTRY
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-18T12:43:45.600495+00:00'
extraction_method: 'Created from CH-Annotator file: austria_complete_ch_annotator.yaml'
confidence_score: 0.95
notes:
- 'Location resolved 2025-12-07T00:18:32Z: CH-Annotator TOP.SET extraction ''Gurk'' -> Gurk (GeoNames:2777237, Region:2)'
- 'YouTube/Google Maps enrichment 2025-12-08T18:42:23Z: Maps: Kirchenarchive (conf: 0.85); YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:10:40Z
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:32Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:47:55Z
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-0PBmATyXd9rkEnXPYx6UfGvarP6+tlokqHUdrfffKQg=
verified_at: '2025-12-28T19:57:15.182028+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q254887
google_maps_enrichment:
content_hash: sha256-ouanBAhtvVxoG/QLQTRRLiVcb7BUAG3+RnexRO4C5xw=
verified_at: '2025-12-28T19:57:15.182126+00:00'
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:57:15.182139+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/austria_complete.yaml
timestamp: '2025-11-18T12:43:45.600495+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:07.943197+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: austria_complete.yaml
annotation_metadata:
confidence_score: 0.95
verified: false
verification_date:
verified_by:
entity_claims:
- claim_type: full_name
claim_value: Diözese Gurk | Archiv der Diözese Gurk
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/austria_complete.yaml
timestamp: '2025-11-18T12:43:45.600495+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/austria_complete.yaml
timestamp: '2025-11-18T12:43:45.600495+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
- claim_type: location_settlement
claim_value: Gurk
property_uri: schema:location
hypernym_code: TOP.SET
hypernym_label: SETTLEMENT
provenance:
namespace: geonames
path: /geonames/2777237
timestamp: '2025-12-07T00:18:32.843265+00:00'
agent: extract_locations_ch_annotator.py
context_convention: ch_annotator-v1_7_0
confidence: 0.85
extraction_source:
field: institution_name
extracted_text: Gurk
method: pattern_matching
integration_note:
created_from: austria_complete_ch_annotator.yaml
creation_date: '2025-12-06T23:34:14.067262+00:00'
creation_method: create_custodian_from_ch_annotator.py
wikidata_enrichment:
wikidata_id: Q254887
wikidata_url: https://www.wikidata.org/wiki/Q254887
label: Diözese Gurk
description: römisch-katholische Diözese in Österreich
enrichment_timestamp: '2025-12-23T00:00:00Z'
enrichment_method: manual_wikidata_lookup
notes: Wikidata entry is for parent diocese (Diözese Gurk), not specifically for the diocesan archive (Archiv der Diözese Gurk)
_provenance:
content_hash:
algorithm: sha256
value: sha256-0PBmATyXd9rkEnXPYx6UfGvarP6+tlokqHUdrfffKQg=
scope: enrichment_section
computed_at: '2025-12-28T19:57:15.182028+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q254887
generatedAtTime: '2025-12-23T00:00:00Z'
verification:
status: verified
last_verified: '2025-12-28T19:57:15.182036+00:00'
wikidata_entity_id: Q254887
google_maps_enrichment:
place_id: ChIJa4rJN2BzcEcRKf52DVnyZO4
name: Kirchenarchive
fetch_timestamp: '2025-12-08T18:42:18.981475+00:00'
api_status: OK
coordinates:
latitude: 46.6274327
longitude: 14.3157137
formatted_address: Mariannengasse 6, 9020 Klagenfurt am Wörthersee, Austria
short_address: Mariannengasse 6, Klagenfurt am Wörthersee
phone_local: 0463 577701981
phone_international: +43 463 577701981
website: https://www.kath-kirche-kaernten.at/dioezese/organisation/C2524
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 4.3
total_ratings: 4
reviews:
- author_name: Iv Ana
author_uri: https://www.google.com/maps/contrib/105976934704956809571/reviews
rating: 5
relative_time_description: a month ago
text:
publish_time: '2025-10-11T22:35:57.427499291Z'
- author_name: Peter Mikl
author_uri: https://www.google.com/maps/contrib/104001392301032951353/reviews
rating: 5
relative_time_description: 5 months ago
text:
publish_time: '2025-06-23T17:07:31.946044190Z'
- author_name: Josef Pippan
author_uri: https://www.google.com/maps/contrib/107513916937613670097/reviews
rating: 2
relative_time_description: a year ago
text:
publish_time: '2024-02-22T15:12:36.074871Z'
- author_name: Matthias
author_uri: https://www.google.com/maps/contrib/102369725921451457379/reviews
rating: 5
relative_time_description: 2 years ago
text:
publish_time: '2022-12-30T16:33:10.327674Z'
opening_hours:
open_now: false
weekday_text:
- 'Monday: 8:00AM12:00PM, 1:304:00PM'
- 'Tuesday: 8:00AM12:00PM, 1:304:00PM'
- 'Wednesday: 8:00AM12:00PM'
- 'Thursday: 8:00AM12:00PM'
- 'Friday: Closed'
- 'Saturday: Closed'
- 'Sunday: Closed'
photo_count: 4
photos_metadata:
- name: places/ChIJa4rJN2BzcEcRKf52DVnyZO4/photos/AZLasHp8dcZ7BRM_BzDYZh7prTG-WB7j2zhQRMjm38d8cSi7pRmL3IH1muQAwRAyhoL0TGwRYtI64sagdn5sl4Oo5boUDvzjV1nwCKw_A6aleqWXlx5plBGbz_-eLwg7CR9wmiSvnuGOvFgJwY7bFA-je3WRUXf1-UM_6hJocGnDSB9LFy8Z1SSqP1yDyiPyqd-V06mprS_747wkhPDfL_IJJUthwORsWDfx1eawKHcIJrFbrIjKIB5VEzsI5XZQy0cSxPuzpQER5_I5LFKouCpM5e6rG1gCIUSpS9Dgnlt5bHrwpQ
height: 1633
width: 2011
- name: places/ChIJa4rJN2BzcEcRKf52DVnyZO4/photos/AZLasHpMgiu45NUdQnYuC34A__GLRAIM0gX3RJJcb6n_eZvEXYHAGk6pwME3rVbHhyCxqd64sf80-MyGjScZx7JwtpD9ox8V0C2E4G2TcCgQ6jpj3ih7aaFevkiiRgIFRDbDinO2781bO247NyzKH5ArHcLiUkkXMXKp2V76HJqdGwBQSOVoj1pflphoNBEY0xro69h-0FOAwkb95L9pnyq_0VK8SXgkDLC-uuvQt0__OYQML29VjRruNVzRDTE9OzBU--XcA5MFIxihAyHJMLiQFcO2xOW5UIjnwUA3s2xWPhSkh6cuBS_C5_hgn96qCSJlo0EWtmiXmZDuDaPMClg9CxvtM69Fr-O1ScHXuwRfI7iaEOlgSeC2maXxBeXVCLk8YesRb18BB0dlVCtTC1cY5KnPVKKEzsuv5zqV2DciX-8jlB0kgwgevq_WjTQ-EVOa
height: 2296
width: 4080
- name: places/ChIJa4rJN2BzcEcRKf52DVnyZO4/photos/AZLasHoF5NqtakmC8K8qWk1BT5v1HvbncW4sDiU_3LDEuE9IJ5mpAHxvs0RVijMCnljAnfrhuEQa8XhcY3v0q3aSjAOfwiBOs4VI7Inh3Z7w6UQbiBcisEt4_98lRFMpAgk7Dyi4PM-9jklTxO3yw1vUZe6ZNyoPRAvz_iYhzOjzDTK1Z5lUY1hbJobHGhCKzSEOY29-djU46pQGJy7N9aLEEGgZVpYTcSy2YWi-UAOGYNB3MtMrpGJqpGqCRfHn_MRZjYcVYDlcS-h-EnG1YslmJqWLoYC2qxmvJcW2IpBKT5VtAqRAPzbEzky_Bj-7cFBt3DiTPE8qsBChtGWnVg10-x8pGkBpMa2mHbkZxHicUe8zTgQL5u8jUOyO9CHtPaYRiwSQhtCH-PSRfZvLC23upL6ZTc19K5eXRODkStc7pFdVbWhCFn6_dUso-cEKO4jW
height: 2296
width: 4080
- name: places/ChIJa4rJN2BzcEcRKf52DVnyZO4/photos/AZLasHoRXPoaV7tyFeVAgGIopp87c_z3L0J7JWQa2jIHCgooIprRdYpaDvMGbTqGGlVj1hPwT5f1HstF-vbLcbBWDzB9iasIFQl9EwPuwZgrQEntQg2AA5huUZrGcbI01CwnX1DexnNDjKUeky4ZsVxlg8kyrstbmKCCDaZ3mvCnCEBt9CX7DNa4yX0mgOf1gdW2pQOVkd0KD_4Zui1C6vN0yNhsutmqccwRSxaLOhgfjFz1k-3fg0y1ZtO6g4kFds5vavoa9fXtPjb00v83GUQd3uoRkNLxWU51sSYITSazNApowQ
height: 721
width: 1024
google_maps_url: https://maps.google.com/?cid=17178121342989827625&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
llm_verification:
is_match: true
confidence: 0.85
entity_type: GRP.HER
reasoning: 'NAME MATCH: The Google name ''Kirchenarchive'' is a generic plural for ''church archives''. The source name ''Archiv der Diözese Gurk'' is a specific diocesan archive. The website for the Google candidate (kath-kirche-kaernten.at) is the official site for the Catholic Church in Carinthia. The diocesan seat for Gurk is co-located with the bishop''s seat in Klagenfurt. The specific page listed for the Google place confirms it is the Archiv der Diözese Gurk, making this a strong match despite the generic Google Maps name. LOCATION MATCH: The source city is Gurk, the seat of the diocese, but the archive''s physical address is in Klagenfurt, which is a common situation. Both are in Austria, so the country matches. The website confirms the Klagenfurt location is correct for this institution. TYPE MATCH: The name ''Archiv'' and the website confirm it is an archive, a type of heritage custodian. Although Google''s types (''point_of_interest'', ''establishment'') are generic, they are not incorrect. ENTITY TYPE: The institution is a diocesan archive, which is a type of heritage institution (GRP.HER).'
agent: glm-4.6
verified: true
ch_annotator_version: ch_annotator-v1_7_0
_provenance:
content_hash:
algorithm: sha256
value: sha256-ouanBAhtvVxoG/QLQTRRLiVcb7BUAG3+RnexRO4C5xw=
scope: enrichment_section
computed_at: '2025-12-28T19:57:15.182126+00:00'
prov:
wasDerivedFrom: https://maps.googleapis.com/maps/api/place/details/json?place_id=ChIJa4rJN2BzcEcRKf52DVnyZO4
generatedAtTime: '2025-12-08T18:42:18.981475+00:00'
wasGeneratedBy:
'@type': prov:Activity
name: google_maps_api_fetch
used: https://maps.googleapis.com/maps/api/place
verification:
status: verified
last_verified: '2025-12-28T19:57:15.182131+00:00'
google_maps_status: SUCCESS
youtube_status: NOT_FOUND
youtube_search_query: Diözese Gurk | Archiv der Diözese Gurk official
youtube_search_timestamp: '2025-12-08T18:42:23.027579+00:00'
location:
latitude: 46.6274327
longitude: 14.3157137
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-12-08T18:42:18.981475+00:00'
entity_id: ChIJa4rJN2BzcEcRKf52DVnyZO4
city: Gurk
region_code: '2'
country: AT
street_address: Mariannengasse 6, Klagenfurt am Wörthersee
formatted_address: Mariannengasse 6, 9020 Klagenfurt am Wörthersee, Austria
geonames_id: 2777237
feature_code: PPLA3
normalization_timestamp: '2025-12-09T06:47:55.829860+00:00'
logo_enrichment:
enrichment_timestamp: '2025-12-22T14:58:22.420419+00:00'
source_url: https://www.kath-kirche-kaernten.at/dioezese/organisation/C2524
extraction_method: crawl4ai
claims:
- claim_type: favicon_url
claim_value: https://www.kath-kirche-kaernten.at/images/icons/safari-pinned-tab.svg
source_url: https://www.kath-kirche-kaernten.at/dioezese/organisation/C2524
css_selector: '[document] > html > head > link:nth-of-type(5)'
retrieved_on: '2025-12-22T14:58:22.420419+00:00'
extraction_method: crawl4ai_link_rel
favicon_type: ''
favicon_sizes: ''
- claim_type: og_image_url
claim_value: https://www.kath-kirche-kaernten.at/images/kath-kirche-kaernten_sharing.jpg
source_url: https://www.kath-kirche-kaernten.at/dioezese/organisation/C2524
css_selector: '[document] > html > head > meta:nth-of-type(10)'
retrieved_on: '2025-12-22T14:58:22.420419+00:00'
extraction_method: crawl4ai_meta_og
summary:
total_claims: 2
has_primary_logo: false
has_favicon: true
has_og_image: true
favicon_count: 5