From 82e58f6d401d4ffe26092d485155008416c1431b Mon Sep 17 00:00:00 2001 From: kempersc Date: Wed, 10 Dec 2025 01:04:29 +0100 Subject: [PATCH] geocode: add coordinates to 29 custodian files via Wikidata P131/P159 lookups --- data/custodian/AU-NSW-NSW-A-SRANSW.yaml | 32 +++++++---- data/custodian/BE-BRU-BRU-L-SDO.yaml | 16 ++++-- data/custodian/BO-L-LP-A-CBB.yaml | 44 ++++++++------ data/custodian/CH-GE-GEN-A-IKVRK.yaml | 57 ++++++++++++------- data/custodian/CH-GE-GEN-A-SJJR.yaml | 15 +++-- data/custodian/DK-84-CM-L-KU.yaml | 34 +++++++---- data/custodian/DO-01-LJ-A-RCASD.yaml | 22 ++++--- data/custodian/DO-19-HMP-M-CMHM.yaml | 25 +++++--- data/custodian/EE-37-TAL-A-SAT.yaml | 29 ++++++---- data/custodian/EE-79-TAR-A-R.yaml | 32 +++++++---- data/custodian/HR-21-ZAG-A-ZF.yaml | 24 +++++--- data/custodian/IR-09-MAS-L-INST.yaml | 34 +++++++---- data/custodian/IR-23-TEH-A-INST.yaml | 38 ++++++++----- data/custodian/KR-11-YEO-C-K.yaml | 43 +++++++++----- data/custodian/KR-41-GP-A-INST.yaml | 39 ++++++++----- data/custodian/MM-18-KYE-A-MRAC.yaml | 19 +++++-- data/custodian/MX-CMX-CHU-A-SCJN.yaml | 39 ++++++++----- data/custodian/MZ-MPM-B2D-A-AHM.yaml | 32 +++++++---- data/custodian/NL-00-ARN-U-NVP.yaml | 2 + .../NL-NH-AMS-U-EFM-eye_filmmuseum.yaml | 6 ++ data/custodian/NL-ZH-TH-O-NGIS.yaml | 24 +++++--- data/custodian/OM-MA-MAS-A-MHC.yaml | 19 +++++-- data/custodian/PH-00-SJ-A-SP.yaml | 22 ++++--- data/custodian/TH-10-DUS-A-NAT.yaml | 19 +++++-- data/custodian/TH-10-PBM-A-STH.yaml | 20 +++++-- data/custodian/TH-10-WAT-A-SS.yaml | 27 +++++---- data/custodian/TH-73-PHU-A-TFA.yaml | 24 +++++--- data/custodian/TR-06-ANK-A-MCT.yaml | 32 +++++++---- data/custodian/UZ-TK-AYR-A-MBU.yaml | 22 ++++--- 29 files changed, 530 insertions(+), 261 deletions(-) diff --git a/data/custodian/AU-NSW-NSW-A-SRANSW.yaml b/data/custodian/AU-NSW-NSW-A-SRANSW.yaml index d94761bb2c..b0e7cd794a 100644 --- a/data/custodian/AU-NSW-NSW-A-SRANSW.yaml +++ b/data/custodian/AU-NSW-NSW-A-SRANSW.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028325 name: Convict Records of Australia country: Australia + locations: + - latitude: -32.0 + longitude: 147.0 processing_timestamp: '2025-12-06T20:58:52.252406+00:00' wikidata_enrichment: wikidata_entity_id: Q7603489 @@ -49,12 +52,13 @@ wikidata_enrichment: instance_of: &id001 - id: Q166118 label: archive - description: agency or institution responsible for the preservation and communication of records selected for permanent - preservation + description: agency or institution responsible for the preservation and communication + of records selected for permanent preservation - id: Q327333 label: government agency - description: organisational part of a government responsible for specific public services, such as health, judiciary, - education, transportation, foreign affairs, etc + description: organisational part of a government responsible for specific public + services, such as health, judiciary, education, transportation, foreign affairs, + etc wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -117,20 +121,26 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:34:36Z: XX->NSW via Wikidata P131 (AU-NSW)' - - 'YouTube/Google Maps enrichment 2025-12-08T20:13:38Z: Maps: rejected by LLM; YouTube: not found' + - 'YouTube/Google Maps enrichment 2025-12-08T20:13:38Z: Maps: rejected by LLM; YouTube: + not found' - Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:39Z - Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:04Z google_maps_status: NO_MATCH google_maps_rejected: candidate_name: State Records Authority of NSW, O'Connell St - rejection_reason: The Google Maps candidate 'State Records Authority of NSW, O'Connell St' is a bus stop (transit_station), - not the heritage institution itself. The Google Place Types do not match the expected heritage institution types. + rejection_reason: The Google Maps candidate 'State Records Authority of NSW, O'Connell + St' is a bus stop (transit_station), not the heritage institution itself. The + Google Place Types do not match the expected heritage institution types. timestamp: '2025-12-08T20:13:38.622115+00:00' youtube_status: NOT_FOUND youtube_search_query: State Records Authority of New South Wales official youtube_search_timestamp: '2025-12-08T20:13:38.951852+00:00' location: - region: AU-NSW - region_code: NSW - country: AU - normalization_timestamp: '2025-12-09T13:20:27.315203+00:00' + latitude: -32.0 + longitude: 147.0 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P131 (New South Wales) + wikidata_id: Q7603489 + property: P131 + timestamp: '2025-12-10T00:02:39.412187+00:00' diff --git a/data/custodian/BE-BRU-BRU-L-SDO.yaml b/data/custodian/BE-BRU-BRU-L-SDO.yaml index f5158b41d9..4926619dc1 100644 --- a/data/custodian/BE-BRU-BRU-L-SDO.yaml +++ b/data/custodian/BE-BRU-BRU-L-SDO.yaml @@ -11,6 +11,8 @@ original_entry: identifier_url: https://www.wikidata.org/wiki/Q50497977 locations: - country: BE + latitude: 50.983333333 + longitude: 3.527222222 processing_timestamp: '2025-12-06T23:36:17.377730+00:00' ghcid: ghcid_current: BE-BRU-BRU-L-SDO @@ -72,10 +74,16 @@ youtube_search_query: Studie-en Documentatiecentrum OFO official youtube_search_timestamp: '2025-12-08T22:34:27.216844+00:00' provenance: notes: - - 'YouTube/Google Maps enrichment 2025-12-08T22:34:27Z: Maps: not found; YouTube: not found' + - 'YouTube/Google Maps enrichment 2025-12-08T22:34:27Z: Maps: not found; YouTube: + not found' - Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:40Z - Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:04Z location: - region_code: BRU - country: BE - normalization_timestamp: '2025-12-09T13:20:28.862333+00:00' + latitude: 50.983333333 + longitude: 3.527222222 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P131 (Deinze) + wikidata_id: Q50497977 + property: P131 + timestamp: '2025-12-10T00:02:42.542654+00:00' diff --git a/data/custodian/BO-L-LP-A-CBB.yaml b/data/custodian/BO-L-LP-A-CBB.yaml index 7480642220..7335dbc7c7 100644 --- a/data/custodian/BO-L-LP-A-CBB.yaml +++ b/data/custodian/BO-L-LP-A-CBB.yaml @@ -4,9 +4,13 @@ original_entry: wikidata_id: Q806180 mow_inscriptions: - wikidata_id: Q28028172 - name: 'Documentary Collection “Life and Works of Ernesto Che Guevara: from the originals manuscripts of its adolescence - and youth to the campaign Diary in Bolivia”' + name: 'Documentary Collection “Life and Works of Ernesto Che Guevara: from the + originals manuscripts of its adolescence and youth to the campaign Diary in + Bolivia”' country: Cuba + locations: + - latitude: -16.495833333 + longitude: -68.133333333 processing_timestamp: '2025-12-06T20:58:19.390024+00:00' wikidata_enrichment: wikidata_entity_id: Q806180 @@ -120,7 +124,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q66344 label: central bank - description: public institution that manages a state's currency, money supply, and interest rates + description: public institution that manages a state's currency, money supply, + and interest rates wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -183,32 +188,39 @@ unesco_mow_enrichment: inscription_count: 1 inscriptions: - wikidata_id: Q28028172 - name: 'Documentary Collection “Life and Works of Ernesto Che Guevara: from the originals manuscripts of its adolescence - and youth to the campaign Diary in Bolivia”' + name: 'Documentary Collection “Life and Works of Ernesto Che Guevara: from the + originals manuscripts of its adolescence and youth to the campaign Diary in + Bolivia”' inscription_country: Cuba enrichment_timestamp: '2025-12-06T20:58:19.390024+00:00' data_source: Wikidata SPARQL (UNESCO has no MoW API) provenance: notes: - 'Region resolved 2025-12-06T23:33:53Z: XX->L via Wikidata P131 (BO-L)' - - 'City resolved 2025-12-07T00:25:48Z: XXX->LP via Wikidata Q806180 coords (-16.4958,-68.1333) -> La Paz (GeoNames:3911925)' - - 'YouTube/Google Maps enrichment 2025-12-08T20:26:24Z: Maps: rejected by LLM; YouTube: not found' + - 'City resolved 2025-12-07T00:25:48Z: XXX->LP via Wikidata Q806180 coords (-16.4958,-68.1333) + -> La Paz (GeoNames:3911925)' + - 'YouTube/Google Maps enrichment 2025-12-08T20:26:24Z: Maps: rejected by LLM; YouTube: + not found' - Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:53Z - Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:18Z google_maps_status: NO_MATCH google_maps_rejected: candidate_name: Central Bank of Bolivia - rejection_reason: The Google Maps candidate is confirmed to be the correct institution based on name and location, but it - is a central bank, not a heritage institution. The Google Place types ['finance', 'point_of_interest', 'establishment'] - confirm its function as a financial institution, not a museum, library, archive, or gallery. Therefore, it does not match - the expected GRP.HER entity type. + rejection_reason: The Google Maps candidate is confirmed to be the correct institution + based on name and location, but it is a central bank, not a heritage institution. + The Google Place types ['finance', 'point_of_interest', 'establishment'] confirm + its function as a financial institution, not a museum, library, archive, or gallery. + Therefore, it does not match the expected GRP.HER entity type. timestamp: '2025-12-08T20:26:23.713351+00:00' youtube_status: NOT_FOUND youtube_search_query: Central Bank of Bolivia official youtube_search_timestamp: '2025-12-08T20:26:24.048911+00:00' location: - region: BO-L - region_code: L - country: BO - geonames_id: 3911925 - normalization_timestamp: '2025-12-09T13:20:53.167532+00:00' + latitude: -16.495833333 + longitude: -68.133333333 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (La Paz) + wikidata_id: Q806180 + property: P159 + timestamp: '2025-12-10T00:02:39.833879+00:00' diff --git a/data/custodian/CH-GE-GEN-A-IKVRK.yaml b/data/custodian/CH-GE-GEN-A-IKVRK.yaml index 4f1f0e9c06..895ab10fe9 100644 --- a/data/custodian/CH-GE-GEN-A-IKVRK.yaml +++ b/data/custodian/CH-GE-GEN-A-IKVRK.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028117 name: Archives of the International Prisoners of War Agency, 1914-1923 country: Switzerland + locations: + - latitude: 46.21972 + longitude: 6.15078 processing_timestamp: '2025-12-06T20:58:49.070298+00:00' wikidata_enrichment: wikidata_entity_id: Q5987345 @@ -152,7 +155,8 @@ wikidata_enrichment: wikidata_label_fr: Comité international de la Croix-Rouge wikidata_label_es: Comité Internacional de la Cruz Roja wikidata_descriptions: - en: humanitarian institution based in Geneva, Switzerland, and a three-time Nobel Prize Laureate + en: humanitarian institution based in Geneva, Switzerland, and a three-time Nobel + Prize Laureate de: humanitäre Organisation cs: humanitární organizace pl: międzynarodowa organizacja humanitarna @@ -170,17 +174,20 @@ wikidata_enrichment: fr: institution d'aide humanitaire suisse it: associazione umanitaria privata id: lembaga kemanusiaan yang berbasis di Jenewa, Swiss - cy: Sefydliad dyngarod ar gyfer clefion,ffoaduriaid, a dioddefwyr trychunebau a'i phencadlys yng Ngenefa, Swistir, enillwyr - Gwobr Nobel tair gwaith. + cy: Sefydliad dyngarod ar gyfer clefion,ffoaduriaid, a dioddefwyr trychunebau + a'i phencadlys yng Ngenefa, Swistir, enillwyr Gwobr Nobel tair gwaith. es: institución humanitaria con sede en Ginebra, Suiza ko: 스위스의 민간 기구 - en-us: humanitarian institution based in Geneva, Switzerland, and a three-time Nobel Prize Laureate + en-us: humanitarian institution based in Geneva, Switzerland, and a three-time + Nobel Prize Laureate uk: міжнародна гуманітарна організація sq: institucion humanitar me seli në Gjenevë, Zvicër vi: tổ chức viện trợ nhân đạo có trụ sở tại Genève, Thuỵ Sĩ - ca: organització dedicada al protegir la vida i la dignitat de les víctimes de la guerra + ca: organització dedicada al protegir la vida i la dignitat de les víctimes de + la guerra as: চুইজাৰলেণ্ডৰ জেনেভাত থকা প্ৰতিষ্ঠান আৰু তিনিবাৰৰ নোবেল বঁটা বিজয়ী - wikidata_description_en: humanitarian institution based in Geneva, Switzerland, and a three-time Nobel Prize Laureate + wikidata_description_en: humanitarian institution based in Geneva, Switzerland, + and a three-time Nobel Prize Laureate wikidata_aliases: en: - ICRC @@ -367,19 +374,22 @@ wikidata_enrichment: description: Swiss army officer, bridge engineer and topographer (1787-1875) - id: Q124535 label: Gustave Moynier - description: Swiss jurist, co-founder and president of the International Committee of the Red Cross (ICRC) + description: Swiss jurist, co-founder and president of the International Committee + of the Red Cross (ICRC) - id: Q116822 label: Louis Appia - description: Swiss-German surgeon, expert in military medicine, co-founder of the International Committee of the Red - Cross (ICRC) 1818–1898 + description: Swiss-German surgeon, expert in military medicine, co-founder of + the International Committee of the Red Cross (ICRC) 1818–1898 - id: Q115827 label: Théodore Maunoir - description: Swiss surgeon and co-founder of the International Committee of the Red Cross - ICRC (1806-1869) + description: Swiss surgeon and co-founder of the International Committee of + the Red Cross - ICRC (1806-1869) parent_organization: *id005 member_of: - id: Q1365781 label: Memoriav - description: Swiss association for the preservation of the audiovisual heritage of Switzerland + description: Swiss association for the preservation of the audiovisual heritage + of Switzerland - id: Q5205559 label: DLM Forum description: European membership community of public archives @@ -418,8 +428,8 @@ wikidata_enrichment: description: human rights award (1968–) - id: Q628457 label: Balzan Prize - description: annual monetary prizes to people or organizations who have made outstanding achievements in the fields - of humanities, natural sciences, culture + description: annual monetary prizes to people or organizations who have made + outstanding achievements in the fields of humanities, natural sciences, culture - id: Q66401029 label: Honorary Member of the Order of Merit (Portugal) description: rank of the Order of Merit (Portugal) @@ -441,8 +451,8 @@ ghcid: reason: Region code resolved from XX to GE via Wikidata P131 - ghcid: CH-GE-GEN-A-IKVRK valid_from: '2025-12-08T17:18:06.909144+00:00' - reason: GHCID abbreviation regenerated from emic_name "Internationales Komitee vom Roten Kreuz" (was "International Committee - of the Red Cross", abbrev ICRC→IKVRK) + reason: GHCID abbreviation regenerated from emic_name "Internationales Komitee + vom Roten Kreuz" (was "International Committee of the Red Cross", abbrev ICRC→IKVRK) location_resolution: method: WIKIDATA_LOCATION country_code: CH @@ -476,15 +486,22 @@ unesco_mow_enrichment: data_source: Wikidata SPARQL (UNESCO has no MoW API) provenance: notes: - - 'Region code resolved 2025-12-06T22:13:05Z: XX → GE (Canton of Geneva) via Wikidata P131 chain' - - 'GHCID regenerated 2025-12-08T17:18:06.909144+00:00: abbreviation ICRC→IKVRK from emic_name' + - 'Region code resolved 2025-12-06T22:13:05Z: XX → GE (Canton of Geneva) via Wikidata + P131 chain' + - 'GHCID regenerated 2025-12-08T17:18:06.909144+00:00: abbreviation ICRC→IKVRK from + emic_name' - Canonical location added via normalize_custodian_files.py on 2025-12-08T23:47:22Z - Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:47Z - 'YouTube/Google Maps enrichment 2025-12-09T09:09:59Z: YouTube: not found' location: - region_code: GE - country: CH - normalization_timestamp: '2025-12-09T13:21:47.736323+00:00' + latitude: 46.21972 + longitude: 6.15078 youtube_status: NOT_FOUND youtube_search_query: International Committee of the Red Cross official youtube_search_timestamp: '2025-12-09T09:09:59.114725+00:00' +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Villa Moynier, Geneva) + wikidata_id: Q5987345 + property: P159 + timestamp: '2025-12-10T00:02:41.593298+00:00' diff --git a/data/custodian/CH-GE-GEN-A-SJJR.yaml b/data/custodian/CH-GE-GEN-A-SJJR.yaml index 8d997a5031..0307eedafa 100644 --- a/data/custodian/CH-GE-GEN-A-SJJR.yaml +++ b/data/custodian/CH-GE-GEN-A-SJJR.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028211 name: Jean-Jacques Rousseau, Geneva and Neuchâtel Collections country: Switzerland + locations: + - latitude: 46.2 + longitude: 6.15 processing_timestamp: '2025-12-06T20:58:53.455278+00:00' wikidata_enrichment: wikidata_entity_id: Q125567548 @@ -113,10 +116,14 @@ provenance: - Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:47Z - 'YouTube/Google Maps enrichment 2025-12-09T09:10:00Z: YouTube: not found' location: - region: CH-GE - region_code: GE - country: CH - normalization_timestamp: '2025-12-09T13:21:47.822610+00:00' + latitude: 46.2 + longitude: 6.15 youtube_status: NOT_FOUND youtube_search_query: Société Jean-Jacques Rousseau official youtube_search_timestamp: '2025-12-09T09:10:00.441192+00:00' +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P131 (Geneva) + wikidata_id: Q125567548 + property: P131 + timestamp: '2025-12-10T00:02:42.788264+00:00' diff --git a/data/custodian/DK-84-CM-L-KU.yaml b/data/custodian/DK-84-CM-L-KU.yaml index febf5b3c99..45c03159c5 100644 --- a/data/custodian/DK-84-CM-L-KU.yaml +++ b/data/custodian/DK-84-CM-L-KU.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028341 name: The Linné Collection country: Denmark + locations: + - latitude: 55.676111111 + longitude: 12.568888888 processing_timestamp: '2025-12-06T20:58:01.048410+00:00' wikidata_enrichment: wikidata_entity_id: Q621273 @@ -124,8 +127,8 @@ ghcid: reason: Region code resolved from XX to 84 via Wikidata P131 - ghcid: DK-84-CM-L-KU valid_from: '2025-12-08T17:19:52.242746+00:00' - reason: GHCID abbreviation regenerated from emic_name "Københavns Universitetsbibliotek" (was "Copenhagen University Library", - abbrev CUL→KU) + reason: GHCID abbreviation regenerated from emic_name "Københavns Universitetsbibliotek" + (was "Copenhagen University Library", abbrev CUL→KU) location_resolution: method: WIKIDATA_LOCATION country_code: DK @@ -159,21 +162,30 @@ unesco_mow_enrichment: data_source: Wikidata SPARQL (UNESCO has no MoW API) provenance: notes: - - 'Region code resolved 2025-12-06T22:15:11Z: XX → 84 (Capital Region of Denmark) via Wikidata P131 chain' - - 'GHCID regenerated 2025-12-08T17:19:52.242746+00:00: abbreviation CUL→KU from emic_name' - - 'YouTube/Google Maps enrichment 2025-12-08T20:18:47Z: Maps: rejected by LLM; YouTube: not found' + - 'Region code resolved 2025-12-06T22:15:11Z: XX → 84 (Capital Region of Denmark) + via Wikidata P131 chain' + - 'GHCID regenerated 2025-12-08T17:19:52.242746+00:00: abbreviation CUL→KU from + emic_name' + - 'YouTube/Google Maps enrichment 2025-12-08T20:18:47Z: Maps: rejected by LLM; YouTube: + not found' - Canonical location normalized on 2025-12-09T12:10:55Z google_maps_status: NO_MATCH google_maps_rejected: candidate_name: University of Copenhagen Student Centre - rejection_reason: The Google Maps candidate 'University of Copenhagen Student Centre' is a different entity from the source - 'Copenhagen University Library'. The names do not match. The Google Place types 'point_of_interest' and 'establishment' - are too generic and do not specify a library or other heritage institution. + rejection_reason: The Google Maps candidate 'University of Copenhagen Student Centre' + is a different entity from the source 'Copenhagen University Library'. The names + do not match. The Google Place types 'point_of_interest' and 'establishment' are + too generic and do not specify a library or other heritage institution. timestamp: '2025-12-08T20:18:46.858008+00:00' youtube_status: NOT_FOUND youtube_search_query: Copenhagen University Library official youtube_search_timestamp: '2025-12-08T20:18:47.200624+00:00' location: - region_code: '84' - country: DK - normalization_timestamp: '2025-12-09T13:32:14.762562+00:00' + latitude: 55.676111111 + longitude: 12.568888888 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Copenhagen) + wikidata_id: Q621273 + property: P159 + timestamp: '2025-12-10T00:02:45.166854+00:00' diff --git a/data/custodian/DO-01-LJ-A-RCASD.yaml b/data/custodian/DO-01-LJ-A-RCASD.yaml index 88694183a4..b1fbf22cca 100644 --- a/data/custodian/DO-01-LJ-A-RCASD.yaml +++ b/data/custodian/DO-01-LJ-A-RCASD.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028133 name: Book for the Baptism of Slaves (1636-1670) country: Dominican Republic + locations: + - latitude: 18.4625 + longitude: -69.936111111 processing_timestamp: '2025-12-06T20:58:05.106896+00:00' wikidata_enrichment: wikidata_entity_id: Q1365531 @@ -119,7 +122,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q105390172 label: Roman Catholic metropolitan archdiocese - description: archdiocese of the Roman Catholic Church that has a suffragan diocese under its jurisdiction + description: archdiocese of the Roman Catholic Church that has a suffragan diocese + under its jurisdiction wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -200,11 +204,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:32:44Z: XX->01 via Wikidata P131 (DO-01)' - - 'City resolved 2025-12-07T00:32:24Z: XXX->LJ via Wikidata Q1365531 coords (18.4625,-69.9361) -> La Julia (GeoNames:3502052)' + - 'City resolved 2025-12-07T00:32:24Z: XXX->LJ via Wikidata Q1365531 coords (18.4625,-69.9361) + -> La Julia (GeoNames:3502052)' - Canonical location normalized on 2025-12-09T12:10:55Z location: - region: DO-01 - region_code: '01' - country: DO - geonames_id: 3502052 - normalization_timestamp: '2025-12-09T13:32:14.821104+00:00' + latitude: 18.4625 + longitude: -69.936111111 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Santo Domingo) + wikidata_id: Q1365531 + property: P159 + timestamp: '2025-12-10T00:02:39.196818+00:00' diff --git a/data/custodian/DO-19-HMP-M-CMHM.yaml b/data/custodian/DO-19-HMP-M-CMHM.yaml index 3d3500788f..2d1a5979e6 100644 --- a/data/custodian/DO-19-HMP-M-CMHM.yaml +++ b/data/custodian/DO-19-HMP-M-CMHM.yaml @@ -4,8 +4,12 @@ original_entry: wikidata_id: Q119794896 mow_inscriptions: - wikidata_id: Q28028176 - name: Documentary Heritage on the Resistance and Struggle for Human Rights in the Dominican Republic, 1930-1961 + name: Documentary Heritage on the Resistance and Struggle for Human Rights in + the Dominican Republic, 1930-1961 country: Dominican Republic + locations: + - latitude: 19.42 + longitude: -70.39 processing_timestamp: '2025-12-06T20:59:01.716015+00:00' wikidata_enrichment: wikidata_entity_id: Q119794896 @@ -42,8 +46,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q33506 label: museum - description: institution that holds artifacts and other objects of scientific, artistic, cultural, historical, or other - importance + description: institution that holds artifacts and other objects of scientific, + artistic, cultural, historical, or other importance wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -94,7 +98,8 @@ unesco_mow_enrichment: inscription_count: 1 inscriptions: - wikidata_id: Q28028176 - name: Documentary Heritage on the Resistance and Struggle for Human Rights in the Dominican Republic, 1930-1961 + name: Documentary Heritage on the Resistance and Struggle for Human Rights in + the Dominican Republic, 1930-1961 inscription_country: Dominican Republic enrichment_timestamp: '2025-12-06T20:59:01.716015+00:00' data_source: Wikidata SPARQL (UNESCO has no MoW API) @@ -103,7 +108,11 @@ provenance: - 'Region resolved 2025-12-06T23:34:43Z: XX->19 via Wikidata P131 (DO-19)' - Canonical location normalized on 2025-12-09T12:10:55Z location: - region: DO-19 - region_code: '19' - country: DO - normalization_timestamp: '2025-12-09T13:32:14.862247+00:00' + latitude: 19.42 + longitude: -70.39 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P131 (Hermanas Mirabal Province) + wikidata_id: Q119794896 + property: P131 + timestamp: '2025-12-10T00:02:45.046626+00:00' diff --git a/data/custodian/EE-37-TAL-A-SAT.yaml b/data/custodian/EE-37-TAL-A-SAT.yaml index f007115703..364120a519 100644 --- a/data/custodian/EE-37-TAL-A-SAT.yaml +++ b/data/custodian/EE-37-TAL-A-SAT.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q135028510 name: Documents on the history of the Hanse country: Germany + locations: + - latitude: 59.437222222 + longitude: 24.745 processing_timestamp: '2025-12-06T20:58:52.316599+00:00' wikidata_enrichment: wikidata_entity_id: Q12376170 @@ -55,8 +58,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q166118 label: archive - description: agency or institution responsible for the preservation and communication of records selected for permanent - preservation + description: agency or institution responsible for the preservation and communication + of records selected for permanent preservation wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -99,7 +102,8 @@ ghcid: reason: 'City resolved via Wikidata Q12376170 coordinates: XXX->TAL (Tallinn)' - ghcid: EE-37-TAL-A-SAT valid_from: '2025-12-08T17:19:52.271847+00:00' - reason: GHCID abbreviation regenerated from emic_name "Stadtarchiv Tallinn" (was "Tallinn City Archives", abbrev TCA→SAT) + reason: GHCID abbreviation regenerated from emic_name "Stadtarchiv Tallinn" (was + "Tallinn City Archives", abbrev TCA→SAT) location_resolution: method: WIKIDATA_COORDS_REVERSE_GEOCODE country_code: EE @@ -134,12 +138,17 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:33:47Z: XX->37 via Wikidata P131 (EE-37)' - - 'City resolved 2025-12-07T00:36:48Z: XXX->TAL via Wikidata Q12376170 coords (59.4372,24.7450) -> Tallinn (GeoNames:588409)' - - 'GHCID regenerated 2025-12-08T17:19:52.271847+00:00: abbreviation TCA→SAT from emic_name' + - 'City resolved 2025-12-07T00:36:48Z: XXX->TAL via Wikidata Q12376170 coords (59.4372,24.7450) + -> Tallinn (GeoNames:588409)' + - 'GHCID regenerated 2025-12-08T17:19:52.271847+00:00: abbreviation TCA→SAT from + emic_name' - Canonical location normalized on 2025-12-09T12:10:55Z location: - region: EE-37 - region_code: '37' - country: EE - geonames_id: 588409 - normalization_timestamp: '2025-12-09T13:32:15.024181+00:00' + latitude: 59.437222222 + longitude: 24.745 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Tallinn) + wikidata_id: Q12376170 + property: P159 + timestamp: '2025-12-10T00:02:41.898752+00:00' diff --git a/data/custodian/EE-79-TAR-A-R.yaml b/data/custodian/EE-79-TAR-A-R.yaml index dba8c3e374..5c7e5a54e4 100644 --- a/data/custodian/EE-79-TAR-A-R.yaml +++ b/data/custodian/EE-79-TAR-A-R.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028320 name: The Baltic Way - Human Chain Linking Three States in Their Drive for Freedom country: Estonia + locations: + - latitude: 58.38 + longitude: 26.7225 processing_timestamp: '2025-12-06T20:58:49.104388+00:00' wikidata_enrichment: wikidata_entity_id: Q6970432 @@ -93,7 +96,8 @@ wikidata_enrichment: description: archives of a country - id: Q1352795 label: cinematheque - description: organisation responsible for preserving and restoring cinematographic heritage + description: organisation responsible for preserving and restoring cinematographic + heritage wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -109,11 +113,12 @@ wikidata_enrichment: member_of: - id: Q27981723 label: Open Preservation Foundation - description: organization working to sustain technology and knowledge for the long-term management of digital cultural - heritage + description: organization working to sustain technology and knowledge for the + long-term management of digital cultural heritage - id: Q16245829 label: Association of European Film Archives and Cinematheques - description: organization of national and regional preservation film archives from all over Europe + description: organization of national and regional preservation film archives + from all over Europe - id: Q5205559 label: DLM Forum description: European membership community of public archives @@ -154,7 +159,8 @@ ghcid: reason: 'City resolved via Wikidata Q6970432 coordinates: XXX->TAR (Tartu)' - ghcid: EE-79-TAR-A-R valid_from: '2025-12-08T17:19:52.277897+00:00' - reason: GHCID abbreviation regenerated from emic_name "Rahvusarhiiv" (was "National Archives of Estonia", abbrev NAE→R) + reason: GHCID abbreviation regenerated from emic_name "Rahvusarhiiv" (was "National + Archives of Estonia", abbrev NAE→R) location_resolution: method: WIKIDATA_COORDS_REVERSE_GEOCODE country_code: EE @@ -189,12 +195,16 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:34:50Z: XX->79 via Wikidata P131 (EE-79)' - - 'City resolved 2025-12-07T00:35:16Z: XXX->TAR via Wikidata Q6970432 coords (58.3800,26.7225) -> Tartu (GeoNames:588335)' + - 'City resolved 2025-12-07T00:35:16Z: XXX->TAR via Wikidata Q6970432 coords (58.3800,26.7225) + -> Tartu (GeoNames:588335)' - 'GHCID regenerated 2025-12-08T17:19:52.277897+00:00: abbreviation NAE→R from emic_name' - Canonical location normalized on 2025-12-09T12:10:55Z location: - region: EE-79 - region_code: '79' - country: EE - geonames_id: 588335 - normalization_timestamp: '2025-12-09T13:32:15.077558+00:00' + latitude: 58.38 + longitude: 26.7225 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Tartu) + wikidata_id: Q6970432 + property: P159 + timestamp: '2025-12-10T00:02:39.538348+00:00' diff --git a/data/custodian/HR-21-ZAG-A-ZF.yaml b/data/custodian/HR-21-ZAG-A-ZF.yaml index c767340c46..53265721bb 100644 --- a/data/custodian/HR-21-ZAG-A-ZF.yaml +++ b/data/custodian/HR-21-ZAG-A-ZF.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q136768420 name: Short films of the Zagreb School of Animated Films (1956 – 1979) country: Croatia + locations: + - latitude: 45.813055555 + longitude: 15.977222222 processing_timestamp: '2025-12-06T20:58:15.010258+00:00' wikidata_enrichment: wikidata_entity_id: Q140373 @@ -86,8 +89,9 @@ wikidata_enrichment: instance_of: &id001 - id: Q375336 label: film studio - description: major entertainment company or motion picture company that has its own privately owned studio facility - or facilities that are used to make films, which is handled by the production company + description: major entertainment company or motion picture company that has + its own privately owned studio facility or facilities that are used to make + films, which is handled by the production company - id: Q1762059 label: film production company description: company that produces films @@ -164,11 +168,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:33:16Z: XX->21 via Wikidata P131 (HR-21)' - - 'City resolved 2025-12-07T00:26:33Z: XXX->ZAG via Wikidata Q140373 coords (45.8131,15.9772) -> Zagreb (GeoNames:3186886)' + - 'City resolved 2025-12-07T00:26:33Z: XXX->ZAG via Wikidata Q140373 coords (45.8131,15.9772) + -> Zagreb (GeoNames:3186886)' - Canonical location normalized on 2025-12-09T12:11:03Z location: - region: HR-21 - region_code: '21' - country: HR - geonames_id: 3186886 - normalization_timestamp: '2025-12-09T13:32:24.374836+00:00' + latitude: 45.813055555 + longitude: 15.977222222 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Zagreb) + wikidata_id: Q140373 + property: P159 + timestamp: '2025-12-10T00:02:44.515749+00:00' diff --git a/data/custodian/IR-09-MAS-L-INST.yaml b/data/custodian/IR-09-MAS-L-INST.yaml index 02fbbaa19f..f0d9aa258a 100644 --- a/data/custodian/IR-09-MAS-L-INST.yaml +++ b/data/custodian/IR-09-MAS-L-INST.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028103 name: Administrative Documents of Astan-e Quds Razavi in the Safavid Era country: Iran + locations: + - latitude: 36.297494444 + longitude: 59.605923055 processing_timestamp: '2025-12-06T20:58:37.164648+00:00' wikidata_enrichment: wikidata_entity_id: Q4119248 @@ -78,8 +81,9 @@ wikidata_enrichment: instance_of: &id001 - id: Q7075 label: library - description: institution charged with the care of a collection of literary, musical, artistic, or reference materials, - such as books, manuscripts, recordings, or films + description: institution charged with the care of a collection of literary, + musical, artistic, or reference materials, such as books, manuscripts, recordings, + or films - id: Q2122214 label: national archives description: archives of a country @@ -88,7 +92,8 @@ wikidata_enrichment: headquarters_location: id: Q121157 label: Mashhad - description: capital city of Razavi Khorasan Province, and second largest city in Iran + description: capital city of Razavi Khorasan Province, and second largest city + in Iran country: &id002 id: Q794 label: Iran @@ -127,8 +132,8 @@ ghcid: reason: 'City resolved via Wikidata Q4119248 coordinates: XXX->MAS (Mashhad)' - ghcid: IR-09-MAS-L-INST valid_from: '2025-12-08T17:19:53.186748+00:00' - reason: GHCID abbreviation regenerated from emic_name "کتابخانه آستان قدس رضوی" (was "Central Library of Astan Quds Razavi", - abbrev CLAQR→INST) + reason: GHCID abbreviation regenerated from emic_name "کتابخانه آستان قدس رضوی" + (was "Central Library of Astan Quds Razavi", abbrev CLAQR→INST) location_resolution: method: WIKIDATA_COORDS_REVERSE_GEOCODE country_code: IR @@ -163,12 +168,17 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:33:15Z: XX->09 via Wikidata P131 (IR-09)' - - 'City resolved 2025-12-07T00:26:42Z: XXX->MAS via Wikidata Q4119248 coords (36.2975,59.6059) -> Mashhad (GeoNames:124665)' - - 'GHCID regenerated 2025-12-08T17:19:53.186748+00:00: abbreviation CLAQR→INST from emic_name' + - 'City resolved 2025-12-07T00:26:42Z: XXX->MAS via Wikidata Q4119248 coords (36.2975,59.6059) + -> Mashhad (GeoNames:124665)' + - 'GHCID regenerated 2025-12-08T17:19:53.186748+00:00: abbreviation CLAQR→INST from + emic_name' - Canonical location normalized on 2025-12-09T12:11:05Z location: - region: IR-09 - region_code: 09 - country: IR - geonames_id: 124665 - normalization_timestamp: '2025-12-09T13:32:26.544941+00:00' + latitude: 36.297494444 + longitude: 59.605923055 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Mashhad) + wikidata_id: Q4119248 + property: P159 + timestamp: '2025-12-10T00:02:40.176076+00:00' diff --git a/data/custodian/IR-23-TEH-A-INST.yaml b/data/custodian/IR-23-TEH-A-INST.yaml index d3615e550d..420aaada2f 100644 --- a/data/custodian/IR-23-TEH-A-INST.yaml +++ b/data/custodian/IR-23-TEH-A-INST.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q135028411 name: Documents on Iran’s International Relations Under the Qajar Rule (1807-1925) country: Iran + locations: + - latitude: 35.688277777 + longitude: 51.415861111 processing_timestamp: '2025-12-06T20:58:58.794877+00:00' wikidata_enrichment: wikidata_entity_id: Q2565708 @@ -62,19 +65,23 @@ wikidata_enrichment: wikidata_label_en: Ministry of Foreign Affairs of Iran wikidata_label_nl: Lijst van Iraanse ministers van Buitenlandse Zaken wikidata_label_ja: イランの外務大臣 - wikidata_label_de: Ministerium für auswärtige Angelegenheiten der islamischen Republik Iran + wikidata_label_de: Ministerium für auswärtige Angelegenheiten der islamischen Republik + Iran wikidata_label_fr: ministère des Affaires étrangères de l'Iran wikidata_label_es: Ministerio de Relaciones Exteriores de Irán wikidata_descriptions: en: Iranian government ministry - fr: réalise les relations diplomatiques de la République islamique d'Iran avec d'autres États - de: Führt die diplomatischen Beziehungen der islamischen Republik Iran mit anderen Staaten + fr: réalise les relations diplomatiques de la République islamique d'Iran avec + d'autres États + de: Führt die diplomatischen Beziehungen der islamischen Republik Iran mit anderen + Staaten cs: ministerstvo íránské vlády pro zahraniční politiku et: Iraani valitsusministeerium fa: یکی از ۱۹ وزارت‌خانهٔ دولت ایران ar: وزارة إيرانية zh: 政府机构 - sl: ministrstvo v vladi Islamske republike Iran, ki vodi diplomatske odnose Islamske republike Iran z drugimi državami + sl: ministrstvo v vladi Islamske republike Iran, ki vodi diplomatske odnose Islamske + republike Iran z drugimi državami ru: государственный орган исполнительной власти Исламской Республики Иран ko: 이란의 대외관계를 담당하는 중앙부처 ur: خمیننی کے انقلاب کے بعد وزیر خارجہ کون تھا @@ -190,8 +197,8 @@ ghcid: reason: 'City resolved via Wikidata Q2565708 coordinates: XXX->TEH (Tehran)' - ghcid: IR-23-TEH-A-INST valid_from: '2025-12-08T17:19:53.204080+00:00' - reason: GHCID abbreviation regenerated from emic_name "وزارت امور خارجه ایران" (was "Ministry of Foreign Affairs of Iran", - abbrev MFAI→INST) + reason: GHCID abbreviation regenerated from emic_name "وزارت امور خارجه ایران" + (was "Ministry of Foreign Affairs of Iran", abbrev MFAI→INST) location_resolution: method: WIKIDATA_COORDS_REVERSE_GEOCODE country_code: IR @@ -226,12 +233,17 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:33:51Z: XX->23 via Wikidata P131 (IR-23)' - - 'City resolved 2025-12-07T00:25:28Z: XXX->TEH via Wikidata Q2565708 coords (35.6883,51.4159) -> Tehran (GeoNames:112931)' - - 'GHCID regenerated 2025-12-08T17:19:53.204080+00:00: abbreviation MFAI→INST from emic_name' + - 'City resolved 2025-12-07T00:25:28Z: XXX->TEH via Wikidata Q2565708 coords (35.6883,51.4159) + -> Tehran (GeoNames:112931)' + - 'GHCID regenerated 2025-12-08T17:19:53.204080+00:00: abbreviation MFAI→INST from + emic_name' - Canonical location normalized on 2025-12-09T12:11:05Z location: - region: IR-23 - region_code: '23' - country: IR - geonames_id: 112931 - normalization_timestamp: '2025-12-09T13:32:26.766631+00:00' + latitude: 35.688277777 + longitude: 51.415861111 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Tehran) + wikidata_id: Q2565708 + property: P159 + timestamp: '2025-12-10T00:02:43.196942+00:00' diff --git a/data/custodian/KR-11-YEO-C-K.yaml b/data/custodian/KR-11-YEO-C-K.yaml index 7d4a6ff768..74ff1e32f4 100644 --- a/data/custodian/KR-11-YEO-C-K.yaml +++ b/data/custodian/KR-11-YEO-C-K.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q135028713 name: The Archives of the KBS Special Live Broadcast "Finding Dispersed Families" country: South Korea + locations: + - latitude: 37.52468 + longitude: 126.92678 processing_timestamp: '2025-12-06T20:58:16.836686+00:00' wikidata_enrichment: wikidata_entity_id: Q498825 @@ -316,7 +319,8 @@ wikidata_enrichment: description: business that focuses primarily in mass media - id: Q270791 label: state-owned enterprise - description: legal entity controlled by a government to undertake commercial activities + description: legal entity controlled by a government to undertake commercial + activities wikidata_instance_of: *id001 wikidata_location: headquarters_location: @@ -383,7 +387,8 @@ ghcid: reason: 'City resolved via Wikidata Q498825 coordinates: XXX->YEO (Yeoui-dong)' - ghcid: KR-11-YEO-C-K valid_from: '2025-12-08T17:20:55.864457+00:00' - reason: GHCID abbreviation regenerated from emic_name "KBS (한국방송공사)" (was "Korean Broadcasting System", abbrev KBS→K) + reason: GHCID abbreviation regenerated from emic_name "KBS (한국방송공사)" (was "Korean + Broadcasting System", abbrev KBS→K) location_resolution: method: WIKIDATA_COORDS_REVERSE_GEOCODE country_code: KR @@ -418,26 +423,34 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:36:09Z: XX->11 via Wikidata P131 (KR-11)' - - 'City resolved 2025-12-07T00:34:14Z: XXX->YEO via Wikidata Q498825 coords (37.5247,126.9268) -> Yeoui-dong (GeoNames:1832144)' + - 'City resolved 2025-12-07T00:34:14Z: XXX->YEO via Wikidata Q498825 coords (37.5247,126.9268) + -> Yeoui-dong (GeoNames:1832144)' - 'GHCID regenerated 2025-12-08T17:20:55.864457+00:00: abbreviation KBS→K from emic_name' - - 'YouTube/Google Maps enrichment 2025-12-08T20:27:20Z: Maps: rejected by LLM; YouTube: not found' + - 'YouTube/Google Maps enrichment 2025-12-08T20:27:20Z: Maps: rejected by LLM; YouTube: + not found' - Canonical location normalized on 2025-12-09T12:23:07Z google_maps_status: NO_MATCH google_maps_rejected: candidate_name: KBS Korean Broadcasting System - rejection_reason: 'NAME MATCH: Yes. KBS is a well-known acronym for Korean Broadcasting System. LOCATION MATCH: Yes. The - address is in Seoul, South Korea. TYPE MATCH: No. The Google Place types ''point_of_interest'' and ''establishment'' are - not specific enough to confirm it as a heritage institution, nor do they match expected types like museum or library. - KBS is primarily a national public broadcaster. While it may have an archive or museum related to broadcasting history, - its main function is not that of a heritage institution. The candidate place type is too general and ambiguous. ENTITY - TYPE: No. The candidate does not have enough evidence to be classified as a heritage institution (GRP.HER).' + rejection_reason: 'NAME MATCH: Yes. KBS is a well-known acronym for Korean Broadcasting + System. LOCATION MATCH: Yes. The address is in Seoul, South Korea. TYPE MATCH: + No. The Google Place types ''point_of_interest'' and ''establishment'' are not + specific enough to confirm it as a heritage institution, nor do they match expected + types like museum or library. KBS is primarily a national public broadcaster. + While it may have an archive or museum related to broadcasting history, its main + function is not that of a heritage institution. The candidate place type is too + general and ambiguous. ENTITY TYPE: No. The candidate does not have enough evidence + to be classified as a heritage institution (GRP.HER).' timestamp: '2025-12-08T20:27:20.234054+00:00' youtube_status: NOT_FOUND youtube_search_query: Korean Broadcasting System official youtube_search_timestamp: '2025-12-08T20:27:20.590309+00:00' location: - region: KR-11 - region_code: '11' - country: KR - geonames_id: 1832144 - normalization_timestamp: '2025-12-09T13:40:52.616239+00:00' + latitude: 37.52468 + longitude: 126.92678 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Yeoui-dong) + wikidata_id: Q498825 + property: P159 + timestamp: '2025-12-10T00:02:44.593396+00:00' diff --git a/data/custodian/KR-41-GP-A-INST.yaml b/data/custodian/KR-41-GP-A-INST.yaml index 31d810367c..62e2193045 100644 --- a/data/custodian/KR-41-GP-A-INST.yaml +++ b/data/custodian/KR-41-GP-A-INST.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q135028416 name: Archives of the April 19 Revolution country: South Korea + locations: + - latitude: 37.5 + longitude: 127.25 processing_timestamp: '2025-12-06T20:58:38.147029+00:00' wikidata_enrichment: wikidata_entity_id: Q14545096 @@ -47,7 +50,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q125852944 label: non-classified public institution - description: Public institutions other than public corporations or quasi-governmental institutions + description: Public institutions other than public corporations or quasi-governmental + institutions wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -92,7 +96,8 @@ ghcid: reason: 'Region resolved via Wikidata P131: XX->41 (KR-41)' - ghcid: KR-41-GP-A-INST valid_from: '2025-12-08T17:20:55.909363+00:00' - reason: GHCID abbreviation regenerated from emic_name "민주화운동기념사업회" (was "Korea Democracy Foundation", abbrev KDF→INST) + reason: GHCID abbreviation regenerated from emic_name "민주화운동기념사업회" (was "Korea + Democracy Foundation", abbrev KDF→INST) location_resolution: method: WIKIDATA_P131 country_code: KR @@ -126,23 +131,31 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:34:04Z: XX->41 via Wikidata P131 (KR-41)' - - 'GHCID regenerated 2025-12-08T17:20:55.909363+00:00: abbreviation KDF→INST from emic_name' - - 'YouTube/Google Maps enrichment 2025-12-08T20:27:44Z: Maps: rejected by LLM; YouTube: not found' + - 'GHCID regenerated 2025-12-08T17:20:55.909363+00:00: abbreviation KDF→INST from + emic_name' + - 'YouTube/Google Maps enrichment 2025-12-08T20:27:44Z: Maps: rejected by LLM; YouTube: + not found' - Canonical location normalized on 2025-12-09T12:23:07Z google_maps_status: NO_MATCH google_maps_rejected: candidate_name: Korea Democracy Foundation - rejection_reason: 'NAME MATCH: True. The names are identical. LOCATION MATCH: True. The candidate is in South Korea (KR), - matching the source institution''s country. TYPE MATCH: False. The Google Place types are ''point_of_interest'' and ''establishment'', - which are generic and do not match any of the expected heritage institution types (museum, library, archive, gallery). - ENTITY TYPE: The lack of a specific heritage-related type prevents a confident confirmation that it is a GRP.HER. It could - be a research center or an office, not a public-facing custodian institution.' + rejection_reason: 'NAME MATCH: True. The names are identical. LOCATION MATCH: True. + The candidate is in South Korea (KR), matching the source institution''s country. + TYPE MATCH: False. The Google Place types are ''point_of_interest'' and ''establishment'', + which are generic and do not match any of the expected heritage institution types + (museum, library, archive, gallery). ENTITY TYPE: The lack of a specific heritage-related + type prevents a confident confirmation that it is a GRP.HER. It could be a research + center or an office, not a public-facing custodian institution.' timestamp: '2025-12-08T20:27:44.311948+00:00' youtube_status: NOT_FOUND youtube_search_query: Korea Democracy Foundation official youtube_search_timestamp: '2025-12-08T20:27:44.667524+00:00' location: - region: KR-41 - region_code: '41' - country: KR - normalization_timestamp: '2025-12-09T13:40:52.867210+00:00' + latitude: 37.5 + longitude: 127.25 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P131 (Gyeonggi Province) + wikidata_id: Q14545096 + property: P131 + timestamp: '2025-12-10T00:02:40.807086+00:00' diff --git a/data/custodian/MM-18-KYE-A-MRAC.yaml b/data/custodian/MM-18-KYE-A-MRAC.yaml index 0a2207aef4..f08c7f04d0 100644 --- a/data/custodian/MM-18-KYE-A-MRAC.yaml +++ b/data/custodian/MM-18-KYE-A-MRAC.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q135028680 name: King Bayinnaung Bell Inscription country: Myanmar + locations: + - latitude: 19.7475 + longitude: 96.115 processing_timestamp: '2025-12-06T20:58:29.946812+00:00' wikidata_enrichment: wikidata_entity_id: Q28194796 @@ -101,11 +104,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:33:29Z: XX->18 via Wikidata P131 (MM-18)' - - 'City resolved 2025-12-07T00:31:45Z: XXX->KYE via Wikidata Q28194796 coords (19.7475,96.1150) -> Kyetpye (GeoNames:1316111)' + - 'City resolved 2025-12-07T00:31:45Z: XXX->KYE via Wikidata Q28194796 coords (19.7475,96.1150) + -> Kyetpye (GeoNames:1316111)' - Canonical location normalized on 2025-12-09T12:23:10Z location: - region: MM-18 - region_code: '18' - country: MM - geonames_id: 1316111 - normalization_timestamp: '2025-12-09T13:40:55.459229+00:00' + latitude: 19.7475 + longitude: 96.115 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Naypyidaw) + wikidata_id: Q28194796 + property: P159 + timestamp: '2025-12-10T00:02:40.860573+00:00' diff --git a/data/custodian/MX-CMX-CHU-A-SCJN.yaml b/data/custodian/MX-CMX-CHU-A-SCJN.yaml index fdd8480c62..4bc21fd203 100644 --- a/data/custodian/MX-CMX-CHU-A-SCJN.yaml +++ b/data/custodian/MX-CMX-CHU-A-SCJN.yaml @@ -4,9 +4,13 @@ original_entry: wikidata_id: Q130925 mow_inscriptions: - wikidata_id: Q135028756 - name: 'Judicial files concerning the birth of a right: the effective remedy as a contribution of the Mexican writ of amparo - to the Universal Declaration of Human Rights (UDHR) of 1948.' + name: 'Judicial files concerning the birth of a right: the effective remedy as + a contribution of the Mexican writ of amparo to the Universal Declaration of + Human Rights (UDHR) of 1948.' country: Mexico + locations: + - latitude: 19.353773 + longitude: -99.13589 processing_timestamp: '2025-12-06T20:58:52.387097+00:00' wikidata_enrichment: wikidata_entity_id: Q130925 @@ -219,30 +223,37 @@ unesco_mow_enrichment: inscription_count: 1 inscriptions: - wikidata_id: Q135028756 - name: 'Judicial files concerning the birth of a right: the effective remedy as a contribution of the Mexican writ of amparo - to the Universal Declaration of Human Rights (UDHR) of 1948.' + name: 'Judicial files concerning the birth of a right: the effective remedy as + a contribution of the Mexican writ of amparo to the Universal Declaration of + Human Rights (UDHR) of 1948.' inscription_country: Mexico enrichment_timestamp: '2025-12-06T20:58:52.387097+00:00' data_source: Wikidata SPARQL (UNESCO has no MoW API) provenance: notes: - 'Region resolved 2025-12-06T23:34:16Z: XX->CMX via Wikidata P131 (MX-CMX)' - - 'City resolved 2025-12-07T00:25:43Z: XXX->CHU via Wikidata Q130925 coords (19.3538,-99.1359) -> Churubusco (GeoNames:3530675)' - - 'YouTube/Google Maps enrichment 2025-12-08T20:44:35Z: Maps: rejected by LLM; YouTube: not found' + - 'City resolved 2025-12-07T00:25:43Z: XXX->CHU via Wikidata Q130925 coords (19.3538,-99.1359) + -> Churubusco (GeoNames:3530675)' + - 'YouTube/Google Maps enrichment 2025-12-08T20:44:35Z: Maps: rejected by LLM; YouTube: + not found' - Canonical location normalized on 2025-12-09T12:23:16Z google_maps_status: NO_MATCH google_maps_rejected: candidate_name: National Supreme Court of Justice - rejection_reason: While the name and location match, the candidate's type ('courthouse', 'government_office') does not align - with the expected GRP.HER heritage institution types (museum, library, archive, gallery). The Supreme Court of Justice - of the Nation is a judicial body, not a cultural heritage custodian. + rejection_reason: While the name and location match, the candidate's type ('courthouse', + 'government_office') does not align with the expected GRP.HER heritage institution + types (museum, library, archive, gallery). The Supreme Court of Justice of the + Nation is a judicial body, not a cultural heritage custodian. timestamp: '2025-12-08T20:44:35.499832+00:00' youtube_status: NOT_FOUND youtube_search_query: Supreme Court of Justice of the Nation official youtube_search_timestamp: '2025-12-08T20:44:35.822997+00:00' location: - region: MX-CMX - region_code: CMX - country: MX - geonames_id: 3530675 - normalization_timestamp: '2025-12-09T13:40:59.457784+00:00' + latitude: 19.353773 + longitude: -99.13589 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Mexico City) + wikidata_id: Q130925 + property: P159 + timestamp: '2025-12-10T00:02:41.285521+00:00' diff --git a/data/custodian/MZ-MPM-B2D-A-AHM.yaml b/data/custodian/MZ-MPM-B2D-A-AHM.yaml index db5e6141cf..2c4e1d8f83 100644 --- a/data/custodian/MZ-MPM-B2D-A-AHM.yaml +++ b/data/custodian/MZ-MPM-B2D-A-AHM.yaml @@ -4,8 +4,12 @@ original_entry: wikidata_id: Q19607653 mow_inscriptions: - wikidata_id: Q136768403 - name: Census of slaves in Angola, Cape Verde and Mozambique determined by Portuguese decree of 12/14/1854 + name: Census of slaves in Angola, Cape Verde and Mozambique determined by Portuguese + decree of 12/14/1854 country: Angola + locations: + - latitude: -25.915277777 + longitude: 32.576388888 processing_timestamp: '2025-12-06T20:58:53.461498+00:00' wikidata_enrichment: wikidata_entity_id: Q19607653 @@ -105,7 +109,8 @@ wikidata_enrichment: country: &id002 id: Q1029 label: Mozambique - description: country in Southeastern Africa; the current form of Mozambique since 1975 + description: country in Southeastern Africa; the current form of Mozambique + since 1975 headquarters_location: id: Q3889 label: Maputo @@ -137,7 +142,8 @@ ghcid: reason: 'Region resolved via Wikidata P131: XX->MPM (MZ-MPM)' - ghcid: MZ-MPM-B2D-A-AHM valid_from: '2025-12-07T00:31:22.328033+00:00' - reason: 'City resolved via Wikidata Q19607653 coordinates: XXX->B2D (Bairro 25 de Junho B)' + reason: 'City resolved via Wikidata Q19607653 coordinates: XXX->B2D (Bairro 25 + de Junho B)' location_resolution: method: WIKIDATA_COORDS_REVERSE_GEOCODE country_code: MZ @@ -161,19 +167,23 @@ unesco_mow_enrichment: inscription_count: 1 inscriptions: - wikidata_id: Q136768403 - name: Census of slaves in Angola, Cape Verde and Mozambique determined by Portuguese decree of 12/14/1854 + name: Census of slaves in Angola, Cape Verde and Mozambique determined by Portuguese + decree of 12/14/1854 inscription_country: Angola enrichment_timestamp: '2025-12-06T20:58:53.461498+00:00' data_source: Wikidata SPARQL (UNESCO has no MoW API) provenance: notes: - 'Region resolved 2025-12-06T23:32:35Z: XX->MPM via Wikidata P131 (MZ-MPM)' - - 'City resolved 2025-12-07T00:31:22Z: XXX->B2D via Wikidata Q19607653 coords (-25.9153,32.5764) -> Bairro 25 de Junho B - (GeoNames:1106294)' + - 'City resolved 2025-12-07T00:31:22Z: XXX->B2D via Wikidata Q19607653 coords (-25.9153,32.5764) + -> Bairro 25 de Junho B (GeoNames:1106294)' - Canonical location normalized on 2025-12-09T12:23:19Z location: - region: MZ-MPM - region_code: MPM - country: MZ - geonames_id: 1106294 - normalization_timestamp: '2025-12-09T13:41:02.278687+00:00' + latitude: -25.915277777 + longitude: 32.576388888 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Maputo) + wikidata_id: Q19607653 + property: P159 + timestamp: '2025-12-10T00:02:40.597922+00:00' diff --git a/data/custodian/NL-00-ARN-U-NVP.yaml b/data/custodian/NL-00-ARN-U-NVP.yaml index 66aca95926..0a64695f4c 100644 --- a/data/custodian/NL-00-ARN-U-NVP.yaml +++ b/data/custodian/NL-00-ARN-U-NVP.yaml @@ -7,6 +7,8 @@ original_entry: - U entry_index: 1504 processing_timestamp: '2025-11-30T09:58:13.945408+00:00' +linkin: + url: https://www.linkedin.com/company/nederlandse-vereniging-voor-papierknipkunst/ nan_isil_enrichment: source: Nationaal Archief ISIL Registry source_file: ISIL-codes_2025-11-06.yaml diff --git a/data/custodian/NL-NH-AMS-U-EFM-eye_filmmuseum.yaml b/data/custodian/NL-NH-AMS-U-EFM-eye_filmmuseum.yaml index e28fe4de94..efea2b85e6 100644 --- a/data/custodian/NL-NH-AMS-U-EFM-eye_filmmuseum.yaml +++ b/data/custodian/NL-NH-AMS-U-EFM-eye_filmmuseum.yaml @@ -1162,6 +1162,7 @@ linkedin_enrichment: - name: Anne Gant role: Head of Film Conservation and Digital Access linkedin_url: https://nl.linkedin.com/in/anne-gant-59908a18 + person_profile_path: data/custodian/person/anne-gant-59908a18_20251209T220000Z.json current: true start_date: '2014' career_history: @@ -1262,6 +1263,7 @@ linkedin_enrichment: - name: Sandra den Hamer role: Director linkedin_url: https://nl.linkedin.com/in/sandra-den-hamer-66024510 + person_profile_path: data/custodian/person/sandra-den-hamer-66024510_20251209T220000Z.json tenure_start: '2010-01' tenure_end: '2023-02' current_role: Interim Directeur at Nederlands Filmfonds @@ -1310,6 +1312,8 @@ linkedin_enrichment: - name: Giovanna Fossati role: Chief Curator (Former) linkedin_url: https://nl.linkedin.com/in/giovannafossati + person_profile_path: data/custodian/person/giovannafossati_20251209T220000Z.json + person_connections_path: data/custodian/person/giovannafossati_connections_20251209T220000Z.json email: g.fossati@uu.nl current: false tenure_end: '2024-12' @@ -1537,6 +1541,7 @@ linkedin_enrichment: specialization: Silent film, international, nitrate film email: elifrongen@eyefilm.nl linkedin_url: https://nl.linkedin.com/in/elif-rongen-kaynak%C3%A7i-35295a17 + person_profile_path: data/custodian/person/elif-rongen-kaynakci-35295a17_20251209T220000Z.json start_date: '2010-01' current: true expertise: @@ -2731,6 +2736,7 @@ linkedin_enrichment: linkedin_url: https://www.linkedin.com/in/alexandr-belov-bb547b46 current: true person_profile_path: data/custodian/person/alexandr-belov-bb547b46_20251210T120000Z.json + person_connections_path: data/custodian/person/alexandr-belov-bb547b46_connections_20251210T160000Z.json technical_staff: - name: Duke Stewart role: Technical Lead diff --git a/data/custodian/NL-ZH-TH-O-NGIS.yaml b/data/custodian/NL-ZH-TH-O-NGIS.yaml index 8d068917c3..27713247b4 100644 --- a/data/custodian/NL-ZH-TH-O-NGIS.yaml +++ b/data/custodian/NL-ZH-TH-O-NGIS.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q27027188 name: Westerbork film country: '' + locations: + - latitude: 52.08 + longitude: 4.31 processing_timestamp: '2025-12-06T20:58:34.201119+00:00' wikidata_enrichment: wikidata_entity_id: Q2369041 @@ -58,8 +61,9 @@ wikidata_enrichment: instance_of: &id001 - id: Q327333 label: government agency - description: organisational part of a government responsible for specific public services, such as health, judiciary, - education, transportation, foreign affairs, etc + description: organisational part of a government responsible for specific public + services, such as health, judiciary, education, transportation, foreign affairs, + etc wikidata_instance_of: *id001 wikidata_location: headquarters_location: @@ -127,11 +131,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:35:12Z: XX->ZH via Wikidata P131 (NL-ZH)' - - 'City resolved 2025-12-07T00:34:26Z: XXX->TH via Wikidata Q2369041 coords (52.0800,4.3100) -> The Hague (GeoNames:2747373)' + - 'City resolved 2025-12-07T00:34:26Z: XXX->TH via Wikidata Q2369041 coords (52.0800,4.3100) + -> The Hague (GeoNames:2747373)' - Canonical location normalized on 2025-12-09T13:16:23Z location: - region: NL-ZH - region_code: ZH - country: NL - geonames_id: 2747373 - normalization_timestamp: '2025-12-09T13:56:18.409197+00:00' + latitude: 52.08 + longitude: 4.31 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (The Hague) + wikidata_id: Q2369041 + property: P159 + timestamp: '2025-12-10T00:02:44.405978+00:00' diff --git a/data/custodian/OM-MA-MAS-A-MHC.yaml b/data/custodian/OM-MA-MAS-A-MHC.yaml index b779ecc87e..5beae503da 100644 --- a/data/custodian/OM-MA-MAS-A-MHC.yaml +++ b/data/custodian/OM-MA-MAS-A-MHC.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q135028577 name: Maden Al Asrar Fi Elm Al Behar Manuscript country: Oman + locations: + - latitude: 23.613888888 + longitude: 58.592222222 processing_timestamp: '2025-12-06T20:58:52.123646+00:00' wikidata_enrichment: wikidata_entity_id: Q6867126 @@ -110,11 +113,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:35:50Z: XX->MA via Wikidata P131 (OM-MA)' - - 'City resolved 2025-12-07T00:31:41Z: XXX->MAS via Wikidata Q6867126 coords (23.6139,58.5922) -> Masqat (GeoNames:13440507)' + - 'City resolved 2025-12-07T00:31:41Z: XXX->MAS via Wikidata Q6867126 coords (23.6139,58.5922) + -> Masqat (GeoNames:13440507)' - Canonical location normalized on 2025-12-09T13:15:55Z location: - region: OM-MA - region_code: MA - country: OM - geonames_id: 13440507 - normalization_timestamp: '2025-12-09T13:56:26.935741+00:00' + latitude: 23.613888888 + longitude: 58.592222222 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Muscat) + wikidata_id: Q6867126 + property: P159 + timestamp: '2025-12-10T00:02:42.625832+00:00' diff --git a/data/custodian/PH-00-SJ-A-SP.yaml b/data/custodian/PH-00-SJ-A-SP.yaml index 34a1cecbbc..ec70707e78 100644 --- a/data/custodian/PH-00-SJ-A-SP.yaml +++ b/data/custodian/PH-00-SJ-A-SP.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028283 name: Presidential Papers of Manuel L. Quezon country: Philippines + locations: + - latitude: 14.5469 + longitude: 120.984 processing_timestamp: '2025-12-06T20:58:05.108005+00:00' wikidata_enrichment: wikidata_entity_id: Q1418426 @@ -150,7 +153,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q2570643 label: senate - description: type of legislative body, often the upper house or chamber of a bicameral legislature + description: type of legislative body, often the upper house or chamber of a + bicameral legislature wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -234,11 +238,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:32:43Z: XX->00 via Wikidata P131 (PH-00)' - - 'City resolved 2025-12-07T00:34:49Z: XXX->SJ via Wikidata Q1418426 coords (14.5469,120.9840) -> San Jose (GeoNames:1689468)' + - 'City resolved 2025-12-07T00:34:49Z: XXX->SJ via Wikidata Q1418426 coords (14.5469,120.9840) + -> San Jose (GeoNames:1689468)' - Canonical location normalized on 2025-12-09T13:15:51Z location: - region: PH-00 - region_code: '00' - country: PH - geonames_id: 1689468 - normalization_timestamp: '2025-12-09T13:56:27.066992+00:00' + latitude: 14.5469 + longitude: 120.984 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (GSIS Building) + wikidata_id: Q1418426 + property: P159 + timestamp: '2025-12-10T00:02:42.390696+00:00' diff --git a/data/custodian/TH-10-DUS-A-NAT.yaml b/data/custodian/TH-10-DUS-A-NAT.yaml index 318121b7df..17a0189c93 100644 --- a/data/custodian/TH-10-DUS-A-NAT.yaml +++ b/data/custodian/TH-10-DUS-A-NAT.yaml @@ -9,6 +9,9 @@ original_entry: - wikidata_id: Q123686162 name: Royal Photographic Glass Plate Negatives and Original Prints Collection country: Thailand + locations: + - latitude: 13.776944444 + longitude: 100.520555555 processing_timestamp: '2025-12-06T20:58:37.584905+00:00' wikidata_enrichment: wikidata_entity_id: Q6970459 @@ -164,11 +167,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:35:52Z: XX->10 via Wikidata P131 (TH-10)' - - 'City resolved 2025-12-07T00:33:24Z: XXX->DUS via Wikidata Q6970459 coords (13.7769,100.5206) -> Dusit (GeoNames:1610858)' + - 'City resolved 2025-12-07T00:33:24Z: XXX->DUS via Wikidata Q6970459 coords (13.7769,100.5206) + -> Dusit (GeoNames:1610858)' - Canonical location normalized on 2025-12-09T13:15:06Z location: - region: TH-10 - region_code: '10' - country: TH - geonames_id: 1610858 - normalization_timestamp: '2025-12-09T13:56:37.920897+00:00' + latitude: 13.776944444 + longitude: 100.520555555 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Dusit) + wikidata_id: Q6970459 + property: P159 + timestamp: '2025-12-10T00:02:39.603055+00:00' diff --git a/data/custodian/TH-10-PBM-A-STH.yaml b/data/custodian/TH-10-PBM-A-STH.yaml index 7b20d6aef7..7fba35c785 100644 --- a/data/custodian/TH-10-PBM-A-STH.yaml +++ b/data/custodian/TH-10-PBM-A-STH.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q4924088 name: Ram Khamhaeng inscription country: Thailand + locations: + - latitude: 13.758277777 + longitude: 100.493666666 processing_timestamp: '2025-12-06T20:58:27.400168+00:00' wikidata_enrichment: wikidata_entity_id: Q13017383 @@ -45,7 +48,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q58227162 label: hall building - description: Gebäude, dessen Inneres durch einen oder mehrere Säle eingenommen wird + description: Gebäude, dessen Inneres durch einen oder mehrere Säle eingenommen + wird wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -116,9 +120,15 @@ unesco_mow_enrichment: data_source: Wikidata SPARQL (UNESCO has no MoW API) provenance: notes: - - 'Region code resolved 2025-12-06T22:15:11Z: XX → 10 (Bangkok) via Wikidata P131 chain' + - 'Region code resolved 2025-12-06T22:15:11Z: XX → 10 (Bangkok) via Wikidata P131 + chain' - Canonical location normalized on 2025-12-09T13:15:34Z location: - region_code: '10' - country: TH - normalization_timestamp: '2025-12-09T13:56:37.953985+00:00' + latitude: 13.758277777 + longitude: 100.493666666 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P131 (Phra Borom Maha Ratchawang) + wikidata_id: Q13017383 + property: P131 + timestamp: '2025-12-10T00:02:41.169159+00:00' diff --git a/data/custodian/TH-10-WAT-A-SS.yaml b/data/custodian/TH-10-WAT-A-SS.yaml index 01bc1fabe6..ab6e25de9c 100644 --- a/data/custodian/TH-10-WAT-A-SS.yaml +++ b/data/custodian/TH-10-WAT-A-SS.yaml @@ -4,9 +4,12 @@ original_entry: wikidata_id: Q2280705 mow_inscriptions: - wikidata_id: Q28028346 - name: The Minute Books of the Council of the Siam Society, 100 years of recording international cooperation in research - and the dissem + name: The Minute Books of the Council of the Siam Society, 100 years of recording + international cooperation in research and the dissem country: Thailand + locations: + - latitude: 13.742444444 + longitude: 100.588638888 processing_timestamp: '2025-12-06T20:58:34.199756+00:00' wikidata_enrichment: wikidata_entity_id: Q2280705 @@ -146,19 +149,23 @@ unesco_mow_enrichment: inscription_count: 1 inscriptions: - wikidata_id: Q28028346 - name: The Minute Books of the Council of the Siam Society, 100 years of recording international cooperation in research - and the dissem + name: The Minute Books of the Council of the Siam Society, 100 years of recording + international cooperation in research and the dissem inscription_country: Thailand enrichment_timestamp: '2025-12-06T20:58:34.199756+00:00' data_source: Wikidata SPARQL (UNESCO has no MoW API) provenance: notes: - 'Region resolved 2025-12-06T23:35:44Z: XX->10 via Wikidata P131 (TH-10)' - - 'City resolved 2025-12-07T00:27:24Z: XXX->WAT via Wikidata Q2280705 coords (13.7424,100.5886) -> Watthana (GeoNames:7027003)' + - 'City resolved 2025-12-07T00:27:24Z: XXX->WAT via Wikidata Q2280705 coords (13.7424,100.5886) + -> Watthana (GeoNames:7027003)' - Canonical location normalized on 2025-12-09T13:15:20Z location: - region: TH-10 - region_code: '10' - country: TH - geonames_id: 7027003 - normalization_timestamp: '2025-12-09T13:56:38.026269+00:00' + latitude: 13.742444444 + longitude: 100.588638888 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Khlong Tan Nuea) + wikidata_id: Q2280705 + property: P159 + timestamp: '2025-12-10T00:02:40.499676+00:00' diff --git a/data/custodian/TH-73-PHU-A-TFA.yaml b/data/custodian/TH-73-PHU-A-TFA.yaml index 23d685bd48..0e777f8ade 100644 --- a/data/custodian/TH-73-PHU-A-TFA.yaml +++ b/data/custodian/TH-73-PHU-A-TFA.yaml @@ -4,8 +4,12 @@ original_entry: wikidata_id: Q13023423 mow_inscriptions: - wikidata_id: Q136768439 - name: The Birth of the Association of Southeast Asia Nations (ASEAN) (Archives about the Formation ASEAN, 1967 – 1976) + name: The Birth of the Association of Southeast Asia Nations (ASEAN) (Archives + about the Formation ASEAN, 1967 – 1976) country: Indonesia + locations: + - latitude: 13.801944444 + longitude: 100.321666666 processing_timestamp: '2025-12-06T20:58:52.336883+00:00' wikidata_enrichment: wikidata_entity_id: Q13023423 @@ -60,7 +64,8 @@ wikidata_enrichment: instance_of: &id001 - id: Q1352795 label: cinematheque - description: organisation responsible for preserving and restoring cinematographic heritage + description: organisation responsible for preserving and restoring cinematographic + heritage - id: Q13023559 label: public organization (Thailand) description: type of state agency in Thailand @@ -129,7 +134,8 @@ unesco_mow_enrichment: inscription_count: 1 inscriptions: - wikidata_id: Q136768439 - name: The Birth of the Association of Southeast Asia Nations (ASEAN) (Archives about the Formation ASEAN, 1967 – 1976) + name: The Birth of the Association of Southeast Asia Nations (ASEAN) (Archives + about the Formation ASEAN, 1967 – 1976) inscription_country: Indonesia enrichment_timestamp: '2025-12-06T20:58:52.336883+00:00' data_source: Wikidata SPARQL (UNESCO has no MoW API) @@ -138,7 +144,11 @@ provenance: - 'Region resolved 2025-12-06T23:33:44Z: XX->73 via Wikidata P131 (TH-73)' - Canonical location normalized on 2025-12-09T13:15:06Z location: - region: TH-73 - region_code: '73' - country: TH - normalization_timestamp: '2025-12-09T13:56:38.112779+00:00' + latitude: 13.801944444 + longitude: 100.321666666 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Phutthamonthon) + wikidata_id: Q13023423 + property: P159 + timestamp: '2025-12-10T00:02:39.630636+00:00' diff --git a/data/custodian/TR-06-ANK-A-MCT.yaml b/data/custodian/TR-06-ANK-A-MCT.yaml index f83f87d526..38407cedf6 100644 --- a/data/custodian/TR-06-ANK-A-MCT.yaml +++ b/data/custodian/TR-06-ANK-A-MCT.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q136768471 name: Karatepe-Aslantaş Inscriptions country: Turkey + locations: + - latitude: 39.93576 + longitude: 32.83869 processing_timestamp: '2025-12-06T20:58:54.715834+00:00' wikidata_enrichment: wikidata_entity_id: Q3136957 @@ -155,7 +158,8 @@ wikidata_enrichment: description: building in Turkey - id: Q28136615 label: Akhisar Museum - description: archaeology and ethnography museum located in Akhisar, Manisa, Türkiye + description: archaeology and ethnography museum located in Akhisar, Manisa, + Türkiye - id: Q28221137 label: Sivas Congress and Ethnography Museum description: '' @@ -225,22 +229,28 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:33:36Z: XX->06 via Wikidata P131 (TR-06)' - - 'City resolved 2025-12-07T00:28:30Z: XXX->ANK via Wikidata Q3136957 coords (39.9358,32.8387) -> Ankara (GeoNames:323786)' - - 'YouTube/Google Maps enrichment 2025-12-08T20:21:22Z: Maps: rejected by LLM; YouTube: not found' + - 'City resolved 2025-12-07T00:28:30Z: XXX->ANK via Wikidata Q3136957 coords (39.9358,32.8387) + -> Ankara (GeoNames:323786)' + - 'YouTube/Google Maps enrichment 2025-12-08T20:21:22Z: Maps: rejected by LLM; YouTube: + not found' - Canonical location normalized on 2025-12-09T13:15:40Z google_maps_status: NO_MATCH google_maps_rejected: candidate_name: T. C. Culture and Tourism Ministry Book Outlets - rejection_reason: The Google candidate is a retail store ('book_store'), which does not match the expected government organization - entity type. While it's associated with the Ministry (name match), its function and Google place type ('store') are mismatched - for the institution itself. + rejection_reason: The Google candidate is a retail store ('book_store'), which does + not match the expected government organization entity type. While it's associated + with the Ministry (name match), its function and Google place type ('store') are + mismatched for the institution itself. timestamp: '2025-12-08T20:21:21.762300+00:00' youtube_status: NOT_FOUND youtube_search_query: Ministry of Culture and Tourism official youtube_search_timestamp: '2025-12-08T20:21:22.127167+00:00' location: - region: TR-06 - region_code: '06' - country: TR - geonames_id: 323786 - normalization_timestamp: '2025-12-09T13:56:38.319515+00:00' + latitude: 39.93576 + longitude: 32.83869 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Ankara) + wikidata_id: Q3136957 + property: P159 + timestamp: '2025-12-10T00:02:41.409656+00:00' diff --git a/data/custodian/UZ-TK-AYR-A-MBU.yaml b/data/custodian/UZ-TK-AYR-A-MBU.yaml index a24f6afc30..cd4a0d3162 100644 --- a/data/custodian/UZ-TK-AYR-A-MBU.yaml +++ b/data/custodian/UZ-TK-AYR-A-MBU.yaml @@ -6,6 +6,9 @@ original_entry: - wikidata_id: Q28028199 name: Holy Koran Mushaf of Othman country: Uzbekistan + locations: + - latitude: 41.336997 + longitude: 69.23933 processing_timestamp: '2025-12-06T20:58:12.581334+00:00' wikidata_enrichment: wikidata_entity_id: Q25527802 @@ -48,7 +51,8 @@ wikidata_enrichment: description: organizations related to Islam or Muslims - id: Q4171307 label: Spiritual Administration of the Muslims - description: religious organization of Muslims, typical for the countries of the former USSR + description: religious organization of Muslims, typical for the countries of + the former USSR wikidata_instance_of: *id001 wikidata_location: country: &id002 @@ -116,11 +120,15 @@ unesco_mow_enrichment: provenance: notes: - 'Region resolved 2025-12-06T23:32:55Z: XX->TK via Wikidata P131 (UZ-TK)' - - 'City resolved 2025-12-07T00:31:03Z: XXX->AYR via Wikidata Q25527802 coords (41.3370,69.2393) -> Ayrikuylak (GeoNames:1514505)' + - 'City resolved 2025-12-07T00:31:03Z: XXX->AYR via Wikidata Q25527802 coords (41.3370,69.2393) + -> Ayrikuylak (GeoNames:1514505)' - Canonical location normalized on 2025-12-09T13:15:50Z location: - region: UZ-TK - region_code: TK - country: UZ - geonames_id: 1514505 - normalization_timestamp: '2025-12-09T13:56:41.740388+00:00' + latitude: 41.336997 + longitude: 69.23933 +geocoding: + method: WIKIDATA_LOCATION + source: Wikidata P159 (Barakhan Madrasah) + wikidata_id: Q25527802 + property: P159 + timestamp: '2025-12-10T00:02:42.250478+00:00'