- Improved city name normalization to handle: - St. Gallen / St.Gallen -> Sankt Gallen - Canton suffixes (Buchs SG, Brugg AG) - Hyphenated districts (Bernex - Genève) - Postal codes with slashes (Ecublens/VD) - German prepositions (Hausen b. Brugg) - Created scripts/geocode_from_city_name.py for unified geocoding
146 lines
5.2 KiB
YAML
146 lines
5.2 KiB
YAML
original_entry:
|
|
name: Bibliothèque de l'Université de Genève. Uni Mail. PEB
|
|
institution_type: LIBRARY
|
|
source: CH-Annotator (switzerland_isil_ch_annotator.yaml)
|
|
identifiers:
|
|
- &id001
|
|
identifier_scheme: ISIL
|
|
identifier_value: CH-001810-2
|
|
identifier_url: https://www.isil.nb.admin.ch/en/?isil=CH-001810-2
|
|
- &id002
|
|
identifier_scheme: Website
|
|
identifier_value: https://www.unige.ch/biblio/fr/services/peb/
|
|
identifier_url: https://www.unige.ch/biblio/fr/services/peb/
|
|
locations:
|
|
- region: GE
|
|
country: CH
|
|
city: Genève 4
|
|
postal_code: '1211'
|
|
street_address: Bd du Pont d'Arve 40
|
|
processing_timestamp: '2025-12-06T23:39:09.973972+00:00'
|
|
ghcid:
|
|
ghcid_current: CH-GE-G4-L-BLUGUMP
|
|
ghcid_original: CH-GE-XXX-L-BLUGUMP
|
|
ghcid_uuid: 4984612a-0382-5119-a511-d50ca71cf35b
|
|
ghcid_uuid_sha256: cee8accf-3d8e-842e-b096-0bb537af04ef
|
|
ghcid_numeric: 14909356572501001262
|
|
record_id: 48b79326-9200-4192-a9ea-2fe148a103db
|
|
generation_timestamp: '2025-12-06T23:39:09.973972+00:00'
|
|
location_resolution:
|
|
method: SWISS_ISIL_ENRICHMENT
|
|
city_name: Genève 4
|
|
city_code: G4
|
|
region_code: GE
|
|
country_code: CH
|
|
enrichment_date: '2025-12-07T01:11:36.206676+00:00'
|
|
source_url: https://www.isil.nb.admin.ch/en/institutions/bibliotheque-de-luniversite-de-geneve-uni-mail-peb-ch-001810-2/?page=20
|
|
ghcid_history:
|
|
- ghcid: CH-GE-G4-L-BLUGUMP
|
|
ghcid_numeric: 14909356572501001262
|
|
valid_from: '2025-12-07T01:11:36.206676+00:00'
|
|
valid_to:
|
|
reason: 'City code updated from Swiss ISIL enrichment: Genève 4 -> G4'
|
|
- ghcid: CH-GE-XXX-L-BLUGUMP
|
|
ghcid_numeric: 10848667176016888002
|
|
valid_from: '2025-12-06T23:39:09.973972+00:00'
|
|
reason: Initial GHCID from CH-Annotator (switzerland_isil_ch_annotator.yaml)
|
|
valid_to: '2025-12-07T01:11:36.206676+00:00'
|
|
custodian_name:
|
|
claim_type: custodian_name
|
|
claim_value: Bibliothèque de l'Université de Genève. Uni Mail. PEB
|
|
source_type: ch_annotator
|
|
identifiers:
|
|
- identifier_scheme: GHCID
|
|
identifier_value: CH-GE-G4-L-BLUGUMP
|
|
- identifier_scheme: GHCID_UUID
|
|
identifier_value: 07dc4d64-920c-570a-be6f-c2c590e1de5d
|
|
- identifier_scheme: GHCID_UUID_SHA256
|
|
identifier_value: 968e3551-60ed-80c2-dcbc-c84bc758b94e
|
|
- identifier_scheme: GHCID_NUMERIC
|
|
identifier_value: '10848667176016888002'
|
|
- identifier_scheme: RECORD_ID
|
|
identifier_value: 48b79326-9200-4192-a9ea-2fe148a103db
|
|
- *id001
|
|
- *id002
|
|
provenance:
|
|
data_source: CSV_REGISTRY
|
|
data_tier: TIER_1_AUTHORITATIVE
|
|
extraction_date: '2025-11-19T09:22:31.448266'
|
|
extraction_method: 'Created from CH-Annotator file: switzerland_isil_ch_annotator.yaml'
|
|
confidence_score: 0.95
|
|
notes:
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:11:03Z
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:47:22Z
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:46Z
|
|
- 'YouTube/Google Maps enrichment 2025-12-09T09:09:40Z: YouTube: not found'
|
|
ch_annotator:
|
|
convention_id: ch_annotator-v1_7_0
|
|
convention_version: 1.7.0
|
|
entity_classification:
|
|
hypernym: GRP
|
|
hypernym_label: GROUP
|
|
subtype: GRP.HER.LIB
|
|
subtype_label: LIBRARY
|
|
ontology_class: schema:Library
|
|
alternative_classes:
|
|
- org:FormalOrganization
|
|
- rov:RegisteredOrganization
|
|
- glam:HeritageCustodian
|
|
extraction_provenance:
|
|
namespace: glam
|
|
path: /files/switzerland_isil.yaml
|
|
timestamp: '2025-11-19T09:22:31.448266'
|
|
agent: claude-conversation
|
|
context_convention: ch_annotator-v1_7_0
|
|
annotation_provenance:
|
|
annotation_agent: opencode-claude-sonnet-4
|
|
annotation_date: '2025-12-06T21:13:14.508879+00:00'
|
|
annotation_method: retroactive CH-Annotator application via batch script
|
|
source_file: switzerland_isil.yaml
|
|
annotation_metadata:
|
|
confidence_score: 0.95
|
|
verified: false
|
|
verification_date:
|
|
verified_by:
|
|
entity_claims:
|
|
- claim_type: full_name
|
|
claim_value: Bibliothèque de l'Université de Genève. Uni Mail. PEB
|
|
property_uri: skos:prefLabel
|
|
provenance:
|
|
namespace: glam
|
|
path: /files/switzerland_isil.yaml
|
|
timestamp: '2025-11-19T09:22:31.448266'
|
|
agent: claude-conversation
|
|
context_convention: ch_annotator-v1_7_0
|
|
confidence: 0.95
|
|
- claim_type: institution_type
|
|
claim_value: LIBRARY
|
|
property_uri: rdf:type
|
|
provenance:
|
|
namespace: glam
|
|
path: /files/switzerland_isil.yaml
|
|
timestamp: '2025-11-19T09:22:31.448266'
|
|
agent: claude-conversation
|
|
context_convention: ch_annotator-v1_7_0
|
|
confidence: 0.95
|
|
integration_note:
|
|
created_from: switzerland_isil_ch_annotator.yaml
|
|
creation_date: '2025-12-06T23:39:09.973972+00:00'
|
|
creation_method: create_custodian_from_ch_annotator.py
|
|
location:
|
|
city: Genève 4
|
|
region: GE
|
|
region_code: GE
|
|
country: CH
|
|
postal_code: '1211'
|
|
street_address: Bd du Pont d'Arve 40
|
|
normalization_timestamp: '2025-12-09T13:21:46.788090+00:00'
|
|
latitude: 46.20222
|
|
longitude: 6.14569
|
|
geonames_id: 2660646
|
|
geocoding_timestamp: '2025-12-09T21:28:44.467592+00:00'
|
|
geocoding_method: CITY_NAME_LOOKUP
|
|
geonames_matched_name: Genève
|
|
youtube_status: NOT_FOUND
|
|
youtube_search_query: Bibliothèque de l'Université de Genève. Uni Mail. PEB official
|
|
youtube_search_timestamp: '2025-12-09T09:09:40.482571+00:00'
|