feat(entity-resolution): expand Dutch heritage domain mappings
Some checks are pending
Deploy Frontend / build-and-deploy (push) Waiting to run

Add domain mappings for better email-based entity matching:
- Government: noord-holland.nl, amsterdam.nl, rotterdam.nl, denhaag.nl,
  hoorn.nl, hhnk.nl, rijksoverheid.nl, politie.nl, kadaster.nl, rvo.nl,
  rivm.nl, staatsbosbeheer.nl, vng.nl
- Museums: maritiemmuseum.nl, paleishetloo.nl, slotloevestein.nl
- Universities: student.vu.nl, cdh.leidenuniv.nl, jur.ru.nl, student.ru.nl,
  student.tudelft.nl, eshcc.eur.nl, wur.nl, ou.nl
- Hogescholen: hva.nl, student.hu.nl, student.fontys.nl

Also remove deprecated activity_id.yaml slot file
This commit is contained in:
kempersc 2026-01-13 20:53:49 +01:00
parent 408813280a
commit 6a3616beac
4 changed files with 43 additions and 72 deletions

View file

@ -1,32 +0,0 @@
id: https://nde.nl/ontology/hc/slot/activity_id
name: activity_id_slot
title: Activity Id Slot (DEPRECATED)
prefixes:
linkml: https://w3id.org/linkml/
hc: https://nde.nl/ontology/hc/
dcterms: http://purl.org/dc/terms/
schema: http://schema.org/
imports:
- linkml:types
default_prefix: hc
slots:
activity_id:
deprecated: >
DEPRECATED (2026-01-13): Use `has_activity_identifier` instead.
This slot is replaced by the standardized identifier slot in the
Activity base class. The new slot follows RiC-O naming conventions
and uses proper URI/CURIE range.
Migration: Replace `activity_id: "some-id"` with
`has_activity_identifier: https://nde.nl/ontology/hc/activity/some-id`
description: 'DEPRECATED - Use has_activity_identifier instead.
Unique identifier for an activity. Mapped to dcterms:identifier
as the standard property for resource identifiers.'
range: string
slot_uri: dcterms:identifier
close_mappings:
- schema:identifier
annotations:
deprecated_date: "2026-01-13"
replaced_by: has_activity_identifier

View file

@ -1,12 +1,12 @@
{
"generated": "2026-01-13T19:52:06.261Z",
"generated": "2026-01-13T19:53:50.189Z",
"schemaRoot": "/schemas/20251121/linkml",
"totalFiles": 2894,
"totalFiles": 2893,
"categoryCounts": {
"main": 4,
"class": 632,
"enum": 147,
"slot": 2107,
"slot": 2106,
"module": 4
},
"categories": [
@ -3967,11 +3967,6 @@
"path": "modules/slots/activities_societies.yaml",
"category": "slot"
},
{
"name": "activity_id",
"path": "modules/slots/activity_id.yaml",
"category": "slot"
},
{
"name": "actual_end",
"path": "modules/slots/actual_end.yaml",

View file

@ -1,32 +0,0 @@
id: https://nde.nl/ontology/hc/slot/activity_id
name: activity_id_slot
title: Activity Id Slot (DEPRECATED)
prefixes:
linkml: https://w3id.org/linkml/
hc: https://nde.nl/ontology/hc/
dcterms: http://purl.org/dc/terms/
schema: http://schema.org/
imports:
- linkml:types
default_prefix: hc
slots:
activity_id:
deprecated: >
DEPRECATED (2026-01-13): Use `has_activity_identifier` instead.
This slot is replaced by the standardized identifier slot in the
Activity base class. The new slot follows RiC-O naming conventions
and uses proper URI/CURIE range.
Migration: Replace `activity_id: "some-id"` with
`has_activity_identifier: https://nde.nl/ontology/hc/activity/some-id`
description: 'DEPRECATED - Use has_activity_identifier instead.
Unique identifier for an activity. Mapped to dcterms:identifier
as the standard property for resource identifiers.'
range: string
slot_uri: dcterms:identifier
close_mappings:
- schema:identifier
annotations:
deprecated_date: "2026-01-13"
replaced_by: has_activity_identifier

View file

@ -107,6 +107,12 @@ HERITAGE_DOMAIN_MAP: Dict[str, Tuple[str, str, Optional[str]]] = {
'stadsarchief.amsterdam.nl': ('Stadsarchief Amsterdam', 'archive', 'NL-NH-AMS-A-SAA'),
'erfgoedcentrumzutphen.nl': ('Erfgoedcentrum Zutphen', 'archive', None),
'erfgoedleiden.nl': ('Erfgoed Leiden en Omstreken', 'archive', None),
'noord-holland.nl': ('Provincie Noord-Holland', 'government', None),
'amsterdam.nl': ('Gemeente Amsterdam', 'government', None),
'rotterdam.nl': ('Gemeente Rotterdam', 'government', None),
'denhaag.nl': ('Gemeente Den Haag', 'government', None),
'hoorn.nl': ('Gemeente Hoorn', 'government', None),
'hhnk.nl': ('Hoogheemraadschap Hollands Noorderkwartier', 'government', None),
# Museums
'openluchtmuseum.nl': ('Nederlands Openluchtmuseum', 'museum', None),
@ -132,6 +138,9 @@ HERITAGE_DOMAIN_MAP: Dict[str, Tuple[str, str, Optional[str]]] = {
'museumhetvalkhof.nl': ('Museum Het Valkhof', 'museum', None),
'museum.nl': ('Rijksmuseum van Oudheden', 'museum', None), # generic, but often RMO
'rfrankenhuis.nl': ('Museum De Fundatie', 'museum', None),
'maritiemmuseum.nl': ('Maritiem Museum Rotterdam', 'museum', None),
'paleishetloo.nl': ('Paleis Het Loo', 'museum', None),
'slotloevestein.nl': ('Slot Loevestein', 'museum', None),
# Universities (Humanities/Heritage departments)
'uu.nl': ('Universiteit Utrecht', 'university', None),
@ -139,19 +148,32 @@ HERITAGE_DOMAIN_MAP: Dict[str, Tuple[str, str, Optional[str]]] = {
'uva.nl': ('Universiteit van Amsterdam', 'university', None),
'student.uva.nl': ('Universiteit van Amsterdam (student)', 'university', None),
'vu.nl': ('Vrije Universiteit Amsterdam', 'university', None),
'student.vu.nl': ('Vrije Universiteit Amsterdam (student)', 'university', None),
'rug.nl': ('Rijksuniversiteit Groningen', 'university', None),
'student.rug.nl': ('Rijksuniversiteit Groningen (student)', 'university', None),
'leidenuniv.nl': ('Universiteit Leiden', 'university', None),
'hum.leidenuniv.nl': ('Universiteit Leiden - Humanities', 'university', None),
'umail.leidenuniv.nl': ('Universiteit Leiden', 'university', None),
'cdh.leidenuniv.nl': ('Universiteit Leiden - Centre for Digital Humanities', 'university', None),
'ru.nl': ('Radboud Universiteit', 'university', None),
'let.ru.nl': ('Radboud Universiteit - Letteren', 'university', None),
'jur.ru.nl': ('Radboud Universiteit - Rechtsgeleerdheid', 'university', None),
'student.ru.nl': ('Radboud Universiteit (student)', 'university', None),
'tudelft.nl': ('TU Delft', 'university', None),
'student.tudelft.nl': ('TU Delft (student)', 'university', None),
'tue.nl': ('TU Eindhoven', 'university', None),
'utwente.nl': ('Universiteit Twente', 'university', None),
'maastrichtuniversity.nl': ('Maastricht University', 'university', None),
'tilburguniversity.edu': ('Tilburg University', 'university', None),
'eur.nl': ('Erasmus Universiteit Rotterdam', 'university', None),
'eshcc.eur.nl': ('Erasmus Universiteit - ESHCC', 'university', None),
'wur.nl': ('Wageningen University & Research', 'university', None),
'ou.nl': ('Open Universiteit', 'university', None),
# Hogescholen (Universities of Applied Sciences)
'hva.nl': ('Hogeschool van Amsterdam', 'university', None),
'student.hu.nl': ('Hogeschool Utrecht (student)', 'university', None),
'student.fontys.nl': ('Fontys Hogescholen (student)', 'university', None),
# Government
'minbuza.nl': ('Ministerie van Buitenlandse Zaken', 'government', None),
@ -168,6 +190,13 @@ HERITAGE_DOMAIN_MAP: Dict[str, Tuple[str, str, Optional[str]]] = {
'minocw.nl': ('Ministerie van OCW', 'government', None),
'minfin.nl': ('Ministerie van Financien', 'government', None),
'belastingdienst.nl': ('Belastingdienst', 'government', None),
'rijksoverheid.nl': ('Rijksoverheid', 'government', None),
'politie.nl': ('Politie Nederland', 'government', None),
'kadaster.nl': ('Kadaster', 'government', None),
'rvo.nl': ('Rijksdienst voor Ondernemend Nederland', 'government', None),
'rivm.nl': ('Rijksinstituut voor Volksgezondheid en Milieu', 'government', None),
'staatsbosbeheer.nl': ('Staatsbosbeheer', 'government', None),
'vng.nl': ('Vereniging van Nederlandse Gemeenten', 'government', None),
# Libraries (Public/Academic)
'oba.nl': ('Openbare Bibliotheek Amsterdam', 'library', None),
@ -179,6 +208,17 @@ HERITAGE_DOMAIN_MAP: Dict[str, Tuple[str, str, Optional[str]]] = {
'nwo.nl': ('Nederlandse Organisatie voor Wetenschappelijk Onderzoek', 'research', None),
'fwo.be': ('Fonds Wetenschappelijk Onderzoek', 'research', None),
'knir.it': ('Koninklijk Nederlands Instituut Rome', 'research', None),
'cbg.nl': ('Centrum voor Familiegeschiedenis (CBG)', 'research', None),
'kitlv.nl': ('Koninklijk Instituut voor Taal-, Land- en Volkenkunde', 'research', None),
'kit.nl': ('KIT Royal Tropical Institute', 'research', None),
# Archaeology/Heritage Research
'baac.nl': ('BAAC Archeologie', 'research', None),
'raap.nl': ('RAAP Archeologisch Adviesbureau', 'research', None),
# Veterans & Military Heritage
'veteranen.nl': ('Veteraneninstituut', 'museum', None),
'knid.nl': ('KNID (unknown)', 'government', None), # 64 hits, needs research
# Belgian Heritage (for completeness)
'arch.be': ('Rijksarchief België', 'archive', None),