glam/data/custodian/NL-OV-DEV-M-MW.yaml
kempersc bd06e4f864 data(custodian): merge 135 PENDING files into existing enriched records
Merge data from PENDING files (with XX-XXX placeholders) into their
corresponding enriched custodian records with proper GHCIDs.

Countries affected:
- DE: 4 institutions (Deutsche Stiftung, Jewish Museum Berlin, etc.)
- ES: 1 institution (Biblioteca Nacional de España)
- FR: 1 institution (NMO)
- ID: 18 Indonesian museums and archives
- NL: 111 Dutch institutions across all provinces
- US: 1 institution (ARCA)

The PENDING files are deleted after merge; originals archived in
data/custodian/archive/pending_merged_20250109/
2026-01-09 18:25:56 +01:00

106 lines
3.8 KiB
YAML

custodian_name:
emic_name: Museum De Waag
emic_name_source: linkedin
institution_type:
- M
linkedin_enrichment:
linkedin_url: https://www.linkedin.com/company/museum-de-waag
linkedin_slug: museum-de-waag
industry: Museums, Historical Sites, and Zoos
website: https://museumstevensweert.nl/nl
follower_count: null
staff_count: 2
heritage_staff_count: 2
heritage_staff:
- name: Henkjan Sprokholt
headline: 'Historisch onderzoeker: onderzoekt en visualiseert geschiedenis voor tentoonstellingen en publicaties'
linkedin_url: https://www.linkedin.com/in/henkjan-sprokholt-33195122
heritage_type: R
- name: Simon Kemper
headline: 'Historisch onderzoeker: onderzoekt en visualiseert geschiedenis voor tentoonstellingen en publicaties'
linkedin_url: https://www.linkedin.com/in/rebeccascholten
heritage_type: R
enrichment_timestamp: '2025-12-16T21:06:39.584400+00:00'
provenance:
source: linkedin_company_scrape
original_file: data/custodian/linkedin/museum-de-waag.yaml
schema_version: 1.0.0
location:
city: Deventer
region: OV
country: NL
coordinates:
latitude: 52.2514472
longitude: 6.159973
ghcid:
ghcid_current: NL-OV-DEV-M-MW
ghcid_original: NL-OV-XXX-M-MW
location_resolution:
method: WIKIDATA_GEONAMES_LOOKUP
wikidata_id: Q40304752
geonames_id: 2756987
city_name: Deventer
city_code: DEV
region_code: OV
country_code: NL
resolution_date: '2025-12-19T12:18:36.061356+00:00'
ghcid_history:
- ghcid: NL-OV-DEV-M-MW
valid_from: '2025-12-19T12:18:36.061356+00:00'
valid_to: null
reason: Location resolved via Wikidata (Q40304752) + GeoNames reverse geocoding
- ghcid: NL-OV-XXX-M-MW
ghcid_numeric: 570291831435702087
valid_from: '2025-12-16T21:06:39.584400+00:00'
valid_to: null
reason: Initial GHCID assignment from LinkedIn batch import
provenance:
schema_version: 1.0.0
generated_at: '2025-12-16T21:06:39.584400+00:00'
sources:
linkedin:
- source_type: linkedin_company_profile
data_tier: TIER_4_INFERRED
source_file: data/custodian/linkedin/museum-de-waag.yaml
extraction_timestamp: '2025-12-16T21:06:39.584400+00:00'
claims_extracted:
- name
- industry
- location
- website
- staff_count
- heritage_staff
data_tier_summary:
TIER_4_INFERRED:
- linkedin_company_profile
notes:
- Created from unmatched LinkedIn company profile
- 'Location resolution method: PROVINCE_FROM_CITY_FIELD'
- Staff data merged from NL-XX-XXX-PENDING-MUSEUM-DE-WAAG.yaml on 2026-01-09T15:45:37.094991+00:00
identifiers:
- identifier_scheme: Wikidata
identifier_value: Q40304752
identifier_url: https://www.wikidata.org/wiki/Q40304752
staff:
provenance:
source_type: linkedin_company_people_page_html
registered_timestamp: '2025-12-30T09:57:02Z'
registration_method: html_parsing_with_full_staff_data
total_staff_extracted: 2
staff_list:
- staff_id: museum-de-waag_staff_0000_henkjan_sprokholt
person_name: Henkjan Sprokholt
person_profile_path: data/custodian/person/entity/henkjan-sprokholt-33195122_*.json
role_title: 'Historisch onderzoeker: onderzoekt en visualiseert geschiedenis voor tentoonstellingen en publicaties'
heritage_relevant: true
heritage_type: R
linkedin_profile_url: https://www.linkedin.com/in/henkjan-sprokholt-33195122
linkedin_slug: henkjan-sprokholt-33195122
- staff_id: museum-de-waag_staff_0001_simon_kemper
person_name: Simon Kemper
person_profile_path: data/custodian/person/entity/rebeccascholten_*.json
role_title: 'Historisch onderzoeker: onderzoekt en visualiseert geschiedenis voor tentoonstellingen en publicaties'
heritage_relevant: true
heritage_type: R
linkedin_profile_url: https://www.linkedin.com/in/rebeccascholten
linkedin_slug: rebeccascholten