glam/data/custodian_sample/NL-NB-MIL-S-M.yaml
2025-12-11 22:32:09 +01:00

521 lines
21 KiB
YAML

original_entry:
organisatie: Stichting Myllesheem
samenwerkingsverband_platform: Brabant Cloud
systeem: Vitec Maior
linked_data: nee
wikidata_id: Q110907479
type:
- S
entry_index: 589
processing_timestamp: '2025-11-27T15:28:02.931703+00:00'
wikidata_enrichment:
wikidata_entity_id: Q110907479
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-09T12:11:33.357078+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P973
- P159
- P17
- P856
- P31
wikidata_labels:
en: Stichting Myllesheem (Heemkamer)
nl: Stichting Myllesheem (Heemkamer)
wikidata_label_en: Stichting Myllesheem (Heemkamer)
wikidata_label_nl: Stichting Myllesheem (Heemkamer)
wikidata_classification:
instance_of: &id001
- id: Q5774403
label: historical society
description: organization that collects, researches, interprets and preserves information or items of historical interest
wikidata_instance_of: *id001
wikidata_location:
headquarters_location:
id: Q2745122
label: Mill, North Brabant
description: village in Land van Cuijk, the Netherlands
country: &id002
id: Q55
label: Netherlands
description: country in Northwestern Europe with territories in the Caribbean
wikidata_country: *id002
wikidata_web:
described_at_url: https://www.brabantserfgoed.nl/page/4488/stichting-myllesheem-heemkamer
official_website: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
wikidata_official_website: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
enrichment_status: success
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:26:54.818740+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- organisatie
- samenwerkingsverband_platform
- systeem
- linked_data
- wikidata_id
- type
wikidata:
- source_type: wikidata_api
fetch_timestamp: '2025-11-27T15:28:02.778377+00:00'
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
entity_id: Q110907479
claims_extracted:
- labels
- instance_of
- country
- official_website
- claim_described_at_url
- claim_headquarters
- claim_P1343_described_by_source
- claim_P1454_legal_form
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T09:54:35.681768+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJ4cemtJAax0cRyXLF0Er_zc0
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- rating
- reviews
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:50:28.544149+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: google_maps_admin2
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
- Canonical location normalized on 2025-12-09T12:50:50Z
qp_resolution_timestamp: '2025-11-27T20:16:10.027954+00:00'
google_maps_enrichment:
place_id: ChIJ4cemtJAax0cRyXLF0Er_zc0
name: Stichting Myllesheem
fetch_timestamp: '2025-11-28T09:54:35.681768+00:00'
api_status: OK
coordinates:
latitude: 51.6871812
longitude: 5.783085
formatted_address: Kerkstraat, 5451 BM Mill
short_address: Kerkstraat, Mill
address_components:
- long_name: Kerkstraat
short_name: Kerkstraat
types:
- route
- long_name: Mill
short_name: Mill
types:
- locality
- political
- long_name: Land van Cuijk
short_name: Land van Cuijk
types:
- administrative_area_level_2
- political
- long_name: Noord-Brabant
short_name: NB
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 5451 BM
short_name: 5451 BM
types:
- postal_code
website: https://myllesheem.nl/
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 4
total_ratings: 2
reviews:
- author_name: Theo Cornelissen
author_uri: https://www.google.com/maps/contrib/113827380484105315296/reviews
rating: 3
relative_time_description: 8 jaar geleden
text: Weet er weinig van
publish_time: '2017-01-16T17:32:40.940Z'
- author_name: Christ'l van der Burgt
author_uri: https://www.google.com/maps/contrib/108638365899942476076/reviews
rating: 5
relative_time_description: 3 jaar geleden
text:
publish_time: '2021-12-03T14:41:45.961459Z'
google_maps_url: https://maps.google.com/?cid=14829789844796175049&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=51.6871812,5.783085&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/generic_pinlet
icon_background_color: '#7B9EB0'
utc_offset_minutes: 60
google_maps_status: SUCCESS
google_maps_search_query: Stichting Myllesheem, Netherlands
web_enrichment:
web_archives:
- url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
directory: web/0589/myllesweerd.nl
pages_archived: 1
archive_method: wget_warc_deep
warc_file: archive.warc.gz
warc_size_bytes: 16353
warc_format: ISO 28500
full_site_archive_timestamp: '2025-11-29T16:43:27.118602+00:00'
ghcid:
ghcid_current: NL-NB-MIL-S-M
ghcid_original: NL-NB-MIL-S-M
ghcid_uuid: a639c418-678e-5585-a85a-8d1ab9b95d5e
ghcid_uuid_sha256: 7793e402-57d5-87d4-ad5f-051bc3cb9d0c
ghcid_numeric: 8616481210804582356
record_id: 019adf94-6851-769f-b475-e043bd2c3d76
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-NB-MIL-S-M
ghcid_numeric: 8616481210804582356
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to:
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Mill
geonames_id: 2750802
geonames_name: Mill
feature_code: PPL
population: 6289
admin1_code: '06'
region_code: NB
country_code: NL
source_coordinates:
latitude: 51.6871812
longitude: 5.783085
source: google_maps
geonames_id: 2750802
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-NB-MIL-S-M
- identifier_scheme: GHCID_UUID
identifier_value: a639c418-678e-5585-a85a-8d1ab9b95d5e
identifier_url: urn:uuid:a639c418-678e-5585-a85a-8d1ab9b95d5e
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 7793e402-57d5-87d4-ad5f-051bc3cb9d0c
identifier_url: urn:uuid:7793e402-57d5-87d4-ad5f-051bc3cb9d0c
- identifier_scheme: GHCID_NUMERIC
identifier_value: '8616481210804582356'
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-6851-769f-b475-e043bd2c3d76
identifier_url: urn:uuid:019adf94-6851-769f-b475-e043bd2c3d76
web_claims:
extraction_timestamp: '2025-12-02T08:43:47.240339+00:00'
source_archive: web/0589/myllesweerd.nl
claims_count: 14
claims:
- claim_type: org_name
claim_value: Huisgenoten
raw_value: Huisgenoten - Myllesweerd
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/head/title
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: title_tag
extraction_timestamp: '2025-12-02T08:43:47.226252+00:00'
- claim_type: org_name
claim_value: Myllesweerd
raw_value: Myllesweerd
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/head/meta[9]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: og_site_name
extraction_timestamp: '2025-12-02T08:43:47.226620+00:00'
- claim_type: email
claim_value: verhuur@myllesweerd.nl
raw_value: verhuur@myllesweerd.nl
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/body/div/footer/div[1]/div/div[4]/div[1]/a[2]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: mailto_link
extraction_timestamp: '2025-12-02T08:43:47.226745+00:00'
- claim_type: social_facebook
claim_value: https://www.facebook.com/myllesweerd/
raw_value: https://www.facebook.com/myllesweerd/
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/body/div/footer/div[1]/div/div[4]/div[2]/div/a[1]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:43:47.226874+00:00'
- claim_type: social_instagram
claim_value: https://www.instagram.com/myllesweerd/
raw_value: https://www.instagram.com/myllesweerd/
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/body/div/footer/div[1]/div/div[4]/div[2]/div/a[2]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:43:47.226881+00:00'
- claim_type: org_name
claim_value: Onze huisgenoten en partners
raw_value: Onze huisgenoten en partners
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/body/div/section[1]/div/div/h1
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 0.9
extraction_method: h1_tag
extraction_timestamp: '2025-12-02T08:43:47.226919+00:00'
- claim_type: collection_page
claim_value: structured_data_collection
raw_value: JSON-LD contains collection-related schema
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/head/script[5]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 0.85
extraction_method: schema_org_collection
extraction_timestamp: '2025-12-02T08:43:47.229699+00:00'
- claim_type: page_title
claim_value: Huisgenoten - Myllesweerd
raw_value: Huisgenoten - Myllesweerd
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/head/title
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: title_tag_full
extraction_timestamp: '2025-12-02T08:43:47.229758+00:00'
- claim_type: favicon
claim_value: https://myllesweerd.nl/wp-content/uploads/2024/01/cropped-favicon-32x32.png
raw_value: sizes=32x32
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/head/link[8]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:43:47.229791+00:00'
- claim_type: favicon
claim_value: https://myllesweerd.nl/wp-content/uploads/2024/01/cropped-favicon-192x192.png
raw_value: sizes=192x192
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/head/link[9]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:43:47.229795+00:00'
- claim_type: favicon
claim_value: https://myllesweerd.nl/wp-content/uploads/2024/01/cropped-favicon-180x180.png
raw_value: https://myllesweerd.nl/wp-content/uploads/2024/01/cropped-favicon-180x180.png
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/head/link[10]
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:43:47.229848+00:00'
- claim_type: logo
claim_value: data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAQ4AAAAoAQAAAAAnSCmXAAAAAnRSTlMAAHaTzTgAAAAUSURBVDjLY2AYBaNgFIyCUUBPAAAFeAABKXG5/AAAAABJRU5ErkJggg==
raw_value: 'alt=Logo '
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/body/div/header/div/div/a/img
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: logo_img_attr
extraction_timestamp: '2025-12-02T08:43:47.229947+00:00'
- claim_type: logo
claim_value: https://myllesweerd.nl/wp-content/uploads/2023/10/Myllesweerd.svg
raw_value: 'alt=Logo '
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/body/div/header/div/div/a/noscript/img
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: logo_img_attr
extraction_timestamp: '2025-12-02T08:43:47.229955+00:00'
- claim_type: ui_login
claim_value: https://www.myllesweerd.nl/vrijwilligers/login
raw_value: text=vrijwilligers systeem, pattern=login
source_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
retrieved_on: '2025-11-29T16:43:27.086961+00:00'
xpath: /html/body/div/footer/div[2]/div/ul/li[3]/a
html_file: web/0589/myllesweerd.nl/pages/huisgenoten_5_stichting-myllesheem.tmp.html
xpath_match_score: 1.0
extraction_method: login_button
extraction_timestamp: '2025-12-02T08:43:47.231345+00:00'
custodian_name:
claim_type: custodian_name
claim_value: Myllesheem
source: google_maps
confidence: 0.715
consensus_method: true
sources_checked: 6
sources_matched: 4
extraction_timestamp: '2025-12-02T13:07:52.808982+00:00'
matching_sources:
- source: wikidata
name: Myllesheem (Heemkamer)
score: 1.0
- source: original_entry
name: Myllesheem
score: 1.0
- source: web_og_site_name
name: Myllesweerd
score: 0.78
previous_value: Stichting Myllesheem (Heemkamer)
previous_source: wikidata
custodian_legal_name:
claim_type: legal_name
claim_value: Stichting Myllesheem (Heemkamer)
extraction_timestamp: '2025-12-02T13:07:52.808991+00:00'
note: Legal form detected in source name (e.g., Stichting, Vereniging, B.V.)
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:50:28.544136+00:00'
match_method: google_maps_admin2
match_confidence: 0.95
municipality:
name: Land van Cuijk
code: '1982'
municipal_archive:
name: Brabants Historisch Informatie Centrum
website: https://www.bhic.nl/het-geheugen-van-brabant
isil: NL-HtBHIC
province:
name: Noord-Brabant
code: '30'
provincial_archive:
name: Brabants Historisch Informatie Centrum
website: https://www.bhic.nl/
digital_platforms:
- platform_name: Stichting Myllesheem Website
platform_url: https://www.myllesweerd.nl/huisgenoten/5/stichting-myllesheem
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website
technology_stack: Vitec Maior
data_standards:
- HTML5
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:18:54.864707+00:00'
source_method: automated_extraction
unesco_ich_enrichment:
country_code: NL
total_elements_in_country: 5
enrichment_timestamp: '2025-12-06T20:20:03.944111+00:00'
elements:
- unesco_ich_id: '1870'
name: Rotterdam Summer Carnival
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2023
multinational: false
url: https://ich.unesco.org/en/RL/rotterdam-summer-carnival-01870
description: The Rotterdam Summer Carnival is a multicultural celebration that unites participants from the Caribbean
and European Netherlands, as well as ethnic minority groups from Central and South America and Africa living in the
Netherlands. The event includes a street parade, a brass band competition and a...
- unesco_ich_id: '1979'
name: 'Traditional irrigation: knowledge, technique, and organization'
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2023
multinational: true
url: https://ich.unesco.org/en/RL/traditional-irrigation-knowledge-technique-and-organization-01979
description: Traditional irrigation uses gravity and hand-made constructions such as channels and ditches to distribute
water from naturally-occurring water catchment points (such as springs, streams and glaciers) to the fields. Practitioners
choose specific days and periods to manually divert the water, and the...
- unesco_ich_id: '1707'
name: Corso culture, flower and fruit parades in the Netherlands
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2021
multinational: false
url: https://ich.unesco.org/en/RL/corso-culture-flower-and-fruit-parades-in-the-netherlands-01707
description: Dating back to the late nineteenth century, a corso is an annual parade of floats or boats decorated with
flowers, fruit, vegetables and, in some cases, people in costumes. Originating in the south of France and Italy, the
practice spread to the Netherlands in the nineteenth century. The parade take...
- unesco_ich_id: '1708'
name: Falconry, a living human heritage
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2021
multinational: true
url: https://ich.unesco.org/en/RL/falconry-a-living-human-heritage-01708
description: Falconry is the traditional art and practice of training and flying falcons (and sometimes eagles, hawks,
buzzards and other birds of prey). It has been practised for over 4000 years. The practice of falconry in early and
medieval periods of history is documented in many parts of the world. Original...
- unesco_ich_id: '1265'
name: Craft of the miller operating windmills and watermills
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2017
multinational: false
url: https://ich.unesco.org/en/RL/craft-of-the-miller-operating-windmills-and-watermills-01265
description: The craft of the miller operating windmills and watermills involves the knowledge and skills necessary to
operate a mill and maintain it in a good state of repair. With a declining number of people earning their livelihood
from the craft, millers today also play a key role in transmitting the cultur...
location:
latitude: 51.6871812
longitude: 5.783085
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-11-28T09:54:35.681768+00:00'
entity_id: ChIJ4cemtJAax0cRyXLF0Er_zc0
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
city: Mill
region: Noord-Brabant
region_code: NB
country: NL
postal_code: 5451 BM
street_address: Kerkstraat, Mill
formatted_address: Kerkstraat, 5451 BM Mill
geonames_id: 2750802
geonames_name: Mill
feature_code: PPL
normalization_timestamp: '2025-12-09T12:50:50.636056+00:00'