glam/data/custodian/NL-NH-SPA-S-HWS.yaml
2026-01-18 01:23:32 +01:00

452 lines
16 KiB
YAML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
plaatsnaam_bezoekadres: Spaarndam
organisatie: Historische Werkgroep Spaarndam
systeem: ZCBS
reference:
- label: https://historischewerkgroepspaarndam.nl/
type:
- S
entry_index: 693
processing_timestamp: '2025-11-27T16:34:40.639535+00:00'
enrichment_status: skipped
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:47:22.638639+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- plaatsnaam_bezoekadres
- organisatie
- systeem
- reference
- type
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T09:55:39.784931+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJSSAiq2vlxUcRuAshVtl5z3g
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- phone
- rating
- reviews
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:50:49.459020+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: google_maps_admin2
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
linkup_timespan:
- source_type: linkup_web_search
fetch_timestamp: '2025-12-15T20:05:00.535823+00:00'
search_query: '"Historische Werkgroep Spaarndam" Spaarndam opgericht OR gesticht
OR sinds'
source_urls:
- https://historischewerkgroepspaarndam.nl/historie/1950-de-strijd-tegen-het-water/
- https://historischewerkgroepspaarndam.nl/historie/1851-de-post-wordt-bezorgd/
- http://peter-perger.blogspot.com/2013/02/geen-blakwannes.html
- https://dorpsraadspaarndam.nl/category/verkeer/
- https://www.historisch-zaandam.nl/category/historie/
claims_extracted:
- timespan_begin
data_tier: TIER_4_INFERRED
archive_path: data/custodian/web/0693/linkup/linkup_founding_20251215T200500Z.json
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:18:35Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T07:07:17Z
skip_reason: no_wikidata_id
google_maps_enrichment:
place_id: ChIJSSAiq2vlxUcRuAshVtl5z3g
name: Historische Werkgroep Spaarndam
fetch_timestamp: '2025-11-28T09:55:39.784931+00:00'
api_status: OK
coordinates:
latitude: 52.41322100000001
longitude: 4.6939003999999995
formatted_address: Van der Burchstraat 20, 2064 WK Spaarndam
short_address: Van der Burchstraat 20, Spaarndam
address_components:
- long_name: '20'
short_name: '20'
types:
- street_number
- long_name: Van der Burchstraat
short_name: Van der Burchstraat
types:
- route
- long_name: Spaarndam
short_name: Spaarndam
types:
- locality
- political
- long_name: Haarlemmermeer
short_name: Haarlemmermeer
types:
- administrative_area_level_2
- political
- long_name: Noord-Holland
short_name: NH
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 2064 WK
short_name: 2064 WK
types:
- postal_code
phone_local: 06 54225208
phone_international: +31 6 54225208
website: http://historischewerkgroepspaarndam.nl/
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 5
total_ratings: 2
reviews:
- author_name: Timo Baas
author_uri: https://www.google.com/maps/contrib/105205936237706223595/reviews
rating: 5
relative_time_description: 6 jaar geleden
text: null
publish_time: '2019-08-20T21:28:29.360221Z'
- author_name: Erwin Beijer
author_uri: https://www.google.com/maps/contrib/117278778601415753999/reviews
rating: 5
relative_time_description: 6 jaar geleden
text: null
publish_time: '2019-08-02T19:03:37.386268Z'
google_maps_url: https://maps.google.com/?cid=8705310579090328504&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.41322100000001,4.6939003999999995&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/generic_pinlet
icon_background_color: '#7B9EB0'
utc_offset_minutes: 60
google_maps_status: SUCCESS
google_maps_search_query: Historische Werkgroep Spaarndam, Spaarndam, Netherlands
web_enrichment:
web_archives:
- url: https://historischewerkgroepspaarndam.nl/
directory: web/0693/historischewerkgroepspaarndam.nl
pages_archived: 20
archive_method: wget_warc_deep
warc_file: archive.warc.gz
warc_size_bytes: 426390
warc_format: ISO 28500
full_site_archive_timestamp: '2025-11-29T17:02:46.243143+00:00'
zcbs_enrichment:
zcbs_id: 8
zcbs_name: Stichting Werkgroep Oud-Castricum
platform_urls:
objects: http://www.oud-castricum.nl/cgi-bin/objecten.pl
photos: http://www.oud-castricum.nl/cgi-bin/beeldbank.pl
enrichment_timestamp: '2025-11-30T19:09:04.722616+00:00'
source: https://www.dezijpe.nl/cgi-bin/boerderij.pl?misc=90
match_score: 0.719
ghcid:
ghcid_current: NL-NH-SPA-S-HWS
ghcid_original: NL-NH-SPA-S-HWS
ghcid_uuid: 58cf3a83-3691-5bc3-a4a9-27d7f51f1b88
ghcid_uuid_sha256: 1cf62ae1-e22d-8fd4-bb2a-34492335f62a
ghcid_numeric: 2086902626983419860
record_id: 019adf94-7af8-7db5-9b38-755bbd9df5aa
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-NH-SPA-S-HWS
ghcid_numeric: 2086902626983419860
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: null
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Spaarndam
geonames_id: 2746986
geonames_name: Spaarndam
feature_code: PPL
population: 0
admin1_code: '07'
region_code: NH
country_code: NL
source_coordinates:
latitude: 52.41322100000001
longitude: 4.6939003999999995
source: google_maps
geonames_id: 2746986
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-NH-SPA-S-HWS
- identifier_scheme: GHCID_UUID
identifier_value: 58cf3a83-3691-5bc3-a4a9-27d7f51f1b88
identifier_url: urn:uuid:58cf3a83-3691-5bc3-a4a9-27d7f51f1b88
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 1cf62ae1-e22d-8fd4-bb2a-34492335f62a
identifier_url: urn:uuid:1cf62ae1-e22d-8fd4-bb2a-34492335f62a
- identifier_scheme: GHCID_NUMERIC
identifier_value: '2086902626983419860'
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-7af8-7db5-9b38-755bbd9df5aa
identifier_url: urn:uuid:019adf94-7af8-7db5-9b38-755bbd9df5aa
custodian_name:
claim_type: custodian_name
claim_value: Historische Werkgroep Spaarndam
source: google_maps
confidence: 0.508
consensus_method: true
sources_checked: 20
sources_matched: 7
extraction_timestamp: '2025-12-02T13:08:05.970528+00:00'
matching_sources:
- source: original_entry
name: Historische Werkgroep Spaarndam
score: 1.0
- source: web_h1_tag
name: STEUN de Historische werkgroep DOOR BOODSCHAPPEN TE DOEN BIJ VOMAR
score: 0.81
- source: web_title_tag
name: Wachtwoord kwijt Historische Werkgroep Spaarndam
score: 1.0
- source: web_title_tag
name: Login Historische Werkgroep Spaarndam
score: 1.0
- source: web_title_tag
name: Historische Werkgroep Spaarndam
score: 1.0
- source: web_title_tag
name: Historie Spaarndam
score: 0.74
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:50:49.459008+00:00'
match_method: google_maps_admin2
match_confidence: 0.95
municipality:
name: Haarlemmermeer
code: '394'
municipal_archive:
name: Noord-Hollands Archief
website: https://noord-hollandsarchief.nl/
isil: NL-HlmNHA
province:
name: Noord-Holland
code: '27'
provincial_archive:
name: Noord-Hollands Archief
website: https://noord-hollandsarchief.nl/
digital_platforms:
- platform_name: Historische Werkgroep Spaarndam Website
platform_url: http://historischewerkgroepspaarndam.nl/
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website
technology_stack: ZCBS
data_standards:
- HTML5
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:19:32.223731+00:00'
source_method: automated_extraction
wikidata_enrichment:
status: NOT_FOUND
fetch_timestamp: '2025-12-06T19:39:14.488898+00:00'
search_query: Historische Werkgroep Spaarndam
location:
latitude: 52.41322100000001
longitude: 4.6939003999999995
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-11-28T09:55:39.784931+00:00'
entity_id: ChIJSSAiq2vlxUcRuAshVtl5z3g
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
city: Spaarndam
region: Noord-Holland
region_code: NH
country: NL
postal_code: 2064 WK
street_address: Van der Burchstraat 20, Spaarndam
formatted_address: Van der Burchstraat 20, 2064 WK Spaarndam
geonames_id: 2746986
geonames_name: Spaarndam
feature_code: PPL
normalization_timestamp: '2025-12-09T07:07:17.040442+00:00'
crawl4ai_enrichment:
retrieval_timestamp: '2025-12-14T18:08:44.741202+00:00'
retrieval_agent: crawl4ai
source_url: http://historischewerkgroepspaarndam.nl/
status_code: null
error: Crawl failed with status None
digital_platform_v2:
transformation_metadata:
transformed_from: httpx_beautifulsoup
transformation_date: '2025-12-14T23:13:26.097739+00:00'
transformation_version: '2.1'
source_status_code: 200
primary_platform:
platform_id: primary_website_historischewerkgroepspaarndam_nl
platform_name: Historische Werkgroep Spaarndam Planet Earth Generic Website
Template
platform_url: https://historischewerkgroepspaarndam.nl/
platform_type: DISCOVERY_PORTAL
description: ''
language: nl
og_image: null
favicon: https://historischewerkgroepspaarndam.nl/wp-content/uploads/2023/04/logo-150x150-1.gif
collection_urls:
- https://historischewerkgroepspaarndam.nl/index.php/beeldbank/
- https://historischewerkgroepspaarndam.nl/index.php/beeldbank-2/
- https://collectie.historischewerkgroepspaarndam.nl/cgi-bin/ansichten.pl
- https://collectie.historischewerkgroepspaarndam.nl/cgi-bin/bidprent.pl
navigation_links:
- https://historischewerkgroepspaarndam.nl/
- https://historischewerkgroepspaarndam.nl/index.php/beeldbank/
- https://historischewerkgroepspaarndam.nl/index.php/bevolkingsregister/
- https://historischewerkgroepspaarndam.nl/?page_id=15
- https://historischewerkgroepspaarndam.nl/index.php/historie-spaarndam/
- https://historischewerkgroepspaarndam.nl/index.php/bibliotheek/
- https://historischewerkgroepspaarndam.nl/index.php/uitgaven-prijslijst-van-andere-organisaties/
- https://historischewerkgroepspaarndam.nl/index.php/uitgave-van-hws/
- https://historischewerkgroepspaarndam.nl/index.php/contact-2/
- https://historischewerkgroepspaarndam.nl/index.php/over-ons/
- https://historischewerkgroepspaarndam.nl/index.php/contact/
- https://historischewerkgroepspaarndam.nl/index.php/privacy-policy/
- https://historischewerkgroepspaarndam.nl/index.php/publicaties-2/
- https://historischewerkgroepspaarndam.nl/index.php/beeldbank-2/
- https://historischewerkgroepspaarndam.nl/index.php/rijnlandshuis/
- https://historischewerkgroepspaarndam.nl/index.php/open-monumenten-dagen/
- https://historischewerkgroepspaarndam.nl/index.php/contact-2-2/
- https://historischewerkgroepspaarndam.nl/wp-admin/post.php?post=3372&action=elementor
- https://collectie.historischewerkgroepspaarndam.nl/cgi-bin/ansichten.pl
- https://collectie.historischewerkgroepspaarndam.nl/cgi-bin/bidprent.pl
timespan:
begin_of_the_begin: '2011-11-15T00:00:00Z'
end_of_the_begin: '2011-11-15T00:00:00Z'
begin_of_the_end: null
end_of_the_end: null
sources:
- 'Linkup web search: https://dcspaarndam.nl/activiiteiten/geschiedenis-hws/'
notes: 'Found via pattern: full_date_nl'
events:
- date: '1986'
type: founding
description: opgericht in 1986, na de viering van het 700-jarig bestaan van Spaarndam
in 1985
timeline_enrichment:
timeline_events:
- event_type: FOUNDING
event_date: '1986'
date_precision: year
approximate: false
description: opgericht in 1986, na de viering van het 700-jarig bestaan van Spaarndam
in 1985
source_urls:
- https://dcspaarndam.nl/activiiteiten/geschiedenis-hws/
- https://historischewerkgroepspaarndam.nl/index.php/uitgave-van-hws/
- https://historischewerkgroepspaarndam.nl/historie/1950-de-strijd-tegen-het-water/
- https://historischewerkgroepspaarndam.nl/historie/1851-de-post-wordt-bezorgd/
- https://historischewerkgroepspaarndam.nl/publicaties/prijslijst-uitgaven-van-anderen/
linkup_query: '"Historische Werkgroep Spaarndam" Spaarndam opgericht OR gesticht
OR sinds'
linkup_answer: De Historische Werkgroep Spaarndam is opgericht in 1986, na de
viering van het 700-jarig bestaan van Spaarndam in 1985.
fetch_timestamp: '2025-12-15T20:05:00.526820+00:00'
archive_path: web/0693/linkup/linkup_founding_20251215T200500Z.json
extraction_method: linkup_answer_regex
extraction_timestamp: '2025-12-16T20:17:53.366534+00:00'
data_tier: TIER_4_INFERRED
web_enrichments:
extraction_timestamp: '2025-12-13T19:46:01.653167+00:00'
extraction_method: hybrid_llm_pattern_layout_v1
confidence_threshold: 0.6
entities_count: 5
cleanup_applied: '2025-12-13T19:49:32.242945+00:00'
claims:
- entity: Historische Werkgroep Spaarndam
entity_type: GRP.ASS
xpath: /html/head/title
base_confidence: 0.95
layout_score: 0.15
pattern_score: 0.15
final_confidence: 1.0
layout_match: high_conf:head/title
- entity: Spaarndam
entity_type: TOP.SET
xpath: /html/head/title
base_confidence: 0.9
layout_score: 0.0
pattern_score: 0.15
final_confidence: 1.0
- entity: https://historischewerkgroepspaarndam.nl/index.php/feed/
entity_type: APP.URL
xpath: /html/head/link[3]
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://historischewerkgroepspaarndam.nl/index.php/comments/feed/
entity_type: APP.URL
xpath: /html/head/link[4]
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://historischewerkgroepspaarndam.nl/wp-content/themes/astra/assets/css/minified/main.min.css?ver=4.8.8
entity_type: APP.URL
xpath: /html/head/link[5]
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
logo_enrichment:
enrichment_timestamp: '2025-12-22T09:59:55.327221+00:00'
source_url: http://historischewerkgroepspaarndam.nl
extraction_method: crawl4ai
claims:
- claim_type: favicon_url
claim_value: https://historischewerkgroepspaarndam.nl/wp-content/uploads/2023/04/logo-150x150-1.gif
source_url: http://historischewerkgroepspaarndam.nl
css_selector: '[document] > html > head > link:nth-of-type(29)'
retrieved_on: '2025-12-22T09:59:55.327221+00:00'
extraction_method: crawl4ai_link_rel
favicon_type: ''
favicon_sizes: 32x32
summary:
total_claims: 1
has_primary_logo: false
has_favicon: true
has_og_image: false
favicon_count: 1