glam/data/custodian/NL-NH-SIJ-S-HVSB.yaml
2026-01-18 01:23:32 +01:00

422 lines
15 KiB
YAML
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
plaatsnaam_bezoekadres: Sijbekarspel
organisatie: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen Door De
Tijd'
systeem: ZCBS
reference:
- label: https://www.lijnendoordetijd.nl/
type:
- S
entry_index: 691
processing_timestamp: '2025-11-27T16:34:40.635990+00:00'
enrichment_status: skipped
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:47:22.624709+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- plaatsnaam_bezoekadres
- organisatie
- systeem
- reference
- type
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T09:55:38.711020+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJ6f47WsStyEcRar6N9sz81jA
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- phone
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:50:49.180955+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: google_maps_admin2
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
linkup_timespan:
- source_type: linkup_web_search
fetch_timestamp: '2025-12-15T20:04:38.327426+00:00'
search_query: '"Historische Vereniging Sijbekarspel & Benningbroek" Sijbekarspel
opgericht OR gesticht OR sinds'
source_urls:
- https://adoc.pub/kroniek-2007-historische-vereniging-sijbekarspel-benningbroe.html
- https://moestuin-in-sij-be.nl/
- https://www.medemblik.nl/projecten/projecten-in-uw-straat-of-wijk/sijbekarspel-benningbroek-herinrichting
- https://jokessterrenkruid.blogspot.com/2025/03/sijbekarspel-de-kerk-maria-en-een-oud.html?m=1
- https://geheugenvandrenthe.nl/encyclopedie-drenthe/historische-verenigingen
claims_extracted:
- timespan_begin
data_tier: TIER_4_INFERRED
archive_path: data/custodian/web/0691/linkup/linkup_founding_20251215T200438Z.json
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:18:35Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T07:07:16Z
skip_reason: no_wikidata_id
google_maps_enrichment:
place_id: ChIJ6f47WsStyEcRar6N9sz81jA
name: Lijnen door de Tijd
fetch_timestamp: '2025-11-28T09:55:38.711020+00:00'
api_status: OK
coordinates:
latitude: 52.7071353
longitude: 4.9988946
formatted_address: Westerstraat 92, 1655 LE Sijbekarspel
short_address: Westerstraat 92, Sijbekarspel
address_components:
- long_name: '92'
short_name: '92'
types:
- street_number
- long_name: Westerstraat
short_name: Westerstraat
types:
- route
- long_name: Sijbekarspel
short_name: Sijbekarspel
types:
- locality
- political
- long_name: Medemblik
short_name: Medemblik
types:
- administrative_area_level_2
- political
- long_name: Noord-Holland
short_name: NH
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 1655 LE
short_name: 1655 LE
types:
- postal_code
phone_local: 0229 591 829
phone_international: +31 229 591 829
website: http://lijnendoordetijd.nl/activiteiten
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
google_maps_url: https://maps.google.com/?cid=3519278116076633706&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.7071353,4.9988946&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/generic_pinlet
icon_background_color: '#7B9EB0'
utc_offset_minutes: 60
google_maps_status: SUCCESS
google_maps_search_query: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen
Door De Tijd', Sijbekarspel, Netherlands
web_enrichment:
web_archives:
- url: https://www.lijnendoordetijd.nl/
directory: web/0691/lijnendoordetijd.nl
pages_archived: 200
archive_method: wget_warc_deep
warc_file: archive.warc.gz
warc_size_bytes: 2001610
warc_format: ISO 28500
full_site_archive_timestamp: '2025-11-29T17:03:52.470790+00:00'
zcbs_enrichment:
zcbs_id: 68
zcbs_name: Historische Vereniging Sijbekarspel-Benningbroek
platform_urls:
photos: http://www.beeldbanksijbekarspelbenningbroek.nl/cgi-bin/beeldbank.pl
enrichment_timestamp: '2025-11-30T19:09:04.402756+00:00'
source: https://www.dezijpe.nl/cgi-bin/boerderij.pl?misc=90
match_score: 0.876
ghcid:
ghcid_current: NL-NH-SIJ-S-HVSB
ghcid_original: NL-NH-SIJ-S-LT
ghcid_uuid: null
ghcid_uuid_sha256: null
ghcid_numeric: null
record_id: 019adf94-7abc-73f0-bacc-9484a19632d8
generation_timestamp: '2025-12-02T17:30:00.000000+00:00'
ghcid_history:
- ghcid: NL-NH-SIJ-S-HVSB
ghcid_numeric: null
valid_from: '2025-12-02T17:30:00.000000+00:00'
valid_to: null
reason: GHCID corrected after identifying that "Lijnen door de Tijd" is the website/platform
name, not the organization name. Using abbreviation from "Historische Vereniging
Sijbekarspel & Benningbroek" (HVSB).
- ghcid: NL-NH-SIJ-S-LT
ghcid_numeric: 3429604925991527790
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: '2025-12-02T17:30:00.000000+00:00'
reason: Incorrect abbreviation from website/platform name instead of organization
name
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Sijbekarspel
geonames_id: 2747332
geonames_name: Sijbekarspel
feature_code: PPL
population: 345
admin1_code: '07'
region_code: NH
country_code: NL
source_coordinates:
latitude: 52.7071353
longitude: 4.9988946
source: google_maps
geonames_id: 2747332
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-NH-SIJ-S-HVSB
note: Corrected from LT to HVSB after distinguishing platform name from organization
- identifier_scheme: GHCID_UUID
identifier_value: null
identifier_url: null
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: null
identifier_url: null
- identifier_scheme: GHCID_NUMERIC
identifier_value: null
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-7abc-73f0-bacc-9484a19632d8
identifier_url: urn:uuid:019adf94-7abc-73f0-bacc-9484a19632d8
custodian_name:
claim_type: custodian_name
claim_value: Historische Vereniging Sijbekarspel & Benningbroek
source: manual_correction
confidence: 0.95
consensus_method: false
sources_checked: 127
sources_matched: 4
extraction_timestamp: '2025-12-02T17:30:00.000000+00:00'
previous_value: Lijnen door de Tijd
previous_source: google_maps
correction_note: '"Lijnen door de Tijd" is the name of the organization''s WEBSITE,
not the organization itself. The actual heritage custodian is "Historische Vereniging Sijbekarspel
& Benningbroek" which operates the "Lijnen door de Tijd" website as their digital
platform for historical research about these two villages.'
digital_platform:
platform_name: Lijnen door de Tijd
platform_url: https://www.lijnendoordetijd.nl/
platform_type: WEBSITE
description: Historical research portal operated by Historische Vereniging Sijbekarspel
& Benningbroek, containing genealogical data, historical photos, and local history
of the Sijbekarspel and Benningbroek villages.
note: Previously incorrectly used as custodian_name
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:50:49.180936+00:00'
match_method: google_maps_admin2
match_confidence: 0.95
municipality:
name: Medemblik
code: '420'
municipal_archive:
name: Westfries Archief
website: https://www.westfriesarchief.nl/
isil: NL-HnWFA
province:
name: Noord-Holland
code: '27'
provincial_archive:
name: Noord-Hollands Archief
website: https://noord-hollandsarchief.nl/
digital_platforms:
- platform_name: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen Door
De Tijd' Website
platform_url: http://lijnendoordetijd.nl/activiteiten
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website
technology_stack: ZCBS
data_standards:
- HTML5
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:19:31.472989+00:00'
source_method: automated_extraction
wikidata_enrichment:
status: NOT_FOUND
fetch_timestamp: '2025-12-06T19:39:12.481809+00:00'
search_query: Historische Vereniging Sijbekarspel & Benningbroek
location:
latitude: 52.7071353
longitude: 4.9988946
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-11-28T09:55:38.711020+00:00'
entity_id: ChIJ6f47WsStyEcRar6N9sz81jA
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
city: Sijbekarspel
region: Noord-Holland
region_code: NH
country: NL
postal_code: 1655 LE
street_address: Westerstraat 92, Sijbekarspel
formatted_address: Westerstraat 92, 1655 LE Sijbekarspel
geonames_id: 2747332
geonames_name: Sijbekarspel
feature_code: PPL
normalization_timestamp: '2025-12-09T07:07:16.679587+00:00'
web_contact_data:
extraction_date: '2025-12-12T22:53:57.170829+00:00'
extraction_method: contact_page_pattern_matching
source_files:
- web/0691/lijnendoordetijd.nl/pages/contact_index.html
persons: []
cleanup_date: '2025-12-13T10:46:08.573266+00:00'
cleanup_v2_removed: 1
crawl4ai_enrichment:
retrieval_timestamp: '2025-12-14T18:08:40.448953+00:00'
retrieval_agent: crawl4ai
source_url: http://lijnendoordetijd.nl/activiteiten
status_code: null
error: Crawl failed with status None
digital_platform_v2:
transformation_metadata:
transformed_from: httpx_beautifulsoup
transformation_date: '2025-12-14T23:13:18.669147+00:00'
transformation_version: '2.1'
source_status_code: 200
primary_platform:
platform_id: primary_website_lijnendoordetijd_nl
platform_name: Activiteiten Lijnen door de Tijd Website
platform_url: https://www.lijnendoordetijd.nl/activiteiten/
platform_type: INSTITUTIONAL_WEBSITE
description: ''
language: nl
og_image: null
favicon: https://www.lijnendoordetijd.nl/wp-content/uploads/2016/10/cropped-logo-32x32.jpg
navigation_links:
- https://www.lijnendoordetijd.nl/
- https://www.lijnendoordetijd.nl
- https://www.lijnendoordetijd.nl/nieuws/
- https://www.lijnendoordetijd.nl/vereniging/
- https://www.lijnendoordetijd.nl/vereniging/commissies/
- https://www.lijnendoordetijd.nl/vereniging/bestuur/
- https://www.lijnendoordetijd.nl/jaarverslagen/
- https://www.lijnendoordetijd.nl/wp-content/uploads/2019/05/Privacyreglement-LddT.pdf
- https://www.lijnendoordetijd.nl/wp-login.php
- https://www.lijnendoordetijd.nl/geschiedenis/
- https://www.lijnendoordetijd.nl/activiteiten/
- https://www.lijnendoordetijd.nl/downloads/
- https://www.lijnendoordetijd.nl/kronieken/
- https://www.lijnendoordetijd.nl/dorpsfilm/
- https://www.lijnendoordetijd.nl/dorpsdruppie/
- https://www.lijnendoordetijd.nl/links/
- https://www.lijnendoordetijd.nl/contact/
- https://www.lijnendoordetijd.nl/activiteiten/page/2/
- https://www.lijnendoordetijd.nl/author/tjomme/
timespan:
begin_of_the_begin: '1930-02-06T00:00:00Z'
end_of_the_begin: '1930-02-06T00:00:00Z'
begin_of_the_end: null
end_of_the_end: null
sources:
- 'Linkup web search: https://docplayer.nl/2622232-Historische-vereniging-sijbekarspel-benningbroek-kroniek-2010-kroniek-2010-lijnen-door-de-tijd-historische-vereniging-sijbekarspel-benningbroek.html'
notes: 'Found via pattern: full_date_nl'
web_enrichments:
extraction_timestamp: '2025-12-13T19:46:01.479928+00:00'
extraction_method: hybrid_llm_pattern_layout_v1
confidence_threshold: 0.6
entities_count: 6
claims:
- entity: Historische Vereniging Sijbekarspel & Benningbroek 'Lijnen Door De Tijd'
entity_type: GRP.ASS
xpath: /html/head/title
base_confidence: 0.95
layout_score: 0.15
pattern_score: 0.15
final_confidence: 1.0
layout_match: high_conf:head/title
pattern_match: \b(vereniging|stichting|genootschap|kring)\b
- entity: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen Door De Tijd'
entity_type: GRP.ASS
xpath: /html/body/div[2]/div[2]/main/article/div[2]/p/center[1]
base_confidence: 0.95
layout_score: 0.0
pattern_score: 0.15
final_confidence: 1.0
pattern_match: \b(vereniging|stichting|genootschap|kring)\b
- entity: https://www.lijnendoordetijd.nl/feed/
entity_type: APP.URL
xpath: /html/head/link[4]
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://www.lijnendoordetijd.nl/
entity_type: APP.URL
xpath: /html/head/link[28]
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: Lijnen door de Tijd
entity_type: APP.EXH
xpath: /html/head/title
base_confidence: 0.95
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.95
- entity: logo.jpg
entity_type: THG.OBJ
xpath: /html/body/div[2]/div[2]/main/article/div[2]/p/center[4]/img
base_confidence: 0.9
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.9
logo_enrichment:
enrichment_timestamp: '2025-12-22T09:59:32.461104+00:00'
source_url: http://lijnendoordetijd.nl/activiteiten
extraction_method: crawl4ai
claims:
- claim_type: favicon_url
claim_value: https://www.lijnendoordetijd.nl/wp-content/uploads/2016/10/cropped-logo-180x180.jpg
source_url: http://lijnendoordetijd.nl/activiteiten
css_selector: '[document] > html > body > link:nth-of-type(23)'
retrieved_on: '2025-12-22T09:59:32.461104+00:00'
extraction_method: crawl4ai_link_rel
favicon_type: ''
favicon_sizes: ''
summary:
total_claims: 1
has_primary_logo: false
has_favicon: true
has_og_image: false
favicon_count: 3