422 lines
15 KiB
YAML
422 lines
15 KiB
YAML
original_entry:
|
||
plaatsnaam_bezoekadres: Sijbekarspel
|
||
organisatie: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen Door De
|
||
Tijd'
|
||
systeem: ZCBS
|
||
reference:
|
||
- label: https://www.lijnendoordetijd.nl/
|
||
type:
|
||
- S
|
||
entry_index: 691
|
||
processing_timestamp: '2025-11-27T16:34:40.635990+00:00'
|
||
enrichment_status: skipped
|
||
provenance:
|
||
schema_version: 1.0.0
|
||
generated_at: '2025-11-28T23:47:22.624709+00:00'
|
||
sources:
|
||
original_entry:
|
||
- source_type: nde_csv_registry
|
||
data_tier: TIER_1_AUTHORITATIVE
|
||
claims_extracted:
|
||
- plaatsnaam_bezoekadres
|
||
- organisatie
|
||
- systeem
|
||
- reference
|
||
- type
|
||
google_maps:
|
||
- source_type: google_maps_api
|
||
fetch_timestamp: '2025-11-28T09:55:38.711020+00:00'
|
||
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
|
||
place_id: ChIJ6f47WsStyEcRar6N9sz81jA
|
||
claims_extracted:
|
||
- coordinates
|
||
- formatted_address
|
||
- address_components
|
||
- business_status
|
||
- website
|
||
- phone
|
||
genealogiewerkbalk:
|
||
- source_type: genealogiewerkbalk_registry
|
||
fetch_timestamp: '2025-12-03T13:50:49.180955+00:00'
|
||
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
|
||
match_method: google_maps_admin2
|
||
claims_extracted:
|
||
- municipality_name
|
||
- municipality_code
|
||
- municipal_archive_name
|
||
- municipal_archive_website
|
||
- municipal_archive_isil
|
||
- province_name
|
||
- province_code
|
||
- provincial_archive_name
|
||
- provincial_archive_website
|
||
linkup_timespan:
|
||
- source_type: linkup_web_search
|
||
fetch_timestamp: '2025-12-15T20:04:38.327426+00:00'
|
||
search_query: '"Historische Vereniging Sijbekarspel & Benningbroek" Sijbekarspel
|
||
opgericht OR gesticht OR sinds'
|
||
source_urls:
|
||
- https://adoc.pub/kroniek-2007-historische-vereniging-sijbekarspel-benningbroe.html
|
||
- https://moestuin-in-sij-be.nl/
|
||
- https://www.medemblik.nl/projecten/projecten-in-uw-straat-of-wijk/sijbekarspel-benningbroek-herinrichting
|
||
- https://jokessterrenkruid.blogspot.com/2025/03/sijbekarspel-de-kerk-maria-en-een-oud.html?m=1
|
||
- https://geheugenvandrenthe.nl/encyclopedie-drenthe/historische-verenigingen
|
||
claims_extracted:
|
||
- timespan_begin
|
||
data_tier: TIER_4_INFERRED
|
||
archive_path: data/custodian/web/0691/linkup/linkup_founding_20251215T200438Z.json
|
||
data_tier_summary:
|
||
TIER_1_AUTHORITATIVE:
|
||
- original_entry (NDE CSV)
|
||
TIER_2_VERIFIED:
|
||
- wikidata_api
|
||
- google_maps_api
|
||
- genealogiewerkbalk_registry
|
||
TIER_3_CROWD_SOURCED: []
|
||
TIER_4_INFERRED:
|
||
- website_scrape
|
||
- exa_web_search
|
||
notes:
|
||
- Provenance tracking added retroactively
|
||
- claim_level_provenance available in sources section
|
||
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:18:35Z
|
||
- Canonical location added via normalize_custodian_files.py on 2025-12-09T07:07:16Z
|
||
skip_reason: no_wikidata_id
|
||
google_maps_enrichment:
|
||
place_id: ChIJ6f47WsStyEcRar6N9sz81jA
|
||
name: Lijnen door de Tijd
|
||
fetch_timestamp: '2025-11-28T09:55:38.711020+00:00'
|
||
api_status: OK
|
||
coordinates:
|
||
latitude: 52.7071353
|
||
longitude: 4.9988946
|
||
formatted_address: Westerstraat 92, 1655 LE Sijbekarspel
|
||
short_address: Westerstraat 92, Sijbekarspel
|
||
address_components:
|
||
- long_name: '92'
|
||
short_name: '92'
|
||
types:
|
||
- street_number
|
||
- long_name: Westerstraat
|
||
short_name: Westerstraat
|
||
types:
|
||
- route
|
||
- long_name: Sijbekarspel
|
||
short_name: Sijbekarspel
|
||
types:
|
||
- locality
|
||
- political
|
||
- long_name: Medemblik
|
||
short_name: Medemblik
|
||
types:
|
||
- administrative_area_level_2
|
||
- political
|
||
- long_name: Noord-Holland
|
||
short_name: NH
|
||
types:
|
||
- administrative_area_level_1
|
||
- political
|
||
- long_name: Nederland
|
||
short_name: NL
|
||
types:
|
||
- country
|
||
- political
|
||
- long_name: 1655 LE
|
||
short_name: 1655 LE
|
||
types:
|
||
- postal_code
|
||
phone_local: 0229 591 829
|
||
phone_international: +31 229 591 829
|
||
website: http://lijnendoordetijd.nl/activiteiten
|
||
google_place_types:
|
||
- point_of_interest
|
||
- establishment
|
||
business_status: OPERATIONAL
|
||
google_maps_url: https://maps.google.com/?cid=3519278116076633706&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
|
||
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.7071353,4.9988946&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
|
||
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/generic_pinlet
|
||
icon_background_color: '#7B9EB0'
|
||
utc_offset_minutes: 60
|
||
google_maps_status: SUCCESS
|
||
google_maps_search_query: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen
|
||
Door De Tijd', Sijbekarspel, Netherlands
|
||
web_enrichment:
|
||
web_archives:
|
||
- url: https://www.lijnendoordetijd.nl/
|
||
directory: web/0691/lijnendoordetijd.nl
|
||
pages_archived: 200
|
||
archive_method: wget_warc_deep
|
||
warc_file: archive.warc.gz
|
||
warc_size_bytes: 2001610
|
||
warc_format: ISO 28500
|
||
full_site_archive_timestamp: '2025-11-29T17:03:52.470790+00:00'
|
||
zcbs_enrichment:
|
||
zcbs_id: 68
|
||
zcbs_name: Historische Vereniging Sijbekarspel-Benningbroek
|
||
platform_urls:
|
||
photos: http://www.beeldbanksijbekarspelbenningbroek.nl/cgi-bin/beeldbank.pl
|
||
enrichment_timestamp: '2025-11-30T19:09:04.402756+00:00'
|
||
source: https://www.dezijpe.nl/cgi-bin/boerderij.pl?misc=90
|
||
match_score: 0.876
|
||
ghcid:
|
||
ghcid_current: NL-NH-SIJ-S-HVSB
|
||
ghcid_original: NL-NH-SIJ-S-LT
|
||
ghcid_uuid: null
|
||
ghcid_uuid_sha256: null
|
||
ghcid_numeric: null
|
||
record_id: 019adf94-7abc-73f0-bacc-9484a19632d8
|
||
generation_timestamp: '2025-12-02T17:30:00.000000+00:00'
|
||
ghcid_history:
|
||
- ghcid: NL-NH-SIJ-S-HVSB
|
||
ghcid_numeric: null
|
||
valid_from: '2025-12-02T17:30:00.000000+00:00'
|
||
valid_to: null
|
||
reason: GHCID corrected after identifying that "Lijnen door de Tijd" is the website/platform
|
||
name, not the organization name. Using abbreviation from "Historische Vereniging
|
||
Sijbekarspel & Benningbroek" (HVSB).
|
||
- ghcid: NL-NH-SIJ-S-LT
|
||
ghcid_numeric: 3429604925991527790
|
||
valid_from: '2025-12-02T14:56:45.615377+00:00'
|
||
valid_to: '2025-12-02T17:30:00.000000+00:00'
|
||
reason: Incorrect abbreviation from website/platform name instead of organization
|
||
name
|
||
location_resolution:
|
||
method: GOOGLE_MAPS_LOCALITY
|
||
google_maps_locality: Sijbekarspel
|
||
geonames_id: 2747332
|
||
geonames_name: Sijbekarspel
|
||
feature_code: PPL
|
||
population: 345
|
||
admin1_code: '07'
|
||
region_code: NH
|
||
country_code: NL
|
||
source_coordinates:
|
||
latitude: 52.7071353
|
||
longitude: 4.9988946
|
||
source: google_maps
|
||
geonames_id: 2747332
|
||
identifiers:
|
||
- identifier_scheme: GHCID
|
||
identifier_value: NL-NH-SIJ-S-HVSB
|
||
note: Corrected from LT to HVSB after distinguishing platform name from organization
|
||
- identifier_scheme: GHCID_UUID
|
||
identifier_value: null
|
||
identifier_url: null
|
||
- identifier_scheme: GHCID_UUID_SHA256
|
||
identifier_value: null
|
||
identifier_url: null
|
||
- identifier_scheme: GHCID_NUMERIC
|
||
identifier_value: null
|
||
- identifier_scheme: RECORD_ID
|
||
identifier_value: 019adf94-7abc-73f0-bacc-9484a19632d8
|
||
identifier_url: urn:uuid:019adf94-7abc-73f0-bacc-9484a19632d8
|
||
custodian_name:
|
||
claim_type: custodian_name
|
||
claim_value: Historische Vereniging Sijbekarspel & Benningbroek
|
||
source: manual_correction
|
||
confidence: 0.95
|
||
consensus_method: false
|
||
sources_checked: 127
|
||
sources_matched: 4
|
||
extraction_timestamp: '2025-12-02T17:30:00.000000+00:00'
|
||
previous_value: Lijnen door de Tijd
|
||
previous_source: google_maps
|
||
correction_note: '"Lijnen door de Tijd" is the name of the organization''s WEBSITE,
|
||
not the organization itself. The actual heritage custodian is "Historische Vereniging Sijbekarspel
|
||
& Benningbroek" which operates the "Lijnen door de Tijd" website as their digital
|
||
platform for historical research about these two villages.'
|
||
digital_platform:
|
||
platform_name: Lijnen door de Tijd
|
||
platform_url: https://www.lijnendoordetijd.nl/
|
||
platform_type: WEBSITE
|
||
description: Historical research portal operated by Historische Vereniging Sijbekarspel
|
||
& Benningbroek, containing genealogical data, historical photos, and local history
|
||
of the Sijbekarspel and Benningbroek villages.
|
||
note: Previously incorrectly used as custodian_name
|
||
genealogiewerkbalk_enrichment:
|
||
source: Genealogiewerkbalk.nl Municipality Archives Registry
|
||
source_url: https://www.genealogiewerkbalk.nl/archieven.html
|
||
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
|
||
data_tier: TIER_2_VERIFIED
|
||
enrichment_timestamp: '2025-12-03T13:50:49.180936+00:00'
|
||
match_method: google_maps_admin2
|
||
match_confidence: 0.95
|
||
municipality:
|
||
name: Medemblik
|
||
code: '420'
|
||
municipal_archive:
|
||
name: Westfries Archief
|
||
website: https://www.westfriesarchief.nl/
|
||
isil: NL-HnWFA
|
||
province:
|
||
name: Noord-Holland
|
||
code: '27'
|
||
provincial_archive:
|
||
name: Noord-Hollands Archief
|
||
website: https://noord-hollandsarchief.nl/
|
||
digital_platforms:
|
||
- platform_name: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen Door
|
||
De Tijd' Website
|
||
platform_url: http://lijnendoordetijd.nl/activiteiten
|
||
platform_type: WEBSITE
|
||
platform_category:
|
||
- Organizational website
|
||
digital_collections: Organizational website
|
||
technology_stack: ZCBS
|
||
data_standards:
|
||
- HTML5
|
||
user_services: General information, Contact
|
||
sustainability_model: Institutional funding
|
||
enrichment_timestamp: '2025-12-05T11:19:31.472989+00:00'
|
||
source_method: automated_extraction
|
||
wikidata_enrichment:
|
||
status: NOT_FOUND
|
||
fetch_timestamp: '2025-12-06T19:39:12.481809+00:00'
|
||
search_query: Historische Vereniging Sijbekarspel & Benningbroek
|
||
location:
|
||
latitude: 52.7071353
|
||
longitude: 4.9988946
|
||
coordinate_provenance:
|
||
source_type: GOOGLE_MAPS
|
||
source_path: google_maps_enrichment.coordinates
|
||
original_timestamp: '2025-11-28T09:55:38.711020+00:00'
|
||
entity_id: ChIJ6f47WsStyEcRar6N9sz81jA
|
||
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
|
||
city: Sijbekarspel
|
||
region: Noord-Holland
|
||
region_code: NH
|
||
country: NL
|
||
postal_code: 1655 LE
|
||
street_address: Westerstraat 92, Sijbekarspel
|
||
formatted_address: Westerstraat 92, 1655 LE Sijbekarspel
|
||
geonames_id: 2747332
|
||
geonames_name: Sijbekarspel
|
||
feature_code: PPL
|
||
normalization_timestamp: '2025-12-09T07:07:16.679587+00:00'
|
||
web_contact_data:
|
||
extraction_date: '2025-12-12T22:53:57.170829+00:00'
|
||
extraction_method: contact_page_pattern_matching
|
||
source_files:
|
||
- web/0691/lijnendoordetijd.nl/pages/contact_index.html
|
||
persons: []
|
||
cleanup_date: '2025-12-13T10:46:08.573266+00:00'
|
||
cleanup_v2_removed: 1
|
||
crawl4ai_enrichment:
|
||
retrieval_timestamp: '2025-12-14T18:08:40.448953+00:00'
|
||
retrieval_agent: crawl4ai
|
||
source_url: http://lijnendoordetijd.nl/activiteiten
|
||
status_code: null
|
||
error: Crawl failed with status None
|
||
digital_platform_v2:
|
||
transformation_metadata:
|
||
transformed_from: httpx_beautifulsoup
|
||
transformation_date: '2025-12-14T23:13:18.669147+00:00'
|
||
transformation_version: '2.1'
|
||
source_status_code: 200
|
||
primary_platform:
|
||
platform_id: primary_website_lijnendoordetijd_nl
|
||
platform_name: Activiteiten – Lijnen door de Tijd Website
|
||
platform_url: https://www.lijnendoordetijd.nl/activiteiten/
|
||
platform_type: INSTITUTIONAL_WEBSITE
|
||
description: ''
|
||
language: nl
|
||
og_image: null
|
||
favicon: https://www.lijnendoordetijd.nl/wp-content/uploads/2016/10/cropped-logo-32x32.jpg
|
||
navigation_links:
|
||
- https://www.lijnendoordetijd.nl/
|
||
- https://www.lijnendoordetijd.nl
|
||
- https://www.lijnendoordetijd.nl/nieuws/
|
||
- https://www.lijnendoordetijd.nl/vereniging/
|
||
- https://www.lijnendoordetijd.nl/vereniging/commissies/
|
||
- https://www.lijnendoordetijd.nl/vereniging/bestuur/
|
||
- https://www.lijnendoordetijd.nl/jaarverslagen/
|
||
- https://www.lijnendoordetijd.nl/wp-content/uploads/2019/05/Privacyreglement-LddT.pdf
|
||
- https://www.lijnendoordetijd.nl/wp-login.php
|
||
- https://www.lijnendoordetijd.nl/geschiedenis/
|
||
- https://www.lijnendoordetijd.nl/activiteiten/
|
||
- https://www.lijnendoordetijd.nl/downloads/
|
||
- https://www.lijnendoordetijd.nl/kronieken/
|
||
- https://www.lijnendoordetijd.nl/dorpsfilm/
|
||
- https://www.lijnendoordetijd.nl/dorpsdruppie/
|
||
- https://www.lijnendoordetijd.nl/links/
|
||
- https://www.lijnendoordetijd.nl/contact/
|
||
- https://www.lijnendoordetijd.nl/activiteiten/page/2/
|
||
- https://www.lijnendoordetijd.nl/author/tjomme/
|
||
timespan:
|
||
begin_of_the_begin: '1930-02-06T00:00:00Z'
|
||
end_of_the_begin: '1930-02-06T00:00:00Z'
|
||
begin_of_the_end: null
|
||
end_of_the_end: null
|
||
sources:
|
||
- 'Linkup web search: https://docplayer.nl/2622232-Historische-vereniging-sijbekarspel-benningbroek-kroniek-2010-kroniek-2010-lijnen-door-de-tijd-historische-vereniging-sijbekarspel-benningbroek.html'
|
||
notes: 'Found via pattern: full_date_nl'
|
||
web_enrichments:
|
||
extraction_timestamp: '2025-12-13T19:46:01.479928+00:00'
|
||
extraction_method: hybrid_llm_pattern_layout_v1
|
||
confidence_threshold: 0.6
|
||
entities_count: 6
|
||
claims:
|
||
- entity: Historische Vereniging Sijbekarspel & Benningbroek 'Lijnen Door De Tijd'
|
||
entity_type: GRP.ASS
|
||
xpath: /html/head/title
|
||
base_confidence: 0.95
|
||
layout_score: 0.15
|
||
pattern_score: 0.15
|
||
final_confidence: 1.0
|
||
layout_match: high_conf:head/title
|
||
pattern_match: \b(vereniging|stichting|genootschap|kring)\b
|
||
- entity: Historische Vereniging van Sijbekarspel/Benningbroek 'Lijnen Door De Tijd'
|
||
entity_type: GRP.ASS
|
||
xpath: /html/body/div[2]/div[2]/main/article/div[2]/p/center[1]
|
||
base_confidence: 0.95
|
||
layout_score: 0.0
|
||
pattern_score: 0.15
|
||
final_confidence: 1.0
|
||
pattern_match: \b(vereniging|stichting|genootschap|kring)\b
|
||
- entity: https://www.lijnendoordetijd.nl/feed/
|
||
entity_type: APP.URL
|
||
xpath: /html/head/link[4]
|
||
base_confidence: 1.0
|
||
layout_score: 0.0
|
||
pattern_score: 0.0
|
||
final_confidence: 1.0
|
||
- entity: https://www.lijnendoordetijd.nl/
|
||
entity_type: APP.URL
|
||
xpath: /html/head/link[28]
|
||
base_confidence: 1.0
|
||
layout_score: 0.0
|
||
pattern_score: 0.0
|
||
final_confidence: 1.0
|
||
- entity: Lijnen door de Tijd
|
||
entity_type: APP.EXH
|
||
xpath: /html/head/title
|
||
base_confidence: 0.95
|
||
layout_score: 0.0
|
||
pattern_score: 0.0
|
||
final_confidence: 0.95
|
||
- entity: logo.jpg
|
||
entity_type: THG.OBJ
|
||
xpath: /html/body/div[2]/div[2]/main/article/div[2]/p/center[4]/img
|
||
base_confidence: 0.9
|
||
layout_score: 0.0
|
||
pattern_score: 0.0
|
||
final_confidence: 0.9
|
||
logo_enrichment:
|
||
enrichment_timestamp: '2025-12-22T09:59:32.461104+00:00'
|
||
source_url: http://lijnendoordetijd.nl/activiteiten
|
||
extraction_method: crawl4ai
|
||
claims:
|
||
- claim_type: favicon_url
|
||
claim_value: https://www.lijnendoordetijd.nl/wp-content/uploads/2016/10/cropped-logo-180x180.jpg
|
||
source_url: http://lijnendoordetijd.nl/activiteiten
|
||
css_selector: '[document] > html > body > link:nth-of-type(23)'
|
||
retrieved_on: '2025-12-22T09:59:32.461104+00:00'
|
||
extraction_method: crawl4ai_link_rel
|
||
favicon_type: ''
|
||
favicon_sizes: ''
|
||
summary:
|
||
total_claims: 1
|
||
has_primary_logo: false
|
||
has_favicon: true
|
||
has_og_image: false
|
||
favicon_count: 3
|