424 lines
14 KiB
YAML
424 lines
14 KiB
YAML
original_entry:
|
|
plaatsnaam_bezoekadres: Noordwijk aan Zee
|
|
organisatie: Stichting Kurt Carlsen
|
|
systeem: Atlantis
|
|
versnellen: ja
|
|
reference:
|
|
- label: https://www.kurtcarlsen.nl/cms/
|
|
type:
|
|
- N
|
|
entry_index: 1160
|
|
processing_timestamp: '2025-11-27T16:48:03.232144+00:00'
|
|
enrichment_status: skipped
|
|
provenance:
|
|
schema_version: 1.0.0
|
|
generated_at: '2025-11-28T23:47:34.172445+00:00'
|
|
sources:
|
|
original_entry:
|
|
- source_type: nde_csv_registry
|
|
data_tier: TIER_1_AUTHORITATIVE
|
|
claims_extracted:
|
|
- plaatsnaam_bezoekadres
|
|
- organisatie
|
|
- systeem
|
|
- versnellen
|
|
- reference
|
|
- type
|
|
google_maps:
|
|
- source_type: google_maps_api
|
|
fetch_timestamp: '2025-11-28T10:00:26.615070+00:00'
|
|
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
|
|
place_id: ChIJUzVDWYvAxUcRpTNAa6LsDyM
|
|
claims_extracted:
|
|
- coordinates
|
|
- formatted_address
|
|
- address_components
|
|
- business_status
|
|
- website
|
|
- phone
|
|
genealogiewerkbalk:
|
|
- source_type: genealogiewerkbalk_registry
|
|
fetch_timestamp: '2025-12-03T13:51:55.225603+00:00'
|
|
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
|
|
match_method: google_maps_admin2
|
|
claims_extracted:
|
|
- municipality_name
|
|
- municipality_code
|
|
- municipal_archive_name
|
|
- municipal_archive_website
|
|
- municipal_archive_isil
|
|
- province_name
|
|
- province_code
|
|
- provincial_archive_name
|
|
- provincial_archive_website
|
|
data_tier_summary:
|
|
TIER_1_AUTHORITATIVE:
|
|
- original_entry (NDE CSV)
|
|
TIER_2_VERIFIED:
|
|
- wikidata_api
|
|
- google_maps_api
|
|
- genealogiewerkbalk_registry
|
|
TIER_3_CROWD_SOURCED: []
|
|
TIER_4_INFERRED:
|
|
- website_scrape
|
|
- exa_web_search
|
|
notes:
|
|
- Provenance tracking added retroactively
|
|
- claim_level_provenance available in sources section
|
|
- Canonical location normalized on 2025-12-09T13:15:36Z
|
|
skip_reason: no_wikidata_id
|
|
google_maps_enrichment:
|
|
place_id: ChIJUzVDWYvAxUcRpTNAa6LsDyM
|
|
name: Stichting Kurt Carlsen
|
|
fetch_timestamp: '2025-11-28T10:00:26.615070+00:00'
|
|
api_status: OK
|
|
coordinates:
|
|
latitude: 52.2301005
|
|
longitude: 4.4479627
|
|
formatted_address: Hofvennepark 5, 2201 PZ Noordwijk
|
|
short_address: Hofvennepark 5, Noordwijk
|
|
address_components:
|
|
- long_name: '5'
|
|
short_name: '5'
|
|
types:
|
|
- street_number
|
|
- long_name: Hofvennepark
|
|
short_name: Hofvennepark
|
|
types:
|
|
- route
|
|
- long_name: Noordwijk
|
|
short_name: Noordwijk
|
|
types:
|
|
- locality
|
|
- political
|
|
- long_name: Noordwijk
|
|
short_name: Noordwijk
|
|
types:
|
|
- administrative_area_level_2
|
|
- political
|
|
- long_name: Zuid-Holland
|
|
short_name: ZH
|
|
types:
|
|
- administrative_area_level_1
|
|
- political
|
|
- long_name: Nederland
|
|
short_name: NL
|
|
types:
|
|
- country
|
|
- political
|
|
- long_name: 2201 PZ
|
|
short_name: 2201 PZ
|
|
types:
|
|
- postal_code
|
|
phone_local: 015 662 4079
|
|
phone_international: +31 15 662 4079
|
|
website: https://www.kurtcarlsen.nl/
|
|
google_place_types:
|
|
- point_of_interest
|
|
- establishment
|
|
business_status: OPERATIONAL
|
|
google_maps_url: https://maps.google.com/?cid=2526498098306364325&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
|
|
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.2301005,4.4479627&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
|
|
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/generic_pinlet
|
|
icon_background_color: '#7B9EB0'
|
|
utc_offset_minutes: 60
|
|
google_maps_status: SUCCESS
|
|
google_maps_search_query: Stichting Kurt Carlsen, Noordwijk aan Zee, Netherlands
|
|
web_enrichment:
|
|
web_archives:
|
|
- url: https://www.kurtcarlsen.nl/cms/
|
|
directory: web/1160/kurtcarlsen.nl
|
|
pages_archived: 28
|
|
archive_method: wget_warc_deep
|
|
warc_file: archive.warc.gz
|
|
warc_size_bytes: 1676326
|
|
warc_format: ISO 28500
|
|
full_site_archive_timestamp: '2025-11-29T18:25:00.975116+00:00'
|
|
ghcid:
|
|
ghcid_current: NL-ZH-NOO-N-KC
|
|
ghcid_original: NL-ZH-NOO-N-KC
|
|
ghcid_uuid: 400d70ba-f87a-55b4-be57-b782a8262061
|
|
ghcid_uuid_sha256: 8e46965d-3b28-8903-8c62-f080b35e2449
|
|
ghcid_numeric: 10252046928924162307
|
|
record_id: 019adf94-d2fc-7a97-ac27-5265d40b99a6
|
|
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
|
|
ghcid_history:
|
|
- ghcid: NL-ZH-NOO-N-KC
|
|
ghcid_numeric: 10252046928924162307
|
|
valid_from: '2025-12-02T14:56:45.615377+00:00'
|
|
valid_to: null
|
|
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
|
|
location_resolution:
|
|
method: GOOGLE_MAPS_LOCALITY
|
|
google_maps_locality: Noordwijk
|
|
geonames_id: 2749816
|
|
geonames_name: Noordwijk
|
|
feature_code: PPL
|
|
population: 235
|
|
admin1_code: '04'
|
|
region_code: ZH
|
|
country_code: NL
|
|
source_coordinates:
|
|
latitude: 52.2301005
|
|
longitude: 4.4479627
|
|
source: google_maps
|
|
geonames_id: 2749816
|
|
identifiers:
|
|
- identifier_scheme: GHCID
|
|
identifier_value: NL-ZH-NOO-N-KC
|
|
- identifier_scheme: GHCID_UUID
|
|
identifier_value: 400d70ba-f87a-55b4-be57-b782a8262061
|
|
identifier_url: urn:uuid:400d70ba-f87a-55b4-be57-b782a8262061
|
|
- identifier_scheme: GHCID_UUID_SHA256
|
|
identifier_value: 8e46965d-3b28-8903-8c62-f080b35e2449
|
|
identifier_url: urn:uuid:8e46965d-3b28-8903-8c62-f080b35e2449
|
|
- identifier_scheme: GHCID_NUMERIC
|
|
identifier_value: '10252046928924162307'
|
|
- identifier_scheme: RECORD_ID
|
|
identifier_value: 019adf94-d2fc-7a97-ac27-5265d40b99a6
|
|
identifier_url: urn:uuid:019adf94-d2fc-7a97-ac27-5265d40b99a6
|
|
custodian_name:
|
|
claim_type: custodian_name
|
|
claim_value: Kurt Carlsen
|
|
source: google_maps
|
|
confidence: 0.466
|
|
consensus_method: true
|
|
sources_checked: 29
|
|
sources_matched: 4
|
|
extraction_timestamp: '2025-12-02T13:08:59.565659+00:00'
|
|
matching_sources:
|
|
- source: original_entry
|
|
name: Kurt Carlsen
|
|
score: 1.0
|
|
- source: web_title_tag
|
|
name: Kurt Carlsen
|
|
score: 1.0
|
|
- source: web_title_tag
|
|
name: De historie van de Kurt Carlsen
|
|
score: 1.0
|
|
previous_value: Stichting Kurt Carlsen
|
|
previous_source: web_title_tag
|
|
custodian_legal_name:
|
|
claim_type: legal_name
|
|
claim_value: Stichting Kurt Carlsen
|
|
extraction_timestamp: '2025-12-02T13:08:59.565673+00:00'
|
|
note: Legal form detected in source name (e.g., Stichting, Vereniging, B.V.)
|
|
genealogiewerkbalk_enrichment:
|
|
source: Genealogiewerkbalk.nl Municipality Archives Registry
|
|
source_url: https://www.genealogiewerkbalk.nl/archieven.html
|
|
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
|
|
data_tier: TIER_2_VERIFIED
|
|
enrichment_timestamp: '2025-12-03T13:51:55.225587+00:00'
|
|
match_method: google_maps_admin2
|
|
match_confidence: 0.95
|
|
municipality:
|
|
name: Noordwijk
|
|
code: '575'
|
|
municipal_archive:
|
|
name: Erfgoed Leiden en Omstreken
|
|
website: https://www.erfgoedleiden.nl/
|
|
isil: NL-LdnRAL
|
|
province:
|
|
name: Zuid-Holland
|
|
code: '28'
|
|
provincial_archive:
|
|
name: Nationaal Archief
|
|
website: https://www.nationaalarchief.nl/
|
|
digital_platforms:
|
|
- platform_name: Stichting Kurt Carlsen Website
|
|
platform_url: https://www.kurtcarlsen.nl/
|
|
platform_type: WEBSITE
|
|
platform_category:
|
|
- Organizational website
|
|
digital_collections: Organizational website
|
|
technology_stack: Atlantis
|
|
data_standards:
|
|
- HTML5
|
|
user_services: General information, Contact
|
|
sustainability_model: Institutional funding
|
|
enrichment_timestamp: '2025-12-05T11:22:23.273194+00:00'
|
|
source_method: automated_extraction
|
|
wikidata_enrichment:
|
|
wikidata_entity_id: Q112627165
|
|
api_metadata:
|
|
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
|
|
fetch_timestamp: '2025-12-09T12:29:21.327538+00:00'
|
|
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
|
|
enrichment_version: 2.0_full
|
|
properties_found:
|
|
- P31
|
|
- P18
|
|
- P373
|
|
- P856
|
|
- P1435
|
|
- P571
|
|
wikidata_labels:
|
|
nl: Kurt Carlsen
|
|
en: Kurt Carlsen
|
|
wikidata_label_en: Kurt Carlsen
|
|
wikidata_label_nl: Kurt Carlsen
|
|
wikidata_descriptions:
|
|
nl: Nederlandse spitsgatsloep en reddingsboot
|
|
en: Dutch lifeboat launched in 1953
|
|
wikidata_description_en: Dutch lifeboat launched in 1953
|
|
wikidata_aliases:
|
|
nl:
|
|
- Kurt Carlsen (schip, 1953)
|
|
wikidata_sitelinks:
|
|
nlwiki: Kurt Carlsen (schip, 1953)
|
|
commonswiki: Category:Kurt Carlsen (ship, 1953)
|
|
wikidata_temporal:
|
|
inception: '1953-00-00'
|
|
wikidata_inception: '1953-00-00'
|
|
wikidata_classification:
|
|
instance_of: &id001
|
|
- id: Q9588290
|
|
label: longboat
|
|
description: type of boat
|
|
- id: Q1746393
|
|
label: lifeboat
|
|
description: boat used primarily as an emergency means of leaving a larger boat
|
|
or ship in case of emergency scene
|
|
- id: Q1842295
|
|
label: Register Varend Erfgoed Nederland
|
|
description: ''
|
|
heritage_designation:
|
|
- id: Q2061317
|
|
label: varend erfgoed
|
|
description: monumentstatus cultureel erfgoed in Nederland
|
|
wikidata_instance_of: *id001
|
|
wikidata_web:
|
|
official_website: https://www.kurtcarlsen.nl/
|
|
wikidata_official_website: https://www.kurtcarlsen.nl/
|
|
wikidata_media:
|
|
image: Onthulling nieuwe reddingsboot te Noordwijk door Kurt Carlsen, Bestanddeelnr
|
|
905-7789.jpg
|
|
commons_category: Kurt Carlsen (ship, 1953)
|
|
wikidata_image: Onthulling nieuwe reddingsboot te Noordwijk door Kurt Carlsen, Bestanddeelnr
|
|
905-7789.jpg
|
|
timespan:
|
|
begin_of_the_begin: '1953-01-01T00:00:00Z'
|
|
end_of_the_begin: '1953-12-31T00:00:00Z'
|
|
begin_of_the_end: null
|
|
end_of_the_end: null
|
|
sources:
|
|
- 'Wikidata P571 (inception): https://www.wikidata.org/wiki/Q112627165'
|
|
notes: Stichting Kurt Carlsen founded 1953. Foundation preserving the rescue boat
|
|
named after Captain Kurt Carlsen, famous for his heroic efforts aboard the Flying
|
|
Enterprise in 1952
|
|
location:
|
|
latitude: 52.2301005
|
|
longitude: 4.4479627
|
|
coordinate_provenance:
|
|
source_type: GOOGLE_MAPS
|
|
source_path: google_maps_enrichment.coordinates
|
|
original_timestamp: '2025-11-28T10:00:26.615070+00:00'
|
|
entity_id: ChIJUzVDWYvAxUcRpTNAa6LsDyM
|
|
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
|
|
city: Noordwijk
|
|
region: Zuid-Holland
|
|
region_code: ZH
|
|
country: NL
|
|
postal_code: 2201 PZ
|
|
street_address: Hofvennepark 5, Noordwijk
|
|
formatted_address: Hofvennepark 5, 2201 PZ Noordwijk
|
|
geonames_id: 2749816
|
|
geonames_name: Noordwijk
|
|
feature_code: PPL
|
|
normalization_timestamp: '2025-12-09T13:15:36.307672+00:00'
|
|
crawl4ai_enrichment:
|
|
retrieval_timestamp: '2025-12-14T18:49:31.294771+00:00'
|
|
retrieval_agent: crawl4ai
|
|
source_url: https://www.kurtcarlsen.nl/
|
|
status_code: null
|
|
error: Crawl failed with status None
|
|
digital_platform_v2:
|
|
transformation_metadata:
|
|
transformed_from: httpx_beautifulsoup
|
|
transformation_date: '2025-12-14T23:50:04.594210+00:00'
|
|
transformation_version: '2.1'
|
|
source_status_code: 200
|
|
primary_platform:
|
|
platform_id: primary_website_kurtcarlsen_nl
|
|
platform_name: Stichting Kurt Carlsen Website
|
|
platform_url: https://www.kurtcarlsen.nl/cms/
|
|
platform_type: DISCOVERY_PORTAL
|
|
description: ''
|
|
language: nl
|
|
og_image: null
|
|
favicon: null
|
|
navigation_links:
|
|
- https://www.kurtcarlsen.nl/cms
|
|
- https://www.kurtcarlsen.nl/cms/home
|
|
- https://www.kurtcarlsen.nl/cms/de-historie-van-de-kurt-carlsen/
|
|
- https://www.kurtcarlsen.nl/cms/boot-informatie/
|
|
- https://www.kurtcarlsen.nl/cms/vrijwilligers/
|
|
- https://www.kurtcarlsen.nl/cms/sponsors/
|
|
- https://www.kurtcarlsen.nl/cms/contact-donateurs/
|
|
- https://www.kurtcarlsen.nl/cms/gallery-2/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2010/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2011/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2012/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2013/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2014/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2015/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2016/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2017/
|
|
- https://www.kurtcarlsen.nl/cms/fotos-2018/
|
|
- https://www.kurtcarlsen.nl/cms/videos/
|
|
- https://www.kurtcarlsen.nl/cms/nieuws/
|
|
- https://www.kurtcarlsen.nl/cms/contact/
|
|
web_enrichments:
|
|
extraction_timestamp: '2025-12-13T19:48:10.164354+00:00'
|
|
extraction_method: hybrid_llm_pattern_layout_v1
|
|
confidence_threshold: 0.6
|
|
entities_count: 3
|
|
cleanup_applied: '2025-12-13T19:49:35.891941+00:00'
|
|
claims:
|
|
- entity: Stichting Kurt Carlsen
|
|
entity_type: GRP.ASS
|
|
xpath: /html/head/title
|
|
base_confidence: 0.95
|
|
layout_score: 0.15
|
|
pattern_score: 0.15
|
|
final_confidence: 1.0
|
|
layout_match: high_conf:head/title
|
|
- entity: https://www.kurtcarlsen.nl/cms/xmlrpc.php
|
|
entity_type: APP.URL
|
|
xpath: /html/head/link[3]/@href
|
|
base_confidence: 1.0
|
|
layout_score: 0.0
|
|
pattern_score: 0.0
|
|
final_confidence: 1.0
|
|
- entity: https://www.kurtcarlsen.nl/cms
|
|
entity_type: APP.URL
|
|
xpath: /html/head/link[11]/@href
|
|
base_confidence: 1.0
|
|
layout_score: 0.0
|
|
pattern_score: 0.0
|
|
final_confidence: 1.0
|
|
logo_enrichment:
|
|
enrichment_timestamp: '2025-12-22T12:23:00.071420+00:00'
|
|
source_url: https://www.kurtcarlsen.nl
|
|
extraction_method: crawl4ai
|
|
claims:
|
|
- claim_type: logo_url
|
|
claim_value: https://www.kurtcarlsen.nl/cms/wp-content/uploads/2023/03/logo_Kurt-Carlsen.jpg
|
|
source_url: https://www.kurtcarlsen.nl
|
|
css_selector: '#masthead > div.elementor.elementor-10243 > section.elementor-section.elementor-top-section
|
|
> div.elementor-container.elementor-column-gap-default > div.elementor-column.elementor-col-100
|
|
> div.elementor-widget-wrap.elementor-element-populated > section.elementor-section.elementor-inner-section
|
|
> div.elementor-container.elementor-column-gap-default > div.elementor-column.elementor-col-50
|
|
> div.elementor-widget-wrap.elementor-element-populated > div.elementor-element.elementor-element-2cd0afe
|
|
> div.elementor-widget-container > div.hfe-site-logo > a.elementor-clickable
|
|
> div.hfe-site-logo-set > div.hfe-site-logo-container > img.hfe-site-logo-img.elementor-animation-'
|
|
retrieved_on: '2025-12-22T12:23:00.071420+00:00'
|
|
extraction_method: crawl4ai_header_logo
|
|
detection_confidence: high
|
|
alt_text: ''
|
|
summary:
|
|
total_claims: 1
|
|
has_primary_logo: true
|
|
has_favicon: false
|
|
has_og_image: false
|
|
favicon_count: 0
|