glam/data/custodian/NL-ZH-NOO-N-KC.yaml
2026-01-18 01:23:32 +01:00

424 lines
14 KiB
YAML

original_entry:
plaatsnaam_bezoekadres: Noordwijk aan Zee
organisatie: Stichting Kurt Carlsen
systeem: Atlantis
versnellen: ja
reference:
- label: https://www.kurtcarlsen.nl/cms/
type:
- N
entry_index: 1160
processing_timestamp: '2025-11-27T16:48:03.232144+00:00'
enrichment_status: skipped
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:47:34.172445+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- plaatsnaam_bezoekadres
- organisatie
- systeem
- versnellen
- reference
- type
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T10:00:26.615070+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJUzVDWYvAxUcRpTNAa6LsDyM
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- phone
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:51:55.225603+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: google_maps_admin2
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
- Canonical location normalized on 2025-12-09T13:15:36Z
skip_reason: no_wikidata_id
google_maps_enrichment:
place_id: ChIJUzVDWYvAxUcRpTNAa6LsDyM
name: Stichting Kurt Carlsen
fetch_timestamp: '2025-11-28T10:00:26.615070+00:00'
api_status: OK
coordinates:
latitude: 52.2301005
longitude: 4.4479627
formatted_address: Hofvennepark 5, 2201 PZ Noordwijk
short_address: Hofvennepark 5, Noordwijk
address_components:
- long_name: '5'
short_name: '5'
types:
- street_number
- long_name: Hofvennepark
short_name: Hofvennepark
types:
- route
- long_name: Noordwijk
short_name: Noordwijk
types:
- locality
- political
- long_name: Noordwijk
short_name: Noordwijk
types:
- administrative_area_level_2
- political
- long_name: Zuid-Holland
short_name: ZH
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 2201 PZ
short_name: 2201 PZ
types:
- postal_code
phone_local: 015 662 4079
phone_international: +31 15 662 4079
website: https://www.kurtcarlsen.nl/
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
google_maps_url: https://maps.google.com/?cid=2526498098306364325&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.2301005,4.4479627&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/generic_pinlet
icon_background_color: '#7B9EB0'
utc_offset_minutes: 60
google_maps_status: SUCCESS
google_maps_search_query: Stichting Kurt Carlsen, Noordwijk aan Zee, Netherlands
web_enrichment:
web_archives:
- url: https://www.kurtcarlsen.nl/cms/
directory: web/1160/kurtcarlsen.nl
pages_archived: 28
archive_method: wget_warc_deep
warc_file: archive.warc.gz
warc_size_bytes: 1676326
warc_format: ISO 28500
full_site_archive_timestamp: '2025-11-29T18:25:00.975116+00:00'
ghcid:
ghcid_current: NL-ZH-NOO-N-KC
ghcid_original: NL-ZH-NOO-N-KC
ghcid_uuid: 400d70ba-f87a-55b4-be57-b782a8262061
ghcid_uuid_sha256: 8e46965d-3b28-8903-8c62-f080b35e2449
ghcid_numeric: 10252046928924162307
record_id: 019adf94-d2fc-7a97-ac27-5265d40b99a6
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-ZH-NOO-N-KC
ghcid_numeric: 10252046928924162307
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: null
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Noordwijk
geonames_id: 2749816
geonames_name: Noordwijk
feature_code: PPL
population: 235
admin1_code: '04'
region_code: ZH
country_code: NL
source_coordinates:
latitude: 52.2301005
longitude: 4.4479627
source: google_maps
geonames_id: 2749816
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-ZH-NOO-N-KC
- identifier_scheme: GHCID_UUID
identifier_value: 400d70ba-f87a-55b4-be57-b782a8262061
identifier_url: urn:uuid:400d70ba-f87a-55b4-be57-b782a8262061
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 8e46965d-3b28-8903-8c62-f080b35e2449
identifier_url: urn:uuid:8e46965d-3b28-8903-8c62-f080b35e2449
- identifier_scheme: GHCID_NUMERIC
identifier_value: '10252046928924162307'
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-d2fc-7a97-ac27-5265d40b99a6
identifier_url: urn:uuid:019adf94-d2fc-7a97-ac27-5265d40b99a6
custodian_name:
claim_type: custodian_name
claim_value: Kurt Carlsen
source: google_maps
confidence: 0.466
consensus_method: true
sources_checked: 29
sources_matched: 4
extraction_timestamp: '2025-12-02T13:08:59.565659+00:00'
matching_sources:
- source: original_entry
name: Kurt Carlsen
score: 1.0
- source: web_title_tag
name: Kurt Carlsen
score: 1.0
- source: web_title_tag
name: De historie van de Kurt Carlsen
score: 1.0
previous_value: Stichting Kurt Carlsen
previous_source: web_title_tag
custodian_legal_name:
claim_type: legal_name
claim_value: Stichting Kurt Carlsen
extraction_timestamp: '2025-12-02T13:08:59.565673+00:00'
note: Legal form detected in source name (e.g., Stichting, Vereniging, B.V.)
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:51:55.225587+00:00'
match_method: google_maps_admin2
match_confidence: 0.95
municipality:
name: Noordwijk
code: '575'
municipal_archive:
name: Erfgoed Leiden en Omstreken
website: https://www.erfgoedleiden.nl/
isil: NL-LdnRAL
province:
name: Zuid-Holland
code: '28'
provincial_archive:
name: Nationaal Archief
website: https://www.nationaalarchief.nl/
digital_platforms:
- platform_name: Stichting Kurt Carlsen Website
platform_url: https://www.kurtcarlsen.nl/
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website
technology_stack: Atlantis
data_standards:
- HTML5
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:22:23.273194+00:00'
source_method: automated_extraction
wikidata_enrichment:
wikidata_entity_id: Q112627165
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-09T12:29:21.327538+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P31
- P18
- P373
- P856
- P1435
- P571
wikidata_labels:
nl: Kurt Carlsen
en: Kurt Carlsen
wikidata_label_en: Kurt Carlsen
wikidata_label_nl: Kurt Carlsen
wikidata_descriptions:
nl: Nederlandse spitsgatsloep en reddingsboot
en: Dutch lifeboat launched in 1953
wikidata_description_en: Dutch lifeboat launched in 1953
wikidata_aliases:
nl:
- Kurt Carlsen (schip, 1953)
wikidata_sitelinks:
nlwiki: Kurt Carlsen (schip, 1953)
commonswiki: Category:Kurt Carlsen (ship, 1953)
wikidata_temporal:
inception: '1953-00-00'
wikidata_inception: '1953-00-00'
wikidata_classification:
instance_of: &id001
- id: Q9588290
label: longboat
description: type of boat
- id: Q1746393
label: lifeboat
description: boat used primarily as an emergency means of leaving a larger boat
or ship in case of emergency scene
- id: Q1842295
label: Register Varend Erfgoed Nederland
description: ''
heritage_designation:
- id: Q2061317
label: varend erfgoed
description: monumentstatus cultureel erfgoed in Nederland
wikidata_instance_of: *id001
wikidata_web:
official_website: https://www.kurtcarlsen.nl/
wikidata_official_website: https://www.kurtcarlsen.nl/
wikidata_media:
image: Onthulling nieuwe reddingsboot te Noordwijk door Kurt Carlsen, Bestanddeelnr
905-7789.jpg
commons_category: Kurt Carlsen (ship, 1953)
wikidata_image: Onthulling nieuwe reddingsboot te Noordwijk door Kurt Carlsen, Bestanddeelnr
905-7789.jpg
timespan:
begin_of_the_begin: '1953-01-01T00:00:00Z'
end_of_the_begin: '1953-12-31T00:00:00Z'
begin_of_the_end: null
end_of_the_end: null
sources:
- 'Wikidata P571 (inception): https://www.wikidata.org/wiki/Q112627165'
notes: Stichting Kurt Carlsen founded 1953. Foundation preserving the rescue boat
named after Captain Kurt Carlsen, famous for his heroic efforts aboard the Flying
Enterprise in 1952
location:
latitude: 52.2301005
longitude: 4.4479627
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-11-28T10:00:26.615070+00:00'
entity_id: ChIJUzVDWYvAxUcRpTNAa6LsDyM
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
city: Noordwijk
region: Zuid-Holland
region_code: ZH
country: NL
postal_code: 2201 PZ
street_address: Hofvennepark 5, Noordwijk
formatted_address: Hofvennepark 5, 2201 PZ Noordwijk
geonames_id: 2749816
geonames_name: Noordwijk
feature_code: PPL
normalization_timestamp: '2025-12-09T13:15:36.307672+00:00'
crawl4ai_enrichment:
retrieval_timestamp: '2025-12-14T18:49:31.294771+00:00'
retrieval_agent: crawl4ai
source_url: https://www.kurtcarlsen.nl/
status_code: null
error: Crawl failed with status None
digital_platform_v2:
transformation_metadata:
transformed_from: httpx_beautifulsoup
transformation_date: '2025-12-14T23:50:04.594210+00:00'
transformation_version: '2.1'
source_status_code: 200
primary_platform:
platform_id: primary_website_kurtcarlsen_nl
platform_name: Stichting Kurt Carlsen Website
platform_url: https://www.kurtcarlsen.nl/cms/
platform_type: DISCOVERY_PORTAL
description: ''
language: nl
og_image: null
favicon: null
navigation_links:
- https://www.kurtcarlsen.nl/cms
- https://www.kurtcarlsen.nl/cms/home
- https://www.kurtcarlsen.nl/cms/de-historie-van-de-kurt-carlsen/
- https://www.kurtcarlsen.nl/cms/boot-informatie/
- https://www.kurtcarlsen.nl/cms/vrijwilligers/
- https://www.kurtcarlsen.nl/cms/sponsors/
- https://www.kurtcarlsen.nl/cms/contact-donateurs/
- https://www.kurtcarlsen.nl/cms/gallery-2/
- https://www.kurtcarlsen.nl/cms/fotos-2010/
- https://www.kurtcarlsen.nl/cms/fotos-2011/
- https://www.kurtcarlsen.nl/cms/fotos-2012/
- https://www.kurtcarlsen.nl/cms/fotos-2013/
- https://www.kurtcarlsen.nl/cms/fotos-2014/
- https://www.kurtcarlsen.nl/cms/fotos-2015/
- https://www.kurtcarlsen.nl/cms/fotos-2016/
- https://www.kurtcarlsen.nl/cms/fotos-2017/
- https://www.kurtcarlsen.nl/cms/fotos-2018/
- https://www.kurtcarlsen.nl/cms/videos/
- https://www.kurtcarlsen.nl/cms/nieuws/
- https://www.kurtcarlsen.nl/cms/contact/
web_enrichments:
extraction_timestamp: '2025-12-13T19:48:10.164354+00:00'
extraction_method: hybrid_llm_pattern_layout_v1
confidence_threshold: 0.6
entities_count: 3
cleanup_applied: '2025-12-13T19:49:35.891941+00:00'
claims:
- entity: Stichting Kurt Carlsen
entity_type: GRP.ASS
xpath: /html/head/title
base_confidence: 0.95
layout_score: 0.15
pattern_score: 0.15
final_confidence: 1.0
layout_match: high_conf:head/title
- entity: https://www.kurtcarlsen.nl/cms/xmlrpc.php
entity_type: APP.URL
xpath: /html/head/link[3]/@href
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://www.kurtcarlsen.nl/cms
entity_type: APP.URL
xpath: /html/head/link[11]/@href
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
logo_enrichment:
enrichment_timestamp: '2025-12-22T12:23:00.071420+00:00'
source_url: https://www.kurtcarlsen.nl
extraction_method: crawl4ai
claims:
- claim_type: logo_url
claim_value: https://www.kurtcarlsen.nl/cms/wp-content/uploads/2023/03/logo_Kurt-Carlsen.jpg
source_url: https://www.kurtcarlsen.nl
css_selector: '#masthead > div.elementor.elementor-10243 > section.elementor-section.elementor-top-section
> div.elementor-container.elementor-column-gap-default > div.elementor-column.elementor-col-100
> div.elementor-widget-wrap.elementor-element-populated > section.elementor-section.elementor-inner-section
> div.elementor-container.elementor-column-gap-default > div.elementor-column.elementor-col-50
> div.elementor-widget-wrap.elementor-element-populated > div.elementor-element.elementor-element-2cd0afe
> div.elementor-widget-container > div.hfe-site-logo > a.elementor-clickable
> div.hfe-site-logo-set > div.hfe-site-logo-container > img.hfe-site-logo-img.elementor-animation-'
retrieved_on: '2025-12-22T12:23:00.071420+00:00'
extraction_method: crawl4ai_header_logo
detection_confidence: high
alt_text: ''
summary:
total_claims: 1
has_primary_logo: true
has_favicon: false
has_og_image: false
favicon_count: 0