glam/data/nde/enriched/entries/1021_unknown.yaml
2025-12-05 15:30:23 +01:00

382 lines
14 KiB
YAML

original_entry:
organisatie: Club van Suikerzakjesverzamelaars in Nederland
collectie_nederland: ja
reference:
- label: https://www.suikerzak.nl/
type:
- S
entry_index: 1021
processing_timestamp: '2025-11-27T16:43:59.817431+00:00'
enrichment_status: skipped
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:47:30.547276+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- organisatie
- collectie_nederland
- reference
- type
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T09:58:58.954001+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJWzo_OP9mxkcRP9DdY57bTtM
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- phone
- rating
- reviews
- opening_hours
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:51:42.061162+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: google_maps_admin2
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
skip_reason: no_wikidata_id
google_maps_enrichment:
place_id: ChIJWzo_OP9mxkcRP9DdY57bTtM
name: Club van Suikerzakjesverzamelaars in Nederland
fetch_timestamp: '2025-11-28T09:58:58.954001+00:00'
api_status: OK
coordinates:
latitude: 52.0339982
longitude: 5.1726966999999995
formatted_address: De Fuik 29, 3995 BJ Houten
short_address: De Fuik 29, Houten
address_components:
- long_name: '29'
short_name: '29'
types:
- street_number
- long_name: De Fuik
short_name: De Fuik
types:
- route
- long_name: Houten
short_name: Houten
types:
- locality
- political
- long_name: Houten
short_name: Houten
types:
- administrative_area_level_2
- political
- long_name: Utrecht
short_name: UT
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 3995 BJ
short_name: 3995 BJ
types:
- postal_code
phone_local: 06 22111485
phone_international: +31 6 22111485
website: http://www.suikerzak.nl/
google_place_types:
- point_of_interest
- store
- establishment
primary_type: store
business_status: OPERATIONAL
opening_hours:
open_now: true
periods:
- open:
day: 0
hour: 0
minute: 0
weekday_text:
- 'maandag: 24 uur geopend'
- 'dinsdag: 24 uur geopend'
- 'woensdag: 24 uur geopend'
- 'donderdag: 24 uur geopend'
- 'vrijdag: 24 uur geopend'
- 'zaterdag: 24 uur geopend'
- 'zondag: 24 uur geopend'
rating: 5
total_ratings: 1
reviews:
- author_name: P.J V Krieken
author_uri: https://www.google.com/maps/contrib/103613345661508403588/reviews
rating: 5
relative_time_description: 7 maanden geleden
text: Leuke site en dat helemaal opgezet vj hobby en met een catalogus van alle
bekend zijnde suikerzakjes. (Ned.erfgoed )
publish_time: '2025-04-16T14:08:41.123310Z'
google_maps_url: https://maps.google.com/?cid=15226348863513022527&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.0339982,5.1726966999999995&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/shopping_pinlet
icon_background_color: '#4B96F3'
utc_offset_minutes: 60
google_maps_status: SUCCESS
google_maps_search_query: Club van Suikerzakjesverzamelaars in Nederland, Netherlands
web_enrichment:
web_archives:
- url: https://www.suikerzak.nl/
directory: web/1021/suikerzak.nl
pages_archived: 13
archive_method: wget_warc_deep
warc_file: archive.warc.gz
warc_size_bytes: 109629
warc_format: ISO 28500
full_site_archive_timestamp: '2025-11-29T17:46:40.278592+00:00'
ghcid:
ghcid_current: NL-UT-HOU-S-CSN
ghcid_original: NL-UT-HOU-S-CSN
ghcid_uuid: 1754a45a-8bf0-569e-9c6b-8c1b65e63c70
ghcid_uuid_sha256: 5cc2a09d-0cfb-8ad5-a5c6-5a3e8d4a69e3
ghcid_numeric: 6684081393359330005
record_id: 019adf94-bae2-7a75-a550-1a466f6b1663
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-UT-HOU-S-CSN
ghcid_numeric: 6684081393359330005
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: null
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Houten
geonames_id: 2753557
geonames_name: Houten
feature_code: PPL
population: 1335
admin1_code: 09
region_code: UT
country_code: NL
source_coordinates:
latitude: 52.0339982
longitude: 5.1726966999999995
source: google_maps
geonames_id: 2753557
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-UT-HOU-S-CSN
- identifier_scheme: GHCID_UUID
identifier_value: 1754a45a-8bf0-569e-9c6b-8c1b65e63c70
identifier_url: urn:uuid:1754a45a-8bf0-569e-9c6b-8c1b65e63c70
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 5cc2a09d-0cfb-8ad5-a5c6-5a3e8d4a69e3
identifier_url: urn:uuid:5cc2a09d-0cfb-8ad5-a5c6-5a3e8d4a69e3
- identifier_scheme: GHCID_NUMERIC
identifier_value: '6684081393359330005'
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-bae2-7a75-a550-1a466f6b1663
identifier_url: urn:uuid:019adf94-bae2-7a75-a550-1a466f6b1663
web_claims:
extraction_timestamp: '2025-12-02T08:49:54.348212+00:00'
source_archive: web/1021/suikerzak.nl
claims_count: 12
claims:
- claim_type: org_name
claim_value: Club van Suikerzakjesverzamelaars in Nederland
raw_value: Club van Suikerzakjesverzamelaars in Nederland
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/head/title
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
xpath_match_score: 1.0
extraction_method: title_tag
extraction_timestamp: '2025-12-02T08:49:54.169810+00:00'
- claim_type: description_short
claim_value: Website van de Club van Suikerzakjesverzamelaars in Nederland
raw_value: Website van de Club van Suikerzakjesverzamelaars in Nederland
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/head/meta[7]
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
xpath_match_score: 1.0
extraction_method: meta_description
extraction_timestamp: '2025-12-02T08:49:54.169941+00:00'
- claim_type: social_facebook
claim_value: https://www.facebook.com/ttfestivalassen
raw_value: https://www.facebook.com/ttfestivalassen
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/body/div/div[3]/div/div[2]/section/div[9]/article/p[1]/a
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:49:54.170412+00:00'
- claim_type: video_youtube
claim_value: https://www.youtube.com/watch?v=TSP0e5rXUl8
raw_value: https://www.youtube.com/embed/TSP0e5rXUl8
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/body/div/div[3]/div/div[2]/section/div[1]/article/p[2]/iframe
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
xpath_match_score: 1.0
extraction_method: youtube_iframe
extraction_timestamp: '2025-12-02T08:49:54.170606+00:00'
- claim_type: page_title
claim_value: Club van Suikerzakjesverzamelaars in Nederland
raw_value: Club van Suikerzakjesverzamelaars in Nederland
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/head/title
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
xpath_match_score: 1.0
extraction_method: title_tag_full
extraction_timestamp: '2025-12-02T08:49:54.175014+00:00'
- claim_type: favicon
claim_value: /templates/suikerzakjes2016/favicon.ico
raw_value: type=image/vnd.microsoft.icon
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/head/link[6]
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:49:54.175147+00:00'
- claim_type: favicon
claim_value: /images/template/engage.png
raw_value: /images/template/engage.png
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/head/link[3]
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:49:54.175329+00:00'
- claim_type: email
claim_value: verkaaik2@gmail.com
raw_value: verkaaik2@gmail.com
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/body/div/div[3]/div/div[2]/section/div[6]/article/p[1]/a[1]
html_file: web/1021/suikerzak.nl/pages/index.html@start=55.tmp.html
xpath_match_score: 1.0
extraction_method: mailto_link
extraction_timestamp: '2025-12-02T08:49:54.197918+00:00'
- claim_type: social_facebook
claim_value: https://www.facebook.com/suikerzak
raw_value: https://www.facebook.com/suikerzak
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/body/div/div[3]/div/div[2]/section/div[6]/article/p[2]/a
html_file: web/1021/suikerzak.nl/pages/index.html@start=110.tmp.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:49:54.211903+00:00'
- claim_type: social_facebook
claim_value: https://www.facebook.com/ttfestivalassen/
raw_value: https://www.facebook.com/ttfestivalassen/
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/body/div/div[3]/div/div[2]/section/div[10]/article/p[2]/a
html_file: web/1021/suikerzak.nl/pages/index.html@start=88.tmp.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:49:54.219259+00:00'
- claim_type: social_facebook
claim_value: https://www.facebook.com/pg/Verzamelkrant/about/?ref=page_internal
raw_value: https://www.facebook.com/pg/Verzamelkrant/about/?ref=page_internal
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/body/div/div[3]/div/div[2]/section/div[5]/article/p[2]/a[2]
html_file: web/1021/suikerzak.nl/pages/index.html@start=66.tmp.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:49:54.236761+00:00'
- claim_type: video_youtube
claim_value: https://www.youtube.com/watch?v=aFV9lo1m5HE
raw_value: https://www.youtube.com/embed/aFV9lo1m5HE
source_url: https://www.suikerzak.nl/
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
xpath: /html/body/div/div[3]/div/div[2]/section/div[4]/article/p[4]/iframe
html_file: web/1021/suikerzak.nl/pages/index.html@start=66.tmp.html
xpath_match_score: 1.0
extraction_method: youtube_iframe
extraction_timestamp: '2025-12-02T08:49:54.236865+00:00'
custodian_name:
claim_type: custodian_name
claim_value: Club van Suikerzakjesverzamelaars in Nederland
source: web_title_tag
confidence: 0.8
consensus_method: true
sources_checked: 3
sources_matched: 3
extraction_timestamp: '2025-12-02T13:08:44.258272+00:00'
matching_sources:
- source: google_maps
name: Club van Suikerzakjesverzamelaars in Nederland
score: 1.0
- source: original_entry
name: Club van Suikerzakjesverzamelaars in Nederland
score: 1.0
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:51:42.061149+00:00'
match_method: google_maps_admin2
match_confidence: 0.95
municipality:
name: Houten
code: '321'
municipal_archive:
name: Regionaal Archief Zuid-Utrecht
website: https://www.razu.nl/
isil: null
isil_note: geenRAZU
province:
name: Utrecht
code: '26'
provincial_archive:
name: Het Utrechts Archief
website: https://hetutrechtsarchief.nl/
extra_info: Kijk voor meer info over archieven in Utrecht op https://www.landschaperfgoedutrecht.nl/erfgoed/historische-verenigingen-en-archieven/archieven/
digital_platforms:
- platform_name: Club van Suikerzakjesverzamelaars in Nederland Website
platform_url: http://www.suikerzak.nl/
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website
technology_stack: Standard web technology
data_standards:
- HTML5
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:21:46.303886+00:00'
source_method: automated_extraction