382 lines
14 KiB
YAML
382 lines
14 KiB
YAML
original_entry:
|
|
organisatie: Club van Suikerzakjesverzamelaars in Nederland
|
|
collectie_nederland: ja
|
|
reference:
|
|
- label: https://www.suikerzak.nl/
|
|
type:
|
|
- S
|
|
entry_index: 1021
|
|
processing_timestamp: '2025-11-27T16:43:59.817431+00:00'
|
|
enrichment_status: skipped
|
|
provenance:
|
|
schema_version: 1.0.0
|
|
generated_at: '2025-11-28T23:47:30.547276+00:00'
|
|
sources:
|
|
original_entry:
|
|
- source_type: nde_csv_registry
|
|
data_tier: TIER_1_AUTHORITATIVE
|
|
claims_extracted:
|
|
- organisatie
|
|
- collectie_nederland
|
|
- reference
|
|
- type
|
|
google_maps:
|
|
- source_type: google_maps_api
|
|
fetch_timestamp: '2025-11-28T09:58:58.954001+00:00'
|
|
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
|
|
place_id: ChIJWzo_OP9mxkcRP9DdY57bTtM
|
|
claims_extracted:
|
|
- coordinates
|
|
- formatted_address
|
|
- address_components
|
|
- business_status
|
|
- website
|
|
- phone
|
|
- rating
|
|
- reviews
|
|
- opening_hours
|
|
genealogiewerkbalk:
|
|
- source_type: genealogiewerkbalk_registry
|
|
fetch_timestamp: '2025-12-03T13:51:42.061162+00:00'
|
|
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
|
|
match_method: google_maps_admin2
|
|
claims_extracted:
|
|
- municipality_name
|
|
- municipality_code
|
|
- municipal_archive_name
|
|
- municipal_archive_website
|
|
- municipal_archive_isil
|
|
- province_name
|
|
- province_code
|
|
- provincial_archive_name
|
|
- provincial_archive_website
|
|
data_tier_summary:
|
|
TIER_1_AUTHORITATIVE:
|
|
- original_entry (NDE CSV)
|
|
TIER_2_VERIFIED:
|
|
- wikidata_api
|
|
- google_maps_api
|
|
- genealogiewerkbalk_registry
|
|
TIER_3_CROWD_SOURCED: []
|
|
TIER_4_INFERRED:
|
|
- website_scrape
|
|
- exa_web_search
|
|
notes:
|
|
- Provenance tracking added retroactively
|
|
- claim_level_provenance available in sources section
|
|
skip_reason: no_wikidata_id
|
|
google_maps_enrichment:
|
|
place_id: ChIJWzo_OP9mxkcRP9DdY57bTtM
|
|
name: Club van Suikerzakjesverzamelaars in Nederland
|
|
fetch_timestamp: '2025-11-28T09:58:58.954001+00:00'
|
|
api_status: OK
|
|
coordinates:
|
|
latitude: 52.0339982
|
|
longitude: 5.1726966999999995
|
|
formatted_address: De Fuik 29, 3995 BJ Houten
|
|
short_address: De Fuik 29, Houten
|
|
address_components:
|
|
- long_name: '29'
|
|
short_name: '29'
|
|
types:
|
|
- street_number
|
|
- long_name: De Fuik
|
|
short_name: De Fuik
|
|
types:
|
|
- route
|
|
- long_name: Houten
|
|
short_name: Houten
|
|
types:
|
|
- locality
|
|
- political
|
|
- long_name: Houten
|
|
short_name: Houten
|
|
types:
|
|
- administrative_area_level_2
|
|
- political
|
|
- long_name: Utrecht
|
|
short_name: UT
|
|
types:
|
|
- administrative_area_level_1
|
|
- political
|
|
- long_name: Nederland
|
|
short_name: NL
|
|
types:
|
|
- country
|
|
- political
|
|
- long_name: 3995 BJ
|
|
short_name: 3995 BJ
|
|
types:
|
|
- postal_code
|
|
phone_local: 06 22111485
|
|
phone_international: +31 6 22111485
|
|
website: http://www.suikerzak.nl/
|
|
google_place_types:
|
|
- point_of_interest
|
|
- store
|
|
- establishment
|
|
primary_type: store
|
|
business_status: OPERATIONAL
|
|
opening_hours:
|
|
open_now: true
|
|
periods:
|
|
- open:
|
|
day: 0
|
|
hour: 0
|
|
minute: 0
|
|
weekday_text:
|
|
- 'maandag: 24 uur geopend'
|
|
- 'dinsdag: 24 uur geopend'
|
|
- 'woensdag: 24 uur geopend'
|
|
- 'donderdag: 24 uur geopend'
|
|
- 'vrijdag: 24 uur geopend'
|
|
- 'zaterdag: 24 uur geopend'
|
|
- 'zondag: 24 uur geopend'
|
|
rating: 5
|
|
total_ratings: 1
|
|
reviews:
|
|
- author_name: P.J V Krieken
|
|
author_uri: https://www.google.com/maps/contrib/103613345661508403588/reviews
|
|
rating: 5
|
|
relative_time_description: 7 maanden geleden
|
|
text: Leuke site en dat helemaal opgezet vj hobby en met een catalogus van alle
|
|
bekend zijnde suikerzakjes. (Ned.erfgoed )
|
|
publish_time: '2025-04-16T14:08:41.123310Z'
|
|
google_maps_url: https://maps.google.com/?cid=15226348863513022527&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
|
|
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.0339982,5.1726966999999995&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
|
|
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/shopping_pinlet
|
|
icon_background_color: '#4B96F3'
|
|
utc_offset_minutes: 60
|
|
google_maps_status: SUCCESS
|
|
google_maps_search_query: Club van Suikerzakjesverzamelaars in Nederland, Netherlands
|
|
web_enrichment:
|
|
web_archives:
|
|
- url: https://www.suikerzak.nl/
|
|
directory: web/1021/suikerzak.nl
|
|
pages_archived: 13
|
|
archive_method: wget_warc_deep
|
|
warc_file: archive.warc.gz
|
|
warc_size_bytes: 109629
|
|
warc_format: ISO 28500
|
|
full_site_archive_timestamp: '2025-11-29T17:46:40.278592+00:00'
|
|
ghcid:
|
|
ghcid_current: NL-UT-HOU-S-CSN
|
|
ghcid_original: NL-UT-HOU-S-CSN
|
|
ghcid_uuid: 1754a45a-8bf0-569e-9c6b-8c1b65e63c70
|
|
ghcid_uuid_sha256: 5cc2a09d-0cfb-8ad5-a5c6-5a3e8d4a69e3
|
|
ghcid_numeric: 6684081393359330005
|
|
record_id: 019adf94-bae2-7a75-a550-1a466f6b1663
|
|
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
|
|
ghcid_history:
|
|
- ghcid: NL-UT-HOU-S-CSN
|
|
ghcid_numeric: 6684081393359330005
|
|
valid_from: '2025-12-02T14:56:45.615377+00:00'
|
|
valid_to: null
|
|
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
|
|
location_resolution:
|
|
method: GOOGLE_MAPS_LOCALITY
|
|
google_maps_locality: Houten
|
|
geonames_id: 2753557
|
|
geonames_name: Houten
|
|
feature_code: PPL
|
|
population: 1335
|
|
admin1_code: 09
|
|
region_code: UT
|
|
country_code: NL
|
|
source_coordinates:
|
|
latitude: 52.0339982
|
|
longitude: 5.1726966999999995
|
|
source: google_maps
|
|
geonames_id: 2753557
|
|
identifiers:
|
|
- identifier_scheme: GHCID
|
|
identifier_value: NL-UT-HOU-S-CSN
|
|
- identifier_scheme: GHCID_UUID
|
|
identifier_value: 1754a45a-8bf0-569e-9c6b-8c1b65e63c70
|
|
identifier_url: urn:uuid:1754a45a-8bf0-569e-9c6b-8c1b65e63c70
|
|
- identifier_scheme: GHCID_UUID_SHA256
|
|
identifier_value: 5cc2a09d-0cfb-8ad5-a5c6-5a3e8d4a69e3
|
|
identifier_url: urn:uuid:5cc2a09d-0cfb-8ad5-a5c6-5a3e8d4a69e3
|
|
- identifier_scheme: GHCID_NUMERIC
|
|
identifier_value: '6684081393359330005'
|
|
- identifier_scheme: RECORD_ID
|
|
identifier_value: 019adf94-bae2-7a75-a550-1a466f6b1663
|
|
identifier_url: urn:uuid:019adf94-bae2-7a75-a550-1a466f6b1663
|
|
web_claims:
|
|
extraction_timestamp: '2025-12-02T08:49:54.348212+00:00'
|
|
source_archive: web/1021/suikerzak.nl
|
|
claims_count: 12
|
|
claims:
|
|
- claim_type: org_name
|
|
claim_value: Club van Suikerzakjesverzamelaars in Nederland
|
|
raw_value: Club van Suikerzakjesverzamelaars in Nederland
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/head/title
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: title_tag
|
|
extraction_timestamp: '2025-12-02T08:49:54.169810+00:00'
|
|
- claim_type: description_short
|
|
claim_value: Website van de Club van Suikerzakjesverzamelaars in Nederland
|
|
raw_value: Website van de Club van Suikerzakjesverzamelaars in Nederland
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/head/meta[7]
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: meta_description
|
|
extraction_timestamp: '2025-12-02T08:49:54.169941+00:00'
|
|
- claim_type: social_facebook
|
|
claim_value: https://www.facebook.com/ttfestivalassen
|
|
raw_value: https://www.facebook.com/ttfestivalassen
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/body/div/div[3]/div/div[2]/section/div[9]/article/p[1]/a
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: social_link
|
|
extraction_timestamp: '2025-12-02T08:49:54.170412+00:00'
|
|
- claim_type: video_youtube
|
|
claim_value: https://www.youtube.com/watch?v=TSP0e5rXUl8
|
|
raw_value: https://www.youtube.com/embed/TSP0e5rXUl8
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/body/div/div[3]/div/div[2]/section/div[1]/article/p[2]/iframe
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: youtube_iframe
|
|
extraction_timestamp: '2025-12-02T08:49:54.170606+00:00'
|
|
- claim_type: page_title
|
|
claim_value: Club van Suikerzakjesverzamelaars in Nederland
|
|
raw_value: Club van Suikerzakjesverzamelaars in Nederland
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/head/title
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: title_tag_full
|
|
extraction_timestamp: '2025-12-02T08:49:54.175014+00:00'
|
|
- claim_type: favicon
|
|
claim_value: /templates/suikerzakjes2016/favicon.ico
|
|
raw_value: type=image/vnd.microsoft.icon
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/head/link[6]
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: favicon_link
|
|
extraction_timestamp: '2025-12-02T08:49:54.175147+00:00'
|
|
- claim_type: favicon
|
|
claim_value: /images/template/engage.png
|
|
raw_value: /images/template/engage.png
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/head/link[3]
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=99.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: favicon_link
|
|
extraction_timestamp: '2025-12-02T08:49:54.175329+00:00'
|
|
- claim_type: email
|
|
claim_value: verkaaik2@gmail.com
|
|
raw_value: verkaaik2@gmail.com
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/body/div/div[3]/div/div[2]/section/div[6]/article/p[1]/a[1]
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=55.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: mailto_link
|
|
extraction_timestamp: '2025-12-02T08:49:54.197918+00:00'
|
|
- claim_type: social_facebook
|
|
claim_value: https://www.facebook.com/suikerzak
|
|
raw_value: https://www.facebook.com/suikerzak
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/body/div/div[3]/div/div[2]/section/div[6]/article/p[2]/a
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=110.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: social_link
|
|
extraction_timestamp: '2025-12-02T08:49:54.211903+00:00'
|
|
- claim_type: social_facebook
|
|
claim_value: https://www.facebook.com/ttfestivalassen/
|
|
raw_value: https://www.facebook.com/ttfestivalassen/
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/body/div/div[3]/div/div[2]/section/div[10]/article/p[2]/a
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=88.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: social_link
|
|
extraction_timestamp: '2025-12-02T08:49:54.219259+00:00'
|
|
- claim_type: social_facebook
|
|
claim_value: https://www.facebook.com/pg/Verzamelkrant/about/?ref=page_internal
|
|
raw_value: https://www.facebook.com/pg/Verzamelkrant/about/?ref=page_internal
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/body/div/div[3]/div/div[2]/section/div[5]/article/p[2]/a[2]
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=66.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: social_link
|
|
extraction_timestamp: '2025-12-02T08:49:54.236761+00:00'
|
|
- claim_type: video_youtube
|
|
claim_value: https://www.youtube.com/watch?v=aFV9lo1m5HE
|
|
raw_value: https://www.youtube.com/embed/aFV9lo1m5HE
|
|
source_url: https://www.suikerzak.nl/
|
|
retrieved_on: '2025-11-29T17:46:40.094028+00:00'
|
|
xpath: /html/body/div/div[3]/div/div[2]/section/div[4]/article/p[4]/iframe
|
|
html_file: web/1021/suikerzak.nl/pages/index.html@start=66.tmp.html
|
|
xpath_match_score: 1.0
|
|
extraction_method: youtube_iframe
|
|
extraction_timestamp: '2025-12-02T08:49:54.236865+00:00'
|
|
custodian_name:
|
|
claim_type: custodian_name
|
|
claim_value: Club van Suikerzakjesverzamelaars in Nederland
|
|
source: web_title_tag
|
|
confidence: 0.8
|
|
consensus_method: true
|
|
sources_checked: 3
|
|
sources_matched: 3
|
|
extraction_timestamp: '2025-12-02T13:08:44.258272+00:00'
|
|
matching_sources:
|
|
- source: google_maps
|
|
name: Club van Suikerzakjesverzamelaars in Nederland
|
|
score: 1.0
|
|
- source: original_entry
|
|
name: Club van Suikerzakjesverzamelaars in Nederland
|
|
score: 1.0
|
|
genealogiewerkbalk_enrichment:
|
|
source: Genealogiewerkbalk.nl Municipality Archives Registry
|
|
source_url: https://www.genealogiewerkbalk.nl/archieven.html
|
|
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
|
|
data_tier: TIER_2_VERIFIED
|
|
enrichment_timestamp: '2025-12-03T13:51:42.061149+00:00'
|
|
match_method: google_maps_admin2
|
|
match_confidence: 0.95
|
|
municipality:
|
|
name: Houten
|
|
code: '321'
|
|
municipal_archive:
|
|
name: Regionaal Archief Zuid-Utrecht
|
|
website: https://www.razu.nl/
|
|
isil: null
|
|
isil_note: geenRAZU
|
|
province:
|
|
name: Utrecht
|
|
code: '26'
|
|
provincial_archive:
|
|
name: Het Utrechts Archief
|
|
website: https://hetutrechtsarchief.nl/
|
|
extra_info: Kijk voor meer info over archieven in Utrecht op https://www.landschaperfgoedutrecht.nl/erfgoed/historische-verenigingen-en-archieven/archieven/
|
|
digital_platforms:
|
|
- platform_name: Club van Suikerzakjesverzamelaars in Nederland Website
|
|
platform_url: http://www.suikerzak.nl/
|
|
platform_type: WEBSITE
|
|
platform_category:
|
|
- Organizational website
|
|
digital_collections: Organizational website
|
|
technology_stack: Standard web technology
|
|
data_standards:
|
|
- HTML5
|
|
user_services: General information, Contact
|
|
sustainability_model: Institutional funding
|
|
enrichment_timestamp: '2025-12-05T11:21:46.303886+00:00'
|
|
source_method: automated_extraction
|