glam/data/custodian_sample/NL-ZH-SAS-S-OS.yaml
2025-12-11 22:32:09 +01:00

401 lines
16 KiB
YAML

original_entry:
plaatsnaam_bezoekadres: Sassenheim
organisatie: Stichting Oud Sassenheim
systeem: ZCBS
reference:
- label: https://www.stichtingoudsassenheim.nl/
type:
- S
entry_index: 1319
processing_timestamp: '2025-11-27T20:43:02.023623+00:00'
enrichment_status: skipped
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:47:38.737650+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- plaatsnaam_bezoekadres
- organisatie
- systeem
- reference
- type
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T10:02:08.900854+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJp-q2CnnBxUcRDCnsa6DkP0Y
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- rating
- reviews
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:43:45.642701+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: google_maps_admin2
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
- Canonical location added via normalize_custodian_files.py on 2025-12-09T07:13:25Z
skip_reason: no_wikidata_id
google_maps_enrichment:
place_id: ChIJp-q2CnnBxUcRDCnsa6DkP0Y
name: Stichting Oud Sassenheim
fetch_timestamp: '2025-11-28T10:02:08.900854+00:00'
api_status: OK
coordinates:
latitude: 52.228516799999994
longitude: 4.5178693999999995
formatted_address: Ridderhof 20, 2171 TK Sassenheim
short_address: Ridderhof 20, Sassenheim
address_components:
- long_name: '20'
short_name: '20'
types:
- street_number
- long_name: Ridderhof
short_name: Ridderhof
types:
- route
- long_name: Sassenheim
short_name: Sassenheim
types:
- locality
- political
- long_name: Teylingen
short_name: Teylingen
types:
- administrative_area_level_2
- political
- long_name: Zuid-Holland
short_name: ZH
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 2171 TK
short_name: 2171 TK
types:
- postal_code
website: https://www.stichtingoudsassenheim.nl/index.php/contact-126
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 4
total_ratings: 1
reviews:
- author_name: Marco van Oostrum
author_uri: https://www.google.com/maps/contrib/112567992905171043013/reviews
rating: 4
relative_time_description: 5 jaar geleden
text: null
publish_time: '2020-08-09T21:15:23.875645Z'
photo_urls:
- https://places.googleapis.com/v1/places/ChIJp-q2CnnBxUcRDCnsa6DkP0Y/photos/AWn5SU6X68d3BWHDq1IDIRXCqRzKyWPPzTZhupEn8Vwjd1yfE-UbYuSVFuppttfY28WTGgDuA9YpFxE2Gl4Id8pDUvlWLYrbUzCBZ0o3eTNGaEG-q2daSfm2MSSnN7mmUPp2tKXYinxWhVHsnFr0k7F5FsBoaGxw4v3qCq0AqyTzWy0Oa3h2jwQDCO6R-8fKf8WgyJTMUfIrDFkkzgsshenrnZ8oBhrVbDyw0BEm_1LseT-aE4M3ELUgJGaROcum6tITujQjYY978m4Nw7NB4BD0Q5K1gC0r1-l196xkmhyP1F9vW7U4eTIWiya9eHTj_RZkvfuO5Cy2jhglS0fpnail73E8pCEktkkwWs91PrZFFljU7BAz9jRVO8XU5PLk5crKd5OHih3IX-5r98qu19KL-3kb0ktz3WeXSu9SKY_I_llecA/media?maxWidthPx=800&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
photos_metadata:
- name: places/ChIJp-q2CnnBxUcRDCnsa6DkP0Y/photos/AWn5SU6X68d3BWHDq1IDIRXCqRzKyWPPzTZhupEn8Vwjd1yfE-UbYuSVFuppttfY28WTGgDuA9YpFxE2Gl4Id8pDUvlWLYrbUzCBZ0o3eTNGaEG-q2daSfm2MSSnN7mmUPp2tKXYinxWhVHsnFr0k7F5FsBoaGxw4v3qCq0AqyTzWy0Oa3h2jwQDCO6R-8fKf8WgyJTMUfIrDFkkzgsshenrnZ8oBhrVbDyw0BEm_1LseT-aE4M3ELUgJGaROcum6tITujQjYY978m4Nw7NB4BD0Q5K1gC0r1-l196xkmhyP1F9vW7U4eTIWiya9eHTj_RZkvfuO5Cy2jhglS0fpnail73E8pCEktkkwWs91PrZFFljU7BAz9jRVO8XU5PLk5crKd5OHih3IX-5r98qu19KL-3kb0ktz3WeXSu9SKY_I_llecA
height: 1836
width: 3264
author_attributions:
- displayName: John V.
uri: https://maps.google.com/maps/contrib/104610170158827874093
photoUri: https://lh3.googleusercontent.com/a-/ALV-UjVNEgxbeoM8awArrA1D7GR-hRatiqOKRGFVBWXJ0JJgYugNcSSgqw=s100-p-k-no-mo
google_maps_url: https://maps.google.com/?cid=5062015883844266252&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.228516799999994,4.5178693999999995&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/generic_pinlet
icon_background_color: '#7B9EB0'
utc_offset_minutes: 60
google_maps_status: SUCCESS
google_maps_search_query: Stichting Oud Sassenheim, Sassenheim, Netherlands
web_enrichment:
web_archives:
- url: https://www.stichtingoudsassenheim.nl/
directory: web/1319/stichtingoudsassenheim.nl
pages_archived: 2
archive_method: wget_warc_deep
warc_file: archive.warc.gz
warc_size_bytes: 20080
warc_format: ISO 28500
full_site_archive_timestamp: '2025-11-29T19:39:17.411572+00:00'
zcbs_enrichment:
zcbs_id: 145
zcbs_name: Stichting Oud Sassenheim
platform_urls:
photos: https://www.beeldbankstichtingoudsassenheim.nl/cgi-bin/fotos.pl
enrichment_timestamp: '2025-11-30T19:09:04.005442+00:00'
source: https://www.dezijpe.nl/cgi-bin/boerderij.pl?misc=90
match_score: 1.0
ghcid:
ghcid_current: NL-ZH-SAS-S-OS
ghcid_original: NL-ZH-SAS-S-OS
ghcid_uuid: 2a6e585a-0205-53bd-9948-7c33971e03e9
ghcid_uuid_sha256: 3e604b44-167e-87b2-9f40-99fdd5e3f893
ghcid_numeric: 4494675183923029938
record_id: 019adf94-eae9-76f6-9eb4-d4b1db34ed41
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-ZH-SAS-S-OS
ghcid_numeric: 4494675183923029938
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: null
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Sassenheim
geonames_id: 2747751
geonames_name: Sassenheim
feature_code: PPL
population: 15510
admin1_code: '11'
region_code: ZH
country_code: NL
source_coordinates:
latitude: 52.228516799999994
longitude: 4.5178693999999995
source: google_maps
geonames_id: 2747751
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-ZH-SAS-S-OS
- identifier_scheme: GHCID_UUID
identifier_value: 2a6e585a-0205-53bd-9948-7c33971e03e9
identifier_url: urn:uuid:2a6e585a-0205-53bd-9948-7c33971e03e9
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 3e604b44-167e-87b2-9f40-99fdd5e3f893
identifier_url: urn:uuid:3e604b44-167e-87b2-9f40-99fdd5e3f893
- identifier_scheme: GHCID_NUMERIC
identifier_value: '4494675183923029938'
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-eae9-76f6-9eb4-d4b1db34ed41
identifier_url: urn:uuid:019adf94-eae9-76f6-9eb4-d4b1db34ed41
web_claims:
extraction_timestamp: '2025-12-02T08:53:09.960194+00:00'
source_archive: web/1319/stichtingoudsassenheim.nl
claims_count: 11
claims:
- claim_type: org_name
claim_value: Welkom op de Site
raw_value: Welkom op de Site
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/head/title
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: title_tag
extraction_timestamp: '2025-12-02T08:53:09.932121+00:00'
- claim_type: description_short
claim_value: 'Stichting Oud Sassenheim, voor de historie over oud Sassenheim en oude Sassemers
De bollenteelt en de kust en duinstreek'
raw_value: 'Stichting Oud Sassenheim, voor de historie over oud Sassenheim en oude Sassemers
De bollenteelt en de kust en duinstreek'
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/head/meta[5]
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: meta_description
extraction_timestamp: '2025-12-02T08:53:09.932207+00:00'
- claim_type: social_facebook
claim_value: https://www.facebook.com/StichtingOudSassenheim/
raw_value: https://www.facebook.com/StichtingOudSassenheim/
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/body/div[2]/ul/li[1]/a
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:53:09.932773+00:00'
- claim_type: social_youtube
claim_value: https://www.youtube.com/channel/UC7IbW74wWSVM18YMYTfv1rw
raw_value: https://www.youtube.com/channel/UC7IbW74wWSVM18YMYTfv1rw
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/body/div[2]/ul/li[2]/a
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: social_link
extraction_timestamp: '2025-12-02T08:53:09.932840+00:00'
- claim_type: org_name
claim_value: Welkom
raw_value: Welkom
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/body/div[1]/div/div/main/div/div[2]/div/section/div/div/div[1]/div/div/div[2]/div/h1
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 0.9
extraction_method: h1_tag
extraction_timestamp: '2025-12-02T08:53:09.932933+00:00'
- claim_type: page_title
claim_value: Welkom op de Site
raw_value: Welkom op de Site
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/head/title
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: title_tag_full
extraction_timestamp: '2025-12-02T08:53:09.936253+00:00'
- claim_type: favicon
claim_value: /images/logososklein.png
raw_value: type=image
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/head/link[15]
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:53:09.936296+00:00'
- claim_type: logo
claim_value: https://www.stichtingoudsassenheim.nl/images/LogoSOS17.png
raw_value: alt=Stichting Oud Sassenheim
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/body/div[1]/div/div/header/div/div/section/div/div/div[1]/a/img
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: logo_img_attr
extraction_timestamp: '2025-12-02T08:53:09.936470+00:00'
- claim_type: ui_login
claim_value: https://www.stichtingoudsassenheim.nl/index.php/inloggen
raw_value: text=inloggen, pattern=inloggen
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/body/div[1]/div/div/nav/div/nav/div/div[1]/ul/li[9]/a
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: login_button
extraction_timestamp: '2025-12-02T08:53:09.937795+00:00'
- claim_type: ui_login
claim_value: https://www.stichtingoudsassenheim.nl/index.php/aanmeldenalsdonateur
raw_value: text=aanmelden als donateur, pattern=aanmelden
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/body/div[1]/div/div/footer/div/div/section/div/div/div[4]/div[1]/ul/li/a
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: login_button
extraction_timestamp: '2025-12-02T08:53:09.937971+00:00'
- claim_type: ui_login
claim_value: https://www.stichtingoudsassenheim.nl/index.php/aanmeldennieuwsbrief
raw_value: text=aanmelden nieuwsbrief, pattern=aanmelden
source_url: https://www.stichtingoudsassenheim.nl/
retrieved_on: '2025-11-29T19:39:17.334070+00:00'
xpath: /html/body/div[1]/div/div/footer/div/div/section/div/div/div[4]/div[2]/ul/li/a
html_file: web/1319/stichtingoudsassenheim.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: login_button
extraction_timestamp: '2025-12-02T08:53:09.937986+00:00'
custodian_name:
claim_type: custodian_name
claim_value: Oud Sassenheim
source: original_entry
confidence: 0.601
consensus_method: true
sources_checked: 3
sources_matched: 2
extraction_timestamp: '2025-12-02T13:09:14.978402+00:00'
matching_sources:
- source: google_maps
name: Oud Sassenheim
score: 1.0
previous_value: Stichting Oud Sassenheim
previous_source: original_entry
custodian_legal_name:
claim_type: legal_name
claim_value: Stichting Oud Sassenheim
extraction_timestamp: '2025-12-02T13:09:14.978410+00:00'
note: Legal form detected in source name (e.g., Stichting, Vereniging, B.V.)
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:43:45.642690+00:00'
match_method: google_maps_admin2
match_confidence: 0.95
municipality:
name: Teylingen
code: '1525'
municipal_archive:
name: Erfgoed Leiden en Omstreken
website: https://www.erfgoedleiden.nl/
isil: NL-LdnRAL
province:
name: Zuid-Holland
code: '28'
provincial_archive:
name: Nationaal Archief
website: https://www.nationaalarchief.nl/
digital_platforms:
- platform_name: Stichting Oud Sassenheim Website
platform_url: https://www.stichtingoudsassenheim.nl/index.php/contact-126
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website with heritage information
technology_stack: ZCBS
data_standards:
- HTML5
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:36:16.589670+00:00'
source_method: automated_extraction
wikidata_enrichment:
status: NOT_FOUND
fetch_timestamp: '2025-12-06T19:42:31.835546+00:00'
search_query: Oud Sassenheim
location:
latitude: 52.228516799999994
longitude: 4.5178693999999995
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-11-28T10:02:08.900854+00:00'
entity_id: ChIJp-q2CnnBxUcRDCnsa6DkP0Y
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
city: Sassenheim
region: Zuid-Holland
region_code: ZH
country: NL
postal_code: 2171 TK
street_address: Ridderhof 20, Sassenheim
formatted_address: Ridderhof 20, 2171 TK Sassenheim
geonames_id: 2747751
geonames_name: Sassenheim
feature_code: PPL
normalization_timestamp: '2025-12-09T07:13:25.942341+00:00'