glam/data/nde/bu/enriched/entries/1231_invalid_id.yaml
2025-12-23 13:27:35 +01:00

302 lines
8.9 KiB
YAML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
plaatsnaam_bezoekadres: Leiden
organisatie: Leidse Deken Register
systeem: ZCBS
reference:
- label: https://www.dekenregister.nl/
type:
- D
entry_index: 1231
processing_timestamp: '2025-11-27T20:40:02.519122+00:00'
enrichment_status: skipped
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:47:35.938008+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- plaatsnaam_bezoekadres
- organisatie
- systeem
- reference
- type
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T10:01:11.463251+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJN7ttKADHxUcROn9zRJBzaBM
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- opening_hours
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:52:01.097947+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: plaatsnaam_bezoekadres
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
skip_reason: no_wikidata_id
google_maps_enrichment:
place_id: ChIJN7ttKADHxUcROn9zRJBzaBM
name: Leidse Deken
fetch_timestamp: '2025-11-28T10:01:11.463251+00:00'
api_status: OK
coordinates:
latitude: 52.1645459
longitude: 4.4936875999999994
formatted_address: Papegaaisbolwerk 18, 2312 LW Leiden
short_address: Papegaaisbolwerk 18, Leiden
address_components:
- long_name: '18'
short_name: '18'
types:
- street_number
- long_name: Papegaaisbolwerk
short_name: Papegaaisbolwerk
types:
- route
- long_name: Leiden
short_name: Leiden
types:
- locality
- political
- long_name: Leiden
short_name: Leiden
types:
- administrative_area_level_2
- political
- long_name: Zuid-Holland
short_name: ZH
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 2312 LW
short_name: 2312 LW
types:
- postal_code
website: https://www.leidsedeken.nl/
google_place_types:
- home_goods_store
- point_of_interest
- store
- establishment
primary_type: home_goods_store
business_status: OPERATIONAL
opening_hours:
open_now: false
periods:
- open:
day: 2
hour: 10
minute: 0
close:
day: 2
hour: 17
minute: 0
- open:
day: 3
hour: 10
minute: 0
close:
day: 3
hour: 17
minute: 0
- open:
day: 4
hour: 10
minute: 0
close:
day: 4
hour: 17
minute: 0
- open:
day: 6
hour: 10
minute: 0
close:
day: 6
hour: 14
minute: 0
weekday_text:
- 'maandag: Gesloten'
- 'dinsdag: 10:0017:00'
- 'woensdag: 10:0017:00'
- 'donderdag: 10:0017:00'
- 'vrijdag: Gesloten'
- 'zaterdag: 10:0014:00'
- 'zondag: Gesloten'
google_maps_url: https://maps.google.com/?cid=1398494747759443770&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
street_view_url: https://maps.googleapis.com/maps/api/streetview?size=600x400&location=52.1645459,4.4936875999999994&key=AIzaSyAHuazNth9ZvfRFYk5-v49CwXwhABH8Ri0
icon_mask_uri: https://maps.gstatic.com/mapfiles/place_api/icons/v2/shopping_pinlet
icon_background_color: '#4B96F3'
utc_offset_minutes: 60
google_maps_status: SUCCESS
google_maps_search_query: Leidse Deken Register, Leiden, Netherlands
web_enrichment:
web_archives:
- url: https://www.dekenregister.nl/
directory: web/1231/dekenregister.nl
pages_archived: 1
archive_method: wget_warc_deep
warc_file: archive.warc.gz
warc_size_bytes: 3738
warc_format: ISO 28500
full_site_archive_timestamp: '2025-11-29T19:22:39.123147+00:00'
zcbs_enrichment:
zcbs_id: 148
zcbs_name: Leidse Deken Register
platform_urls:
objects: https://www.dekenregister.nl/cgi-bin/objecten.pl
enrichment_timestamp: '2025-11-30T20:15:00.000000+00:00'
source: https://www.dezijpe.nl/cgi-bin/boerderij.pl?misc=90
match_score: 1.0
match_note: Exact name match - corrected from wrong ZCBS
ghcid:
ghcid_current: NL-ZH-LEI-D-LDR
ghcid_original: NL-ZH-LEI-D-LDR
ghcid_uuid: edb4dce8-255b-5cf5-ab9e-3c8039ec64ad
ghcid_uuid_sha256: a3e7cd5a-7173-8872-b89c-3723442b1caa
ghcid_numeric: 11810634336136587378
record_id: 019adf94-dddb-7592-bf3d-3788696c6e02
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-ZH-LEI-D-LDR
ghcid_numeric: 11810634336136587378
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: null
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Leiden
geonames_id: 2751773
geonames_name: Leiden
feature_code: PPL
population: 119713
admin1_code: '11'
region_code: ZH
country_code: NL
source_coordinates:
latitude: 52.1645459
longitude: 4.4936875999999994
source: google_maps
geonames_id: 2751773
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-ZH-LEI-D-LDR
- identifier_scheme: GHCID_UUID
identifier_value: edb4dce8-255b-5cf5-ab9e-3c8039ec64ad
identifier_url: urn:uuid:edb4dce8-255b-5cf5-ab9e-3c8039ec64ad
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: a3e7cd5a-7173-8872-b89c-3723442b1caa
identifier_url: urn:uuid:a3e7cd5a-7173-8872-b89c-3723442b1caa
- identifier_scheme: GHCID_NUMERIC
identifier_value: '11810634336136587378'
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-dddb-7592-bf3d-3788696c6e02
identifier_url: urn:uuid:019adf94-dddb-7592-bf3d-3788696c6e02
web_claims:
extraction_timestamp: '2025-12-02T08:52:27.870434+00:00'
source_archive: web/1231/dekenregister.nl
claims_count: 2
claims:
- claim_type: org_name
claim_value: Goto ZBBS
raw_value: Goto ZBBS
source_url: https://www.dekenregister.nl/
retrieved_on: '2025-11-29T19:22:39.053875+00:00'
xpath: /html/head/title
html_file: web/1231/dekenregister.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: title_tag
extraction_timestamp: '2025-12-02T08:52:27.868146+00:00'
- claim_type: page_title
claim_value: Goto ZBBS
raw_value: Goto ZBBS
source_url: https://www.dekenregister.nl/
retrieved_on: '2025-11-29T19:22:39.053875+00:00'
xpath: /html/head/title
html_file: web/1231/dekenregister.nl/pages/index.html
xpath_match_score: 1.0
extraction_method: title_tag_full
extraction_timestamp: '2025-12-02T08:52:27.868873+00:00'
custodian_name:
claim_type: custodian_name
claim_value: Leidse Deken Register
source: original_entry
confidence: 0.575
consensus_method: true
sources_checked: 3
sources_matched: 2
extraction_timestamp: '2025-12-02T13:09:06.790356+00:00'
matching_sources:
- source: google_maps
name: Leidse Deken
score: 1.0
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:52:01.097939+00:00'
match_method: plaatsnaam_bezoekadres
match_confidence: 1.0
municipality:
name: Leiden
code: '546'
municipal_archive:
name: Erfgoed Leiden en Omstreken
website: https://www.erfgoedleiden.nl/
isil: NL-LdnRAL
province:
name: Zuid-Holland
code: '28'
provincial_archive:
name: Nationaal Archief
website: https://www.nationaalarchief.nl/
digital_platforms:
- platform_name: Leidse Deken Register Website
platform_url: https://www.leidsedeken.nl/
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website with heritage information
technology_stack: ZCBS
data_standards:
- HTML5
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:39:10.528358+00:00'
source_method: automated_extraction