glam/data/custodian/NL-UT-BUN-L-B.yaml
2026-01-18 01:23:32 +01:00

568 lines
19 KiB
YAML
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
plaatsnaam_bezoekadres: Houten
organisatie: BiSC Utrecht
type_organisatie: bibliotheek
isil_code_kb: NL-0702940000
type:
- L
opmerkingen: POI
entry_index: 1363
processing_timestamp: '2025-11-28T12:19:25.739468+00:00'
kb_enrichment:
source: KB Netherlands Library Network
source_file: KB_Netherlands_ISIL_2025-04-01.xlsx
source_url: https://www.bibliotheeknetwerk.nl/
extraction_date: '2025-11-17T13:02:03.421813+00:00'
enrichment_timestamp: '2025-11-28T12:19:25.739468+00:00'
enrichment_method: automated_integration
isil_code: NL-0702940000
name: BiSC Utrecht
city: Houten
registry: KB Netherlands Library Network
notes: POI
country: Netherlands
enrichment_status: isil_kb_source
provenance:
schema_version: 1.0.0
generated_at: '2025-11-28T23:47:39.512678+00:00'
sources:
original_entry:
- source_type: nde_csv_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- plaatsnaam_bezoekadres
- organisatie
- type_organisatie
- isil_code_kb
- type
- opmerkingen
google_maps:
- source_type: google_maps_api
fetch_timestamp: '2025-11-28T12:24:34.534295+00:00'
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
place_id: ChIJd3CnRPhmxkcRCkQsNtznxtI
claims_extracted:
- coordinates
- formatted_address
- address_components
- business_status
- website
- phone
- rating
- opening_hours
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:43:49.480299+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: plaatsnaam_bezoekadres
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
linkup_timespan:
- source_type: linkup_web_search
fetch_timestamp: '2025-12-15T21:31:00.759480+00:00'
search_query: '"BiSC" Bunnik opgericht OR gesticht OR sinds'
source_urls:
- https://www.biscutrecht.nl/wp-content/uploads/2019/06/Bestuursverslag-BiSC-2018.pdf
- https://bunnik-projekten.nl/over-ons
- https://nl.wikipedia.org/wiki/Bunnik_(gemeente)
- https://www.geschiedenisextra.nl/nl/bunnik.htm
- https://www.bunnik.nl/ondernemen/winkeliers-en-ondernemersverenigingen
claims_extracted:
- timespan_begin
data_tier: TIER_4_INFERRED
archive_path: data/custodian/web/1363/linkup/linkup_founding_20251215T213100Z.json
data_tier_summary:
TIER_1_AUTHORITATIVE:
- original_entry (NDE CSV)
TIER_2_VERIFIED:
- wikidata_api
- google_maps_api
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED:
- website_scrape
- exa_web_search
notes:
- Provenance tracking added retroactively
- claim_level_provenance available in sources section
- Canonical location normalized on 2025-12-09T13:16:11Z
corrections:
- correction_date: '2025-12-14T00:00:00Z'
correction_type: wikidata_enrichment_removal
description: Removed hallucinated Wikidata enrichment. The enrichment pipeline incorrectly added data for Q22431 (Bischwiller
- a commune in Bas-Rhin, France) which has no relation to BiSC Utrecht (Dutch library service organization in Houten/Bunnik).
Original wikidata_enrichment_status correctly showed NOT_FOUND, but a later enrichment run erroneously added the French
commune data. No Wikidata entity exists for BiSC Utrecht (verified via SPARQL search for ISIL NL-0702940000 and name
searches). Removed 331 lines of incorrect French geographic data.
old_value: Q22431 (Bischwiller, France)
new_value: null (no Wikidata entity exists)
corrected_by: claude-opus-4
enrichment_source: KB Netherlands Library Network
enrichment_timestamp: '2025-11-28T12:19:25.739468+00:00'
wikidata_enrichment_status: NOT_FOUND
wikidata_search_timestamp: '2025-11-28T12:22:38.808890+00:00'
google_maps_enrichment:
place_id: ChIJd3CnRPhmxkcRCkQsNtznxtI
name: BiSC
fetch_timestamp: '2025-11-28T12:24:34.534295+00:00'
api_status: OK
coordinates:
latitude: 52.063488899999996
longitude: 5.2116562
formatted_address: Fruitweg 48, 3981 PA Bunnik
short_address: De Rumpst, Fruitweg 48, Bunnik
address_components:
- long_name: '48'
short_name: '48'
types:
- street_number
- long_name: Fruitweg
short_name: Fruitweg
types:
- route
- long_name: Bunnik
short_name: Bunnik
types:
- locality
- political
- long_name: Bunnik
short_name: Bunnik
types:
- administrative_area_level_2
- political
- long_name: Utrecht
short_name: UT
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 3981 PA
short_name: 3981 PA
types:
- postal_code
phone_local: 030 635 4635
phone_international: +31 30 635 4635
website: http://www.biscutrecht.nl/
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
opening_hours:
periods:
- open:
day: 1
hour: 9
minute: 0
close:
day: 1
hour: 17
minute: 0
- open:
day: 2
hour: 9
minute: 0
close:
day: 2
hour: 17
minute: 0
- open:
day: 3
hour: 9
minute: 0
close:
day: 3
hour: 17
minute: 0
- open:
day: 4
hour: 9
minute: 0
close:
day: 4
hour: 17
minute: 0
- open:
day: 5
hour: 9
minute: 0
close:
day: 5
hour: 17
minute: 0
weekday_text:
- 'maandag: 09:0017:00'
- 'dinsdag: 09:0017:00'
- 'woensdag: 09:0017:00'
- 'donderdag: 09:0017:00'
- 'vrijdag: 09:0017:00'
- 'zaterdag: Gesloten'
- 'zondag: Gesloten'
rating: 4.7
total_ratings: 3
google_maps_url: https://maps.google.com/?cid=15188081726341268490&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
google_maps_status: SUCCESS
google_maps_search_query: Bibliotheek BiSC Utrecht, Houten, Netherlands
ghcid:
ghcid_current: NL-UT-BUN-L-B
ghcid_original: NL-UT-BUN-L-B
ghcid_uuid: 89121393-c288-5a2b-9c32-a5fe478022d4
ghcid_uuid_sha256: a59d3563-3465-8afc-9dd1-742becf62a2a
ghcid_numeric: 11933753287798754044
record_id: 019adf94-f202-7ad4-89c2-42b226c04bbc
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-UT-BUN-L-B
ghcid_numeric: 11933753287798754044
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: null
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Bunnik
geonames_id: 2758106
geonames_name: Bunnik
feature_code: PPL
population: 6315
admin1_code: 09
region_code: UT
country_code: NL
source_coordinates:
latitude: 52.063488899999996
longitude: 5.2116562
source: google_maps
geonames_id: 2758106
identifiers:
- identifier_scheme: GHCID
identifier_value: NL-UT-BUN-L-B
- identifier_scheme: GHCID_UUID
identifier_value: 89121393-c288-5a2b-9c32-a5fe478022d4
identifier_url: urn:uuid:89121393-c288-5a2b-9c32-a5fe478022d4
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: a59d3563-3465-8afc-9dd1-742becf62a2a
identifier_url: urn:uuid:a59d3563-3465-8afc-9dd1-742becf62a2a
- identifier_scheme: GHCID_NUMERIC
identifier_value: '11933753287798754044'
- identifier_scheme: RECORD_ID
identifier_value: 019adf94-f202-7ad4-89c2-42b226c04bbc
identifier_url: urn:uuid:019adf94-f202-7ad4-89c2-42b226c04bbc
custodian_name:
claim_type: custodian_name
claim_value: BiSC
source: google_maps
confidence: 0.439
consensus_method: true
sources_checked: 77
sources_matched: 8
extraction_timestamp: '2025-12-02T13:09:19.402640+00:00'
matching_sources:
- source: original_entry
name: BiSC Utrecht
score: 1.0
- source: web_title_tag
name: BiSC Utrecht
score: 1.0
- source: web_title_tag
name: Mooi rapportcijfer vervoersdienst BiSC in 2022
score: 1.0
- source: web_title_tag
name: Jaarrekening BiSC 2022
score: 1.0
- source: web_title_tag
name: Over BiSC
score: 1.0
- source: web_title_tag
name: Jaarrekening BiSC 2024
score: 1.0
- source: web_title_tag
name: Jaarrekening BiSC 2021
score: 1.0
previous_value: BiSC Utrecht
previous_source: web_title_tag
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:43:49.480282+00:00'
match_method: plaatsnaam_bezoekadres
match_confidence: 1.0
municipality:
name: Houten
code: '321'
municipal_archive:
name: Regionaal Archief Zuid-Utrecht
website: https://www.razu.nl/
isil: null
isil_note: geenRAZU
province:
name: Utrecht
code: '26'
provincial_archive:
name: Het Utrechts Archief
website: https://hetutrechtsarchief.nl/
extra_info: Kijk voor meer info over archieven in Utrecht op https://www.landschaperfgoedutrecht.nl/erfgoed/historische-verenigingen-en-archieven/archieven/
digital_platforms:
- platform_name: BiSC Utrecht Website
platform_url: http://www.biscutrecht.nl/
platform_type: ONLINE_DATABASE
platform_category:
- Organizational website
- Collection catalog
digital_collections: Organizational website with heritage information
technology_stack: Standard web technology
data_standards:
- HTML5
user_services: Catalog search
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:36:30.929536+00:00'
source_method: automated_extraction
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.LIB
subtype_label: LIBRARY
ontology_class: schema:Library
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/netherlands_complete.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-18T17:16:16.901941+00:00'
statement_created_at: '2026-01-01T13:15:32.156780+00:00'
migration_note: Migrated from agent:claude-conversation on 2026-01-01 (ch_annotator.extraction_provenance)
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:13:11.947020+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: netherlands_complete.yaml
annotation_metadata:
confidence_score: 1.0
verified: false
verification_date: null
verified_by: null
entity_claims:
- claim_type: full_name
claim_value: BiSC Utrecht
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/netherlands_complete.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-18T17:16:16.901941+00:00'
statement_created_at: '2026-01-01T13:15:32.156799+00:00'
migration_note: Migrated from agent:claude-conversation on 2026-01-01 (entity_claims[0].provenance)
confidence: 1.0
- claim_type: institution_type
claim_value: LIBRARY
property_uri: rdf:type
provenance:
namespace: glam
path: /files/netherlands_complete.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-18T17:16:16.901941+00:00'
statement_created_at: '2026-01-01T13:15:32.156802+00:00'
migration_note: Migrated from agent:claude-conversation on 2026-01-01 (entity_claims[1].provenance)
confidence: 0.95
- claim_type: located_in_city
claim_value: Houten
property_uri: schema:addressLocality
provenance:
namespace: glam
path: /files/netherlands_complete.yaml
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-18T17:16:16.901941+00:00'
statement_created_at: '2026-01-01T13:15:32.156804+00:00'
migration_note: Migrated from agent:claude-conversation on 2026-01-01 (entity_claims[2].provenance)
confidence: 0.9
integration_note:
integrated_from: netherlands_complete_ch_annotator.yaml
integration_date: '2025-12-06T23:20:34.310667+00:00'
match_type: name
location:
latitude: 52.063488899999996
longitude: 5.2116562
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-11-28T12:24:34.534295+00:00'
entity_id: ChIJd3CnRPhmxkcRCkQsNtznxtI
api_endpoint: https://maps.googleapis.com/maps/api/place/textsearch
city: Bunnik
region: Utrecht
region_code: UT
country: NL
postal_code: 3981 PA
street_address: De Rumpst, Fruitweg 48, Bunnik
formatted_address: Fruitweg 48, 3981 PA Bunnik
geonames_id: 2758106
geonames_name: Bunnik
feature_code: PPL
normalization_timestamp: '2025-12-09T13:16:11.602213+00:00'
crawl4ai_enrichment:
retrieval_timestamp: '2025-12-14T18:19:38.859580+00:00'
retrieval_agent: crawl4ai
source_url: http://www.biscutrecht.nl/
status_code: null
error: Crawl failed with status None
digital_platform_v2:
transformation_metadata:
transformed_from: httpx_beautifulsoup
transformation_date: '2025-12-14T23:22:51.032979+00:00'
transformation_version: '2.1'
source_status_code: 200
primary_platform:
platform_id: primary_website_biscutrecht_nl
platform_name: BiSC Utrecht | Voor bibliotheken in transitie Website
platform_url: https://www.biscutrecht.nl/
platform_type: INSTITUTIONAL_WEBSITE
description: ''
language: nl
og_image: null
favicon: https://www.biscutrecht.nl/wp-content/uploads/2015/06/cropped-favicon-32x32.png
navigation_links:
- http://www.biscutrecht.nl/
- https://www.biscutrecht.nl/
- https://www.biscutrecht.nl/diensten/
- https://www.biscutrecht.nl/projecten/
- https://www.biscutrecht.nl/over-bisc/
- https://www.biscutrecht.nl/ons-team/
- https://www.biscutrecht.nl/contact/
- https://www.biscutrecht.nl/news-cat/masterclass-toekomstbestendige-bibliotheken-van-cubiss-bisc-en-tias/
- https://www.biscutrecht.nl/news-cat/alle-informatie-over-de-vernieuwde-wsob-op-een-rij/
- https://www.biscutrecht.nl/news-cat/ga-goed-van-start-in-de-bibliotheekbranche/
- https://www.biscutrecht.nl/news-cat/de-robuuste-toekomstgerichte-bibliotheek/
- https://www.biscutrecht.nl/news-cat/basistraining-projectmatig-creeren-pmc/
- https://www.biscutrecht.nl/news-cat/democratie-fitness-in-de-bibliotheek/
- https://www.biscutrecht.nl/page/2/?et_blog
- http://www.biscutrecht.nl/agenda/
- http://www.biscutrecht.nl/contact/
- http://www.biscutrecht.nl/algemenevoorwaarden/
- https://www.biscutrecht.nl/wp-content/uploads/2025/06/Algemene_Inkoopvoorwaarden_BiSC-juni_2025.pdf
- http://www.biscutrecht.nl/privacyverklaring/
- http://www.biscutrecht.nl/disclaimer/
timespan:
begin_of_the_begin: '2018-01-10T00:00:00Z'
end_of_the_begin: '2018-01-10T00:00:00Z'
begin_of_the_end: null
end_of_the_end: null
sources:
- 'Linkup web search: https://www.bunnikgroep.nl/over-ons/organisatie/historie/'
notes: 'Found via pattern: full_date_nl'
web_enrichments:
extraction_timestamp: '2025-12-13T19:46:59.985404+00:00'
extraction_method: hybrid_llm_pattern_layout_v1
confidence_threshold: 0.6
entities_count: 5
cleanup_applied: '2025-12-13T19:49:34.408715+00:00'
claims:
- entity: BiSC Utrecht
entity_type: GRP.HER
xpath: /html/head/title
base_confidence: 0.9
layout_score: 0.2
pattern_score: 0.0
final_confidence: 1.0
layout_match: high_conf:head/title
- entity: https://www.biscutrecht.nl
entity_type: APP.URL
xpath: /html/head/link[@rel='pingback']/@href
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://www.biscutrecht.nl/feed/
entity_type: WRK.WEB
xpath: /html/head/link[@type='application/rss+xml' and contains(@title, 'feed')]/@href
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://www.biscutrecht.nl/comments/feed/
entity_type: WRK.WEB
xpath: /html/head/link[@type='application/rss+xml' and contains(@title, 'reacties')]/@href
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://www.biscutrecht.nl/agenda/?ical=1
entity_type: WRK.WEB
xpath: /html/head/link[@type='text/calendar']/@href
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
web_enrichment:
archive_metadata:
archive_method: httpx_fetch
archive_timestamp: '2025-12-21T10:13:25.908785+00:00'
archive_location: web/NL/UT/BUN/L/B
source_url: https://www.biscutrecht.nl/
html_file: web/NL/UT/BUN/L/B/www.biscutrecht.nl_index.html
claims:
- claim_type: page_title
claim_value: BiSC Utrecht | Voor bibliotheken in transitie
source_url: https://www.biscutrecht.nl/
retrieved_on: '2025-12-21T10:13:25.904838+00:00'
xpath: /html/head/title
xpath_match_score: 1.0
extraction_method: title_tag
html_file: web/NL/UT/BUN/L/B/www.biscutrecht.nl_index.html
- claim_type: social_linkedin
claim_value: https://www.linkedin.com/company/bisc-utrecht
source_url: https://www.biscutrecht.nl/
retrieved_on: '2025-12-21T10:13:25.904838+00:00'
xpath: /html/body/div/div/header/div/div/div[1]/div[3]/ul/li/a
xpath_match_score: 1.0
extraction_method: social_link
html_file: web/NL/UT/BUN/L/B/www.biscutrecht.nl_index.html
logo_enrichment:
enrichment_timestamp: '2025-12-22T10:38:55.993637+00:00'
source_url: http://www.biscutrecht.nl
extraction_method: crawl4ai
claims:
- claim_type: logo_url
claim_value: https://www.biscutrecht.nl/wp-content/uploads/2019/04/logo-bisc-utrecht.png
source_url: http://www.biscutrecht.nl
css_selector: '#et-boc > header.et-l.et-l--header > div.et_builder_inner_content.et_pb_gutters3 > div.et_pb_section.et_pb_section_0_tb_header
> div.et_pb_row.et_pb_row_1_tb_header:nth-of-type(2) > div.et_pb_column.et_pb_column_1_4 > div.et_pb_module.et_pb_image
> a > span.et_pb_image_wrap > img.wp-image-3731'
retrieved_on: '2025-12-22T10:38:55.993637+00:00'
extraction_method: crawl4ai_header_logo
detection_confidence: high
alt_text: ''
- claim_type: favicon_url
claim_value: https://www.biscutrecht.nl/wp-content/uploads/2015/06/cropped-favicon-180x180.png
source_url: http://www.biscutrecht.nl
css_selector: '[document] > html.js > head > link:nth-of-type(25)'
retrieved_on: '2025-12-22T10:38:55.993637+00:00'
extraction_method: crawl4ai_link_rel
favicon_type: ''
favicon_sizes: ''
summary:
total_claims: 2
has_primary_logo: true
has_favicon: true
has_og_image: false
favicon_count: 3