glam/data/custodian/NL-NH-AMS-R-HI.yaml
kempersc 181b1cf705 data: enrich Dutch heritage custodians (DR, FL, FR, GE, GR, LI provinces)
- Add digital platform discovery data with provenance
- Cleanup duplicate/incorrect custodian entries
- Add GHCID collision resolution suffixes where needed
- Update person entity profiles with career history
2025-12-15 01:34:38 +01:00

676 lines
24 KiB
YAML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
plaatsnaam_bezoekadres: Amsterdam
organisatie: Huygens Instituut (HI)
type_organisatie: unknown
source: nan_isil_2025-11-06
type:
- R
entry_index: 1502
processing_timestamp: '2025-11-30T09:58:13.945408+00:00'
nan_isil_enrichment:
source: Nationaal Archief ISIL Registry
source_file: ISIL-codes_2025-11-06.yaml
source_url: https://www.nationaalarchief.nl/isil
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-17T12:27:31.711551+00:00'
enrichment_timestamp: '2025-11-30T09:58:13.945408+00:00'
enrichment_method: new_entry_from_nan_isil
match_confidence: 1.0
isil_code: NL-AsdHI
nan_name: Huygens Instituut (HI)
nan_city: Amsterdam
nan_toegekend_op: '2025-07-30'
nan_opmerking: ''
identifiers:
- identifier_scheme: ISIL
identifier_value: NL-AsdHI
identifier_url: https://isil.org/NL-AsdHI
assigned_date: '2025-07-30'
source: Nationaal Archief ISIL Registry 2025-11-06
- identifier_scheme: GHCID
identifier_value: NL-NH-AMS-R-HI
- identifier_scheme: GHCID_UUID
identifier_value: 46379c78-595e-50e9-b38a-5f4fe37d9120
identifier_url: urn:uuid:46379c78-595e-50e9-b38a-5f4fe37d9120
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 133d2a88-53f0-858b-980e-c6684586f926
identifier_url: urn:uuid:133d2a88-53f0-858b-980e-c6684586f926
- identifier_scheme: GHCID_NUMERIC
identifier_value: '1386311025312187787'
- identifier_scheme: RECORD_ID
identifier_value: 019adf95-07a2-7df1-8fe6-322188cb38ab
identifier_url: urn:uuid:019adf95-07a2-7df1-8fe6-322188cb38ab
enrichment_status: enriched
provenance:
schema_version: 1.0.0
generated_at: '2025-11-30T09:58:13.945408+00:00'
sources:
original_entry:
- source_type: nan_isil_registry
data_tier: TIER_1_AUTHORITATIVE
claims_extracted:
- organisatie
- plaatsnaam_bezoekadres
- isil_code
genealogiewerkbalk:
- source_type: genealogiewerkbalk_registry
fetch_timestamp: '2025-12-03T13:44:00.744314+00:00'
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
match_method: plaatsnaam_bezoekadres
claims_extracted:
- municipality_name
- municipality_code
- municipal_archive_name
- municipal_archive_website
- municipal_archive_isil
- province_name
- province_code
- provincial_archive_name
- provincial_archive_website
data_tier_summary:
TIER_1_AUTHORITATIVE:
- nan_isil_registry
TIER_2_VERIFIED:
- genealogiewerkbalk_registry
TIER_3_CROWD_SOURCED: []
TIER_4_INFERRED: []
notes:
- Entry created from NAN ISIL Registry 2025-11-06 - needs further enrichment
- Enrichment status updated to 'enriched' on 2025-12-01T15:19:28.134408+00:00
- Canonical location normalized on 2025-12-09T12:55:34Z
google_maps_enrichment:
place_id: ChIJO6dE4bgJxkcRBil_dsYIKsY
name: Huygens Institute
fetch_timestamp: '2025-11-30T17:51:37.529451+00:00'
api_status: OK
coordinates:
latitude: 52.3705747
longitude: 4.8965239
formatted_address: Oudezijds Achterburgwal 185, 1012 DK Amsterdam
short_address: De Wallen Red Light District Amsterdam, Oudezijds Achterburgwal 185,
Amsterdam
address_components:
- long_name: '185'
short_name: '185'
types:
- street_number
- long_name: Oudezijds Achterburgwal
short_name: Oudezijds Achterburgwal
types:
- route
- long_name: Amsterdam-Centrum
short_name: Amsterdam-Centrum
types:
- sublocality_level_1
- sublocality
- political
- long_name: Amsterdam
short_name: Amsterdam
types:
- locality
- political
- long_name: Amsterdam
short_name: Amsterdam
types:
- administrative_area_level_2
- political
- long_name: Noord-Holland
short_name: NH
types:
- administrative_area_level_1
- political
- long_name: Nederland
short_name: NL
types:
- country
- political
- long_name: 1012 DK
short_name: 1012 DK
types:
- postal_code
phone_local: 020 224 6800
phone_international: +31 20 224 6800
website: http://www.huygens.knaw.nl/
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
opening_hours:
periods:
- open:
day: 1
hour: 9
minute: 0
close:
day: 1
hour: 17
minute: 0
- open:
day: 2
hour: 9
minute: 0
close:
day: 2
hour: 17
minute: 0
- open:
day: 3
hour: 9
minute: 0
close:
day: 3
hour: 17
minute: 0
- open:
day: 4
hour: 9
minute: 0
close:
day: 4
hour: 17
minute: 0
- open:
day: 5
hour: 9
minute: 0
close:
day: 5
hour: 17
minute: 0
weekday_text:
- 'maandag: 09:0017:00'
- 'dinsdag: 09:0017:00'
- 'woensdag: 09:0017:00'
- 'donderdag: 09:0017:00'
- 'vrijdag: 09:0017:00'
- 'zaterdag: Gesloten'
- 'zondag: Gesloten'
google_maps_url: https://maps.google.com/?cid=14279235217016170758&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
google_maps_status: SUCCESS
google_maps_search_query: Huygens Instituut (HI), Amsterdam, Netherlands
ghcid:
ghcid_current: NL-NH-AMS-R-HI
ghcid_original: NL-NH-AMS-U-HI
ghcid_uuid: 46379c78-595e-50e9-b38a-5f4fe37d9120
ghcid_uuid_sha256: 133d2a88-53f0-858b-980e-c6684586f926
ghcid_numeric: 1386311025312187787
record_id: 019adf95-07a2-7df1-8fe6-322188cb38ab
generation_timestamp: '2025-12-02T14:56:45.615377+00:00'
ghcid_history:
- ghcid: NL-NH-AMS-R-HI
ghcid_numeric: 1386311025312187787
valid_from: '2025-12-14T21:43:45.066494+00:00'
reason: 'Type corrected: U → R (manual correction)'
- ghcid: NL-NH-AMS-U-HI
ghcid_numeric: 3330535727189814456
valid_from: '2025-12-02T14:56:45.615377+00:00'
valid_to: '2025-12-14T21:43:45.066494+00:00'
reason: GHCID regenerated with Google Maps locality fix (Dec 2025)
superseded_by: NL-NH-AMS-R-HI
location_resolution:
method: GOOGLE_MAPS_LOCALITY
google_maps_locality: Amsterdam
geonames_id: 2759794
geonames_name: Amsterdam
feature_code: PPLC
population: 741636
admin1_code: '07'
region_code: NH
country_code: NL
source_coordinates:
latitude: 52.3705747
longitude: 4.8965239
source: google_maps
geonames_id: 2759794
custodian_name:
claim_type: custodian_name
claim_value: Huygens Instituut
source: web_og_site_name
confidence: 0.864
consensus_method: true
sources_checked: 4
sources_matched: 4
extraction_timestamp: '2025-12-02T13:09:32.195503+00:00'
matching_sources:
- source: google_maps
name: Huygens Institute
score: 0.95
- source: nan_isil
name: Huygens Instituut (HI)
score: 1.0
- source: original_entry
name: Huygens Instituut (HI)
score: 1.0
web_enrichment:
web_archives:
- url: http://www.huygens.knaw.nl/
directory: web/1502/huygens.knaw.nl
web_archive_timestamp: '2025-12-01T11:57:10.165322+00:00'
web_claims:
extraction_timestamp: '2025-12-02T08:57:04.671833+00:00'
source_archive: web/1502/huygens.knaw.nl
claims_count: 18
claims:
- claim_type: org_name
claim_value: Home
raw_value: Home - Huygens Instituut
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/title
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: title_tag
extraction_timestamp: '2025-12-02T08:57:04.659013+00:00'
- claim_type: description_short
claim_value: Het Huygens Instituut is het toonaangevende onderzoeksinstituut op
het gebied van geschiedenis en cultuur van Nederland.
raw_value: Het Huygens Instituut is het toonaangevende onderzoeksinstituut op
het gebied van geschiedenis en cultuur van Nederland.
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/meta[7]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: meta_description
extraction_timestamp: '2025-12-02T08:57:04.659226+00:00'
- claim_type: org_name
claim_value: Huygens Instituut
raw_value: Huygens Instituut
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/meta[14]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: og_site_name
extraction_timestamp: '2025-12-02T08:57:04.659583+00:00'
- claim_type: email
claim_value: info@huygens.knaw.nl
raw_value: info@huygens.knaw.nl
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/footer/div/div[1]/p[3]/a
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: mailto_link
extraction_timestamp: '2025-12-02T08:57:04.659757+00:00'
- claim_type: gallery_detected
claim_value: carousel
raw_value: 'carousel: 20 elements'
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/div[4]/div/div[1]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 0.85
extraction_method: gallery_pattern
extraction_timestamp: '2025-12-02T08:57:04.666922+00:00'
- claim_type: image_count
claim_value: '4'
raw_value: 4 images in carousel container
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/div[4]/div/div[1]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 0.8
extraction_method: gallery_image_count
extraction_timestamp: '2025-12-02T08:57:04.667386+00:00'
- claim_type: page_title
claim_value: Home - Huygens Instituut
raw_value: Home - Huygens Instituut
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/title
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: title_tag_full
extraction_timestamp: '2025-12-02T08:57:04.667657+00:00'
- claim_type: favicon
claim_value: /favicon-32x32.png
raw_value: sizes=32x32, type=image/png
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/link[8]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:57:04.667717+00:00'
- claim_type: favicon
claim_value: /favicon-16x16.png
raw_value: sizes=16x16, type=image/png
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/link[9]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:57:04.667721+00:00'
- claim_type: favicon
claim_value: https://www.huygens.knaw.nl/wp-content/uploads/2022/07/H_Blue_RGB_2x-80x80.png
raw_value: sizes=32x32
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/link[21]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:57:04.667726+00:00'
- claim_type: favicon
claim_value: https://www.huygens.knaw.nl/wp-content/uploads/2022/07/H_Blue_RGB_2x-320x320.png
raw_value: sizes=192x192
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/link[22]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:57:04.667730+00:00'
- claim_type: favicon
claim_value: /apple-touch-icon.png
raw_value: sizes=180x180
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/link[7]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:57:04.667826+00:00'
- claim_type: favicon
claim_value: /safari-pinned-tab.svg
raw_value: /safari-pinned-tab.svg
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/head/link[11]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: favicon_link
extraction_timestamp: '2025-12-02T08:57:04.667831+00:00'
- claim_type: logo
claim_value: https://www.huygens.knaw.nl/wp-content/themes/huygens-2026/img/logo_huygens.png
raw_value: alt=Huygens ING
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/header/a[1]/img[1]
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: logo_img_attr
extraction_timestamp: '2025-12-02T08:57:04.668013+00:00'
- claim_type: logo
claim_value: https://www.huygens.knaw.nl/wp-content/themes/huygens-2026/img/footer-logo-knaw-humanities-cluster.png
raw_value: alt=Bezoek KNAW Humanities Cluster
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/footer/div/div[1]/div/div[2]/a[1]/img
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: logo_img_attr
extraction_timestamp: '2025-12-02T08:57:04.668019+00:00'
- claim_type: logo
claim_value: https://www.huygens.knaw.nl/wp-content/themes/huygens-2026/img/footer-logo-knaw.png
raw_value: alt=Bezoek KNAW
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/footer/div/div[1]/div/div[2]/a[2]/img
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: logo_img_attr
extraction_timestamp: '2025-12-02T08:57:04.668023+00:00'
- claim_type: logo
claim_value: https://www.huygens.knaw.nl/wp-content/uploads/2018/05/logo-historici-198x30.png
raw_value: alt=Bezoek historici.nl
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/footer/div/div[3]/ul/li/a/img
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: logo_img_attr
extraction_timestamp: '2025-12-02T08:57:04.668028+00:00'
- claim_type: ui_login
claim_value: https://nieuwsbrief.huygens.knaw.nl/nl/aanmelden-voor-de-huygens-nieuwsbrief
raw_value: text=abonneer u op onze nieuwsbrief, pattern=aanmelden
source_url: http://www.huygens.knaw.nl/
retrieved_on: ''
xpath: /html/body/footer/div/div[2]/p[2]/a
html_file: web/1502/huygens.knaw.nl/rendered.html
xpath_match_score: 1.0
extraction_method: login_button
extraction_timestamp: '2025-12-02T08:57:04.671443+00:00'
url: http://www.huygens.knaw.nl/
genealogiewerkbalk_enrichment:
source: Genealogiewerkbalk.nl Municipality Archives Registry
source_url: https://www.genealogiewerkbalk.nl/archieven.html
data_url: https://docs.google.com/spreadsheets/d/1rS_Z5L6L2vvfGLS6eHI8wfyiwB-KUfHEr7W1VNY3rpg/export?format=csv
data_tier: TIER_2_VERIFIED
enrichment_timestamp: '2025-12-03T13:44:00.744306+00:00'
match_method: plaatsnaam_bezoekadres
match_confidence: 1.0
municipality:
name: Amsterdam
code: '363'
municipal_archive:
name: Stadsarchief Amsterdam
website: https://archief.amsterdam/
isil: NL-AsdSAA
province:
name: Noord-Holland
code: '27'
provincial_archive:
name: Noord-Hollands Archief
website: https://noord-hollandsarchief.nl/
digital_platforms:
- platform_name: Huygens Instituut (HI) Website
platform_url: http://www.huygens.knaw.nl/
platform_type: WEBSITE
platform_category:
- Organizational website
digital_collections: Organizational website with heritage information
technology_stack: Standard web technology
data_standards:
- Open Graph
user_services: General information, Contact
sustainability_model: Institutional funding
enrichment_timestamp: '2025-12-05T11:36:09.574036+00:00'
source_method: automated_extraction
wikidata_enrichment:
wikidata_entity_id: Q2353809
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-09T12:15:50.156808+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P31
- P17
- P576
wikidata_labels:
nl: Huygens Instituut
fy: Huygens Ynstitút
en: Huygens Institute
mk: Институт „Хајгенс“
fr: Institut Huygens
sl: Huygensov inštitut
wikidata_label_en: Huygens Institute
wikidata_label_nl: Huygens Instituut
wikidata_label_fr: Institut Huygens
wikidata_descriptions:
nl: voormalig onderzoeksinstituut in Nederland
fr: ancien institut de recherche aux Pays-Bas
sl: nekdanji raziskovalni inštitut na Nizozemskem
wikidata_aliases:
sl:
- Huygens Instituut
wikidata_temporal:
dissolution: '2010-12-31'
wikidata_dissolution: '2010-12-31'
wikidata_classification:
instance_of: &id001
- id: Q31855
label: research institute
description: organization whose primary purpose is research
wikidata_instance_of: *id001
wikidata_location:
country: &id002
id: Q55
label: Netherlands
description: country in Northwestern Europe with territories in the Caribbean
wikidata_country: *id002
unesco_ich_enrichment:
country_code: NL
total_elements_in_country: 5
enrichment_timestamp: '2025-12-06T20:20:52.615456+00:00'
elements:
- unesco_ich_id: '1870'
name: Rotterdam Summer Carnival
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2023
multinational: false
url: https://ich.unesco.org/en/RL/rotterdam-summer-carnival-01870
description: The Rotterdam Summer Carnival is a multicultural celebration that
unites participants from the Caribbean and European Netherlands, as well as
ethnic minority groups from Central and South America and Africa living in the
Netherlands. The event includes a street parade, a brass band competition and
a...
- unesco_ich_id: '1979'
name: 'Traditional irrigation: knowledge, technique, and organization'
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2023
multinational: true
url: https://ich.unesco.org/en/RL/traditional-irrigation-knowledge-technique-and-organization-01979
description: Traditional irrigation uses gravity and hand-made constructions such
as channels and ditches to distribute water from naturally-occurring water catchment
points (such as springs, streams and glaciers) to the fields. Practitioners
choose specific days and periods to manually divert the water, and the...
- unesco_ich_id: '1707'
name: Corso culture, flower and fruit parades in the Netherlands
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2021
multinational: false
url: https://ich.unesco.org/en/RL/corso-culture-flower-and-fruit-parades-in-the-netherlands-01707
description: Dating back to the late nineteenth century, a corso is an annual
parade of floats or boats decorated with flowers, fruit, vegetables and, in
some cases, people in costumes. Originating in the south of France and Italy,
the practice spread to the Netherlands in the nineteenth century. The parade
take...
- unesco_ich_id: '1708'
name: Falconry, a living human heritage
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2021
multinational: true
url: https://ich.unesco.org/en/RL/falconry-a-living-human-heritage-01708
description: Falconry is the traditional art and practice of training and flying
falcons (and sometimes eagles, hawks, buzzards and other birds of prey). It
has been practised for over 4000 years. The practice of falconry in early and
medieval periods of history is documented in many parts of the world. Original...
- unesco_ich_id: '1265'
name: Craft of the miller operating windmills and watermills
list_type: RL
list_name: Representative List of the Intangible Cultural Heritage of Humanity
inscription_year: 2017
multinational: false
url: https://ich.unesco.org/en/RL/craft-of-the-miller-operating-windmills-and-watermills-01265
description: The craft of the miller operating windmills and watermills involves
the knowledge and skills necessary to operate a mill and maintain it in a good
state of repair. With a declining number of people earning their livelihood
from the craft, millers today also play a key role in transmitting the cultur...
location:
latitude: 52.3705747
longitude: 4.8965239
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-11-30T17:51:37.529451+00:00'
entity_id: ChIJO6dE4bgJxkcRBil_dsYIKsY
city: Amsterdam
region: Noord-Holland
region_code: NH
country: NL
postal_code: 1012 DK
street_address: De Wallen Red Light District Amsterdam, Oudezijds Achterburgwal
185, Amsterdam
formatted_address: Oudezijds Achterburgwal 185, 1012 DK Amsterdam
geonames_id: 2759794
geonames_name: Amsterdam
feature_code: PPLC
normalization_timestamp: '2025-12-09T12:55:34.169592+00:00'
validated_entity_claims:
extraction_timestamp: '2025-12-13T19:45:31.929963+00:00'
extraction_method: hybrid_llm_pattern_layout_v1
confidence_threshold: 0.6
entities_count: 9
cleanup_applied: '2025-12-13T19:49:31.637601+00:00'
claims:
- entity: Huygens Instituut
entity_type: GRP.HER
xpath: /html/head/title
base_confidence: 0.95
layout_score: 0.2
pattern_score: 0.0
final_confidence: 1.0
layout_match: high_conf:head/title
- entity: '2025-11-20T09:51:53+00:00'
entity_type: TMP.DAB
xpath: /html/head/meta[property='article:modified_time']
base_confidence: 1.0
layout_score: 0.0
pattern_score: 0.0
final_confidence: 1.0
- entity: https://www.huygens.knaw.nl/
entity_type: APP.URL
xpath: /html/head/link[rel='canonical']
base_confidence: 0.98
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.98
- entity: https://www.huygens.knaw.nl/en/institute-dutch-history-culture/
entity_type: APP.URL
xpath: /html/head/link[@hreflang='en']
base_confidence: 0.98
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.98
- entity: Home - Huygens Instituut
entity_type: APP.TTL
xpath: /html/head/title
base_confidence: 0.95
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.95
- entity: https://www.huygens.knaw.nl/
entity_type: APP.WKD
xpath: /html/head/meta[property='og:url']
base_confidence: 0.95
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.95
- entity: Nederland
entity_type: TOP.CTY
xpath: /html/head/meta[@name='description']
base_confidence: 0.9
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.9
wikidata_id: Q55
wikidata_label: Netherlands
- entity: geschiedenis
entity_type: THG.CON
xpath: /html/head/meta[@name='description']
base_confidence: 0.9
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.9
- entity: cultuur
entity_type: THG.CON
xpath: /html/head/meta[@name='description']
base_confidence: 0.9
layout_score: 0.0
pattern_score: 0.0
final_confidence: 0.9
wikidata_linking_timestamp: '2025-12-13T23:07:16.175736'
crawl4ai_enrichment:
retrieval_timestamp: '2025-12-14T17:58:58.937743+00:00'
retrieval_agent: crawl4ai
source_url: http://www.huygens.knaw.nl/
status_code: null
error: Crawl failed with status None