glam/frontend/public/data/nde_statistics.json
kempersc 30162e6526 Add script to validate KB library entries and generate enrichment report
- Implemented a Python script to validate KB library YAML files for required fields and data quality.
- Analyzed enrichment coverage from Wikidata and Google Maps, generating statistics.
- Created a comprehensive markdown report summarizing validation results and enrichment quality.
- Included error handling for file loading and validation processes.
- Generated JSON statistics for further analysis.
2025-11-28 14:48:33 +01:00

1685 lines
No EOL
32 KiB
JSON

{
"generated_at": "2025-11-28T12:24:11.193129+00:00",
"total_entries": 1502,
"summary": {
"total_institutions": 1502,
"enriched": 1466,
"not_enriched": 36,
"with_coordinates": 1411,
"with_wikidata": 1216,
"with_google_maps": 1345,
"google_maps_not_found": 0,
"unique_cities": 511,
"unique_provinces": 12,
"institution_types": 14
},
"charts": {
"institution_types": [
{
"code": "M",
"name": "Museum",
"count": 605,
"percentage": 40.3,
"color": "#e74c3c"
},
{
"code": "S",
"name": "Society",
"count": 346,
"percentage": 23.0,
"color": "#9b59b6"
},
{
"code": "A",
"name": "Archive",
"count": 222,
"percentage": 14.8,
"color": "#3498db"
},
{
"code": "L",
"name": "Library",
"count": 176,
"percentage": 11.7,
"color": "#2ecc71"
},
{
"code": "O",
"name": "Official",
"count": 52,
"percentage": 3.5,
"color": "#f39c12"
},
{
"code": "D",
"name": "Digital",
"count": 30,
"percentage": 2.0,
"color": "#34495e"
},
{
"code": "N",
"name": "NGO",
"count": 12,
"percentage": 0.8,
"color": "#e91e63"
},
{
"code": "B",
"name": "Botanical",
"count": 11,
"percentage": 0.7,
"color": "#4caf50"
},
{
"code": "R",
"name": "Research",
"count": 10,
"percentage": 0.7,
"color": "#1abc9c"
},
{
"code": "F",
"name": "Features",
"count": 9,
"percentage": 0.6,
"color": "#95a5a6"
},
{
"code": "E",
"name": "Education",
"count": 9,
"percentage": 0.6,
"color": "#ff9800"
},
{
"code": "C",
"name": "Corporation",
"count": 4,
"percentage": 0.3,
"color": "#795548"
},
{
"code": "I",
"name": "Intangible",
"count": 2,
"percentage": 0.1,
"color": "#673ab7"
},
{
"code": "G",
"name": "Gallery",
"count": 1,
"percentage": 0.1,
"color": "#00bcd4"
}
],
"top_cities": [
{
"city": "Den Haag",
"count": 53
},
{
"city": "Amsterdam",
"count": 43
},
{
"city": "Arnhem",
"count": 19
},
{
"city": "Groningen",
"count": 19
},
{
"city": "Rotterdam",
"count": 19
},
{
"city": "Zwolle",
"count": 15
},
{
"city": "Leeuwarden",
"count": 14
},
{
"city": "Nijmegen",
"count": 12
},
{
"city": "Utrecht",
"count": 12
},
{
"city": "Leiden",
"count": 11
},
{
"city": "Maastricht",
"count": 10
},
{
"city": "Enschede",
"count": 10
},
{
"city": "Deventer",
"count": 10
},
{
"city": "Assen",
"count": 8
},
{
"city": "Roermond",
"count": 8
},
{
"city": "Haarlem",
"count": 8
},
{
"city": "Den Bosch",
"count": 7
},
{
"city": "Apeldoorn",
"count": 6
},
{
"city": "Hardenberg",
"count": 6
},
{
"city": "Heerlen",
"count": 6
}
],
"collection_systems": [],
"wikidata_types": [
{
"type": "museum",
"count": 492
},
{
"type": "historical society",
"count": 125
},
{
"type": "Municipal Archive",
"count": 113
},
{
"type": "cultural association",
"count": 57
},
{
"type": "organization",
"count": 43
},
{
"type": "archive",
"count": 42
},
{
"type": "art museum",
"count": 24
},
{
"type": "regional archive",
"count": 21
},
{
"type": "regional historic center",
"count": 17
},
{
"type": "national museum",
"count": 15
},
{
"type": "nonprofit organization",
"count": 15
},
{
"type": "public library",
"count": 13
},
{
"type": "building",
"count": 11
},
{
"type": "library",
"count": 11
},
{
"type": "château",
"count": 11
},
{
"type": "ministry of the Netherlands",
"count": 11
},
{
"type": "library network",
"count": 10
},
{
"type": "military museum",
"count": 10
},
{
"type": "research institute",
"count": 10
},
{
"type": "State archive from the Netherlands",
"count": 8
}
],
"enrichment_status": [
{
"status": "Enriched",
"count": 1466,
"percentage": 97.6,
"color": "#2ecc71"
},
{
"status": "Not Enriched",
"count": 36,
"percentage": 2.4,
"color": "#e74c3c"
}
],
"enrichment_sources": [
{
"source": "Google Maps",
"count": 1345,
"percentage": 89.5,
"color": "#e74c3c"
},
{
"source": "Wikidata",
"count": 1216,
"percentage": 81.0,
"color": "#3498db"
},
{
"source": "Website",
"count": 425,
"percentage": 28.3,
"color": "#9b59b6"
},
{
"source": "ISIL",
"count": 357,
"percentage": 23.8,
"color": "#2ecc71"
}
],
"identifier_coverage": [
{
"identifier": "Coordinates",
"count": 1411,
"percentage": 93.9
},
{
"identifier": "Website",
"count": 940,
"percentage": 62.6
},
{
"identifier": "Wikipedia NL",
"count": 620,
"percentage": 41.3
},
{
"identifier": "Image",
"count": 532,
"percentage": 35.4
},
{
"identifier": "ISIL Code",
"count": 357,
"percentage": 23.8
}
],
"google_maps_coverage": [
{
"feature": "Street View",
"count": 1341,
"percentage": 89.3
},
{
"feature": "Rating",
"count": 1167,
"percentage": 77.7
},
{
"feature": "Reviews",
"count": 1160,
"percentage": 77.2
},
{
"feature": "Photos",
"count": 1151,
"percentage": 76.6
},
{
"feature": "Opening Hours",
"count": 989,
"percentage": 65.8
}
],
"founding_timeline": [
{
"decade": 600,
"count": 1
},
{
"decade": 610,
"count": 0
},
{
"decade": 620,
"count": 0
},
{
"decade": 630,
"count": 0
},
{
"decade": 640,
"count": 0
},
{
"decade": 650,
"count": 0
},
{
"decade": 660,
"count": 0
},
{
"decade": 670,
"count": 0
},
{
"decade": 680,
"count": 0
},
{
"decade": 690,
"count": 0
},
{
"decade": 700,
"count": 0
},
{
"decade": 710,
"count": 0
},
{
"decade": 720,
"count": 0
},
{
"decade": 730,
"count": 0
},
{
"decade": 740,
"count": 0
},
{
"decade": 750,
"count": 0
},
{
"decade": 760,
"count": 0
},
{
"decade": 770,
"count": 0
},
{
"decade": 780,
"count": 0
},
{
"decade": 790,
"count": 0
},
{
"decade": 800,
"count": 0
},
{
"decade": 810,
"count": 0
},
{
"decade": 820,
"count": 0
},
{
"decade": 830,
"count": 0
},
{
"decade": 840,
"count": 0
},
{
"decade": 850,
"count": 0
},
{
"decade": 860,
"count": 0
},
{
"decade": 870,
"count": 0
},
{
"decade": 880,
"count": 0
},
{
"decade": 890,
"count": 0
},
{
"decade": 900,
"count": 0
},
{
"decade": 910,
"count": 0
},
{
"decade": 920,
"count": 0
},
{
"decade": 930,
"count": 0
},
{
"decade": 940,
"count": 0
},
{
"decade": 950,
"count": 0
},
{
"decade": 960,
"count": 0
},
{
"decade": 970,
"count": 0
},
{
"decade": 980,
"count": 0
},
{
"decade": 990,
"count": 0
},
{
"decade": 1000,
"count": 0
},
{
"decade": 1010,
"count": 0
},
{
"decade": 1020,
"count": 0
},
{
"decade": 1030,
"count": 0
},
{
"decade": 1040,
"count": 0
},
{
"decade": 1050,
"count": 0
},
{
"decade": 1060,
"count": 0
},
{
"decade": 1070,
"count": 0
},
{
"decade": 1080,
"count": 0
},
{
"decade": 1090,
"count": 0
},
{
"decade": 1100,
"count": 0
},
{
"decade": 1110,
"count": 0
},
{
"decade": 1120,
"count": 0
},
{
"decade": 1130,
"count": 0
},
{
"decade": 1140,
"count": 0
},
{
"decade": 1150,
"count": 0
},
{
"decade": 1160,
"count": 0
},
{
"decade": 1170,
"count": 0
},
{
"decade": 1180,
"count": 0
},
{
"decade": 1190,
"count": 0
},
{
"decade": 1200,
"count": 0
},
{
"decade": 1210,
"count": 0
},
{
"decade": 1220,
"count": 0
},
{
"decade": 1230,
"count": 0
},
{
"decade": 1240,
"count": 0
},
{
"decade": 1250,
"count": 1
},
{
"decade": 1260,
"count": 0
},
{
"decade": 1270,
"count": 0
},
{
"decade": 1280,
"count": 2
},
{
"decade": 1290,
"count": 0
},
{
"decade": 1300,
"count": 0
},
{
"decade": 1310,
"count": 0
},
{
"decade": 1320,
"count": 0
},
{
"decade": 1330,
"count": 0
},
{
"decade": 1340,
"count": 0
},
{
"decade": 1350,
"count": 0
},
{
"decade": 1360,
"count": 0
},
{
"decade": 1370,
"count": 0
},
{
"decade": 1380,
"count": 0
},
{
"decade": 1390,
"count": 0
},
{
"decade": 1400,
"count": 3
},
{
"decade": 1410,
"count": 0
},
{
"decade": 1420,
"count": 0
},
{
"decade": 1430,
"count": 0
},
{
"decade": 1440,
"count": 0
},
{
"decade": 1450,
"count": 0
},
{
"decade": 1460,
"count": 0
},
{
"decade": 1470,
"count": 0
},
{
"decade": 1480,
"count": 0
},
{
"decade": 1490,
"count": 0
},
{
"decade": 1500,
"count": 0
},
{
"decade": 1510,
"count": 1
},
{
"decade": 1520,
"count": 0
},
{
"decade": 1530,
"count": 1
},
{
"decade": 1540,
"count": 1
},
{
"decade": 1550,
"count": 0
},
{
"decade": 1560,
"count": 0
},
{
"decade": 1570,
"count": 0
},
{
"decade": 1580,
"count": 1
},
{
"decade": 1590,
"count": 2
},
{
"decade": 1600,
"count": 0
},
{
"decade": 1610,
"count": 2
},
{
"decade": 1620,
"count": 0
},
{
"decade": 1630,
"count": 1
},
{
"decade": 1640,
"count": 2
},
{
"decade": 1650,
"count": 0
},
{
"decade": 1660,
"count": 2
},
{
"decade": 1670,
"count": 0
},
{
"decade": 1680,
"count": 0
},
{
"decade": 1690,
"count": 0
},
{
"decade": 1700,
"count": 0
},
{
"decade": 1710,
"count": 1
},
{
"decade": 1720,
"count": 0
},
{
"decade": 1730,
"count": 0
},
{
"decade": 1740,
"count": 0
},
{
"decade": 1750,
"count": 0
},
{
"decade": 1760,
"count": 2
},
{
"decade": 1770,
"count": 0
},
{
"decade": 1780,
"count": 2
},
{
"decade": 1790,
"count": 6
},
{
"decade": 1800,
"count": 3
},
{
"decade": 1810,
"count": 4
},
{
"decade": 1820,
"count": 2
},
{
"decade": 1830,
"count": 3
},
{
"decade": 1840,
"count": 7
},
{
"decade": 1850,
"count": 5
},
{
"decade": 1860,
"count": 4
},
{
"decade": 1870,
"count": 9
},
{
"decade": 1880,
"count": 9
},
{
"decade": 1890,
"count": 6
},
{
"decade": 1900,
"count": 3
},
{
"decade": 1910,
"count": 12
},
{
"decade": 1920,
"count": 8
},
{
"decade": 1930,
"count": 15
},
{
"decade": 1940,
"count": 10
},
{
"decade": 1950,
"count": 16
},
{
"decade": 1960,
"count": 8
},
{
"decade": 1970,
"count": 29
},
{
"decade": 1980,
"count": 27
},
{
"decade": 1990,
"count": 40
},
{
"decade": 2000,
"count": 32
},
{
"decade": 2010,
"count": 25
},
{
"decade": 2020,
"count": 5
}
],
"provinces": [
{
"province": "Zuid-Holland",
"count": 224,
"color": "#bcbd22",
"types": {
"S": {
"code": "S",
"name": "Society",
"count": 25,
"color": "#9b59b6"
},
"M": {
"code": "M",
"name": "Museum",
"count": 102,
"color": "#e74c3c"
},
"D": {
"code": "D",
"name": "Digital",
"count": 4,
"color": "#34495e"
},
"A": {
"code": "A",
"name": "Archive",
"count": 29,
"color": "#3498db"
},
"N": {
"code": "N",
"name": "NGO",
"count": 5,
"color": "#e91e63"
},
"O": {
"code": "O",
"name": "Official",
"count": 33,
"color": "#f39c12"
},
"U": {
"code": "U",
"name": "Unknown",
"count": 3,
"color": "#9e9e9e"
},
"L": {
"code": "L",
"name": "Library",
"count": 19,
"color": "#2ecc71"
},
"F": {
"code": "F",
"name": "Features",
"count": 2,
"color": "#95a5a6"
},
"B": {
"code": "B",
"name": "Botanical",
"count": 1,
"color": "#4caf50"
},
"R": {
"code": "R",
"name": "Research",
"count": 1,
"color": "#1abc9c"
}
}
},
{
"province": "Gelderland",
"count": 220,
"color": "#8c564b",
"types": {
"A": {
"code": "A",
"name": "Archive",
"count": 29,
"color": "#3498db"
},
"M": {
"code": "M",
"name": "Museum",
"count": 105,
"color": "#e74c3c"
},
"S": {
"code": "S",
"name": "Society",
"count": 46,
"color": "#9b59b6"
},
"D": {
"code": "D",
"name": "Digital",
"count": 10,
"color": "#34495e"
},
"L": {
"code": "L",
"name": "Library",
"count": 13,
"color": "#2ecc71"
},
"O": {
"code": "O",
"name": "Official",
"count": 5,
"color": "#f39c12"
},
"E": {
"code": "E",
"name": "Education",
"count": 3,
"color": "#ff9800"
},
"B": {
"code": "B",
"name": "Botanical",
"count": 2,
"color": "#4caf50"
},
"N": {
"code": "N",
"name": "NGO",
"count": 3,
"color": "#e91e63"
},
"U": {
"code": "U",
"name": "Unknown",
"count": 2,
"color": "#9e9e9e"
},
"C": {
"code": "C",
"name": "Corporation",
"count": 1,
"color": "#795548"
},
"F": {
"code": "F",
"name": "Features",
"count": 1,
"color": "#95a5a6"
}
}
},
{
"province": "Overijssel",
"count": 218,
"color": "#d62728",
"types": {
"M": {
"code": "M",
"name": "Museum",
"count": 65,
"color": "#e74c3c"
},
"U": {
"code": "U",
"name": "Unknown",
"count": 3,
"color": "#9e9e9e"
},
"L": {
"code": "L",
"name": "Library",
"count": 20,
"color": "#2ecc71"
},
"A": {
"code": "A",
"name": "Archive",
"count": 38,
"color": "#3498db"
},
"S": {
"code": "S",
"name": "Society",
"count": 79,
"color": "#9b59b6"
},
"D": {
"code": "D",
"name": "Digital",
"count": 6,
"color": "#34495e"
},
"N": {
"code": "N",
"name": "NGO",
"count": 1,
"color": "#e91e63"
},
"C": {
"code": "C",
"name": "Corporation",
"count": 2,
"color": "#795548"
},
"I": {
"code": "I",
"name": "Intangible",
"count": 1,
"color": "#673ab7"
},
"O": {
"code": "O",
"name": "Official",
"count": 2,
"color": "#f39c12"
},
"R": {
"code": "R",
"name": "Research",
"count": 1,
"color": "#1abc9c"
}
}
},
{
"province": "Noord-Holland",
"count": 176,
"color": "#7f7f7f",
"types": {
"O": {
"code": "O",
"name": "Official",
"count": 5,
"color": "#f39c12"
},
"M": {
"code": "M",
"name": "Museum",
"count": 90,
"color": "#e74c3c"
},
"S": {
"code": "S",
"name": "Society",
"count": 36,
"color": "#9b59b6"
},
"N": {
"code": "N",
"name": "NGO",
"count": 2,
"color": "#e91e63"
},
"R": {
"code": "R",
"name": "Research",
"count": 5,
"color": "#1abc9c"
},
"C": {
"code": "C",
"name": "Corporation",
"count": 1,
"color": "#795548"
},
"L": {
"code": "L",
"name": "Library",
"count": 12,
"color": "#2ecc71"
},
"G": {
"code": "G",
"name": "Gallery",
"count": 1,
"color": "#00bcd4"
},
"A": {
"code": "A",
"name": "Archive",
"count": 16,
"color": "#3498db"
},
"U": {
"code": "U",
"name": "Unknown",
"count": 2,
"color": "#9e9e9e"
},
"B": {
"code": "B",
"name": "Botanical",
"count": 2,
"color": "#4caf50"
},
"I": {
"code": "I",
"name": "Intangible",
"count": 1,
"color": "#673ab7"
},
"E": {
"code": "E",
"name": "Education",
"count": 1,
"color": "#ff9800"
},
"D": {
"code": "D",
"name": "Digital",
"count": 2,
"color": "#34495e"
}
}
},
{
"province": "Noord-Brabant",
"count": 172,
"color": "#aec7e8",
"types": {
"S": {
"code": "S",
"name": "Society",
"count": 75,
"color": "#9b59b6"
},
"M": {
"code": "M",
"name": "Museum",
"count": 70,
"color": "#e74c3c"
},
"O": {
"code": "O",
"name": "Official",
"count": 2,
"color": "#f39c12"
},
"A": {
"code": "A",
"name": "Archive",
"count": 13,
"color": "#3498db"
},
"D": {
"code": "D",
"name": "Digital",
"count": 1,
"color": "#34495e"
},
"L": {
"code": "L",
"name": "Library",
"count": 8,
"color": "#2ecc71"
},
"N": {
"code": "N",
"name": "NGO",
"count": 1,
"color": "#e91e63"
},
"E": {
"code": "E",
"name": "Education",
"count": 2,
"color": "#ff9800"
}
}
},
{
"province": "Friesland",
"count": 80,
"color": "#ff7f0e",
"types": {
"A": {
"code": "A",
"name": "Archive",
"count": 24,
"color": "#3498db"
},
"M": {
"code": "M",
"name": "Museum",
"count": 42,
"color": "#e74c3c"
},
"U": {
"code": "U",
"name": "Unknown",
"count": 1,
"color": "#9e9e9e"
},
"O": {
"code": "O",
"name": "Official",
"count": 2,
"color": "#f39c12"
},
"B": {
"code": "B",
"name": "Botanical",
"count": 3,
"color": "#4caf50"
},
"D": {
"code": "D",
"name": "Digital",
"count": 1,
"color": "#34495e"
},
"F": {
"code": "F",
"name": "Features",
"count": 1,
"color": "#95a5a6"
},
"R": {
"code": "R",
"name": "Research",
"count": 1,
"color": "#1abc9c"
},
"S": {
"code": "S",
"name": "Society",
"count": 3,
"color": "#9b59b6"
},
"L": {
"code": "L",
"name": "Library",
"count": 2,
"color": "#2ecc71"
}
}
},
{
"province": "Limburg",
"count": 79,
"color": "#ffbb78",
"types": {
"S": {
"code": "S",
"name": "Society",
"count": 31,
"color": "#9b59b6"
},
"O": {
"code": "O",
"name": "Official",
"count": 1,
"color": "#f39c12"
},
"M": {
"code": "M",
"name": "Museum",
"count": 26,
"color": "#e74c3c"
},
"L": {
"code": "L",
"name": "Library",
"count": 6,
"color": "#2ecc71"
},
"A": {
"code": "A",
"name": "Archive",
"count": 13,
"color": "#3498db"
},
"B": {
"code": "B",
"name": "Botanical",
"count": 1,
"color": "#4caf50"
},
"E": {
"code": "E",
"name": "Education",
"count": 1,
"color": "#ff9800"
}
}
},
{
"province": "Groningen",
"count": 70,
"color": "#1f77b4",
"types": {
"M": {
"code": "M",
"name": "Museum",
"count": 25,
"color": "#e74c3c"
},
"A": {
"code": "A",
"name": "Archive",
"count": 27,
"color": "#3498db"
},
"S": {
"code": "S",
"name": "Society",
"count": 6,
"color": "#9b59b6"
},
"F": {
"code": "F",
"name": "Features",
"count": 1,
"color": "#95a5a6"
},
"L": {
"code": "L",
"name": "Library",
"count": 4,
"color": "#2ecc71"
},
"R": {
"code": "R",
"name": "Research",
"count": 1,
"color": "#1abc9c"
},
"O": {
"code": "O",
"name": "Official",
"count": 1,
"color": "#f39c12"
},
"E": {
"code": "E",
"name": "Education",
"count": 1,
"color": "#ff9800"
},
"B": {
"code": "B",
"name": "Botanical",
"count": 2,
"color": "#4caf50"
},
"D": {
"code": "D",
"name": "Digital",
"count": 2,
"color": "#34495e"
}
}
},
{
"province": "Zeeland",
"count": 51,
"color": "#17becf",
"types": {
"A": {
"code": "A",
"name": "Archive",
"count": 10,
"color": "#3498db"
},
"S": {
"code": "S",
"name": "Society",
"count": 3,
"color": "#9b59b6"
},
"M": {
"code": "M",
"name": "Museum",
"count": 30,
"color": "#e74c3c"
},
"R": {
"code": "R",
"name": "Research",
"count": 1,
"color": "#1abc9c"
},
"D": {
"code": "D",
"name": "Digital",
"count": 1,
"color": "#34495e"
},
"F": {
"code": "F",
"name": "Features",
"count": 3,
"color": "#95a5a6"
},
"L": {
"code": "L",
"name": "Library",
"count": 3,
"color": "#2ecc71"
}
}
},
{
"province": "Drenthe",
"count": 45,
"color": "#2ca02c",
"types": {
"M": {
"code": "M",
"name": "Museum",
"count": 16,
"color": "#e74c3c"
},
"A": {
"code": "A",
"name": "Archive",
"count": 13,
"color": "#3498db"
},
"S": {
"code": "S",
"name": "Society",
"count": 14,
"color": "#9b59b6"
},
"L": {
"code": "L",
"name": "Library",
"count": 2,
"color": "#2ecc71"
}
}
},
{
"province": "Flevoland",
"count": 42,
"color": "#9467bd",
"types": {
"S": {
"code": "S",
"name": "Society",
"count": 12,
"color": "#9b59b6"
},
"L": {
"code": "L",
"name": "Library",
"count": 5,
"color": "#2ecc71"
},
"A": {
"code": "A",
"name": "Archive",
"count": 4,
"color": "#3498db"
},
"M": {
"code": "M",
"name": "Museum",
"count": 17,
"color": "#e74c3c"
},
"F": {
"code": "F",
"name": "Features",
"count": 1,
"color": "#95a5a6"
},
"U": {
"code": "U",
"name": "Unknown",
"count": 1,
"color": "#9e9e9e"
},
"O": {
"code": "O",
"name": "Official",
"count": 1,
"color": "#f39c12"
},
"D": {
"code": "D",
"name": "Digital",
"count": 1,
"color": "#34495e"
}
}
},
{
"province": "Utrecht",
"count": 33,
"color": "#e377c2",
"types": {
"M": {
"code": "M",
"name": "Museum",
"count": 13,
"color": "#e74c3c"
},
"A": {
"code": "A",
"name": "Archive",
"count": 6,
"color": "#3498db"
},
"S": {
"code": "S",
"name": "Society",
"count": 11,
"color": "#9b59b6"
},
"E": {
"code": "E",
"name": "Education",
"count": 1,
"color": "#ff9800"
},
"D": {
"code": "D",
"name": "Digital",
"count": 1,
"color": "#34495e"
},
"L": {
"code": "L",
"name": "Library",
"count": 1,
"color": "#2ecc71"
}
}
}
]
}
}