- Add display_name and name_romanized fields to all 7948 person profiles
- Resolve UNKNOWN-UNKNOWN collision group (Hebrew/Arabic names now properly romanize)
- Hebrew names like אבישי דנינו now generate PPID AVISHI-DANINO instead of UNKNOWN-UNKNOWN
- Collision count reduced from 82 to 81 groups
Regenerated using generate_ppids.py with unidecode support (commit abe30cb)
341 lines
No EOL
10 KiB
JSON
341 lines
No EOL
10 KiB
JSON
{
|
|
"generation_timestamp": "2026-01-09T17:29:51.769166+00:00",
|
|
"input_directory": "/Users/kempersc/apps/glam/data/custodian/person/entity",
|
|
"output_directory": "/Users/kempersc/apps/glam/data/person",
|
|
"statistics": {
|
|
"input_files": 10871,
|
|
"unique_persons": 10325,
|
|
"heritage_relevant": 7949,
|
|
"ppids_generated": 7948,
|
|
"collisions_resolved": 81,
|
|
"files_saved": 7948
|
|
},
|
|
"collisions": {
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_THIJS-JANSSEN": [
|
|
"thijs-janssen-5b6004282",
|
|
"thijs-janssen-3256a4237"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_WIM-SCHOT": [
|
|
"wim-schot-70319312",
|
|
"wim-schot-34aa17153"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_HENRI-OMMEN": [
|
|
"henri-van-ommen-55176029a",
|
|
"henri-van-ommen-2565ba21"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_DION-CROON": [
|
|
"dion-croon-0845b9182",
|
|
"dion-croon-7293a62"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_LIDY-KUTSCHRUITER": [
|
|
"lidy-kutschruiter-33934b107",
|
|
"lidy-kutschruiter-948651199"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JESSICA-V": [
|
|
"jessica-v-aa894535",
|
|
"jessica-v-b9a08747"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_PETER-NIJHUIS": [
|
|
"peter-peter-nijhuis-41b43a9a",
|
|
"peter-nijhuis-b6735b83",
|
|
"peter-nijhuis-a502b4249"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_INGE-SCHOONE": [
|
|
"ingejolijnschoone",
|
|
"inge-jolijn-schoone-b242843a"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_FLEUR-SMITH": [
|
|
"fleur-smith-788b8618",
|
|
"fleur-howes-smith-23b4b7b"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_WIM-ES": [
|
|
"wim-van-es-8104aa139",
|
|
"wimvanderes"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_DJOKE-DAM": [
|
|
"djoke-dam-9321a1139",
|
|
"djoke-dam-3a92a3139"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ANNEMARIE-DEKKER": [
|
|
"annemarie-dekker-025477132",
|
|
"annemarie-dekker-2aa03a43"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_RICHARD-JANSEN": [
|
|
"richard-jansen-b009878a",
|
|
"richardjansenhinttech"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ERWIN-VOORHAAR": [
|
|
"erwin-voorhaar-03a678274",
|
|
"erwin-voorhaar-1901b717"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ANNEMARIE-ETTEKOVEN": [
|
|
"annemarie-ettekoven-62446415",
|
|
"annemarie-ettekoven-9b6471158"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_PIETER-DREU": [
|
|
"pieter-de-dreu-b124504b",
|
|
"pieter-de-dreu-b6a4b34"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ANNEMARIE-BEZOOIJEN": [
|
|
"annemarie-bezooijen-b99034172",
|
|
"annemarie-bezooijen-56a66185"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_BENNO-TEMPEL": [
|
|
"benno-tempel-b40a445",
|
|
"bennotempel"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JOKE-PUTTEN": [
|
|
"joke-van-putten-537067b2",
|
|
"joke-van-putten-64048b238"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_REBECCA-TIMMERMANS": [
|
|
"rebecca-timmermans-95084021a",
|
|
"rebecca-timmermans-81717266"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JET-BARUCH": [
|
|
"jet-baruch-5209a0b",
|
|
"jet-baruch-829083110"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JOHAN-OOMEN": [
|
|
"johanoomen",
|
|
"johan-oomen-98b5b631"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JASPER-V": [
|
|
"jvh1988",
|
|
"jaspervdm"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_WIES-ERKELENS": [
|
|
"wies-erkelens-b4735219",
|
|
"wies-erkelens-5a6969161"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_NOVITA-DWIHAPSARI": [
|
|
"novita-dwihapsari-17983031",
|
|
"novita-dwihapsari-27788027"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_HANS-JANSEN": [
|
|
"hans-jansen-6a075530",
|
|
"hansjansen5"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ROBERT-GEBHARDT": [
|
|
"robert-gebhardt-524a37113",
|
|
"robert-gebhardt-a79567276"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_RENE-BROUWER": [
|
|
"rené-brouwer-413a1289",
|
|
"rene-brouwer-413a1289"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MAX-KLEEF": [
|
|
"max-van-kleef-321945195",
|
|
"max-kleef-325b1a161"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_STEPHAN-MANTEL": [
|
|
"stephan-mantel-b77b1b348",
|
|
"stephanmantel"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JH-SCHUITE": [
|
|
"j-h-schuite-41462750",
|
|
"j-h-schuite-8939751a4"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MICHIEL-WIJK": [
|
|
"michiel-van-wijk-85a8b754",
|
|
"michiel-van-wijk-53858154"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ANNE-B": [
|
|
"anne-b-a6023522",
|
|
"anne-v-b-832796186"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_DORINE-STUGER": [
|
|
"dorine-stuger-b3551894",
|
|
"dorine-stuger-56005083"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_AAT-HOUT": [
|
|
"aat-in-t-hout-2a164a22",
|
|
"aat-in-t-hout-6a28867"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MICHAEL-BAL": [
|
|
"michaël-bal-27884718",
|
|
"michaël-m-bal-63ba8313"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_GERARD-POEL": [
|
|
"gerard-van-der-poel-13a60b37",
|
|
"gerard-van-der-poel-11b20570"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ANGELIQUE-EERENBEEMD": [
|
|
"angelique-van-den-eerenbeemd-b754248",
|
|
"angelique-van-den-eerenbeemd-71415832"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ERIC-BOES": [
|
|
"eric-boes-5ba50b11a",
|
|
"eric-boes-8262b5124"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ARIE-WALLERT": [
|
|
"arie-wallert-a533b516",
|
|
"arie-wallert-7a7a0442"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JEROEN-BOS": [
|
|
"jvdbos",
|
|
"jeroen-bos-5aa600305"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_CASPER-HUIS": [
|
|
"casper-huis-8b1350180",
|
|
"casper-huis-ab8452179"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_RAISTIWAR-PRATAMA": [
|
|
"raistiwar-pratama-4bb2404a",
|
|
"raistiwar-pratama-0874ba290"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JOHN-DEE": [
|
|
"john-dee-64b31aa0",
|
|
"john-dee-7a69652b6"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_SEFANJA-BROUWER": [
|
|
"sefanja-brouwer-7b9b091a3",
|
|
"sefanja-brouwer-12b3368a"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_HELEN-MEIJER": [
|
|
"helen-meijer-4971b056",
|
|
"helenmeijer"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_TANJA-KUSTERS": [
|
|
"kusterscommunicatie",
|
|
"tanja-kusters-04589a203"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MARYSA-OTTE": [
|
|
"marysa-otte-a8632012",
|
|
"marysa-otte-853b6b23"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_GUUS-GEURTS": [
|
|
"guus-geurts-149948158",
|
|
"guus-geurts-637447a0"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_VESNA-INJAC": [
|
|
"vesna-injac-735b911",
|
|
"vesna-injac-07b2749"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ARNO-DIETEREN": [
|
|
"arno-dieteren-24304519",
|
|
"arno-dieteren-37914a30"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_HANNEKE-ZUTHEM": [
|
|
"hanneke-van-zuthem-3065bb11",
|
|
"hanneke-van-zuthem-20855311"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JULIETTE-ROMIJN": [
|
|
"julietteromijn",
|
|
"juliette-romijn-963374236"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MARIEJOSE-RAVEN": [
|
|
"marie-josé-raven-0413007",
|
|
"marie-josé-raven-18283711"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ERIK-VRIES": [
|
|
"erik-de-vries-075662171",
|
|
"erik-de-vries-6976083"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_TIM-ZEGGEREN": [
|
|
"tim-van-zeggeren-448539150",
|
|
"tim-van-zeggeren-96a20a29"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MAURITS-RAVESTEYN": [
|
|
"maurits-van-ravesteyn-916808154",
|
|
"maurits-van-ravesteyn-709517ab"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_NUR-ARIANI": [
|
|
"nur-indah-ariani-570514280",
|
|
"nur-indah-ariani-090920362"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_KELLY-V": [
|
|
"kelly-vink",
|
|
"kelly-v-0260305a"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_DAAN-JANSEN": [
|
|
"daan-jansen-6aa28225a",
|
|
"daan-jansen-85278640"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_BJRN-DEKKER": [
|
|
"bjørn-dekker-8447068a",
|
|
"bjorn-dekker-8447068a"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MARCEL-LAAR": [
|
|
"marcel-van-laar-5b4725294",
|
|
"marcel-van-laar-163a4a45"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_JAN-BEENS": [
|
|
"jan-beens-86b42013",
|
|
"jan-beens-5b6448335"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_HARRY-HOLLEMAN": [
|
|
"harry-holleman-a136059",
|
|
"harry-holleman-b205692a3",
|
|
"harryholleman"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_SIMONE-SOUER": [
|
|
"simone-souër-781bb126",
|
|
"simone-souer-781bb126"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MANJA-ZELDENRUST": [
|
|
"manja-zeldenrust-31475912",
|
|
"manja-zeldenrust-23678411"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MARENTE-BLOEMHEUVEL": [
|
|
"marente-bloemheuvel-9a65078",
|
|
"marente-bloemheuvel-a97aab355"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_SARAH-S": [
|
|
"sarahsarah",
|
|
"sarah-s-1699b2a3"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MARK-JONG": [
|
|
"mark-de-jong-405678",
|
|
"mark-de-jong-942663222"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_NIENKE-JANSEN": [
|
|
"nienke-jansen-2b8a1a6",
|
|
"nienke-jansen-3a906964"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_KARIN-VERSCHOOR": [
|
|
"karin-verschoor-b5136157",
|
|
"karinzwartverschoor"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_WILMA-TOOREN": [
|
|
"wilma-van-den-tooren-895203227",
|
|
"wilma-van-den-tooren-934b9674"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ISKANDER-BREEBAART": [
|
|
"iskander-breebaart-73b964b4",
|
|
"iskander-breebaart-854799b3"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_TEIO-MEEDENDORP": [
|
|
"teio-meedendorp-2ab21519",
|
|
"teio-meedendorp-634442a"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MATTIE-BOOM": [
|
|
"mattie-boom-76a122386",
|
|
"mattie-boom-8346bb79"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ANDRE-KLAVER": [
|
|
"andré-klaver-9535932b",
|
|
"andré-klaver-982b79239"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_NATASCHA-RENSWOUW": [
|
|
"natascha-van-renswouw-69328a10b",
|
|
"natascha-van-renswouw-703b5a19"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_KRISTA-VERMEULENRIJKER": [
|
|
"krista-vermeulen-rijker-022011346",
|
|
"krista-vermeulen-rijker-b4210a356"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_RUUD-HOGERWERF": [
|
|
"ruud-hogerwerf-377683294",
|
|
"ruud-hogerwerf-b583313b"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_RINSKE-HAAN": [
|
|
"rinske-haan-248778151",
|
|
"rinske-de-haan-0b529712"
|
|
],
|
|
"ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_MARJAN-NANNINGA": [
|
|
"marjan-nanninga-39353254",
|
|
"marjan-nanninga-55841b247"
|
|
]
|
|
}
|
|
} |