diff --git a/backend/rag/main.py b/backend/rag/main.py index 95fd25a519..4d565ceefd 100644 --- a/backend/rag/main.py +++ b/backend/rag/main.py @@ -2485,20 +2485,28 @@ async def dspy_query(request: DSPyQueryRequest) -> DSPyQueryResponse: elapsed_ms = (time.time() - start_time) * 1000 + # Extract retrieved results for frontend visualization (tables, graphs) + retrieved_results = getattr(result, "retrieved_results", None) + query_type = getattr(result, "query_type", None) + # Extract visualization if present visualization = None if request.include_visualization and hasattr(result, "visualization"): viz = result.visualization if viz: + # Only include SPARQL for institution queries - person queries use wrong schema + # The HeritageSPARQLGenerator generates queries using crm:E39_Actor and hc:institutionType + # but person data uses schema:Person, schema:name, schema:jobTitle predicates. + # TODO: Create HeritagePersonSPARQLGenerator with correct schema:Person predicates + sparql_to_show = None + if query_type != "person": + sparql_to_show = getattr(result, "sparql", None) + visualization = { "type": getattr(viz, "viz_type", "table"), - "sparql_query": getattr(result, "sparql", None), + "sparql_query": sparql_to_show, } - # Extract retrieved results for frontend visualization (tables, graphs) - retrieved_results = getattr(result, "retrieved_results", None) - query_type = getattr(result, "query_type", None) - # Extract LLM response metadata from DSPy history (GLM 4.7 reasoning_content support) llm_response_metadata = extract_llm_response_metadata( lm=lm, @@ -2971,17 +2979,26 @@ async def stream_dspy_query_response( elapsed_ms = (time.time() - start_time) * 1000 + # Extract query_type first - needed for SPARQL visibility decision + query_type = getattr(result, "query_type", None) + visualization = None if request.include_visualization and hasattr(result, "visualization"): viz = result.visualization if viz: + # Only include SPARQL for institution queries - person SPARQL uses wrong schema + # (HeritageSPARQLGenerator uses crm:E39_Actor but person data uses schema:Person) + # TODO: Create HeritagePersonSPARQLGenerator with correct schema:Person predicates + sparql_to_show = None + if query_type != "person": + sparql_to_show = getattr(result, "sparql", None) + visualization = { "type": getattr(viz, "viz_type", "table"), - "sparql_query": getattr(result, "sparql", None), + "sparql_query": sparql_to_show, } retrieved_results = getattr(result, "retrieved_results", None) - query_type = getattr(result, "query_type", None) # Extract LLM response metadata from DSPy history (GLM 4.7 reasoning_content support) llm_response_metadata = extract_llm_response_metadata( diff --git a/data/custodian/.logo_enrichment_crawl4ai_checkpoint.json b/data/custodian/.logo_enrichment_crawl4ai_checkpoint.json index a896d67c22..8fe317cb56 100644 --- a/data/custodian/.logo_enrichment_crawl4ai_checkpoint.json +++ b/data/custodian/.logo_enrichment_crawl4ai_checkpoint.json @@ -10912,7 +10912,757 @@ "JP-13-CHU-L-NL.yaml", "JP-13-CHU-L-RLT.yaml", "JP-13-CHU-L-S-shimizukensetsukabushikigaishajohoshiryosenta.yaml", - "JP-13-CHU-L-S.yaml" + "JP-13-CHU-L-S.yaml", + "JP-13-CHU-L-SL.yaml", + "JP-13-CHU-L-SOL.yaml", + "JP-13-CHU-L-T.yaml", + "JP-13-CHU-L-TIITL.yaml", + "JP-13-CHU-M-AMIF.yaml", + "JP-13-CHU-M-CCCHM.yaml", + "JP-13-CHU-M-CMIMESBJ.yaml", + "JP-13-CHU-M-KM.yaml", + "JP-13-CHU-M-MHYYC.yaml", + "JP-13-CHU-M-MMM.yaml", + "JP-13-CHU-M-NFAJ.yaml", + "JP-13-CHU-M-SMG.yaml", + "JP-13-EDO-L-AGJCL.yaml", + "JP-13-EDO-L-ECCL.yaml", + "JP-13-EDO-L-ECHKL.yaml", + "JP-13-EDO-L-ECKL-edogawa_city_kasai_library.yaml", + "JP-13-EDO-L-ECKL-edogawa_city_komatsugawa_library.yaml", + "JP-13-EDO-L-ECKL.yaml", + "JP-13-EDO-L-ECML.yaml", + "JP-13-EDO-L-ECNKL.yaml", + "JP-13-EDO-L-ECSCL.yaml", + "JP-13-EDO-L-ECSL.yaml", + "JP-13-EDO-L-ECSLY.yaml", + "JP-13-EDO-L-ECTL.yaml", + "JP-13-EDO-L-EL.yaml", + "JP-13-EDO-L-SLN.yaml", + "JP-13-EDO-L-TCWL.yaml", + "JP-13-EDO-M-EKLM.yaml", + "JP-13-EDO-M-MM.yaml", + "JP-13-EDO-M-TSLP.yaml", + "JP-13-ETO-L-TPUHSL.yaml", + "JP-13-FUC-A-FF-fuchushiritsu_furusatofuchurekishikan.yaml", + "JP-13-FUC-A-FF.yaml", + "JP-13-FUC-A-TUFSA-tokyo_university_of_foreign_studies_archives.yaml", + "JP-13-FUC-A-TUFSA.yaml", + "JP-13-FUC-L-FL-fuchushiritsukatamachi_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsukoremasa_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsumiyamachi_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsumomijigaoka_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsumusashidai_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsunishifu_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsuoshitate_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsushimmachi_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsushiraitodai_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsushogaigakushusenta_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsusumiyoshi_library.yaml", + "JP-13-FUC-L-FL-fuchushiritsuyotsuya_library.yaml", + "JP-13-FUC-L-FL.yaml", + "JP-13-FUC-L-ITMRTPSSL.yaml", + "JP-13-FUC-L-TLFL.yaml", + "JP-13-FUC-L-TUFSL.yaml", + "JP-13-FUC-M-FAM.yaml", + "JP-13-FUC-M-JRM.yaml", + "JP-13-FUC-M-KMFCM.yaml", + "JP-13-FUC-M-OST.yaml", + "JP-13-FUS-L-FL-fussashiritsumusashinodai_library.yaml", + "JP-13-FUS-L-FL-fussashiritsuwakagiri_library.yaml", + "JP-13-FUS-L-FL-fussashiritsuwakatake_library.yaml", + "JP-13-FUS-L-FL.yaml", + "JP-13-FUS-M-FMLH.yaml", + "JP-13-HAC-L-C-chuodaigakuhogakubugakuseitoshoshitsu.yaml", + "JP-13-HAC-L-C-chuodaigakujimbunkagakukenkyusho.yaml", + "JP-13-HAC-L-C-chuodaigakukeizaigakubugakuseitoshoshitsu.yaml", + "JP-13-HAC-L-C-chuodaigakukeizaikenkyujo.yaml", + "JP-13-HAC-L-C-chuodaigakukigyokenkyujo.yaml", + "JP-13-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo.yaml", + "JP-13-HAC-L-C-chuodaigakushakaikagakukenkyujo.yaml", + "JP-13-HAC-L-C-chuodaigakushogakubugakuseitoshoshitsu.yaml", + "JP-13-HAC-L-C.yaml", + "JP-13-HAC-L-CL.yaml", + "JP-13-HAC-L-CLTMU.yaml", + "JP-13-HAC-L-HL-hachijochoritsu_library.yaml", + "JP-13-HAC-L-HL-hachiojishiikoi_library.yaml", + "JP-13-HAC-L-HL-hachiojishiishikawashiminsenta_library.yaml", + "JP-13-HAC-L-HL-hachiojishikawaguchi_library.yaml", + "JP-13-HAC-L-HL-hachiojishikitanoshiminsenta_library.yaml", + "JP-13-HAC-L-HL-hachiojishiminamiosawa_library.yaml", + "JP-13-HAC-L-HL-hachiojishiongatashiminsenta_library.yaml", + "JP-13-HAC-L-HL-hachiojishishogaigakushusenta_library.yaml", + "JP-13-HAC-L-HL-hachiojishiyugichuoshiminsenta_library.yaml", + "JP-13-HAC-L-HL-hachiojishiyuishiminsentaminamino_library.yaml", + "JP-13-HAC-L-HL.yaml", + "JP-13-HAC-L-ICLJCU.yaml", + "JP-13-HAC-L-ICLTUPLS.yaml", + "JP-13-HAC-L-IHSSCU.yaml", + "JP-13-HAC-L-KLH.yaml", + "JP-13-HAC-L-NL.yaml", + "JP-13-HAC-L-OC.yaml", + "JP-13-HAC-L-SUFLFSEA.yaml", + "JP-13-HAC-L-SUL.yaml", + "JP-13-HAC-L-SULSL.yaml", + "JP-13-HAC-L-SUSL.yaml", + "JP-13-HAC-L-SWSCL.yaml", + "JP-13-HAC-L-TL-tokyojunshindaigaku_library.yaml", + "JP-13-HAC-L-TL-tokyokogyokotosemmongakko_library.yaml", + "JP-13-HAC-L-TL-tokyozokeidaigakufuzoku_library.yaml", + "JP-13-HAC-L-TL.yaml", + "JP-13-HAC-L-TLI.yaml", + "JP-13-HAC-L-TUHL.yaml", + "JP-13-HAC-L-TUMLC.yaml", + "JP-13-HAC-L-TUTMCL.yaml", + "JP-13-HAC-L-UASPROCU.yaml", + "JP-13-HAC-L-YL.yaml", + "JP-13-HAC-L-YUANL.yaml", + "JP-13-HAC-M-HCHM.yaml", + "JP-13-HAC-M-HSC.yaml", + "JP-13-HAC-M-MPGTUPLS.yaml", + "JP-13-HAC-M-TFAM.yaml", + "JP-13-HAC-M-TFSG.yaml", + "JP-13-HAC-M-TM.yaml", + "JP-13-HAC-M-TUM.yaml", + "JP-13-HAC-M-TVC.yaml", + "JP-13-HAC-M-TZUAM.yaml", + "JP-13-HAG-A-HTA-haga_town_archives.yaml", + "JP-13-HAG-A-HTA.yaml", + "JP-13-HAG-L-HTL.yaml", + "JP-13-HAG-L-IPL.yaml", + "JP-13-HAG-L-M.yaml", + "JP-13-HAG-L-ML.yaml", + "JP-13-HAG-M-HTM.yaml", + "JP-13-HAG-M-IHFM.yaml", + "JP-13-HAG-M-MMCA.yaml", + "JP-13-HAG-M-MMF.yaml", + "JP-13-HAG-M-WNAG.yaml", + "JP-13-HAM-L-H-hamurashifujimidairabunshitsu.yaml", + "JP-13-HAM-L-H-hamurashikamibunshitsu.yaml", + "JP-13-HAM-L-H-hamurashikawasakibunshitsu.yaml", + "JP-13-HAM-L-H.yaml", + "JP-13-HAM-L-HCL.yaml", + "JP-13-HAM-M-HM.yaml", + "JP-13-HAM-M-HZP.yaml", + "JP-13-HIE-M-NESMTD.yaml", + "JP-13-HIE-M-NOMA.yaml", + "JP-13-HIG-L-CL.yaml", + "JP-13-HIG-L-HAL.yaml", + "JP-13-HIG-L-HCL.yaml", + "JP-13-HIG-L-HFL.yaml", + "JP-13-HIG-L-HHL.yaml", + "JP-13-HIG-L-HL-higashikurumeshiritsuchuo_library.yaml", + "JP-13-HIG-L-HL-higashiyamatoshiritsukiyohara_library.yaml", + "JP-13-HIG-L-HL-higashiyamatoshiritsusakuragaoka_library.yaml", + "JP-13-HIG-L-HL.yaml", + "JP-13-HIG-L-HLHC.yaml", + "JP-13-HIG-L-HML.yaml", + "JP-13-HIG-L-HTL.yaml", + "JP-13-HIG-L-KCLTNDRLL.yaml", + "JP-13-HIG-L-TBSL.yaml", + "JP-13-HIG-L-TLHC.yaml", + "JP-13-HIG-M-FMH.yaml", + "JP-13-HIG-M-HCM.yaml", + "JP-13-HIG-M-NHSDM.yaml", + "JP-13-HIG-M-TAMF.yaml", + "JP-13-HIG-M-TCBM.yaml", + "JP-13-HIM-L-H-himishijusankominkantoshoshitsu.yaml", + "JP-13-HIM-L-H-himishiunamikominkantoshoshitsu.yaml", + "JP-13-HIM-L-H.yaml", + "JP-13-HIM-L-HCL.yaml", + "JP-13-HIM-M-HCM.yaml", + "JP-13-HIM-M-HSBG.yaml", + "JP-13-HIN-L-AMHIL.yaml", + "JP-13-HIN-L-H.yaml", + "JP-13-HIN-L-HL-hinocho_library.yaml", + "JP-13-HIN-L-HL-hinoshiritsuhino_library.yaml", + "JP-13-HIN-L-HL-hinoshiritsuhirayama_library.yaml", + "JP-13-HIN-L-HL-hinoshiritsumogusa_library.yaml", + "JP-13-HIN-L-HL-hinoshiritsutakahata_library.yaml", + "JP-13-HIN-L-HL-hinoshiritsutamadaira_library.yaml", + "JP-13-HIN-L-HL.yaml", + "JP-13-HIN-L-JWSUL.yaml", + "JP-13-HIN-L-KL.yaml", + "JP-13-HIN-L-MUL.yaml", + "JP-13-HIN-L-NL.yaml", + "JP-13-HIN-L-SDLTMU.yaml", + "JP-13-HIN-M-HCHM.yaml", + "JP-13-HIN-M-LMHC.yaml", + "JP-13-HIN-M-NTMA.yaml", + "JP-13-HIN-M-TZP.yaml", + "JP-13-HIU-L-KCL.yaml", + "JP-13-IMI-L-IL-imizushishimminato_library.yaml", + "JP-13-IMI-L-IL-imizushishimomura_library.yaml", + "JP-13-IMI-L-IL-imizushishoriki_library.yaml", + "JP-13-IMI-L-IL.yaml", + "JP-13-IMI-L-TL.yaml", + "JP-13-IMI-L-TLJL.yaml", + "JP-13-IMI-L-TPUL.yaml", + "JP-13-IMI-M-DMOC.yaml", + "JP-13-IMI-M-ICSM.yaml", + "JP-13-IMI-M-ITT.yaml", + "JP-13-INA-L-ICCL.yaml", + "JP-13-INA-L-ICDIL.yaml", + "JP-13-INA-L-ICDNL.yaml", + "JP-13-INA-L-ICDSL.yaml", + "JP-13-INA-L-ICDYL.yaml", + "JP-13-INA-L-IL.yaml", + "JP-13-INA-L-KTL.yaml", + "JP-13-ITA-A-IK-itabashiku_koubunshokan.yaml", + "JP-13-ITA-A-IK.yaml", + "JP-13-ITA-L-AL.yaml", + "JP-13-ITA-L-DBUL.yaml", + "JP-13-ITA-L-IBCSBH.yaml", + "JP-13-ITA-L-ICAL.yaml", + "JP-13-ITA-L-ICCL.yaml", + "JP-13-ITA-L-ICHIL.yaml", + "JP-13-ITA-L-ICHL-itabashi_city_hikawa_library.yaml", + "JP-13-ITA-L-ICHL.yaml", + "JP-13-ITA-L-ICKL.yaml", + "JP-13-ITA-L-ICNL-itabashi_city_narimasu_library.yaml", + "JP-13-ITA-L-ICNL.yaml", + "JP-13-ITA-L-ICSL-itabashi_city_shimura_library.yaml", + "JP-13-ITA-L-ICSL.yaml", + "JP-13-ITA-L-ICTL.yaml", + "JP-13-ITA-L-IL.yaml", + "JP-13-ITA-L-K.yaml", + "JP-13-ITA-L-KLS.yaml", + "JP-13-ITA-L-ML.yaml", + "JP-13-ITA-L-NUSM.yaml", + "JP-13-ITA-L-SL.yaml", + "JP-13-ITA-L-TL-tokushimakogyotankidaigaku_library.yaml", + "JP-13-ITA-L-TL.yaml", + "JP-13-ITA-L-TULMS.yaml", + "JP-13-ITA-M-AHM.yaml", + "JP-13-ITA-M-ASMR.yaml", + "JP-13-ITA-M-IAM.yaml", + "JP-13-ITA-M-IBG.yaml", + "JP-13-ITA-M-IHM.yaml", + "JP-13-ITA-M-ISEH.yaml", + "JP-13-ITA-M-JCM.yaml", + "JP-13-ITA-M-KCHFMH.yaml", + "JP-13-ITA-M-MB.yaml", + "JP-13-ITA-M-MHFMJPM.yaml", + "JP-13-ITA-M-TKUM.yaml", + "JP-13-ITA-M-TPCBCP.yaml", + "JP-13-IWA-L-IL.yaml", + "JP-13-IWA-M-BPMA.yaml", + "JP-13-IWA-M-KOZ.yaml", + "JP-13-IZU-M-TCFA.yaml", + "JP-13-IZU-M-TCMAIKMH.yaml", + "JP-13-KAI-L-KL-kaiyochoritsushishikui_library.yaml", + "JP-13-KAI-L-KL.yaml", + "JP-13-KAI-L-M.yaml", + "JP-13-KAI-L-ML.yaml", + "JP-13-KAI-L-Y.yaml", + "JP-13-KAI-M-KCM.yaml", + "JP-13-KAN-L-KCL.yaml", + "JP-13-KAN-L-KLA.yaml", + "JP-13-KAN-L-KLH.yaml", + "JP-13-KAN-M-KMAMKS.yaml", + "JP-13-KAN-M-KMFAW.yaml", + "JP-13-KAN-M-KSFHMH.yaml", + "JP-13-KAT-L-K-kamikatsuchokyoikuiinkai.yaml", + "JP-13-KAT-L-K.yaml", + "JP-13-KAT-L-KL-katsushikakuritsuaotochiku_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsuchuo_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsukamakura_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsukameari_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsukamikomatsu_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsukosugechiku_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsumizumoto_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsunishimizumotochiku_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsutateishi_library.yaml", + "JP-13-KAT-L-KL-katsushikakuritsuyotsugichiku_library.yaml", + "JP-13-KAT-L-KL.yaml", + "JP-13-KAT-L-KOL.yaml", + "JP-13-KAT-L-KTL.yaml", + "JP-13-KAT-L-TL.yaml", + "JP-13-KAT-L-TUSKL.yaml", + "JP-13-KAT-M-PG.yaml", + "JP-13-KAW-L-KL.yaml", + "JP-13-KIN-M-KAM.yaml", + "JP-13-KIN-M-KBK.yaml", + "JP-13-KIO-L-KL.yaml", + "JP-13-KIO-L-OL.yaml", + "JP-13-KIT-L-IRCSEMF.yaml", + "JP-13-KIT-L-JCARDLL.yaml", + "JP-13-KIT-L-KCCLB.yaml", + "JP-13-KIT-L-KJL.yaml", + "JP-13-KIT-L-KL-kitakuritsuakabane_library.yaml", + "JP-13-KIT-L-KL-kitakuritsuakabanekita_library.yaml", + "JP-13-KIT-L-KL-kitakuritsuakabanenishi_library.yaml", + "JP-13-KIT-L-KL-kitakuritsuhigashijujo_library.yaml", + "JP-13-KIT-L-KL-kitakuritsuhigashitabata_library.yaml", + "JP-13-KIT-L-KL-kitakuritsukamijujo_library.yaml", + "JP-13-KIT-L-KL-kitakuritsukamiya_library.yaml", + "JP-13-KIT-L-KL-kitakuritsukima_library.yaml", + "JP-13-KIT-L-KL-kitakuritsushowamachi_library.yaml", + "JP-13-KIT-L-KL-kitakuritsutabata_library.yaml", + "JP-13-KIT-L-KL-kitakuritsutakinogawa_library.yaml", + "JP-13-KIT-L-KL-kitakuritsutakinogawanishi_library.yaml", + "JP-13-KIT-L-KL-kitakuritsutoshima_library.yaml", + "JP-13-KIT-L-KL.yaml", + "JP-13-KIT-L-NKCLRDGL.yaml", + "JP-13-KIT-L-PML.yaml", + "JP-13-KIT-L-SL.yaml", + "JP-13-KIT-L-TLO.yaml", + "JP-13-KIT-L-TSTLTB.yaml", + "JP-13-KIT-L-TSU.yaml", + "JP-13-KIT-L-TULAL.yaml", + "JP-13-KIT-M-KCAM.yaml", + "JP-13-KIT-M-OAM.yaml", + "JP-13-KIT-M-PM.yaml", + "JP-13-KIT-M-TMMWA.yaml", + "JP-13-KIY-L-GLJNA.yaml", + "JP-13-KIY-L-JCSWL.yaml", + "JP-13-KIY-L-KCL.yaml", + "JP-13-KIY-L-KEL.yaml", + "JP-13-KIY-L-KMKL.yaml", + "JP-13-KIY-L-KNL.yaml", + "JP-13-KIY-L-KSL.yaml", + "JP-13-KIY-L-KTL.yaml", + "JP-13-KIY-L-LMPU.yaml", + "JP-13-KIY-L-NIOSH.yaml", + "JP-13-KIY-L-ORCTRI.yaml", + "JP-13-KIY-M-KMM.yaml", + "JP-13-KIY-M-MPGMPU.yaml", + "JP-13-KOD-L-BCTCL.yaml", + "JP-13-KOD-L-BGUKL.yaml", + "JP-13-KOD-L-CL.yaml", + "JP-13-KOD-L-KIMC.yaml", + "JP-13-KOD-L-KL-kodairashiritsuhanakoganei_library.yaml", + "JP-13-KOD-L-KL-kodairashiritsukamijuku_library.yaml", + "JP-13-KOD-L-KL-kodairashiritsukihei_library.yaml", + "JP-13-KOD-L-KL-kodairashiritsunakamachi_library.yaml", + "JP-13-KOD-L-KL-kodairashiritsuogawanishimachi_library.yaml", + "JP-13-KOD-L-KL-kodairashiritsuonuma_library.yaml", + "JP-13-KOD-L-KL-kodairashiritsutsuda_library.yaml", + "JP-13-KOD-L-KL.yaml", + "JP-13-KOD-L-KLH.yaml", + "JP-13-KOD-L-KLJ.yaml", + "JP-13-KOD-L-KLO.yaml", + "JP-13-KOD-L-PUL.yaml", + "JP-13-KOD-L-SGUCL.yaml", + "JP-13-KOD-L-TL.yaml", + "JP-13-KOD-M-FMS.yaml", + "JP-13-KOD-M-GM.yaml", + "JP-13-KOD-M-KHDAM.yaml", + "JP-13-KOD-M-MAUML.yaml", + "JP-13-KOD-M-TMMPG.yaml", + "JP-13-KOG-L-HL.yaml", + "JP-13-KOG-L-K-kokuritsukenkyukaihatsuhojinjohotsushinkenkyukikok.yaml", + "JP-13-KOG-L-K.yaml", + "JP-13-KOG-L-KCL.yaml", + "JP-13-KOG-L-KLH.yaml", + "JP-13-KOG-L-KLM.yaml", + "JP-13-KOG-L-KLN.yaml", + "JP-13-KOG-L-TGUCRIE.yaml", + "JP-13-KOG-L-TGUL.yaml", + "JP-13-KOG-L-TLKL.yaml", + "JP-13-KOG-M-NIICT.yaml", + "JP-13-KOG-M-NSMTUAT.yaml", + "JP-13-KOK-L-K.yaml", + "JP-13-KOK-L-KCHL-kokubunji_city_honda_library.yaml", + "JP-13-KOK-L-KCHL.yaml", + "JP-13-KOK-L-KCHLSB.yaml", + "JP-13-KOK-L-KCKL.yaml", + "JP-13-KOK-L-KCML.yaml", + "JP-13-KOK-L-KCNL.yaml", + "JP-13-KOK-L-LCRLHL.yaml", + "JP-13-KOK-L-TKUL.yaml", + "JP-13-KOK-L-TMTL.yaml", + "JP-13-KOK-M-KCMCA.yaml", + "JP-13-KOK-M-MKTRM.yaml", + "JP-13-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu.yaml", + "JP-13-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu.yaml", + "JP-13-KOM-L-K-komaeshinambuchiikisentatoshoshitsu.yaml", + "JP-13-KOM-L-K-komaeshinogawachiikisentatoshoshitsu.yaml", + "JP-13-KOM-L-K.yaml", + "JP-13-KOM-L-KL.yaml", + "JP-13-KOM-L-SL.yaml", + "JP-13-KOT-L-AL.yaml", + "JP-13-KOT-L-ALMCAT.yaml", + "JP-13-KOT-L-CIL.yaml", + "JP-13-KOT-L-ITSC.yaml", + "JP-13-KOT-L-JTRCL.yaml", + "JP-13-KOT-L-KL-kotokuritsufukagawa_library.yaml", + "JP-13-KOT-L-KL-kotokuritsufuruishiba_library.yaml", + "JP-13-KOT-L-KL-kotokuritsuhigashiojima_library.yaml", + "JP-13-KOT-L-KL-kotokuritsujoto_library.yaml", + "JP-13-KOT-L-KL-kotokuritsukameido_library.yaml", + "JP-13-KOT-L-KL-kotokuritsukodomopuraza_library.yaml", + "JP-13-KOT-L-KL-kotokuritsushinonome_library.yaml", + "JP-13-KOT-L-KL-kotokuritsusunamachi_library.yaml", + "JP-13-KOT-L-KL-kotokuritsutoyo_library.yaml", + "JP-13-KOT-L-KL-kotokuritsutoyosu_library.yaml", + "JP-13-KOT-L-KL.yaml", + "JP-13-KOT-L-LLB.yaml", + "JP-13-KOT-L-ML.yaml", + "JP-13-KOT-L-SITTL.yaml", + "JP-13-KOT-L-TCTMOLLI.yaml", + "JP-13-KOT-L-TEPSCTMRIE.yaml", + "JP-13-KOT-L-TL.yaml", + "JP-13-KOT-L-TUMSTLEB.yaml", + "JP-13-KOT-M-CTARWD.yaml", + "JP-13-KOT-M-DFEH.yaml", + "JP-13-KOT-M-GSM.yaml", + "JP-13-KOT-M-KCBM.yaml", + "JP-13-KOT-M-KCFEM.yaml", + "JP-13-KOT-M-MCAT.yaml", + "JP-13-KOT-M-MNMESI.yaml", + "JP-13-KOT-M-NFM.yaml", + "JP-13-KOT-M-YSTGD.yaml", + "JP-13-KOZ-L-KPL.yaml", + "JP-13-KOZ-M-KILMH.yaml", + "JP-13-KUB-L-FL.yaml", + "JP-13-KUN-L-HUCHSSL.yaml", + "JP-13-KUN-L-HUL.yaml", + "JP-13-KUN-L-IERLHU.yaml", + "JP-13-KUN-L-K.yaml", + "JP-13-KUN-L-KL-kunitachikitashimimpuraza_library.yaml", + "JP-13-KUN-L-KL.yaml", + "JP-13-KUN-L-KLA.yaml", + "JP-13-KUN-L-KLH.yaml", + "JP-13-KUN-L-KLM.yaml", + "JP-13-KUN-L-KLS.yaml", + "JP-13-KUN-L-KLY.yaml", + "JP-13-KUN-L-RCISSSIERH.yaml", + "JP-13-KUN-L-TCF.yaml", + "JP-13-KUN-L-TWSCPEL.yaml", + "JP-13-KUN-L-YCIL.yaml", + "JP-13-KUN-M-KKBK.yaml", + "JP-13-KUN-M-THAM.yaml", + "JP-13-KUR-L-K-kurayoshishiageikominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurayoshishikamiogamokominkantoshosupesu.yaml", + "JP-13-KUR-L-K-kurayoshishikitadanikominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurayoshishimeirinkominkantoshokona.yaml", + "JP-13-KUR-L-K-kurayoshishinadatekominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurayoshishiogamokominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurayoshishisaigokominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurayoshishiuwanadakominkankenshutoshoshitsu.yaml", + "JP-13-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurobeshiritsuhigashifusekominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurobeshiritsumikkaichikominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurobeshiritsuogyukominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurobeshiritsurayamakominkantoshoshitsu.yaml", + "JP-13-KUR-L-K-kurobeshiritsuwakagurikominkantoshoshitsu.yaml", + "JP-13-KUR-L-K.yaml", + "JP-13-KUR-L-KCAL.yaml", + "JP-13-KUR-L-KCL.yaml", + "JP-13-KUR-L-KL.yaml", + "JP-13-KUR-L-KST.yaml", + "JP-13-KUR-L-KUL.yaml", + "JP-13-KUR-L-TTL.yaml", + "JP-13-KUR-M-KCAM.yaml", + "JP-13-KUR-M-KFHM.yaml", + "JP-13-KUR-M-KMEP.yaml", + "JP-13-KUR-M-KVC.yaml", + "JP-13-KUR-M-KYSM.yaml", + "JP-13-KUR-M-SMA.yaml", + "JP-13-KUR-M-TNPM.yaml", + "JP-13-MAC-L-D.yaml", + "JP-13-MAC-L-FCCEL.yaml", + "JP-13-MAC-L-H-hoseidaigakushakaigakubushiryoshitsu.yaml", + "JP-13-MAC-L-H.yaml", + "JP-13-MAC-L-HL.yaml", + "JP-13-MAC-L-HUFSHS.yaml", + "JP-13-MAC-L-HUJSRI.yaml", + "JP-13-MAC-L-HURRFSPA.yaml", + "JP-13-MAC-L-ICESHU.yaml", + "JP-13-MAC-L-JFOUL.yaml", + "JP-13-MAC-L-KLJ.yaml", + "JP-13-MAC-L-ML-machidashiritsukanamori_library.yaml", + "JP-13-MAC-L-ML-machidashiritsukisoyamasaki_library.yaml", + "JP-13-MAC-L-ML-machidashiritsusakai_library.yaml", + "JP-13-MAC-L-ML-machidashiritsusarubia_library.yaml", + "JP-13-MAC-L-ML-machidashiritsutadao_library.yaml", + "JP-13-MAC-L-ML-machidashiritsutsurukawa_library.yaml", + "JP-13-MAC-L-ML-machidashiritsutsurukawaekimae_library.yaml", + "JP-13-MAC-L-ML-mukyukai_library.yaml", + "JP-13-MAC-L-ML.yaml", + "JP-13-MAC-L-OISRHU.yaml", + "JP-13-MAC-L-SL.yaml", + "JP-13-MAC-L-SPUL.yaml", + "JP-13-MAC-L-TKGULOML.yaml", + "JP-13-MAC-L-TUL.yaml", + "JP-13-MAC-L-WUUMLIC.yaml", + "JP-13-MAC-M-JMIMC.yaml", + "JP-13-MAC-M-SPUY.yaml", + "JP-13-MAC-M-TKGMDL.yaml", + "JP-13-MAC-M-TUME.yaml", + "JP-13-MEG-L-CPASLGSASU.yaml", + "JP-13-MEG-L-IISLUT.yaml", + "JP-13-MEG-L-ISTOL.yaml", + "JP-13-MEG-L-KLUT.yaml", + "JP-13-MEG-L-LTMMP.yaml", + "JP-13-MEG-L-MCOL.yaml", + "JP-13-MEG-L-MCYCL.yaml", + "JP-13-MEG-L-ML-megurokuritsumegurohoncho_library.yaml", + "JP-13-MEG-L-ML-megurokuritsumegurokuminsenta_library.yaml", + "JP-13-MEG-L-ML-megurokuritsumidorigaoka_library.yaml", + "JP-13-MEG-L-ML-megurokuritsunakameguroekimae_library.yaml", + "JP-13-MEG-L-ML-megurokuritsusenzoku_library.yaml", + "CZ-42-POL-L-MKP.yaml", + "CZ-42-POL-L-MLKVP.yaml", + "CZ-42-POV-L-MPS.yaml", + "CZ-42-POV-L-OKVP.yaml", + "CZ-42-PRA-L-MKPNL.yaml", + "CZ-42-PRA-L-MKVLNL.yaml", + "CZ-42-PRE-L-OKVP.yaml", + "CZ-42-PRO-L-MKP.yaml", + "CZ-42-RAD-L-MKR.yaml", + "CZ-42-RAD-L-OKR.yaml", + "CZ-42-REH-L-VKD.yaml", + "CZ-42-REJ-G-GBR.yaml", + "CZ-42-ROH-L-MKR.yaml", + "CZ-42-ROU-G-GMUVRNLPOU.yaml", + "CZ-42-ROU-L-A.yaml", + "CZ-42-ROU-L-KES.yaml", + "CZ-42-ROU-L-MKC.yaml", + "CZ-42-ROU-L-MKD-mistni_knihovna_dobrin.yaml", + "CZ-42-ROU-L-MKD.yaml", + "CZ-42-ROU-L-MKK-mistni_knihovna_kyskovice.yaml", + "CZ-42-ROU-L-MKV-mistni_knihovna_vetla.yaml", + "CZ-42-ROU-L-MKV.yaml", + "CZ-42-ROU-L-MKVDNO.yaml", + "CZ-42-ROU-M-PMK.yaml", + "CZ-42-RTY-L-OKRNB.yaml", + "CZ-42-RUM-L-KZSMNVUNLZ.yaml", + "CZ-42-RUM-L-MKR.yaml", + "CZ-42-RUM-M-KOMVDPOPR.yaml", + "CZ-42-RYJ-L-LPDN.yaml", + "CZ-42-SLU-L-MKS.yaml", + "CZ-42-SLU-L-T.yaml", + "CZ-42-SNE-L-MKS.yaml", + "CZ-42-SPO-L-OKVOS.yaml", + "CZ-42-STA-L-OKS.yaml", + "CZ-42-STA-L-OKSK.yaml", + "CZ-42-STE-E-VOSOTSSSKP.yaml", + "CZ-42-STE-L-IVP.yaml", + "CZ-42-STE-L-MPS.yaml", + "CZ-42-STR-L-MKSV.yaml", + "CZ-42-SUL-L-MKS.yaml", + "CZ-42-SVE-L-OKS.yaml", + "CZ-42-TEP-A-SOAT-statni_okresni_archiv_teplice.yaml", + "CZ-42-TEP-E-KTCK.yaml", + "CZ-42-TEP-E-VOSZSSZPK.yaml", + "CZ-42-TEP-L-BPTS.yaml", + "CZ-42-TEP-L-KZ.yaml", + "CZ-42-TEP-L-KZSNTZLKUN.yaml", + "CZ-42-TEP-L-LTVC.yaml", + "CZ-42-TEP-L-R.yaml", + "CZ-42-TEP-L-RKTPO.yaml", + "CZ-42-TEP-L-SSP.yaml", + "CZ-42-TEP-L-SUO.yaml", + "CZ-42-TEP-L-SUVP.yaml", + "CZ-42-TEP-L-VOD.yaml", + "CZ-42-TEP-L-VSTK.yaml", + "CZ-42-TEP-M-RMVTPK.yaml", + "CZ-42-TEP-M-RMVTPO.yaml", + "CZ-42-TEP-O-SOAVLSOAT.yaml", + "CZ-42-TER-L-DSR.yaml", + "CZ-42-TER-L-MKT.yaml", + "CZ-42-TER-L-VSAPSRK.yaml", + "CZ-42-TER-M-PTNKP.yaml", + "CZ-42-TRE-L-MKP.yaml", + "CZ-42-TRE-L-MKVS.yaml", + "CZ-42-TRM-L-MKT.yaml", + "CZ-42-TRU-A-AUMAVEST-archivalie_ulozene_mimo_archivy_v_evidenci_soka_tr.yaml", + "CZ-42-TUC-L-MKT.yaml", + "CZ-42-UDL-L-OKVU.yaml", + "CZ-42-UJE-L-MLKU.yaml", + "CZ-42-UNL-M-MMUNL.yaml", + "CZ-42-UST-L-AVCSUPSEU.yaml", + "CZ-42-UST-L-CLZUNL.yaml", + "CZ-42-UST-L-ES.yaml", + "CZ-42-UST-L-KHSUKSSVUN.yaml", + "CZ-42-UST-L-MKR.yaml", + "CZ-42-UST-L-NPUUOPVUNL.yaml", + "CZ-42-UST-L-OKC.yaml", + "CZ-42-UST-L-OUSTK.yaml", + "CZ-42-UST-L-PKUSPTK.yaml", + "CZ-42-UST-L-S.yaml", + "CZ-42-UST-L-SSTK.yaml", + "CZ-42-UST-L-THZ.yaml", + "CZ-42-UST-L-TS.yaml", + "CZ-42-UST-L-UJPFSE.yaml", + "CZ-42-UST-L-UJPFUDK.yaml", + "CZ-42-UST-L-UJPVK.yaml", + "CZ-42-UST-L-VS.yaml", + "CZ-42-UST-L-ZCUNLTK.yaml", + "CZ-42-UST-L-ZESR.yaml", + "CZ-42-UST-M-OMVUNLPOK.yaml", + "CZ-42-VAL-L-OKV.yaml", + "CZ-42-VAR-L-E.yaml", + "CZ-42-VAR-L-TST.yaml", + "CZ-42-VAR-L-VS.yaml", + "CZ-42-VEJ-L-MKSS.yaml", + "CZ-42-VEJ-L-MKVV.yaml", + "CZ-42-VEJ-L-OKVKH.yaml", + "CZ-42-VEL-L-MKV-mistni_knihovna_velteze.yaml", + "CZ-42-VEL-L-MKVM.yaml", + "CZ-42-VEL-L-MKVS.yaml", + "CZ-42-VEL-L-OKVVB-obecni_knihovna_ve_velke_bukovine.yaml", + "CZ-42-VEL-L-OKVVB.yaml", + "CZ-42-VEL-L-OKVVC.yaml", + "CZ-42-VER-L-OKVV.yaml", + "CZ-42-VIL-L-OVKV.yaml", + "CZ-42-VIL-L-SS.yaml", + "CZ-42-VRS-L-MVKV.yaml", + "CZ-42-VSE-L-OKVV.yaml", + "CZ-42-VYS-L-OKVV.yaml", + "CZ-42-VYS-L-OKVVP.yaml", + "CZ-42-ZAB-L-MKZ.yaml", + "CZ-42-ZAC-M-MMZ-mestske_muzeum_zacler.yaml", + "CZ-42-ZAL-L-MKZ-mistni_knihovna_zalhostice.yaml", + "CZ-42-ZAL-L-MKZ.yaml", + "CZ-42-ZAL-L-SDVU.yaml", + "CZ-42-ZAT-L-CISR.yaml", + "CZ-42-ZAT-L-SZS.yaml", + "CZ-42-ZAT-M-RMKPVZ.yaml", + "CZ-42-ZEL-M-MVMZ.yaml", + "CZ-42-ZIT-L-MKZ.yaml", + "CZ-42-ZIZ-L-OKZ.yaml", + "CZ-51-BEN-L-MKVBUS.yaml", + "CZ-51-BEN-L-OKBLS.yaml", + "CZ-51-BEN-L-OKDS.yaml", + "CZ-51-BOL-A-AUMAVESMB.yaml", + "CZ-51-BRA-L-OKB.yaml", + "CZ-51-BRA-L-OKH.yaml", + "CZ-51-BRA-L-OKJ.yaml", + "CZ-51-BUL-L-MKA.yaml", + "CZ-51-BYS-L-MKVBNJ.yaml", + "CZ-51-CED-M-PM-podjestedske_muzeum.yaml", + "CZ-51-CES-A-SOACL.yaml", + "CZ-51-CES-L-MKCL.yaml", + "CZ-51-CES-L-MKSPJR.yaml", + "CZ-51-CES-L-MKVPPJ.yaml", + "CZ-51-CES-L-N.yaml", + "CZ-51-CES-L-NCLS.yaml", + "CZ-51-CES-L-NSPCLSLK.yaml", + "CZ-51-CES-L-OKB.yaml", + "CZ-51-CES-L-OKVS.yaml", + "CZ-51-CES-L-PMKCD.yaml", + "CZ-51-CES-L-V.yaml", + "CZ-51-CES-M-VMGVCL.yaml", + "CZ-51-CET-L-MKVCHL.yaml", + "CZ-51-CHR-L-ECS.yaml", + "CZ-51-CHR-L-MKC.yaml", + "CZ-51-CHR-L-MLKV.yaml", + "CZ-51-CHR-M-MMIC.yaml", + "CZ-51-CIS-L-OKCUH.yaml", + "CZ-51-CRA-M-MCR.yaml", + "CZ-51-CVI-L-MKVC.yaml", + "CZ-51-CVI-L-S.yaml", + "CZ-51-DES-L-MKD.yaml", + "CZ-51-DES-M-MRV.yaml", + "CZ-51-DOK-L-MKB.yaml", + "CZ-51-DOK-L-MKT-mistni_knihovna_tuhan.yaml", + "CZ-51-DOK-L-MKT.yaml", + "CZ-51-DRZ-L-MKD.yaml", + "CZ-51-DUB-L-MKVD.yaml", + "CZ-51-DUB-L-OKVD.yaml", + "CZ-51-FRY-L-MKF.yaml", + "CZ-51-FRY-L-MKVV.yaml", + "CZ-51-FRY-M-MMF.yaml", + "CZ-51-FRY-M-MUFOKMMFK.yaml", + "CZ-51-HAB-L-MKVC.yaml", + "CZ-51-HAB-L-MKVH.yaml", + "CZ-51-HAB-L-MKVP.yaml", + "CZ-51-HAR-L-MKH.yaml", + "CZ-51-HEJ-L-OKBP.yaml", + "CZ-51-HEJ-L-OKLL.yaml", + "CZ-51-HOD-L-MKHNM.yaml", + "CZ-51-HOR-L-MKHP.yaml", + "CZ-51-HOR-L-MKVHB.yaml", + "CZ-51-HOR-L-MKVHR.yaml", + "CZ-51-HOR-L-MKVHUSP.yaml", + "CZ-51-HOR-L-MKVV.yaml", + "CZ-51-HRA-L-BZV.yaml", + "CZ-51-HRA-L-MKC.yaml", + "CZ-51-HUN-L-OKS.yaml", + "CZ-51-JAB-A-SOAJNN.yaml", + "CZ-51-JAB-L-AS.yaml", + "CZ-51-JAB-L-ASREPJNN.yaml", + "CZ-51-JAB-L-B.yaml", + "CZ-51-JAB-L-JOPMPS.yaml", + "CZ-51-JAB-L-JS.yaml", + "CZ-51-JAB-L-MKJNJ.yaml", + "CZ-51-JAB-L-MKJNN.yaml", + "CZ-51-JAB-L-MKM.yaml", + "CZ-51-JAB-L-MKVV.yaml", + "CZ-51-JAB-L-NJNNPLK.yaml", + "CZ-51-JAB-L-PSOSRT.yaml", + "CZ-51-JAB-L-UPHULPJNN.yaml", + "CZ-51-JAB-L-ZBZN.yaml", + "CZ-51-JAN-L-OKJNN.yaml", + "CZ-51-JEN-L-OKVJ.yaml", + "CZ-51-JER-L-MKVJ.yaml", + "CZ-51-JES-L-MKVJ.yaml", + "CZ-51-JIL-L-MKJH.yaml", + "CZ-51-JIL-L-MKJVK.yaml", + "CZ-51-JIL-L-MKLO.yaml", + "CZ-51-JIL-L-MLKVBUC.yaml", + "CZ-51-JIL-L-MMNJLK.yaml", + "CZ-51-JIL-L-OKK-obecni_knihovna_kundratice.yaml", + "CZ-51-JIL-L-OKK.yaml", + "CZ-51-JIL-M-KMJ.yaml", + "CZ-51-JIN-L-OKVJPS.yaml", + "CZ-51-JNN-A-AUMAVESJNN.yaml", + "CZ-51-JNN-M-MSBJNN.yaml", + "CZ-51-JOS-L-OKJD.yaml", + "CZ-51-KAM-L-PLSTK.yaml", + "CZ-51-KOS-L-OKVK.yaml", + "CZ-51-KRA-L-MKK.yaml", + "CZ-51-KRI-L-MKK.yaml", + "CZ-51-KRI-L-MKR.yaml", + "CZ-51-KRI-L-MKZ-mistni_knihovna_zibridice.yaml", + "CZ-51-KRI-L-MKZ.yaml", + "CZ-51-LIB-A-AUMAVESL-archivalie_ulozene_mimo_archivy_v_evidenci_soka_li.yaml", + "CZ-51-LIB-A-SOAL-statni_okresni_archiv_liberec.yaml", + "CZ-51-LIB-E-SZSVOSZLK.yaml", + "CZ-51-LIB-G-OGL.yaml", + "CZ-51-LIB-G-OGLPK.yaml", + "CZ-51-LIB-L-CMIOIL.yaml", + "CZ-51-LIB-L-DZVK.yaml", + "CZ-51-LIB-L-IS.yaml", + "CZ-51-LIB-L-KNLSLK.yaml", + "CZ-51-LIB-L-KSRSSV.yaml", + "CZ-51-LIB-L-KVKVL.yaml", + "CZ-51-LIB-L-LS.yaml", + "CZ-51-LIB-L-LVZ.yaml", + "CZ-51-LIB-L-MKVKU.yaml", + "CZ-51-LIB-L-MLKL.yaml", + "CZ-51-LIB-L-OZCEPP.yaml", + "CZ-51-LIB-L-S.yaml", + "CZ-51-LIB-L-SVUT.yaml", + "CZ-51-LIB-L-TL.yaml", + "CZ-51-LIB-L-TS.yaml", + "CZ-51-LIB-L-TUVLUK.yaml", + "CZ-51-LIB-L-UP.yaml", + "CZ-51-LIB-L-UPVMVSROP.yaml", + "CZ-51-LIB-L-VL.yaml", + "CZ-51-LIB-L-VSOITK.yaml", + "CZ-51-LIB-L-VSSTFS.yaml", + "CZ-51-LIB-M-SMLPO.yaml", + "CZ-51-LIB-O-KOPRTMHSKS.yaml", + "CZ-51-LIB-O-SOAVLSOAL.yaml", + "CZ-51-LNP-M-MMGLNP.yaml", + "CZ-51-LOM-L-KISPOMK.yaml", + "CZ-51-LOM-L-MKVS-mistni_knihovna_ve_struzinci.yaml", + "CZ-51-LOM-L-MKVS.yaml", + "CZ-51-LOM-L-TTTS.yaml", + "CZ-51-LUC-L-MKLNN.yaml", + "CZ-51-MAL-L-VKVMS.yaml", + "CZ-51-MAR-L-MKM.yaml", + "CZ-51-MAR-L-OKMVK.yaml", + "CZ-51-MAS-A-BSS.yaml", + "CZ-51-MIM-L-MKM.yaml", + "CZ-51-MIM-L-MKVK.yaml", + "CZ-51-MIM-L-MKVNPR.yaml", + "CZ-51-MIM-L-MKVPPR.yaml", + "CZ-51-MIM-L-MSK.yaml" ], - "last_index": 499 + "last_index": 259 } \ No newline at end of file diff --git a/data/custodian/CZ-42-ROU-L-KES.yaml b/data/custodian/CZ-42-ROU-L-KES.yaml index 6e4adc03ab..f2aef085a7 100644 --- a/data/custodian/CZ-42-ROU-L-KES.yaml +++ b/data/custodian/CZ-42-ROU-L-KES.yaml @@ -192,3 +192,22 @@ wikidata_enrichment: - Q7075 - Q41176 located_in: Q63855 +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:55:31.266468+00:00' + source_url: https://katalog.mk-roudnice.cz + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://katalog.mk-roudnice.cz/themes/root/images/vufind-favicon.ico + source_url: https://katalog.mk-roudnice.cz + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T13:55:31.266468+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/CZ-42-SLU-L-MKS.yaml b/data/custodian/CZ-42-SLU-L-MKS.yaml index 1799400d39..20451e0d3f 100644 --- a/data/custodian/CZ-42-SLU-L-MKS.yaml +++ b/data/custodian/CZ-42-SLU-L-MKS.yaml @@ -229,3 +229,22 @@ location: postal_code: 407 77 street_address: T.G. Masaryka 638 normalization_timestamp: '2025-12-09T10:54:19.705290+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:56:35.796505+00:00' + source_url: https://decin.tritius.cz/library/skat + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://decin.tritius.cz/apple-touch-icon-180x180.png + source_url: https://decin.tritius.cz/library/skat + css_selector: '[document] > html > head > link:nth-of-type(14)' + retrieved_on: '2025-12-25T13:56:35.796505+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 14 diff --git a/data/custodian/CZ-52-DVU-L-MKSVDKNL.yaml b/data/custodian/CZ-52-DVU-L-MKSVDKNL.yaml index 4aa20d9b82..594155468d 100644 --- a/data/custodian/CZ-52-DVU-L-MKSVDKNL.yaml +++ b/data/custodian/CZ-52-DVU-L-MKSVDKNL.yaml @@ -182,3 +182,22 @@ wikidata_enrichment: instance_of: - Q7075 located_in: Q143664 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:46:20.429989+00:00' + source_url: https://katalog.slavoj.cz + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://katalog.slavoj.cz/themes/root/images/vufind-favicon.ico + source_url: https://katalog.slavoj.cz + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T15:46:20.429989+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-CHU-L-SOL.yaml b/data/custodian/JP-13-CHU-L-SOL.yaml index a5dcc33106..1d8b5f8c77 100644 --- a/data/custodian/JP-13-CHU-L-SOL.yaml +++ b/data/custodian/JP-13-CHU-L-SOL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-CHU-L-SOL - valid_from: "2025-12-10T09:44:02Z" + valid_from: '2025-12-10T09:44:02Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-CHU-L-SOL valid_from: null - valid_to: "2025-12-10T09:44:02Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:02Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-CHU-L-SOL ghcid_numeric: 5734815799153242372 valid_from: '2025-12-06T23:38:57.776064+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Shochiku Otani Library @@ -151,3 +152,28 @@ location: geonames_id: 13353695 geonames_name: Chūō feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T12:45:01.704325+00:00' + source_url: http://www.shochiku.co.jp/shochiku-otani-toshokan + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.shochiku.co.jp/shochiku-otani-toshokan/wp-content/themes/otani2024/assets/images/favicon/apple-touch-icon-180x180.png + source_url: http://www.shochiku.co.jp/shochiku-otani-toshokan + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T12:45:01.704325+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.shochiku.co.jp/shochiku-otani-toshokan/wp-content/themes/otani2024/images/ogp.png + source_url: http://www.shochiku.co.jp/shochiku-otani-toshokan + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T12:45:01.704325+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-CHU-L-T.yaml b/data/custodian/JP-13-CHU-L-T.yaml index 1589effc6e..d122555485 100644 --- a/data/custodian/JP-13-CHU-L-T.yaml +++ b/data/custodian/JP-13-CHU-L-T.yaml @@ -152,3 +152,28 @@ location: geonames_id: 13353695 geonames_name: Chūō feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T12:45:11.533645+00:00' + source_url: http://www.toyokeizai.net + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.toyokeizai.net/apple-touch-icon.png?rd=202512040900 + source_url: http://www.toyokeizai.net + css_selector: '[document] > html > head > link:nth-of-type(21)' + retrieved_on: '2025-12-25T12:45:11.533645+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://toyokeizai.net/common/images/v5/common/tkollogo_130th.jpg + source_url: http://www.toyokeizai.net + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T12:45:11.533645+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-CHU-M-AMIF.yaml b/data/custodian/JP-13-CHU-M-AMIF.yaml index 1cf1334f0e..115d24e878 100644 --- a/data/custodian/JP-13-CHU-M-AMIF.yaml +++ b/data/custodian/JP-13-CHU-M-AMIF.yaml @@ -326,3 +326,22 @@ wikidata_enrichment: commons_category: Artizon Museum commons_gallery: Artizon Museum wikidata_image: Bridgestone Museum.jpg +logo_enrichment: + enrichment_timestamp: '2025-12-25T12:45:21.521987+00:00' + source_url: https://www.artizon.museum + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.artizon.museum/wp-content/themes/artizon_jp/images/favicon.ico + source_url: https://www.artizon.museum + css_selector: '[document] > html.cc--darkmode.show--consent > head > link' + retrieved_on: '2025-12-25T12:45:21.521987+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 32x32 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-CHU-M-NFAJ.yaml b/data/custodian/JP-13-CHU-M-NFAJ.yaml index 6014f86ba0..b105489435 100644 --- a/data/custodian/JP-13-CHU-M-NFAJ.yaml +++ b/data/custodian/JP-13-CHU-M-NFAJ.yaml @@ -296,3 +296,30 @@ wikidata_enrichment: image: MOMAT FilmCenter.jpg commons_category: National Film Archive of Japan wikidata_image: MOMAT FilmCenter.jpg +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:55:35.159832+00:00' + source_url: https://www.nfaj.go.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.nfaj.go.jp/wp-content/uploads/nfajlogo.png + source_url: https://www.nfaj.go.jp + css_selector: '#header > div.logo > a > img' + retrieved_on: '2025-12-25T13:55:35.159832+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国立映画アーカイブ National Film Archive of JAPAN + - claim_type: favicon_url + claim_value: https://www.nfaj.go.jp/wp-content/uploads/cropped-logo1-1.png + source_url: https://www.nfaj.go.jp + css_selector: '[document] > html > head > link:nth-of-type(16)' + retrieved_on: '2025-12-25T13:55:35.159832+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 32x32 + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-CHU-M-SMG.yaml b/data/custodian/JP-13-CHU-M-SMG.yaml index c59134360d..94940f8a6d 100644 --- a/data/custodian/JP-13-CHU-M-SMG.yaml +++ b/data/custodian/JP-13-CHU-M-SMG.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-CHU-M-SMG - valid_from: "2025-12-10T09:44:02Z" + valid_from: '2025-12-10T09:44:02Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-CHU-M-SMG valid_from: null - valid_to: "2025-12-10T09:44:02Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:02Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-CHU-M-SMG ghcid_numeric: 10445667631050794321 valid_from: '2025-12-06T23:38:32.997005+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: THE SEIKO MUSEUM GINZA @@ -151,3 +152,20 @@ location: geonames_id: 13353695 geonames_name: Chūō feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:55:42.427721+00:00' + source_url: https://museum.seiko.co.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://museum.seiko.co.jp/common/img/ogp.jpg + source_url: https://museum.seiko.co.jp + css_selector: '[document] > html.webkit.chrome > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T13:55:42.427721+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-AGJCL.yaml b/data/custodian/JP-13-EDO-L-AGJCL.yaml index 2d54152f2c..c4a5ea717f 100644 --- a/data/custodian/JP-13-EDO-L-AGJCL.yaml +++ b/data/custodian/JP-13-EDO-L-AGJCL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-EDO-L-AGJCL - valid_from: "2025-12-10T09:44:02Z" + valid_from: '2025-12-10T09:44:02Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-EDO-L-AGJCL valid_from: null - valid_to: "2025-12-10T09:44:02Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:02Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-EDO-L-AGJCL ghcid_numeric: 8511444997913181785 valid_from: '2025-12-06T23:38:56.934641+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Aikoku Gakuen Junior College Library @@ -204,3 +205,28 @@ location: geonames_id: 1907124 geonames_name: Edogawadai-higashi feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:55:55.069181+00:00' + source_url: https://www.aikoku-jc.ac.jp/student/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.aikoku-jc.ac.jp/contents/wp-content/themes/aitan_re/image/apple-touch-icon.png + source_url: https://www.aikoku-jc.ac.jp/student/library + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T13:55:55.069181+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.aikoku-jc.ac.jp/contents/wp-content/themes/aitan_re/screenshot.jpg + source_url: https://www.aikoku-jc.ac.jp/student/library + css_selector: '[document] > html > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T13:55:55.069181+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-EDO-L-ECCL.yaml b/data/custodian/JP-13-EDO-L-ECCL.yaml index 91608aac31..17f35a8732 100644 --- a/data/custodian/JP-13-EDO-L-ECCL.yaml +++ b/data/custodian/JP-13-EDO-L-ECCL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-EDO-L-ECCL - valid_from: "2025-12-10T09:44:02Z" + valid_from: '2025-12-10T09:44:02Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-EDO-L-ECCL valid_from: null - valid_to: "2025-12-10T09:44:02Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:02Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-EDO-L-ECCL ghcid_numeric: 15426129734398471141 valid_from: '2025-12-06T23:38:43.599591+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Edogawa City Central Library @@ -192,8 +193,9 @@ wikidata_enrichment: instance_of: &id004 - id: Q7075 label: library - description: institution charged with the care of a collection of literary, musical, artistic, or reference materials, - such as books, manuscripts, recordings, or films + description: institution charged with the care of a collection of literary, + musical, artistic, or reference materials, such as books, manuscripts, recordings, + or films wikidata_instance_of: *id004 wikidata_location: country: &id005 @@ -225,3 +227,23 @@ location: geonames_id: 1907124 geonames_name: Edogawadai-higashi feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:56:06.495061+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_chuo.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_chuo.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:56:06.495061+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECHKL.yaml b/data/custodian/JP-13-EDO-L-ECHKL.yaml index 1939ee42e6..bd7154a1b0 100644 --- a/data/custodian/JP-13-EDO-L-ECHKL.yaml +++ b/data/custodian/JP-13-EDO-L-ECHKL.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/h_kasai.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/h_kasai.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:56:16.135120+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_h_kasai.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_h_kasai.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:56:16.135120+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_kasai_library.yaml b/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_kasai_library.yaml index 1f98e9bf03..923589e79a 100644 --- a/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_kasai_library.yaml +++ b/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_kasai_library.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/kasai.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/kasai.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:56:26.276203+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_kasai.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_kasai.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:56:26.276203+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_komatsugawa_library.yaml b/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_komatsugawa_library.yaml index 9f8576bd45..f6e0861b2f 100644 --- a/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_komatsugawa_library.yaml +++ b/data/custodian/JP-13-EDO-L-ECKL-edogawa_city_komatsugawa_library.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/komatsu.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/komatsu.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:56:36.248575+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_komatsu.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_komatsu.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:56:36.248575+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECKL.yaml b/data/custodian/JP-13-EDO-L-ECKL.yaml index 536f5175ea..17959f1d10 100644 --- a/data/custodian/JP-13-EDO-L-ECKL.yaml +++ b/data/custodian/JP-13-EDO-L-ECKL.yaml @@ -212,3 +212,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/koiwa.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/koiwa.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:56:46.131530+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_koiwa.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_koiwa.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:56:46.131530+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECML.yaml b/data/custodian/JP-13-EDO-L-ECML.yaml index 23340f6aec..e44b76fbbc 100644 --- a/data/custodian/JP-13-EDO-L-ECML.yaml +++ b/data/custodian/JP-13-EDO-L-ECML.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/matsue.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/matsue.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:56:56.467101+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_matsue.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_matsue.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:56:56.467101+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECNKL.yaml b/data/custodian/JP-13-EDO-L-ECNKL.yaml index 1fbc7d1b61..e5ff276a9c 100644 --- a/data/custodian/JP-13-EDO-L-ECNKL.yaml +++ b/data/custodian/JP-13-EDO-L-ECNKL.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/n_kasai.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/n_kasai.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:57:07.187504+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_n_kasai.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_n_kasai.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:57:07.187504+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECSCL.yaml b/data/custodian/JP-13-EDO-L-ECSCL.yaml index 79467d59af..dd482d25ee 100644 --- a/data/custodian/JP-13-EDO-L-ECSCL.yaml +++ b/data/custodian/JP-13-EDO-L-ECSCL.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/seishin.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/seishin.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:57:17.467467+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_seishin.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_seishin.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:57:17.467467+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECSL.yaml b/data/custodian/JP-13-EDO-L-ECSL.yaml index 2b03eac366..6fd4884cfe 100644 --- a/data/custodian/JP-13-EDO-L-ECSL.yaml +++ b/data/custodian/JP-13-EDO-L-ECSL.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: http://www.shinozaki-bunkaplaza.com/library/ wikidata_official_website: http://www.shinozaki-bunkaplaza.com/library/ +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:57:28.209619+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_shino.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_shino.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:57:28.209619+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-ECTL.yaml b/data/custodian/JP-13-EDO-L-ECTL.yaml index c88aaba67b..f5e98d6771 100644 --- a/data/custodian/JP-13-EDO-L-ECTL.yaml +++ b/data/custodian/JP-13-EDO-L-ECTL.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/tobu.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/tobu.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:57:48.438298+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_tobu.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_tobu.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:57:48.438298+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-EL.yaml b/data/custodian/JP-13-EDO-L-EL.yaml index 19a3b47f33..36cc7c7b06 100644 --- a/data/custodian/JP-13-EDO-L-EL.yaml +++ b/data/custodian/JP-13-EDO-L-EL.yaml @@ -205,3 +205,23 @@ wikidata_enrichment: wikidata_web: official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/shishi.php wikidata_official_website: https://www.library.city.edogawa.tokyo.jp/TOSHOW/introduction/html/shishi.php +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:57:57.865530+00:00' + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_shishi.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.city.edogawa.tokyo.jp/images/common/logo.gif + source_url: https://www.library.city.edogawa.tokyo.jp/toshow/introduction/html/edg_shishi.php + css_selector: '[document] > html > body > header > div.block-header > h1 > a > + img' + retrieved_on: '2025-12-25T13:57:57.865530+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江戸川区立図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-L-TCWL.yaml b/data/custodian/JP-13-EDO-L-TCWL.yaml index 88ad13a5f3..f993b2d556 100644 --- a/data/custodian/JP-13-EDO-L-TCWL.yaml +++ b/data/custodian/JP-13-EDO-L-TCWL.yaml @@ -157,3 +157,20 @@ location: geonames_id: 1907124 geonames_name: Edogawadai-higashi feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T13:58:19.011490+00:00' + source_url: https://www.tcw.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.tcw.ac.jp/wp-content/uploads/2024/12/TOP2026.jpg + source_url: https://www.tcw.ac.jp + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T13:58:19.011490+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-EDO-M-MM.yaml b/data/custodian/JP-13-EDO-M-MM.yaml index e265d8f8d9..abe7241673 100644 --- a/data/custodian/JP-13-EDO-M-MM.yaml +++ b/data/custodian/JP-13-EDO-M-MM.yaml @@ -359,3 +359,32 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/Am3a8LqzHbw/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:01:22.469144+00:00' + source_url: https://www.chikahaku.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.chikahaku.jp/images/logo-01a_v2.svg + source_url: https://www.chikahaku.jp + css_selector: '#top > div.wrapper > header > section.header-sp.fixed-top > div.container-fluid.global-link + > div.row.justify-content-between > div.col-6 > a > img.img-fluid.w-75' + retrieved_on: '2025-12-25T14:01:22.469144+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: https://www.chikahaku.jp/images/apple-icon-180x180.png + source_url: https://www.chikahaku.jp + css_selector: '[document] > html.fontawesome-i2svg-active.fontawesome-i2svg-complete + > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T14:01:22.469144+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-ETO-L-TPUHSL.yaml b/data/custodian/JP-13-ETO-L-TPUHSL.yaml index 8e914fe6ea..2c712b1b5a 100644 --- a/data/custodian/JP-13-ETO-L-TPUHSL.yaml +++ b/data/custodian/JP-13-ETO-L-TPUHSL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ETO-L-TPUHSL - valid_from: "2025-12-10T09:44:02Z" + valid_from: '2025-12-10T09:44:02Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ETO-L-TPUHSL valid_from: null - valid_to: "2025-12-10T09:44:02Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:02Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ETO-L-TPUHSL ghcid_numeric: 7835861160977250323 valid_from: '2025-12-06T23:38:59.908091+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Professional University of Health Sciences Library @@ -182,7 +183,8 @@ wikidata_enrichment: part_of: id: Q97162036 label: Tokyo Professional University of Health Sciences - description: professional and vocational university in Kōtō Ward, Tōkyō Metropolis, Japan + description: professional and vocational university in Kōtō Ward, Tōkyō Metropolis, + Japan wikidata_web: official_website: https://lib-tpu.opac.jp/opac/Top wikidata_official_website: https://lib-tpu.opac.jp/opac/Top @@ -204,3 +206,28 @@ location: geonames_id: 1852663 geonames_name: Seto feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:01:40.304002+00:00' + source_url: https://lib-tpu.opac.jp/opac/Top + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://lib-tpu.opac.jp/common/images/op4-favicon.ico + source_url: https://lib-tpu.opac.jp/opac/Top + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:01:40.304002+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://lib-tpu.opac.jp/common/images/ogp-image.jpg + source_url: https://lib-tpu.opac.jp/opac/Top + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T14:01:40.304002+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsukatamachi_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsukatamachi_library.yaml index ca6fec0f63..8a93ef3045 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsukatamachi_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsukatamachi_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map11.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map11.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:02:17.698885+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/katamachi.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/katamachi.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:02:17.698885+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/katamachi.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:02:17.698885+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsukoremasa_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsukoremasa_library.yaml index 8858252c36..e8839188a0 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsukoremasa_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsukoremasa_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map07.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map07.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:02:28.813880+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/koremasa.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/koremasa.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:02:28.813880+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/koremasa.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:02:28.813880+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsumiyamachi_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsumiyamachi_library.yaml index 1adafa3ac2..5a5e422752 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsumiyamachi_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsumiyamachi_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map12.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map12.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:02:39.848691+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/miyamachi.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/miyamachi.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:02:39.848691+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/miyamachi.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:02:39.848691+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsumomijigaoka_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsumomijigaoka_library.yaml index d8f485a8f6..bac730849a 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsumomijigaoka_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsumomijigaoka_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map08.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map08.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:02:49.647654+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/momijigaoka.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/momijigaoka.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:02:49.647654+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/momijigaoka.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:02:49.647654+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsumusashidai_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsumusashidai_library.yaml index 236cc1c589..091be14dff 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsumusashidai_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsumusashidai_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map04.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map04.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:03:00.895034+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/musashidai.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/musashidai.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:03:00.895034+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/musashidai.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:03:00.895034+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsunishifu_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsunishifu_library.yaml index fa53022bbf..460f96c796 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsunishifu_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsunishifu_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map03.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map03.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:03:11.066954+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/nishifu.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/nishifu.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:03:11.066954+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/nishifu.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:03:11.066954+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsuoshitate_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsuoshitate_library.yaml index 55b91bb758..93f4f8b78c 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsuoshitate_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsuoshitate_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map10.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map10.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:03:22.606545+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/oshitate.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/oshitate.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:03:22.606545+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/oshitate.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:03:22.606545+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsushimmachi_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsushimmachi_library.yaml index 8e3f6b496c..db688a2e0e 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsushimmachi_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsushimmachi_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map05.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map05.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:03:34.721855+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/sinmachi.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/sinmachi.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:03:34.721855+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/sinmachi.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:03:34.721855+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsushiraitodai_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsushiraitodai_library.yaml index 26ec32d53e..35d0ada54e 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsushiraitodai_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsushiraitodai_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map02.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map02.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:03:45.061892+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/shiraitodai.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/shiraitodai.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:03:45.061892+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/shiraitodai.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:03:45.061892+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsushogaigakushusenta_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsushogaigakushusenta_library.yaml index 79ebea4561..00801be1f2 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsushogaigakushusenta_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsushogaigakushusenta_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map13.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map13.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:03:54.207190+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/gakushu.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/gakushu.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:03:54.207190+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/gakushu.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:03:54.207190+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsusumiyoshi_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsusumiyoshi_library.yaml index e143b7b18b..906eca8479 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsusumiyoshi_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsusumiyoshi_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map06.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map06.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:04:01.969737+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/sumiyoshi.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/sumiyoshi.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:04:01.969737+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/sumiyoshi.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:04:01.969737+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL-fuchushiritsuyotsuya_library.yaml b/data/custodian/JP-13-FUC-L-FL-fuchushiritsuyotsuya_library.yaml index 5fa2ab0c90..4f8d8fef9b 100644 --- a/data/custodian/JP-13-FUC-L-FL-fuchushiritsuyotsuya_library.yaml +++ b/data/custodian/JP-13-FUC-L-FL-fuchushiritsuyotsuya_library.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/about/map09.html wikidata_official_website: http://library.city.fuchu.tokyo.jp/about/map09.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:04:12.447683+00:00' + source_url: https://library.city.fuchu.tokyo.jp/lib_info/yotsuya.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp/lib_info/yotsuya.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:04:12.447683+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp/lib_info/yotsuya.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:04:12.447683+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-FL.yaml b/data/custodian/JP-13-FUC-L-FL.yaml index abeee552fb..50c7bc3cc7 100644 --- a/data/custodian/JP-13-FUC-L-FL.yaml +++ b/data/custodian/JP-13-FUC-L-FL.yaml @@ -205,3 +205,30 @@ wikidata_enrichment: wikidata_web: official_website: http://library.city.fuchu.tokyo.jp/ wikidata_official_website: http://library.city.fuchu.tokyo.jp/ +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:04:22.535021+00:00' + source_url: https://library.city.fuchu.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://library.city.fuchu.tokyo.jp + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T14:04:22.535021+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 府中市立図書館 + - claim_type: favicon_url + claim_value: https://library.city.fuchu.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://library.city.fuchu.tokyo.jp + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:04:22.535021+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-FUC-L-ITMRTPSSL.yaml b/data/custodian/JP-13-FUC-L-ITMRTPSSL.yaml index 86847e0a0d..e3225a3831 100644 --- a/data/custodian/JP-13-FUC-L-ITMRTPSSL.yaml +++ b/data/custodian/JP-13-FUC-L-ITMRTPSSL.yaml @@ -152,3 +152,28 @@ location: geonames_id: 11611632 geonames_name: Fuchū feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:04:31.795986+00:00' + source_url: https://www.tama-100.or.jp/category_list.php?frmCd=5-0-0-0-0 + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.tama-100.or.jp/css/img/apple-touch-icon.png + source_url: https://www.tama-100.or.jp/category_list.php?frmCd=5-0-0-0-0 + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T14:04:31.795986+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.tama-100.or.jp/design_img/og_image.png + source_url: https://www.tama-100.or.jp/category_list.php?frmCd=5-0-0-0-0 + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T14:04:31.795986+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-FUC-L-TUFSL.yaml b/data/custodian/JP-13-FUC-L-TUFSL.yaml index e80d208d47..2d4f6183c2 100644 --- a/data/custodian/JP-13-FUC-L-TUFSL.yaml +++ b/data/custodian/JP-13-FUC-L-TUFSL.yaml @@ -41,13 +41,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-FUC-L-TUFSL - valid_from: "2025-12-10T09:44:02Z" + valid_from: '2025-12-10T09:44:02Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-FUC-L-TUFSL valid_from: null - valid_to: "2025-12-10T09:44:02Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:02Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-FUC-L-TUFSL ghcid_numeric: 535539741010551052 valid_from: '2025-12-06T23:38:53.346778+00:00' @@ -106,8 +107,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo University of Foreign Studies Library @@ -195,7 +196,8 @@ wikidata_enrichment: member_of: - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.tufs.ac.jp/common/library/index-j.html wikidata_official_website: http://www.tufs.ac.jp/common/library/index-j.html @@ -217,3 +219,37 @@ location: geonames_id: 11611632 geonames_name: Fuchū feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:05:12.415903+00:00' + source_url: http://www.tufs.ac.jp/common/library/index-j.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.tufs.ac.jp/library/wp-content/uploads/sites/5/2023/09/title-1.png + source_url: http://www.tufs.ac.jp/common/library/index-j.html + css_selector: '#header-in > div.logo.logo-header > a.site-name.site-name-text-link + > span.site-name-text > img.site-logo-image.header-site-logo-image' + retrieved_on: '2025-12-25T14:05:12.415903+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東京外国語大学附属図書館 + - claim_type: favicon_url + claim_value: https://www.tufs.ac.jp/library/wp-content/uploads/sites/5/2023/09/cropped-TUFS_SM-p-180x180.png + source_url: http://www.tufs.ac.jp/common/library/index-j.html + css_selector: '[document] > html > head > link:nth-of-type(47)' + retrieved_on: '2025-12-25T14:05:12.415903+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.tufs.ac.jp/library/wp-content/uploads/sites/5/2021/04/homeimage.jpg + source_url: http://www.tufs.ac.jp/common/library/index-j.html + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T14:05:12.415903+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-FUC-M-FAM.yaml b/data/custodian/JP-13-FUC-M-FAM.yaml index 6b9adf90e1..2ef3a03176 100644 --- a/data/custodian/JP-13-FUC-M-FAM.yaml +++ b/data/custodian/JP-13-FUC-M-FAM.yaml @@ -1283,3 +1283,28 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/GeJgP9ic8Ws/hqdefault_live.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:05:20.447090+00:00' + source_url: http://www.city.fuchu.tokyo.jp/art + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.city.fuchu.tokyo.jp/images/apple-touch-icon.png + source_url: http://www.city.fuchu.tokyo.jp/art + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T14:05:20.447090+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.fuchu.tokyo.jp/images/ogp.png + source_url: http://www.city.fuchu.tokyo.jp/art + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:05:20.447090+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-FUS-M-FMLH.yaml b/data/custodian/JP-13-FUS-M-FMLH.yaml index 2c640b0df0..f6fd096add 100644 --- a/data/custodian/JP-13-FUS-M-FMLH.yaml +++ b/data/custodian/JP-13-FUS-M-FMLH.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-FUS-M-FMLH - valid_from: "2025-12-10T09:44:02Z" + valid_from: '2025-12-10T09:44:02Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-FUS-M-FMLH valid_from: null - valid_to: "2025-12-10T09:44:02Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:02Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-FUS-M-FMLH ghcid_numeric: 2304751066352204324 valid_from: '2025-12-06T23:38:33.706761+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: FUSSA MUSEUM OF LOCAL HISTORY @@ -175,8 +176,8 @@ wikidata_enrichment: instance_of: &id004 - id: Q33506 label: museum - description: institution that holds artifacts and other objects of scientific, artistic, cultural, historical, or other - importance + description: institution that holds artifacts and other objects of scientific, + artistic, cultural, historical, or other importance wikidata_instance_of: *id004 wikidata_location: coordinates: &id007 @@ -218,3 +219,22 @@ location: postal_code: 197-0003 street_address: KUMAGAWA, Fussa Shi, Tokyo To, 197-0003 normalization_timestamp: '2025-12-09T12:21:32.142080+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:29:25.890440+00:00' + source_url: https://www.museum.fussa.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.museum.fussa.tokyo.jp/cms/wp-content/themes/fussa/images/favicon.ico + source_url: https://www.museum.fussa.tokyo.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:29:25.890440+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-C-chuodaigakuhogakubugakuseitoshoshitsu.yaml b/data/custodian/JP-13-HAC-L-C-chuodaigakuhogakubugakuseitoshoshitsu.yaml index daf21a7f13..a228a526ef 100644 --- a/data/custodian/JP-13-HAC-L-C-chuodaigakuhogakubugakuseitoshoshitsu.yaml +++ b/data/custodian/JP-13-HAC-L-C-chuodaigakuhogakubugakuseitoshoshitsu.yaml @@ -205,3 +205,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:29:33.240002+00:00' + source_url: http://www.chuo-u.ac.jp/library/library_service/tamacampus/law_library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/library/library_service/tamacampus/law_library + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:29:33.240002+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/library/library_service/tamacampus/law_library + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:29:33.240002+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-C-chuodaigakujimbunkagakukenkyusho.yaml b/data/custodian/JP-13-HAC-L-C-chuodaigakujimbunkagakukenkyusho.yaml index 615ab6a788..e9386d910c 100644 --- a/data/custodian/JP-13-HAC-L-C-chuodaigakujimbunkagakukenkyusho.yaml +++ b/data/custodian/JP-13-HAC-L-C-chuodaigakujimbunkagakukenkyusho.yaml @@ -41,13 +41,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-C-chuodaigakujimbunkagakukenkyusho - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-C-chuodaigakujimbunkagakukenkyusho valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-C-chuodaigakujimbunkagakukenkyusho ghcid_numeric: 7548581585069259310 valid_from: '2025-12-06T23:38:55.046050+00:00' @@ -106,8 +107,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: CHUODAIGAKUJIMBUNKAGAKUKENKYUSHO @@ -215,3 +216,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:29:40.973116+00:00' + source_url: http://www.chuo-u.ac.jp/research/institutes/culturalscience + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/research/institutes/culturalscience + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:29:40.973116+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/research/institutes/culturalscience + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:29:40.973116+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-C-chuodaigakukeizaikenkyujo.yaml b/data/custodian/JP-13-HAC-L-C-chuodaigakukeizaikenkyujo.yaml index 3074b3e803..4ac7cbb06f 100644 --- a/data/custodian/JP-13-HAC-L-C-chuodaigakukeizaikenkyujo.yaml +++ b/data/custodian/JP-13-HAC-L-C-chuodaigakukeizaikenkyujo.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-C-chuodaigakukeizaikenkyujo - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-C-chuodaigakukeizaikenkyujo valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-C-chuodaigakukeizaikenkyujo ghcid_numeric: 4810812187606637727 valid_from: '2025-12-06T23:38:55.041002+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: CHUODAIGAKUKEIZAIKENKYUJO @@ -205,3 +206,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:30:20.735321+00:00' + source_url: http://www.chuo-u.ac.jp/research/institutes/economic + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/research/institutes/economic + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:30:20.735321+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/research/institutes/economic + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:30:20.735321+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-C-chuodaigakukigyokenkyujo.yaml b/data/custodian/JP-13-HAC-L-C-chuodaigakukigyokenkyujo.yaml index 6a138cf88d..1b6f8d8329 100644 --- a/data/custodian/JP-13-HAC-L-C-chuodaigakukigyokenkyujo.yaml +++ b/data/custodian/JP-13-HAC-L-C-chuodaigakukigyokenkyujo.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-C-chuodaigakukigyokenkyujo - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-C-chuodaigakukigyokenkyujo valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-C-chuodaigakukigyokenkyujo ghcid_numeric: 3961943790049198653 valid_from: '2025-12-06T23:38:55.043537+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: CHUODAIGAKUKIGYOKENKYUJO @@ -204,3 +205,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:30:32.095556+00:00' + source_url: http://www.chuo-u.ac.jp/research/institutes/business + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/research/institutes/business + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:30:32.095556+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/research/institutes/business + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:30:32.095556+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo.yaml b/data/custodian/JP-13-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo.yaml index 06b7420c20..ae950585df 100644 --- a/data/custodian/JP-13-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo.yaml +++ b/data/custodian/JP-13-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-C-chuodaigakuseisakubunkasogokenkyujo ghcid_numeric: 16479389462139040776 valid_from: '2025-12-06T23:38:55.054384+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: CHUODAIGAKUSEISAKUBUNKASOGOKENKYUJO @@ -204,3 +205,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:30:39.722696+00:00' + source_url: http://www.chuo-u.ac.jp/research/institutes/policystudies + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/research/institutes/policystudies + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:30:39.722696+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/research/institutes/policystudies + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:30:39.722696+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-C-chuodaigakushakaikagakukenkyujo.yaml b/data/custodian/JP-13-HAC-L-C-chuodaigakushakaikagakukenkyujo.yaml index 483ada97a0..ffdbee02c4 100644 --- a/data/custodian/JP-13-HAC-L-C-chuodaigakushakaikagakukenkyujo.yaml +++ b/data/custodian/JP-13-HAC-L-C-chuodaigakushakaikagakukenkyujo.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-C-chuodaigakushakaikagakukenkyujo - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-C-chuodaigakushakaikagakukenkyujo valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-C-chuodaigakushakaikagakukenkyujo ghcid_numeric: 13572919211061991325 valid_from: '2025-12-06T23:38:55.048987+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: CHUODAIGAKUSHAKAIKAGAKUKENKYUJO @@ -204,3 +205,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:30:50.025271+00:00' + source_url: http://www.chuo-u.ac.jp/research/institutes/socialsciences + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/research/institutes/socialsciences + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:30:50.025271+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/research/institutes/socialsciences + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:30:50.025271+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-C.yaml b/data/custodian/JP-13-HAC-L-C.yaml index 71d01044ae..0a2d50888c 100644 --- a/data/custodian/JP-13-HAC-L-C.yaml +++ b/data/custodian/JP-13-HAC-L-C.yaml @@ -205,3 +205,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:02.271847+00:00' + source_url: http://www.chuo-u.ac.jp/library/library_service/tamacampus + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/library/library_service/tamacampus + css_selector: '[document] > html > head > link:nth-of-type(10)' + retrieved_on: '2025-12-25T14:31:02.271847+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.png + source_url: http://www.chuo-u.ac.jp/library/library_service/tamacampus + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:31:02.271847+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-CL.yaml b/data/custodian/JP-13-HAC-L-CL.yaml index 7afaba4082..ae5a9659ce 100644 --- a/data/custodian/JP-13-HAC-L-CL.yaml +++ b/data/custodian/JP-13-HAC-L-CL.yaml @@ -228,3 +228,28 @@ location: postal_code: 192-0393 street_address: 742-1 HIGASHINAKANO 742-1, Hachioji Shi, Tokyo To, 192-0393 normalization_timestamp: '2025-12-09T12:21:32.589862+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:12.652378+00:00' + source_url: http://www.chuo-u.ac.jp/chuo-u/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/chuo-u/library + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:31:12.652378+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/chuo-u/library + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:31:12.652378+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-HL-hachijochoritsu_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachijochoritsu_library.yaml index 74eb47d954..265876eb6a 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachijochoritsu_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachijochoritsu_library.yaml @@ -201,3 +201,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.town.hachijo.tokyo.jp/kakuka/kyouiku/library/tosyo-top.html wikidata_official_website: http://www.town.hachijo.tokyo.jp/kakuka/kyouiku/library/tosyo-top.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:22.610786+00:00' + source_url: https://www.town.hachijo.tokyo.jp/kakuka/kyouiku/library/tosyo-top.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.town.hachijo.tokyo.jp/img/logo.png + source_url: https://www.town.hachijo.tokyo.jp/kakuka/kyouiku/library/tosyo-top.html + css_selector: '#header > header > hgroup > a > img' + retrieved_on: '2025-12-25T14:31:22.610786+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 八丈町 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishiikoi_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishiikoi_library.yaml index f41436b5fa..3c6df33707 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishiikoi_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishiikoi_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-HL-hachiojishiikoi_library - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-HL-hachiojishiikoi_library valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-HL-hachiojishiikoi_library ghcid_numeric: 10998013155664456394 valid_from: '2025-12-06T23:38:52.989861+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HACHIOJISHIIKOI Library @@ -151,3 +152,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:30.536633+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/library.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/library.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:31:30.536633+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishiishikawashiminsenta_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishiishikawashiminsenta_library.yaml index eac891db1a..d100e336cc 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishiishikawashiminsenta_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishiishikawashiminsenta_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-HL-hachiojishiishikawashiminsenta_library - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-HL-hachiojishiishikawashiminsenta_library valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-HL-hachiojishiishikawashiminsenta_library ghcid_numeric: 14077976813549689953 valid_from: '2025-12-06T23:38:52.985114+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HACHIOJISHIISHIKAWASHIMINSENTA Library @@ -151,3 +152,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:36.829029+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib08.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib08.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:31:36.829029+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishikawaguchi_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishikawaguchi_library.yaml index 1967fada69..49e290b14b 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishikawaguchi_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishikawaguchi_library.yaml @@ -211,3 +211,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.library.city.hachioji.tokyo.jp/lib04.html wikidata_official_website: http://www.library.city.hachioji.tokyo.jp/lib04.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:43.820062+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:31:43.820062+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishikitanoshiminsenta_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishikitanoshiminsenta_library.yaml index a3c7f66852..3bf3c47208 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishikitanoshiminsenta_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishikitanoshiminsenta_library.yaml @@ -210,3 +210,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.library.city.hachioji.tokyo.jp/lib05.html wikidata_official_website: http://www.library.city.hachioji.tokyo.jp/lib05.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:50.854794+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib05.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib05.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:31:50.854794+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishiminamiosawa_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishiminamiosawa_library.yaml index 6601c754ff..1d7e03c322 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishiminamiosawa_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishiminamiosawa_library.yaml @@ -211,3 +211,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.library.city.hachioji.tokyo.jp/lib03.html wikidata_official_website: http://www.library.city.hachioji.tokyo.jp/lib03.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:31:58.091981+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:31:58.091981+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishiongatashiminsenta_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishiongatashiminsenta_library.yaml index cbcbdc805b..5aebe41b61 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishiongatashiminsenta_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishiongatashiminsenta_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:32:05.451707+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib07.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib07.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:32:05.451707+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishishogaigakushusenta_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishishogaigakushusenta_library.yaml index 1377d29a42..25a4b04f98 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishishogaigakushusenta_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishishogaigakushusenta_library.yaml @@ -211,3 +211,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.library.city.hachioji.tokyo.jp/lib02.html wikidata_official_website: http://www.library.city.hachioji.tokyo.jp/lib02.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:32:12.143300+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:32:12.143300+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishiyugichuoshiminsenta_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishiyugichuoshiminsenta_library.yaml index 59891396b2..dfd1dc4ed6 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishiyugichuoshiminsenta_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishiyugichuoshiminsenta_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-HL-hachiojishiyugichuoshiminsenta_library - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-HL-hachiojishiyugichuoshiminsenta_library valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-HL-hachiojishiyugichuoshiminsenta_library ghcid_numeric: 890668732079418372 valid_from: '2025-12-06T23:38:52.987444+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HACHIOJISHIYUGICHUOSHIMINSENTA Library @@ -151,3 +152,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:32:18.879656+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib09.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib09.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:32:18.879656+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL-hachiojishiyuishiminsentaminamino_library.yaml b/data/custodian/JP-13-HAC-L-HL-hachiojishiyuishiminsentaminamino_library.yaml index bc105d8edb..85873dc27b 100644 --- a/data/custodian/JP-13-HAC-L-HL-hachiojishiyuishiminsentaminamino_library.yaml +++ b/data/custodian/JP-13-HAC-L-HL-hachiojishiyuishiminsentaminamino_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-HL-hachiojishiyuishiminsentaminamino_library - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-HL-hachiojishiyuishiminsentaminamino_library valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-HL-hachiojishiyuishiminsentaminamino_library ghcid_numeric: 11038619215475146268 valid_from: '2025-12-06T23:38:52.980072+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HACHIOJISHIYUISHIMINSENTAMINAMINO Library @@ -151,3 +152,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:32:25.119659+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib06.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/library/lib06.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:32:25.119659+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-HL.yaml b/data/custodian/JP-13-HAC-L-HL.yaml index 14d95e6b98..9045dc1030 100644 --- a/data/custodian/JP-13-HAC-L-HL.yaml +++ b/data/custodian/JP-13-HAC-L-HL.yaml @@ -213,3 +213,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.library.city.hachioji.tokyo.jp/lib01.html wikidata_official_website: http://www.library.city.hachioji.tokyo.jp/lib01.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:32:32.162036+00:00' + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.hachioji.tokyo.jp/img/ruri180.png + source_url: https://www.library.city.hachioji.tokyo.jp/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:32:32.162036+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-ICLJCU.yaml b/data/custodian/JP-13-HAC-L-ICLJCU.yaml index 2fe11100a8..f7c3dc0426 100644 --- a/data/custodian/JP-13-HAC-L-ICLJCU.yaml +++ b/data/custodian/JP-13-HAC-L-ICLJCU.yaml @@ -211,3 +211,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:32:41.441274+00:00' + source_url: http://www.chuo-u.ac.jp/chuo-u/ins_law/index_j.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/chuo-u/ins_law/index_j.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:32:41.441274+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/chuo-u/ins_law/index_j.html + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:32:41.441274+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-IHSSCU.yaml b/data/custodian/JP-13-HAC-L-IHSSCU.yaml index 7a905fec71..3c75b5371e 100644 --- a/data/custodian/JP-13-HAC-L-IHSSCU.yaml +++ b/data/custodian/JP-13-HAC-L-IHSSCU.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-IHSSCU - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-IHSSCU valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-IHSSCU ghcid_numeric: 16869296380046832118 valid_from: '2025-12-06T23:38:55.051703+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Institute of Health and Sports Science, Chuo University @@ -204,3 +205,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:32:53.671522+00:00' + source_url: http://www.chuo-u.ac.jp/research/institutes/hsscience + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.chuo-u.ac.jp/favicon-16x16.ico + source_url: http://www.chuo-u.ac.jp/research/institutes/hsscience + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:32:53.671522+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 16x16 + - claim_type: og_image_url + claim_value: https://www.chuo-u.ac.jp/media/images/common/ogp.jpg + source_url: http://www.chuo-u.ac.jp/research/institutes/hsscience + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T14:32:53.671522+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-NL.yaml b/data/custodian/JP-13-HAC-L-NL.yaml index 74b08772fb..6755eaa1a1 100644 --- a/data/custodian/JP-13-HAC-L-NL.yaml +++ b/data/custodian/JP-13-HAC-L-NL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-NL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-NL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-NL ghcid_numeric: 16809677814190662144 valid_from: '2025-12-06T23:38:55.391353+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: NIHOMBUNKADAIGAKU Library @@ -204,3 +205,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:33:09.497942+00:00' + source_url: http://www.nihonbunka-u.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://nihonbunka-u.ac.jp/university_2022/wp-content/themes/nbu/assets/img/favicon.ico + source_url: http://www.nihonbunka-u.ac.jp + css_selector: '[document] > html.chrome > head > link' + retrieved_on: '2025-12-25T14:33:09.497942+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-OC.yaml b/data/custodian/JP-13-HAC-L-OC.yaml index bf44b36026..b2a4462665 100644 --- a/data/custodian/JP-13-HAC-L-OC.yaml +++ b/data/custodian/JP-13-HAC-L-OC.yaml @@ -281,3 +281,31 @@ location: postal_code: 192-8512 street_address: 2-3 KUBOYAMACHO, Hachioji Shi, Tokyo To, 192-8512 normalization_timestamp: '2025-12-09T12:21:33.326401+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:33:18.220942+00:00' + source_url: http://www.olympus.co.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.olympus.co.jp/shared/images/ci-logo-01.png + source_url: http://www.olympus.co.jp + css_selector: '#header > div.header-inner:nth-of-type(2) > h1.header-logo > a + > img' + retrieved_on: '2025-12-25T14:33:18.220942+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: オリンパスコーポレートロゴ + - claim_type: favicon_url + claim_value: http://www.olympus.co.jp/shared/images/icon-webclip-01.png + source_url: http://www.olympus.co.jp + css_selector: '[document] > html.js.flexbox > head > link' + retrieved_on: '2025-12-25T14:33:18.220942+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-SUFLFSEA.yaml b/data/custodian/JP-13-HAC-L-SUFLFSEA.yaml index b91536427e..c0944c02fd 100644 --- a/data/custodian/JP-13-HAC-L-SUFLFSEA.yaml +++ b/data/custodian/JP-13-HAC-L-SUFLFSEA.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-SUFLFSEA - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-SUFLFSEA valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-SUFLFSEA ghcid_numeric: 12358771442224844367 valid_from: '2025-12-06T23:38:54.922652+00:00' @@ -101,11 +102,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: Soka University Fraser Library(Faculty of Science and Engineering Annex) + claim_value: Soka University Fraser Library(Faculty of Science and Engineering + Annex) property_uri: skos:prefLabel provenance: namespace: glam @@ -164,7 +166,8 @@ wikidata_enrichment: wikidata_labels: en: Soka University Fraser Library(Faculty of Science and Engineering Annex) ja: 創価大学フレイザー図書館(理工学部分館) - wikidata_label_en: Soka University Fraser Library(Faculty of Science and Engineering Annex) + wikidata_label_en: Soka University Fraser Library(Faculty of Science and Engineering + Annex) wikidata_label_ja: 創価大学フレイザー図書館(理工学部分館) wikidata_classification: instance_of: &id004 @@ -204,3 +207,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:33:26.796518+00:00' + source_url: http://lib.soka.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.soka.ac.jp/images/common/favicon.png + source_url: http://lib.soka.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:33:26.796518+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-SUL.yaml b/data/custodian/JP-13-HAC-L-SUL.yaml index 3ed76fac21..98a6113be1 100644 --- a/data/custodian/JP-13-HAC-L-SUL.yaml +++ b/data/custodian/JP-13-HAC-L-SUL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-SUL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-SUL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-SUL ghcid_numeric: 4066965078261491998 valid_from: '2025-12-06T23:38:54.919834+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Soka University Library @@ -196,7 +197,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://lib.soka.ac.jp/ wikidata_official_website: http://lib.soka.ac.jp/ @@ -218,3 +220,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:33:35.263462+00:00' + source_url: http://lib.soka.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.soka.ac.jp/images/common/favicon.png + source_url: http://lib.soka.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:33:35.263462+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-SULSL.yaml b/data/custodian/JP-13-HAC-L-SULSL.yaml index f669057883..c2529a3822 100644 --- a/data/custodian/JP-13-HAC-L-SULSL.yaml +++ b/data/custodian/JP-13-HAC-L-SULSL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-SULSL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-SULSL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-SULSL ghcid_numeric: 8607275504862694189 valid_from: '2025-12-06T23:38:54.926025+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Soka University Law School Library @@ -204,3 +205,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:33:43.973027+00:00' + source_url: http://lib.soka.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.soka.ac.jp/images/common/favicon.png + source_url: http://lib.soka.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:33:43.973027+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-SUSL.yaml b/data/custodian/JP-13-HAC-L-SUSL.yaml index 7882a4323e..a2364b57c0 100644 --- a/data/custodian/JP-13-HAC-L-SUSL.yaml +++ b/data/custodian/JP-13-HAC-L-SUSL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-SUSL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-SUSL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-SUSL ghcid_numeric: 14973580792834017221 valid_from: '2025-12-06T23:38:59.735891+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Soka University Shirakaba Library @@ -204,3 +205,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:33:53.316870+00:00' + source_url: http://lib.soka.ac.jp/kango + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.soka.ac.jp/images/common/favicon.png + source_url: http://lib.soka.ac.jp/kango + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:33:53.316870+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-SWSCL.yaml b/data/custodian/JP-13-HAC-L-SWSCL.yaml index 3e0bc6ff63..7a730dc43d 100644 --- a/data/custodian/JP-13-HAC-L-SWSCL.yaml +++ b/data/custodian/JP-13-HAC-L-SWSCL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-SWSCL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-SWSCL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-SWSCL ghcid_numeric: 17472482588682182680 valid_from: '2025-12-06T23:38:56.929585+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Soka Woman's College Library @@ -204,3 +205,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:34:02.652657+00:00' + source_url: http://lib.soka.ac.jp/kahou + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.soka.ac.jp/img/common/favicon.png + source_url: http://lib.soka.ac.jp/kahou + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:34:02.652657+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-TL-tokyojunshindaigaku_library.yaml b/data/custodian/JP-13-HAC-L-TL-tokyojunshindaigaku_library.yaml index c18efae411..17e4c66583 100644 --- a/data/custodian/JP-13-HAC-L-TL-tokyojunshindaigaku_library.yaml +++ b/data/custodian/JP-13-HAC-L-TL-tokyojunshindaigaku_library.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-TL-tokyojunshindaigaku_library - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-TL-tokyojunshindaigaku_library valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-TL-tokyojunshindaigaku_library ghcid_numeric: 9988006338368822697 valid_from: '2025-12-06T23:38:55.417938+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKYOJUNSHINDAIGAKU Library @@ -196,7 +197,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.t-junshin.ac.jp/univ/gar wikidata_official_website: http://www.t-junshin.ac.jp/univ/gar @@ -218,3 +220,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:34:10.531393+00:00' + source_url: http://www.t-junshin.ac.jp/univ/gar + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.t-junshin.ac.jp/univ/wp-content/uploads/cropped-favicon-180x180.png + source_url: http://www.t-junshin.ac.jp/univ/gar + css_selector: '[document] > html > head > link:nth-of-type(40)' + retrieved_on: '2025-12-25T14:34:10.531393+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www.t-junshin.ac.jp/univ/wp-content/uploads/null_img.jpg + source_url: http://www.t-junshin.ac.jp/univ/gar + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T14:34:10.531393+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-L-TL-tokyozokeidaigakufuzoku_library.yaml b/data/custodian/JP-13-HAC-L-TL-tokyozokeidaigakufuzoku_library.yaml index 2b836febc2..8eca9285f4 100644 --- a/data/custodian/JP-13-HAC-L-TL-tokyozokeidaigakufuzoku_library.yaml +++ b/data/custodian/JP-13-HAC-L-TL-tokyozokeidaigakufuzoku_library.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-TL-tokyozokeidaigakufuzoku_library - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-TL-tokyozokeidaigakufuzoku_library valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-TL-tokyozokeidaigakufuzoku_library ghcid_numeric: 1565219728940050495 valid_from: '2025-12-06T23:38:55.117520+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKYOZOKEIDAIGAKUFUZOKU Library @@ -215,3 +216,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:34:35.462645+00:00' + source_url: http://www.zokei.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.zokei.ac.jp/wp-content/themes/zokeiweb/favicon.ico + source_url: http://www.zokei.ac.jp/library + css_selector: '[document] > html > head > link:nth-of-type(13)' + retrieved_on: '2025-12-25T14:34:35.462645+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-TL.yaml b/data/custodian/JP-13-HAC-L-TL.yaml index 8a36b1ef0a..6e6d7339b2 100644 --- a/data/custodian/JP-13-HAC-L-TL.yaml +++ b/data/custodian/JP-13-HAC-L-TL.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-TL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-TL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-TL ghcid_numeric: 16823901011793290075 valid_from: '2025-12-06T23:38:55.017545+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TAMABIJUTSUDAIGAKU Library @@ -250,3 +251,22 @@ location: postal_code: 192-0394 street_address: 2-1723 YARIMIZU, Hachioji Shi, Tokyo To, 192-0394 normalization_timestamp: '2025-12-09T12:21:33.759165+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:34:41.215907+00:00' + source_url: http://library.tamabi.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://library.tamabi.ac.jp/opac/images/cyan/favicon.ico + source_url: http://library.tamabi.ac.jp + css_selector: '[document] > html > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T14:34:41.215907+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-L-TUHL.yaml b/data/custodian/JP-13-HAC-L-TUHL.yaml index 202083ddba..d02158b237 100644 --- a/data/custodian/JP-13-HAC-L-TUHL.yaml +++ b/data/custodian/JP-13-HAC-L-TUHL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-TUHL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-TUHL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-TUHL ghcid_numeric: 7628512807518341674 valid_from: '2025-12-06T23:38:55.009876+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Takushoku University Hachioji Library @@ -204,3 +205,20 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:34:57.604015+00:00' + source_url: http://www.takushoku-u.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.takushoku-u.ac.jp/images/standard_photo_takudai_logo.gif + source_url: http://www.takushoku-u.ac.jp/library + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T14:34:57.604015+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-HAC-L-YL.yaml b/data/custodian/JP-13-HAC-L-YL.yaml index 3632e10af6..1bb6905710 100644 --- a/data/custodian/JP-13-HAC-L-YL.yaml +++ b/data/custodian/JP-13-HAC-L-YL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-YL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-YL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-YL ghcid_numeric: 17924990199130339682 valid_from: '2025-12-06T23:38:56.932170+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: YAMANOBIYOGEIJUTSUTANKIDAIGAKU Library @@ -204,3 +205,37 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:35:31.607860+00:00' + source_url: http://www.yamano.ac.jp/about/facilities/library.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.yamano.ac.jp/about/facilities/image/logo_pc.png + source_url: http://www.yamano.ac.jp/about/facilities/library.html + css_selector: '[document] > html > body.home.home-404 > header.l-header > div.l-header__logo + > div.l-header__logo__wrap > a.u-hidden-sp > img' + retrieved_on: '2025-12-25T14:35:31.607860+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: http://www.yamano.ac.jp/about/facilities/lib/safari-pinned-tab.svg + source_url: http://www.yamano.ac.jp/about/facilities/library.html + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T14:35:31.607860+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.yamano.ac.jp/image/ogp.png + source_url: http://www.yamano.ac.jp/about/facilities/library.html + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T14:35:31.607860+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 5 diff --git a/data/custodian/JP-13-HAC-L-YUANL.yaml b/data/custodian/JP-13-HAC-L-YUANL.yaml index fe64dd149f..ddec00a6fa 100644 --- a/data/custodian/JP-13-HAC-L-YUANL.yaml +++ b/data/custodian/JP-13-HAC-L-YUANL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-L-YUANL - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-L-YUANL valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-L-YUANL ghcid_numeric: 11857807885685771110 valid_from: '2025-12-06T23:38:55.470295+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Yamazaki University of Animal Nursing Library @@ -190,7 +191,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://univ.yamazaki.ac.jp/univ/about/library/ wikidata_official_website: http://univ.yamazaki.ac.jp/univ/about/library/ @@ -212,3 +214,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:35:44.410851+00:00' + source_url: http://univ.yamazaki.ac.jp/univ/about/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://univ.yamazaki.ac.jp/Portals/0/images/univ/common/logo_univ.png?11826121542876 + source_url: http://univ.yamazaki.ac.jp/univ/about/library + css_selector: '#dnn_ctr753_HtmlModule_HtmlModule_lblContent > div.logo > a > img' + retrieved_on: '2025-12-25T14:35:44.410851+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-HAC-M-HCHM.yaml b/data/custodian/JP-13-HAC-M-HCHM.yaml index 9c7c07cddd..5c0ca10532 100644 --- a/data/custodian/JP-13-HAC-M-HCHM.yaml +++ b/data/custodian/JP-13-HAC-M-HCHM.yaml @@ -214,3 +214,22 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:35:50.863327+00:00' + source_url: https://www.city.hachioji.tokyo.jp/kankobunka/003/005/p005312.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.hachioji.tokyo.jp/share/imgs/main-favicon.ico + source_url: https://www.city.hachioji.tokyo.jp/kankobunka/003/005/p005312.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:35:50.863327+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-M-HSC.yaml b/data/custodian/JP-13-HAC-M-HSC.yaml index 6a5e18fecc..c02584cb1c 100644 --- a/data/custodian/JP-13-HAC-M-HSC.yaml +++ b/data/custodian/JP-13-HAC-M-HSC.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAC-M-HSC - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAC-M-HSC valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAC-M-HSC ghcid_numeric: 9848006179648696697 valid_from: '2025-12-06T23:38:33.547319+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HACHIOJI SCIENCE CENTER @@ -195,8 +196,8 @@ wikidata_enrichment: description: museum devoted primarily to science - id: Q148319 label: planetarium - description: theatre built primarily for presenting educational and entertaining shows about astronomy and the night - sky + description: theatre built primarily for presenting educational and entertaining + shows about astronomy and the night sky - id: Q842478 label: children's museum description: type of museum geared to children @@ -240,3 +241,22 @@ location: postal_code: 192-0062 street_address: OYOKOCHO, Hachioji Shi, Tokyo To, 192-0062 normalization_timestamp: '2025-12-09T12:21:34.524554+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:35:55.684371+00:00' + source_url: https://www.city.hachioji.tokyo.jp/shisetsu/003/p011705.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.hachioji.tokyo.jp/share/imgs/main-favicon.ico + source_url: https://www.city.hachioji.tokyo.jp/shisetsu/003/p011705.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:35:55.684371+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-M-MPGTUPLS.yaml b/data/custodian/JP-13-HAC-M-MPGTUPLS.yaml index d108f89da2..bc9fc2e845 100644 --- a/data/custodian/JP-13-HAC-M-MPGTUPLS.yaml +++ b/data/custodian/JP-13-HAC-M-MPGTUPLS.yaml @@ -211,3 +211,28 @@ wikidata_enrichment: wikidata_official_website: https://www.toyaku.ac.jp/campus/hachioji/plant/ wikidata_social_media: instagram_username: medicinalplantgardentupls +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:36:13.148358+00:00' + source_url: https://www.toyaku.ac.jp/campus/hachioji/plant + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.toyaku.ac.jp/apple-touch-icon.jpg + source_url: https://www.toyaku.ac.jp/campus/hachioji/plant + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T14:36:13.148358+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.toyaku.ac.jp/common/images/img-ogp-01.jpg + source_url: https://www.toyaku.ac.jp/campus/hachioji/plant + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T14:36:13.148358+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-HAC-M-TFAM.yaml b/data/custodian/JP-13-HAC-M-TFAM.yaml index 8c8f3f4f90..d944842e79 100644 --- a/data/custodian/JP-13-HAC-M-TFAM.yaml +++ b/data/custodian/JP-13-HAC-M-TFAM.yaml @@ -1245,3 +1245,28 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/cWJtBc9gc4g/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:36:22.927970+00:00' + source_url: https://www.fujibi.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.fujibi.or.jp/wp-content/themes/fam/icon.svg + source_url: https://www.fujibi.or.jp + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T14:36:22.927970+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/svg+xml + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.fujibi.or.jp/wp-content/themes/fam/ogimage.png + source_url: https://www.fujibi.or.jp + css_selector: '[document] > html > head > meta:nth-of-type(14)' + retrieved_on: '2025-12-25T14:36:22.927970+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HAC-M-TFSG.yaml b/data/custodian/JP-13-HAC-M-TFSG.yaml index c1ea1c1d50..e802266a61 100644 --- a/data/custodian/JP-13-HAC-M-TFSG.yaml +++ b/data/custodian/JP-13-HAC-M-TFSG.yaml @@ -232,3 +232,22 @@ wikidata_enrichment: commons_category: Tama Forest Science Garden image: Tama Forest Science Garden 2012.4.jpg wikidata_image: Tama Forest Science Garden 2012.4.jpg +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:36:34.172503+00:00' + source_url: https://www.ffpri.affrc.go.jp/tmk + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.ffpri.affrc.go.jp/shared/images/favicon/apple-touch-icon-precomposed.png + source_url: https://www.ffpri.affrc.go.jp/tmk + css_selector: '[document] > html > head > link:nth-of-type(14)' + retrieved_on: '2025-12-25T14:36:34.172503+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-HAC-M-TM.yaml b/data/custodian/JP-13-HAC-M-TM.yaml index c5cb65530a..235ccd0f5f 100644 --- a/data/custodian/JP-13-HAC-M-TM.yaml +++ b/data/custodian/JP-13-HAC-M-TM.yaml @@ -248,3 +248,22 @@ wikidata_enrichment: - id: Q11528100 label: Tohata Architects & Engineers description: '' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:36:44.512279+00:00' + source_url: https://www.takao599museum.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.takao599museum.jp/apple-touch-icon-precomposed.png + source_url: https://www.takao599museum.jp + css_selector: '[document] > html.fac-js-enabled.fac-dom-loaded > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T14:36:44.512279+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAC-M-TUM.yaml b/data/custodian/JP-13-HAC-M-TUM.yaml index 7763c4c26f..1b51ec790f 100644 --- a/data/custodian/JP-13-HAC-M-TUM.yaml +++ b/data/custodian/JP-13-HAC-M-TUM.yaml @@ -152,3 +152,28 @@ location: geonames_id: 1863440 geonames_name: Hachiōji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:36:54.077648+00:00' + source_url: http://teikyo.jp/museum + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://teikyo.jp/museum/wp-content/uploads/2022/04/favicon-1.png + source_url: http://teikyo.jp/museum + css_selector: '[document] > html > head > link:nth-of-type(17)' + retrieved_on: '2025-12-25T14:36:54.077648+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 32x32 + - claim_type: og_image_url + claim_value: https://teikyo.jp/museum/wp-content/uploads/2025/04/eyecatch_2025_seminar_sai-scaled.jpg + source_url: http://teikyo.jp/museum + css_selector: '[document] > html > head > meta:nth-of-type(17)' + retrieved_on: '2025-12-25T14:36:54.077648+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-HAG-A-HTA-haga_town_archives.yaml b/data/custodian/JP-13-HAG-A-HTA-haga_town_archives.yaml index b1178a0d44..f0367b18b9 100644 --- a/data/custodian/JP-13-HAG-A-HTA-haga_town_archives.yaml +++ b/data/custodian/JP-13-HAG-A-HTA-haga_town_archives.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAG-A-HTA-haga_town_archives - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAG-A-HTA-haga_town_archives valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAG-A-HTA-haga_town_archives ghcid_numeric: 15893078129013026606 valid_from: '2025-12-06T23:38:29.533372+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Haga Town Archives @@ -153,3 +154,22 @@ location: geonames_id: 11112495 geonames_name: Haga feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:37:54.928146+00:00' + source_url: https://www.town.tochigi-haga.lg.jp/menu/kurashi/sports/shogai/johokan/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.town.tochigi-haga.lg.jp/shared/images/favicon/apple-touch-icon-precomposed.png + source_url: https://www.town.tochigi-haga.lg.jp/menu/kurashi/sports/shogai/johokan/index.html + css_selector: '[document] > html > head > link:nth-of-type(14)' + retrieved_on: '2025-12-25T14:37:54.928146+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-HAG-A-HTA.yaml b/data/custodian/JP-13-HAG-A-HTA.yaml index 1be6e0cfeb..2d1330660e 100644 --- a/data/custodian/JP-13-HAG-A-HTA.yaml +++ b/data/custodian/JP-13-HAG-A-HTA.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAG-A-HTA - valid_from: "2025-12-10T09:44:03Z" + valid_from: '2025-12-10T09:44:03Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAG-A-HTA valid_from: null - valid_to: "2025-12-10T09:44:03Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:03Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAG-A-HTA ghcid_numeric: 13007848696833093898 valid_from: '2025-12-06T23:35:50.087366+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Haga Town Archives @@ -153,3 +154,22 @@ location: geonames_id: 11112495 geonames_name: Haga feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:52:28.786668+00:00' + source_url: https://www.town.tochigi-haga.lg.jp/menu/kurashi/sports/shogai/johokan/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.town.tochigi-haga.lg.jp/shared/images/favicon/apple-touch-icon-precomposed.png + source_url: https://www.town.tochigi-haga.lg.jp/menu/kurashi/sports/shogai/johokan/index.html + css_selector: '[document] > html > head > link:nth-of-type(14)' + retrieved_on: '2025-12-25T14:52:28.786668+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-HAG-L-IPL.yaml b/data/custodian/JP-13-HAG-L-IPL.yaml index 1886afd9aa..22a8c5c560 100644 --- a/data/custodian/JP-13-HAG-L-IPL.yaml +++ b/data/custodian/JP-13-HAG-L-IPL.yaml @@ -218,3 +218,22 @@ wikidata_enrichment: wikidata_media: image: Ichikai Town Library & Museum of History and Folklore.jpg wikidata_image: Ichikai Town Library & Museum of History and Folklore.jpg +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:56:22.629763+00:00' + source_url: https://www.library.ichikai.tochigi.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.ichikai.tochigi.jp/images/header_logo.png + source_url: https://www.library.ichikai.tochigi.jp + css_selector: '#index > header > div.block.clearfix > h1 > a > img' + retrieved_on: '2025-12-25T14:56:22.629763+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 市貝町立図書館・歴史民俗資料館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-HAG-L-M.yaml b/data/custodian/JP-13-HAG-L-M.yaml index ddf52f8dbd..f56acc437b 100644 --- a/data/custodian/JP-13-HAG-L-M.yaml +++ b/data/custodian/JP-13-HAG-L-M.yaml @@ -201,3 +201,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.town.mashiko.tochigi.jp/page/page000173.html wikidata_official_website: http://www.town.mashiko.tochigi.jp/page/page000173.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:56:31.565829+00:00' + source_url: http://www.town.mashiko.tochigi.jp/page/page000173.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.town.mashiko.tochigi.jp/page/web_clip_icon.png + source_url: http://www.town.mashiko.tochigi.jp/page/page000173.html + css_selector: '[document] > html > body > link:nth-of-type(2)' + retrieved_on: '2025-12-25T14:56:31.565829+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-HAG-L-ML.yaml b/data/custodian/JP-13-HAG-L-ML.yaml index 398b57f785..9c442985db 100644 --- a/data/custodian/JP-13-HAG-L-ML.yaml +++ b/data/custodian/JP-13-HAG-L-ML.yaml @@ -201,3 +201,23 @@ wikidata_enrichment: wikidata_web: official_website: http://www.town.motegi.tochigi.jp/motegi/nextpage.php?cd=000000381&syurui=2&lev=2&hidchangemoji=2 wikidata_official_website: http://www.town.motegi.tochigi.jp/motegi/nextpage.php?cd=000000381&syurui=2&lev=2&hidchangemoji=2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:56:42.473308+00:00' + source_url: http://www.town.motegi.tochigi.jp/motegi/nextpage.php?cd=000000381&syurui=2&lev=2&hidchangemoji=2 + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.town.motegi.tochigi.jp/motegi/image/symbol.png + source_url: http://www.town.motegi.tochigi.jp/motegi/nextpage.php?cd=000000381&syurui=2&lev=2&hidchangemoji=2 + css_selector: '#header > a.navbar-brand > div.d-flex.align-items-center > div.mr-3 + > img.mt-logo-image' + retrieved_on: '2025-12-25T14:56:42.473308+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 茂木町町章 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-HAG-M-HTM.yaml b/data/custodian/JP-13-HAG-M-HTM.yaml index 00bd8f14ac..a454517178 100644 --- a/data/custodian/JP-13-HAG-M-HTM.yaml +++ b/data/custodian/JP-13-HAG-M-HTM.yaml @@ -256,3 +256,22 @@ wikidata_enrichment: wikidata_official_website: *id007 wikidata_social_media: twitter_username: hagamachisogoj1 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:56:48.192011+00:00' + source_url: https://www.town.tochigi-haga.lg.jp/menu/kurashi/sports/shogai/johokan/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.town.tochigi-haga.lg.jp/shared/images/favicon/apple-touch-icon-precomposed.png + source_url: https://www.town.tochigi-haga.lg.jp/menu/kurashi/sports/shogai/johokan/index.html + css_selector: '[document] > html > head > link:nth-of-type(14)' + retrieved_on: '2025-12-25T14:56:48.192011+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-HAG-M-IHFM.yaml b/data/custodian/JP-13-HAG-M-IHFM.yaml index 430b2feec4..38161e7228 100644 --- a/data/custodian/JP-13-HAG-M-IHFM.yaml +++ b/data/custodian/JP-13-HAG-M-IHFM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAG-M-IHFM - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAG-M-IHFM valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAG-M-IHFM ghcid_numeric: 13648974713677583673 valid_from: '2025-12-06T23:38:31.926481+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: ICHIKAI HISTORICAL AND FOLK MUSEUM @@ -153,3 +154,22 @@ location: geonames_id: 13156713 geonames_name: Ichikai feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:56:55.786042+00:00' + source_url: http://www.library.ichikai.tochigi.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.library.ichikai.tochigi.jp/images/header_logo.png + source_url: http://www.library.ichikai.tochigi.jp + css_selector: '#index > header > div.block.clearfix > h1 > a > img' + retrieved_on: '2025-12-25T14:56:55.786042+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 市貝町立図書館・歴史民俗資料館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-HAG-M-MMCA.yaml b/data/custodian/JP-13-HAG-M-MMCA.yaml index ef219b9c8c..09bb30c7b0 100644 --- a/data/custodian/JP-13-HAG-M-MMCA.yaml +++ b/data/custodian/JP-13-HAG-M-MMCA.yaml @@ -871,3 +871,22 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/x_q8bbUYgeU/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:57:04.020537+00:00' + source_url: http://www.mashiko-museum.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.mashiko-museum.jp/icon_images/iphoneicon.png + source_url: http://www.mashiko-museum.jp + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T14:57:04.020537+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-HAG-M-MMF.yaml b/data/custodian/JP-13-HAG-M-MMF.yaml index c16334df21..c49d59b24b 100644 --- a/data/custodian/JP-13-HAG-M-MMF.yaml +++ b/data/custodian/JP-13-HAG-M-MMF.yaml @@ -154,3 +154,22 @@ location: geonames_id: 2111827 geonames_name: Motegi feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:57:13.583438+00:00' + source_url: https://fuminomori.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://fuminomori.jp/templates/motegilibrary/favicon.ico + source_url: https://fuminomori.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:57:13.583438+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAM-L-H.yaml b/data/custodian/JP-13-HAM-L-H.yaml index 4a9e19cd4a..97cfd17303 100644 --- a/data/custodian/JP-13-HAM-L-H.yaml +++ b/data/custodian/JP-13-HAM-L-H.yaml @@ -204,3 +204,28 @@ wikidata_enrichment: wikidata_web: official_website: http://www.city.hamura.tokyo.jp/0000002123.html wikidata_official_website: http://www.city.hamura.tokyo.jp/0000002123.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:57:43.203033+00:00' + source_url: http://www.city.hamura.tokyo.jp/0000002123.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.city.hamura.tokyo.jp/design_img/favicon.ico + source_url: http://www.city.hamura.tokyo.jp/0000002123.html + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T14:57:43.203033+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.hamura.tokyo.jp/design_img/og_image.png + source_url: http://www.city.hamura.tokyo.jp/0000002123.html + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T14:57:43.203033+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-HAM-L-HCL.yaml b/data/custodian/JP-13-HAM-L-HCL.yaml index 9382358599..7214bdc0b7 100644 --- a/data/custodian/JP-13-HAM-L-HCL.yaml +++ b/data/custodian/JP-13-HAM-L-HCL.yaml @@ -204,3 +204,22 @@ wikidata_enrichment: wikidata_web: official_website: http://www.hamura-library.tokyo.jp/ wikidata_official_website: http://www.hamura-library.tokyo.jp/ +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:57:54.794087+00:00' + source_url: https://www.hamura-library.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.hamura-library.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://www.hamura-library.tokyo.jp + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T14:57:54.794087+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HAM-M-HM.yaml b/data/custodian/JP-13-HAM-M-HM.yaml index a3785d3621..d50e2767cb 100644 --- a/data/custodian/JP-13-HAM-M-HM.yaml +++ b/data/custodian/JP-13-HAM-M-HM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAM-M-HM - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAM-M-HM valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAM-M-HM ghcid_numeric: 14228598473420585810 valid_from: '2025-12-06T23:38:33.728753+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HAMURA MUSEUM @@ -151,3 +152,28 @@ location: geonames_id: 11611629 geonames_name: Hamura feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:58:01.164034+00:00' + source_url: https://www.city.hamura.tokyo.jp/0000005474.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.hamura.tokyo.jp/design_img/favicon.ico + source_url: https://www.city.hamura.tokyo.jp/0000005474.html + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T14:58:01.164034+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.hamura.tokyo.jp/design_img/og_image.png + source_url: https://www.city.hamura.tokyo.jp/0000005474.html + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T14:58:01.164034+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-HAM-M-HZP.yaml b/data/custodian/JP-13-HAM-M-HZP.yaml index 19d1e20cc7..ef56d8291a 100644 --- a/data/custodian/JP-13-HAM-M-HZP.yaml +++ b/data/custodian/JP-13-HAM-M-HZP.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HAM-M-HZP - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HAM-M-HZP valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HAM-M-HZP ghcid_numeric: 8960255251096834969 valid_from: '2025-12-06T23:38:33.730945+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HAMURA ZOOLOGICAL PARK @@ -202,8 +203,8 @@ wikidata_enrichment: instance_of: &id004 - id: Q43501 label: zoo - description: 'collection of assorted wild animal species kept for purposes like: study, conservation and, or, commercial - exhibition' + description: 'collection of assorted wild animal species kept for purposes like: + study, conservation and, or, commercial exhibition' wikidata_instance_of: *id004 wikidata_location: country: &id005 @@ -250,3 +251,28 @@ location: postal_code: 205-0012 street_address: HANE, Hamura Shi, Tokyo To, 205-0012 normalization_timestamp: '2025-12-09T12:21:35.565489+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:58:10.100083+00:00' + source_url: http://www.t-net.ne.jp/~hamura-z + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://hamurazoo.jp/icon.png + source_url: http://www.t-net.ne.jp/~hamura-z + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T14:58:10.100083+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://hamurazoo.jp/ogimg.jpg + source_url: http://www.t-net.ne.jp/~hamura-z + css_selector: '[document] > html > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T14:58:10.100083+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HIE-M-NESMTD.yaml b/data/custodian/JP-13-HIE-M-NESMTD.yaml index c38201a8eb..e859fc97d5 100644 --- a/data/custodian/JP-13-HIE-M-NESMTD.yaml +++ b/data/custodian/JP-13-HIE-M-NESMTD.yaml @@ -253,3 +253,22 @@ location: geonames_id: 9290610 feature_code: PPL normalization_timestamp: '2025-12-09T06:53:34.141451+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:58:17.872556+00:00' + source_url: http://www.nishiwaki-cs.or.jp/terra + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.nishiwaki-cs.or.jp/image/animated_favicon2.gif + source_url: http://www.nishiwaki-cs.or.jp/terra + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T14:58:17.872556+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/gif + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsukiyohara_library.yaml b/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsukiyohara_library.yaml index ef4ca92a94..4440c9166f 100644 --- a/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsukiyohara_library.yaml +++ b/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsukiyohara_library.yaml @@ -204,3 +204,20 @@ wikidata_enrichment: wikidata_web: official_website: http://www.lib.higashiyamato.tokyo.jp/index.html wikidata_official_website: http://www.lib.higashiyamato.tokyo.jp/index.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:59:47.640682+00:00' + source_url: https://www.lib.higashiyamato.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://localhost/TOSHOW/asp/shared/img/snsThumbnail.png + source_url: https://www.lib.higashiyamato.tokyo.jp + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T14:59:47.640682+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsusakuragaoka_library.yaml b/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsusakuragaoka_library.yaml index 498ee1f016..b3f447480e 100644 --- a/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsusakuragaoka_library.yaml +++ b/data/custodian/JP-13-HIG-L-HL-higashiyamatoshiritsusakuragaoka_library.yaml @@ -204,3 +204,20 @@ wikidata_enrichment: wikidata_web: official_website: http://www.lib.higashiyamato.tokyo.jp/index.html wikidata_official_website: http://www.lib.higashiyamato.tokyo.jp/index.html +logo_enrichment: + enrichment_timestamp: '2025-12-25T14:59:59.088263+00:00' + source_url: https://www.lib.higashiyamato.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://localhost/TOSHOW/asp/shared/img/snsThumbnail.png + source_url: https://www.lib.higashiyamato.tokyo.jp + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T14:59:59.088263+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-HIG-L-HL.yaml b/data/custodian/JP-13-HIG-L-HL.yaml index 47187fec8c..b501be9065 100644 --- a/data/custodian/JP-13-HIG-L-HL.yaml +++ b/data/custodian/JP-13-HIG-L-HL.yaml @@ -205,3 +205,20 @@ wikidata_enrichment: wikidata_web: official_website: http://www.lib.higashiyamato.tokyo.jp/ wikidata_official_website: http://www.lib.higashiyamato.tokyo.jp/ +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:00:08.551604+00:00' + source_url: https://www.lib.higashiyamato.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://localhost/TOSHOW/asp/shared/img/snsThumbnail.png + source_url: https://www.lib.higashiyamato.tokyo.jp + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T15:00:08.551604+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-HIG-L-TBSL.yaml b/data/custodian/JP-13-HIG-L-TBSL.yaml index e9acedfe10..0c386df173 100644 --- a/data/custodian/JP-13-HIG-L-TBSL.yaml +++ b/data/custodian/JP-13-HIG-L-TBSL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HIG-L-TBSL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HIG-L-TBSL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HIG-L-TBSL ghcid_numeric: 2864808006818620837 valid_from: '2025-12-06T23:38:58.866015+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Biblical Seminary Library @@ -153,3 +154,20 @@ location: geonames_id: 7279570 geonames_name: Higashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:00:46.589646+00:00' + source_url: http://www.jhc.or.jp/tbs/library/index.html + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.jhc.or.jp/tbs//bdflashinfo/thumbnail.png + source_url: http://www.jhc.or.jp/tbs/library/index.html + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:00:46.589646+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-HIG-M-FMH.yaml b/data/custodian/JP-13-HIG-M-FMH.yaml index 66670ec3b6..f91e9bb157 100644 --- a/data/custodian/JP-13-HIG-M-FMH.yaml +++ b/data/custodian/JP-13-HIG-M-FMH.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HIG-M-FMH - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HIG-M-FMH valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HIG-M-FMH ghcid_numeric: 9770563110900817089 valid_from: '2025-12-06T23:38:33.691688+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: THE FOLK MUSEUM OF HIGASHIMURAYAMA @@ -219,3 +220,23 @@ location: postal_code: 189-0021 street_address: SUWACHO, Higashimurayama Shi, Tokyo To, 189-0021 normalization_timestamp: '2025-12-09T12:21:36.167270+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:01:01.438946+00:00' + source_url: https://www.city.higashimurayama.tokyo.jp/tanoshimi/rekishi/furusato + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.higashimurayama.tokyo.jp/images/header_logo.png + source_url: https://www.city.higashimurayama.tokyo.jp/tanoshimi/rekishi/furusato + css_selector: '#header_block > header.header_area > div.l_container > div.header_upper.fixed + > div.header_box_left > div.header_logo > a > img' + retrieved_on: '2025-12-25T15:01:01.438946+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東村山市 Higashimurayama City + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-HIG-M-HCM.yaml b/data/custodian/JP-13-HIG-M-HCM.yaml index 7cf2f41a2b..ac119d3475 100644 --- a/data/custodian/JP-13-HIG-M-HCM.yaml +++ b/data/custodian/JP-13-HIG-M-HCM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HIG-M-HCM - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HIG-M-HCM valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HIG-M-HCM ghcid_numeric: 5777366010648073427 valid_from: '2025-12-06T23:38:33.709577+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HIGASHIYAMATO CITY MUSEUM @@ -151,3 +152,28 @@ location: geonames_id: 6822136 geonames_name: Higashiyamato feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:01:10.418014+00:00' + source_url: https://www.city.higashiyamato.lg.jp/index.cfm/35,0,366,html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.higashiyamato.lg.jp/index.cfm/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.higashiyamato.lg.jp/index.cfm/35,0,366,html + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T15:01:10.418014+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.higashiyamato.lg.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: https://www.city.higashiyamato.lg.jp/index.cfm/35,0,366,html + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:01:10.418014+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-HIG-M-NHSDM.yaml b/data/custodian/JP-13-HIG-M-NHSDM.yaml index e05813c07f..c836fa0c2d 100644 --- a/data/custodian/JP-13-HIG-M-NHSDM.yaml +++ b/data/custodian/JP-13-HIG-M-NHSDM.yaml @@ -273,3 +273,39 @@ wikidata_enrichment: - id: Q724647 label: Good Design Award description: Japanese design award +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:01:36.341133+00:00' + source_url: https://www.nhdm.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.nhdm.jp/hansen/wp-content/themes/hansen/_assets/images/top/logo_title.png + source_url: https://www.nhdm.jp + css_selector: '#top > header.siteHeader > div.siteHeader__inner.u-siteHeaderNav:nth-of-type(2) + > div.siteHeader__title > a.siteHeader__titleLogo > img.siteHeader__titleLogoImg' + retrieved_on: '2025-12-25T15:01:36.341133+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: logo + - claim_type: favicon_url + claim_value: https://www.nhdm.jp/hansen/wp-content/themes/hansen/_assets/images/_etc/custom-icon.png + source_url: https://www.nhdm.jp + css_selector: '[document] > html.no-js.wf-noto-sans-cjk-jp-n4-active > head > + link:nth-of-type(9)' + retrieved_on: '2025-12-25T15:01:36.341133+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/png + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.nhdm.jp/hansen/wp-content/themes/hansen/_assets/images/_etc/ogp.jpg + source_url: https://www.nhdm.jp + css_selector: '[document] > html.no-js.wf-noto-sans-cjk-jp-n4-active > head > + meta:nth-of-type(4)' + retrieved_on: '2025-12-25T15:01:36.341133+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-HIG-M-TCBM.yaml b/data/custodian/JP-13-HIG-M-TCBM.yaml index 4604927c9a..9e7efc9c8e 100644 --- a/data/custodian/JP-13-HIG-M-TCBM.yaml +++ b/data/custodian/JP-13-HIG-M-TCBM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HIG-M-TCBM - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HIG-M-TCBM valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HIG-M-TCBM ghcid_numeric: 14985891489123884639 valid_from: '2025-12-06T23:38:33.689342+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKUZOJI CONSERVATION OF BOARD MONUMENT @@ -151,3 +152,20 @@ location: geonames_id: 7279570 geonames_name: Higashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:01:46.267227+00:00' + source_url: http://www.tokuzo-ji.com + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://www.tokuzo-ji.com/images/common/ogp_logo.jpg + source_url: http://www.tokuzo-ji.com + css_selector: '[document] > html > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T15:01:46.267227+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-HIM-M-HSBG.yaml b/data/custodian/JP-13-HIM-M-HSBG.yaml index b515b71363..1b6414af16 100644 --- a/data/custodian/JP-13-HIM-M-HSBG.yaml +++ b/data/custodian/JP-13-HIM-M-HSBG.yaml @@ -237,3 +237,28 @@ wikidata_enrichment: - id: Q445298 label: Itsuko Hasegawa description: Japanese architect +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:02:19.147692+00:00' + source_url: https://www.himi-kaihin.com + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.himi-kaihin.com/common/images/parts/favicon.png + source_url: https://www.himi-kaihin.com + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:02:19.147692+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.himi-kaihin.com/common/images/parts/favicon.png + source_url: https://www.himi-kaihin.com + css_selector: '[document] > html > head > meta:nth-of-type(5)' + retrieved_on: '2025-12-25T15:02:19.147692+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-HIN-L-HL-hinocho_library.yaml b/data/custodian/JP-13-HIN-L-HL-hinocho_library.yaml index bcff892ea8..64a9344c27 100644 --- a/data/custodian/JP-13-HIN-L-HL-hinocho_library.yaml +++ b/data/custodian/JP-13-HIN-L-HL-hinocho_library.yaml @@ -201,3 +201,22 @@ wikidata_enrichment: wikidata_web: official_website: http://tosyo.town.hino.tottori.jp wikidata_official_website: http://tosyo.town.hino.tottori.jp +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:02:33.976740+00:00' + source_url: http://tosyo.town.hino.tottori.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://tosyo.town.hino.tottori.jp/img/favicon.ico + source_url: http://tosyo.town.hino.tottori.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:02:33.976740+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HIN-L-JWSUL.yaml b/data/custodian/JP-13-HIN-L-JWSUL.yaml index 7a0eefa733..9dccd8d94f 100644 --- a/data/custodian/JP-13-HIN-L-JWSUL.yaml +++ b/data/custodian/JP-13-HIN-L-JWSUL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HIN-L-JWSUL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HIN-L-JWSUL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HIN-L-JWSUL ghcid_numeric: 8113316008130357374 valid_from: '2025-12-06T23:38:54.901681+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Jissen Women's University Library @@ -190,7 +191,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.jissen.ac.jp/library wikidata_official_website: http://www.jissen.ac.jp/library @@ -212,3 +214,22 @@ location: geonames_id: 1862599 geonames_name: Hino feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:03:14.754827+00:00' + source_url: http://www.jissen.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.jissen.ac.jp/favicon.ico + source_url: http://www.jissen.ac.jp/library + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:03:14.754827+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-HIN-L-KL.yaml b/data/custodian/JP-13-HIN-L-KL.yaml index e0716e68f7..4fe421809a 100644 --- a/data/custodian/JP-13-HIN-L-KL.yaml +++ b/data/custodian/JP-13-HIN-L-KL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HIN-L-KL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HIN-L-KL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HIN-L-KL ghcid_numeric: 8947973121639993294 valid_from: '2025-12-06T23:38:46.786916+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOFUCHORITSU Library @@ -153,3 +154,36 @@ location: geonames_id: 1859100 geonames_name: Kofu feature_code: PPLA +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:03:30.027203+00:00' + source_url: http://lib.town-kofu.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://lib.town-kofu.jp/user/lib/images/logo.png + source_url: http://lib.town-kofu.jp + css_selector: '#site-logo > a > img' + retrieved_on: '2025-12-25T15:03:30.027203+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 江府町立図書館 + - claim_type: favicon_url + claim_value: http://lib.town-kofu.jp/user/lib/images/apple-touch-icon.png + source_url: http://lib.town-kofu.jp + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T15:03:30.027203+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www.town-kofu.jp/user/lib/images/ogp_image.jpg + source_url: http://lib.town-kofu.jp + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T15:03:30.027203+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-HIN-L-NL.yaml b/data/custodian/JP-13-HIN-L-NL.yaml index 378580a87a..ff90d7dcb2 100644 --- a/data/custodian/JP-13-HIN-L-NL.yaml +++ b/data/custodian/JP-13-HIN-L-NL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-HIN-L-NL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-HIN-L-NL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-HIN-L-NL ghcid_numeric: 17157452172621245797 valid_from: '2025-12-06T23:38:46.782351+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: NICHINANCHO Library @@ -153,3 +154,37 @@ location: geonames_id: 1855476 geonames_name: Nichinan feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:04:11.824810+00:00' + source_url: http://www2.town.nichinan.lg.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www2.town.nichinan.lg.jp/wp-content/themes/nichinan/assets/img/common/logo_main.svg + source_url: http://www2.town.nichinan.lg.jp + css_selector: '#header > div.gHeaderTop > div.modContainer > div.gHeaderTop-inner + > h1.gHeaderTop-logo > a > img' + retrieved_on: '2025-12-25T15:04:11.824810+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: https://www2.town.nichinan.lg.jp/wp-content/themes/nichinan/assets/favicon/apple-touch-icon.png + source_url: http://www2.town.nichinan.lg.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T15:04:11.824810+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www2.town.nichinan.lg.jp/ogimage.png + source_url: http://www2.town.nichinan.lg.jp + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T15:04:11.824810+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-IMI-L-TL.yaml b/data/custodian/JP-13-IMI-L-TL.yaml index 2300fcccc9..2875dae805 100644 --- a/data/custodian/JP-13-IMI-L-TL.yaml +++ b/data/custodian/JP-13-IMI-L-TL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-IMI-L-TL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-IMI-L-TL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-IMI-L-TL ghcid_numeric: 14260108011059627071 valid_from: '2025-12-06T23:38:57.094616+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOYAMAFUKUSHITANKIDAIGAKU Library @@ -204,3 +205,28 @@ location: geonames_id: 6822125 geonames_name: Imizu feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:05:56.334592+00:00' + source_url: http://www.t-fukushi.urayama.ac.jp/visitor/library.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.t-fukushi.urayama.ac.jp/uploads/f0/1c/f01c5253b1b630579d1be7c110a313df.ico + source_url: http://www.t-fukushi.urayama.ac.jp/visitor/library.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:05:56.334592+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.t-fukushi.urayama.ac.jp + source_url: http://www.t-fukushi.urayama.ac.jp/visitor/library.html + css_selector: '[document] > html > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T15:05:56.334592+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-IMI-L-TLJL.yaml b/data/custodian/JP-13-IMI-L-TLJL.yaml index c617f23ee4..b9cfaa579f 100644 --- a/data/custodian/JP-13-IMI-L-TLJL.yaml +++ b/data/custodian/JP-13-IMI-L-TLJL.yaml @@ -152,3 +152,28 @@ location: geonames_id: 6822125 geonames_name: Imizu feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:06:24.818889+00:00' + source_url: http://www.nc-toyama.ac.jp/c5/index.php/mcon/campus/lib_info + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.nc-toyama.ac.jp/wp/wp-content/themes/kosen/icon/apple-touch-icon-152x152.png + source_url: http://www.nc-toyama.ac.jp/c5/index.php/mcon/campus/lib_info + css_selector: '[document] > html.mac.win > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T15:06:24.818889+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 152x152 + - claim_type: og_image_url + claim_value: https://www.nc-toyama.ac.jp/wp/wp-content/themes/kosen/images/opg.jpg + source_url: http://www.nc-toyama.ac.jp/c5/index.php/mcon/campus/lib_info + css_selector: '[document] > html.mac.win > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T15:06:24.818889+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 9 diff --git a/data/custodian/JP-13-IMI-L-TPUL.yaml b/data/custodian/JP-13-IMI-L-TPUL.yaml index 42b62e1c15..77ad1838fa 100644 --- a/data/custodian/JP-13-IMI-L-TPUL.yaml +++ b/data/custodian/JP-13-IMI-L-TPUL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-IMI-L-TPUL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-IMI-L-TPUL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-IMI-L-TPUL ghcid_numeric: 13368037705863780146 valid_from: '2025-12-06T23:38:53.976302+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Toyama Prefectural University Library @@ -187,7 +188,8 @@ wikidata_enrichment: member_of: - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.pu-toyama.ac.jp/library wikidata_official_website: http://www.pu-toyama.ac.jp/library @@ -209,3 +211,31 @@ location: geonames_id: 6822125 geonames_name: Imizu feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:06:30.769681+00:00' + source_url: http://www.pu-toyama.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.pu-toyama.ac.jp/assets/img/tpu-logo.svg + source_url: http://www.pu-toyama.ac.jp/library + css_selector: '[document] > html > body > header.header > div.header-inner > h1.header-title + > a > img.tpu-logo' + retrieved_on: '2025-12-25T15:06:30.769681+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 富山県立大学 + - claim_type: favicon_url + claim_value: http://www.pu-toyama.ac.jp/assets/icon/favicon.ico + source_url: http://www.pu-toyama.ac.jp/library + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:06:30.769681+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-IMI-M-ICSM.yaml b/data/custodian/JP-13-IMI-M-ICSM.yaml index 52bba4bb37..e5907da161 100644 --- a/data/custodian/JP-13-IMI-M-ICSM.yaml +++ b/data/custodian/JP-13-IMI-M-ICSM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-IMI-M-ICSM - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-IMI-M-ICSM valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-IMI-M-ICSM ghcid_numeric: 8303398810938296277 valid_from: '2025-12-06T23:38:34.767550+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: IMIZU CITY SHINMINATO MUSEUM @@ -151,3 +152,28 @@ location: geonames_id: 6822125 geonames_name: Imizu feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:07:12.832473+00:00' + source_url: https://www.city.imizu.toyama.jp/museum + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.imizu.toyama.jp/designs/icon/apple-touch-icon-152x152.png + source_url: https://www.city.imizu.toyama.jp/museum + css_selector: '[document] > html.mac.win > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T15:07:12.832473+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 152x152 + - claim_type: og_image_url + claim_value: https://www.city.imizu.toyama.jp/designs/external/image/symbol.jpg + source_url: https://www.city.imizu.toyama.jp/museum + css_selector: '[document] > html.mac.win > head > meta:nth-of-type(5)' + retrieved_on: '2025-12-25T15:07:12.832473+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 9 diff --git a/data/custodian/JP-13-INA-L-ICCL.yaml b/data/custodian/JP-13-INA-L-ICCL.yaml index 03204d3c84..db26263e8d 100644 --- a/data/custodian/JP-13-INA-L-ICCL.yaml +++ b/data/custodian/JP-13-INA-L-ICCL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-INA-L-ICCL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-INA-L-ICCL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-INA-L-ICCL ghcid_numeric: 16771263550042850877 valid_from: '2025-12-06T23:38:43.942581+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Inagi City Chuo Library @@ -151,3 +152,30 @@ location: geonames_id: 11612578 geonames_name: Inagi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:07:25.086976+00:00' + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/chuuou.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/design/images/header/tlogo.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/chuuou.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T15:07:25.086976+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 稲城市公式ホームページトップページ + - claim_type: favicon_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/chuuou.html + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T15:07:25.086976+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-INA-L-ICDIL.yaml b/data/custodian/JP-13-INA-L-ICDIL.yaml index 1f3ed6e784..db569a9d6f 100644 --- a/data/custodian/JP-13-INA-L-ICDIL.yaml +++ b/data/custodian/JP-13-INA-L-ICDIL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-INA-L-ICDIL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-INA-L-ICDIL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-INA-L-ICDIL ghcid_numeric: 14772634650256149373 valid_from: '2025-12-06T23:38:43.933354+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Inagi City Dai-Ichi Library @@ -151,3 +152,30 @@ location: geonames_id: 11612578 geonames_name: Inagi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:07:30.169548+00:00' + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai1.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/design/images/header/tlogo.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai1.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T15:07:30.169548+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 稲城市公式ホームページトップページ + - claim_type: favicon_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai1.html + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T15:07:30.169548+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-INA-L-ICDNL.yaml b/data/custodian/JP-13-INA-L-ICDNL.yaml index 56bb456b58..af72c6e2c1 100644 --- a/data/custodian/JP-13-INA-L-ICDNL.yaml +++ b/data/custodian/JP-13-INA-L-ICDNL.yaml @@ -152,3 +152,30 @@ location: geonames_id: 11612578 geonames_name: Inagi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:07:34.999492+00:00' + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai2.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/design/images/header/tlogo.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai2.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T15:07:34.999492+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 稲城市公式ホームページトップページ + - claim_type: favicon_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai2.html + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T15:07:34.999492+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-INA-L-ICDSL.yaml b/data/custodian/JP-13-INA-L-ICDSL.yaml index a9500a9922..5e3efe7d12 100644 --- a/data/custodian/JP-13-INA-L-ICDSL.yaml +++ b/data/custodian/JP-13-INA-L-ICDSL.yaml @@ -152,3 +152,30 @@ location: geonames_id: 11612578 geonames_name: Inagi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:07:39.985593+00:00' + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai3.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/design/images/header/tlogo.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai3.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T15:07:39.985593+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 稲城市公式ホームページトップページ + - claim_type: favicon_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai3.html + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T15:07:39.985593+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-INA-L-ICDYL.yaml b/data/custodian/JP-13-INA-L-ICDYL.yaml index ba44e617d6..e8adba3485 100644 --- a/data/custodian/JP-13-INA-L-ICDYL.yaml +++ b/data/custodian/JP-13-INA-L-ICDYL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-INA-L-ICDYL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-INA-L-ICDYL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-INA-L-ICDYL ghcid_numeric: 13882009762647486184 valid_from: '2025-12-06T23:38:43.940302+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Inagi City Dai-Yon Library @@ -151,3 +152,30 @@ location: geonames_id: 11612578 geonames_name: Inagi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:07:45.039326+00:00' + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai4.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/design/images/header/tlogo.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai4.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T15:07:45.039326+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 稲城市公式ホームページトップページ + - claim_type: favicon_url + claim_value: https://www.city.inagi.tokyo.jp/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.inagi.tokyo.jp/shisetsu/bunka/toshokan/dai4.html + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T15:07:45.039326+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-INA-L-KTL.yaml b/data/custodian/JP-13-INA-L-KTL.yaml index 1a17cbc362..2591fc4083 100644 --- a/data/custodian/JP-13-INA-L-KTL.yaml +++ b/data/custodian/JP-13-INA-L-KTL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-INA-L-KTL - valid_from: "2025-12-10T09:44:04Z" + valid_from: '2025-12-10T09:44:04Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-INA-L-KTL valid_from: null - valid_to: "2025-12-10T09:44:04Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:04Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-INA-L-KTL ghcid_numeric: 14868447424754719232 valid_from: '2025-12-06T23:38:55.407349+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMAZAWAJOSHIDAIGAKU・TANKIDAIGAKU Library @@ -204,3 +205,22 @@ location: geonames_id: 11612578 geonames_name: Inagi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:08:26.355712+00:00' + source_url: http://www.komajo.ac.jp/uni/place/library.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.komajo.ac.jp/uni/common/images/apple-touch-icon.png + source_url: http://www.komajo.ac.jp/uni/place/library.html + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:08:26.355712+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 152x152 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-L-DBUL.yaml b/data/custodian/JP-13-ITA-L-DBUL.yaml index dbfb8c567a..bdac23b446 100644 --- a/data/custodian/JP-13-ITA-L-DBUL.yaml +++ b/data/custodian/JP-13-ITA-L-DBUL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-DBUL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-DBUL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-DBUL ghcid_numeric: 11740726727602387973 valid_from: '2025-12-06T23:38:54.999513+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Daito Bunka University Library @@ -209,3 +210,28 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:08:52.967222+00:00' + source_url: http://www.daito.ac.jp/research/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.daito.ac.jp/assets/img/apple-touch-icon.png + source_url: http://www.daito.ac.jp/research/library + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T15:08:52.967222+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.daito.ac.jp/assets/img/img_logo_ogp.jpg + source_url: http://www.daito.ac.jp/research/library + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:08:52.967222+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-L-IBCSBH.yaml b/data/custodian/JP-13-ITA-L-IBCSBH.yaml index 5ecc1d89f6..06cf58a364 100644 --- a/data/custodian/JP-13-ITA-L-IBCSBH.yaml +++ b/data/custodian/JP-13-ITA-L-IBCSBH.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-IBCSBH - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-IBCSBH valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-IBCSBH ghcid_numeric: 13534738045838770369 valid_from: '2025-12-06T23:38:48.658686+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi-Bologna Children's Book Hall @@ -151,3 +152,36 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:08:59.535141+00:00' + source_url: https://www.city.itabashi.tokyo.jp/library/bologna/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.itabashi.tokyo.jp/library/_template_/_site_/project_lib/_res/design/images/header/tlogo.png + source_url: https://www.city.itabashi.tokyo.jp/library/bologna/index.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T15:08:59.535141+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 板橋区立図書館 + - claim_type: favicon_url + claim_value: https://www.city.itabashi.tokyo.jp/library/_template_/_site_/project_lib/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.itabashi.tokyo.jp/library/bologna/index.html + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T15:08:59.535141+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: https://www.city.itabashi.tokyo.jp/library/bologna/index.html + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:08:59.535141+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-L-ICAL.yaml b/data/custodian/JP-13-ITA-L-ICAL.yaml index 6a79b5cc80..10567a621b 100644 --- a/data/custodian/JP-13-ITA-L-ICAL.yaml +++ b/data/custodian/JP-13-ITA-L-ICAL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-ICAL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-ICAL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-ICAL ghcid_numeric: 12653340971048199919 valid_from: '2025-12-06T23:38:43.471601+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi City Akatsuka Library @@ -151,3 +152,28 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:09:08.218834+00:00' + source_url: https://www.trc-itabashi.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.trc-itabashi.jp/_src/4268401/trc_logo.gif?v=1762061584632 + source_url: https://www.trc-itabashi.jp + css_selector: '#imgsrc4268401_1' + retrieved_on: '2025-12-25T15:09:08.218834+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: og_image_url + claim_value: https://www.trc-itabashi.jp/index.html + source_url: https://www.trc-itabashi.jp + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:09:08.218834+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-ITA-L-ICCL.yaml b/data/custodian/JP-13-ITA-L-ICCL.yaml index 7ba7a6cc1c..48c885a3e4 100644 --- a/data/custodian/JP-13-ITA-L-ICCL.yaml +++ b/data/custodian/JP-13-ITA-L-ICCL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-ICCL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-ICCL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-ICCL ghcid_numeric: 9690399356711150975 valid_from: '2025-12-06T23:38:43.469352+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi City Chuo Library @@ -151,3 +152,36 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:09:15.737930+00:00' + source_url: https://www.city.itabashi.tokyo.jp/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/project_lib/_res/design/images/header/tlogo.png + source_url: https://www.city.itabashi.tokyo.jp/library + css_selector: '#tlogo > h1 > a > img' + retrieved_on: '2025-12-25T15:09:15.737930+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 板橋区立図書館 + - claim_type: favicon_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/project_lib/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.itabashi.tokyo.jp/library + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T15:09:15.737930+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: https://www.city.itabashi.tokyo.jp/library + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:09:15.737930+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-ITA-L-ICHIL.yaml b/data/custodian/JP-13-ITA-L-ICHIL.yaml index 998005c841..372d843f3c 100644 --- a/data/custodian/JP-13-ITA-L-ICHIL.yaml +++ b/data/custodian/JP-13-ITA-L-ICHIL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-ICHIL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-ICHIL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-ICHIL ghcid_numeric: 5765949531043964042 valid_from: '2025-12-06T23:38:43.482802+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi City Higashi-itabashi Library @@ -151,3 +152,22 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:09:23.543915+00:00' + source_url: https://itabashi-lib-higashiitabashi.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://itabashi-lib-higashiitabashi.jp/wp-content/uploads/2023/02/fvc02.png + source_url: https://itabashi-lib-higashiitabashi.jp + css_selector: '[document] > html.no-js.js_active > head > link:nth-of-type(26)' + retrieved_on: '2025-12-25T15:09:23.543915+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-L-ICHL-itabashi_city_hikawa_library.yaml b/data/custodian/JP-13-ITA-L-ICHL-itabashi_city_hikawa_library.yaml index cfc20123cf..b82a270c07 100644 --- a/data/custodian/JP-13-ITA-L-ICHL-itabashi_city_hikawa_library.yaml +++ b/data/custodian/JP-13-ITA-L-ICHL-itabashi_city_hikawa_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-ICHL-itabashi_city_hikawa_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-ICHL-itabashi_city_hikawa_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-ICHL-itabashi_city_hikawa_library ghcid_numeric: 17291739435236158377 valid_from: '2025-12-06T23:38:43.478342+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi City Hikawa Library @@ -151,3 +152,22 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:09:32.551498+00:00' + source_url: https://itabashi-lib-hikawa.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://itabashi-lib-hikawa.jp/wp-content/uploads/2023/02/fvc02.png + source_url: https://itabashi-lib-hikawa.jp + css_selector: '[document] > html.no-js.js_active > head > link:nth-of-type(27)' + retrieved_on: '2025-12-25T15:09:32.551498+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-L-ICHL.yaml b/data/custodian/JP-13-ITA-L-ICHL.yaml index a8a7e1902f..53c38aacc0 100644 --- a/data/custodian/JP-13-ITA-L-ICHL.yaml +++ b/data/custodian/JP-13-ITA-L-ICHL.yaml @@ -152,3 +152,20 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:09:40.987638+00:00' + source_url: https://hasune-lib.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://hasune-lib.jp/wp-content/themes/commonlibrary/img/common/default_2.jpg + source_url: https://hasune-lib.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:09:40.987638+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-ITA-L-ICKL.yaml b/data/custodian/JP-13-ITA-L-ICKL.yaml index e549dbc077..03872fb27d 100644 --- a/data/custodian/JP-13-ITA-L-ICKL.yaml +++ b/data/custodian/JP-13-ITA-L-ICKL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-ICKL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-ICKL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-ICKL ghcid_numeric: 17728104605708031769 valid_from: '2025-12-06T23:38:43.485035+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi City Komone Library @@ -151,3 +152,22 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:09:49.251983+00:00' + source_url: https://itabashi-lib-komone.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://itabashi-lib-komone.jp/wp-content/uploads/2023/03/fvc02-2.png + source_url: https://itabashi-lib-komone.jp + css_selector: '[document] > html.no-js.js_active > head > link:nth-of-type(26)' + retrieved_on: '2025-12-25T15:09:49.251983+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-L-ICNL-itabashi_city_narimasu_library.yaml b/data/custodian/JP-13-ITA-L-ICNL-itabashi_city_narimasu_library.yaml index 1c7b8721ed..fdc43f808b 100644 --- a/data/custodian/JP-13-ITA-L-ICNL-itabashi_city_narimasu_library.yaml +++ b/data/custodian/JP-13-ITA-L-ICNL-itabashi_city_narimasu_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-ICNL-itabashi_city_narimasu_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-ICNL-itabashi_city_narimasu_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-ICNL-itabashi_city_narimasu_library ghcid_numeric: 4288872939540727034 valid_from: '2025-12-06T23:38:43.491950+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi City Narimasu Library @@ -151,3 +152,28 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:09:58.098115+00:00' + source_url: https://lib.trc-itabashi.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://lib.trc-itabashi.jp/_src/4268401/trc_logo.gif?v=1762061584632 + source_url: https://lib.trc-itabashi.jp + css_selector: '#imgsrc4268401_1' + retrieved_on: '2025-12-25T15:09:58.098115+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: og_image_url + claim_value: https://www.trc-itabashi.jp/index.html + source_url: https://lib.trc-itabashi.jp + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:09:58.098115+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-ITA-L-ICNL.yaml b/data/custodian/JP-13-ITA-L-ICNL.yaml index 9b3816b93c..a6e5cd6bb5 100644 --- a/data/custodian/JP-13-ITA-L-ICNL.yaml +++ b/data/custodian/JP-13-ITA-L-ICNL.yaml @@ -152,3 +152,20 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:10:05.605904+00:00' + source_url: https://nishidai-lib.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://nishidai-lib.jp/wp-content/themes/commonlibrary/img/common/default_2.jpg + source_url: https://nishidai-lib.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:10:05.605904+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-ITA-L-ICSL-itabashi_city_shimura_library.yaml b/data/custodian/JP-13-ITA-L-ICSL-itabashi_city_shimura_library.yaml index a21b11704f..68b776b94c 100644 --- a/data/custodian/JP-13-ITA-L-ICSL-itabashi_city_shimura_library.yaml +++ b/data/custodian/JP-13-ITA-L-ICSL-itabashi_city_shimura_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-ICSL-itabashi_city_shimura_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-ICSL-itabashi_city_shimura_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-ICSL-itabashi_city_shimura_library ghcid_numeric: 11165399925052889103 valid_from: '2025-12-06T23:38:43.489463+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Itabashi City Shimura Library @@ -151,3 +152,20 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:10:15.039906+00:00' + source_url: https://www.shimura-lib.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.shimura-lib.jp/wp-content/themes/shimura/img/common/default_2.jpg + source_url: https://www.shimura-lib.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:10:15.039906+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-ITA-L-ICSL.yaml b/data/custodian/JP-13-ITA-L-ICSL.yaml index bc46895619..e8e7383ded 100644 --- a/data/custodian/JP-13-ITA-L-ICSL.yaml +++ b/data/custodian/JP-13-ITA-L-ICSL.yaml @@ -152,3 +152,20 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:10:22.603241+00:00' + source_url: https://shimizu-lib.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://shimizu-lib.jp/wp-content/themes/commonlibrary/img/common/default_2.jpg + source_url: https://shimizu-lib.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:10:22.603241+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-ITA-L-NUSM.yaml b/data/custodian/JP-13-ITA-L-NUSM.yaml index dd2759db44..27b79b7700 100644 --- a/data/custodian/JP-13-ITA-L-NUSM.yaml +++ b/data/custodian/JP-13-ITA-L-NUSM.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-NUSM - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-NUSM valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-NUSM ghcid_numeric: 3084361680596267918 valid_from: '2025-12-06T23:38:54.701650+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Nihon University School of Medicine @@ -204,3 +205,22 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:43:55.917150+00:00' + source_url: http://www.med.nihon-u.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.med.nihon-u.ac.jp/image/favicon.ico + source_url: http://www.med.nihon-u.ac.jp/library + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T15:43:55.917150+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-ITA-L-SL.yaml b/data/custodian/JP-13-ITA-L-SL.yaml index df6e7d4d21..2c43e64905 100644 --- a/data/custodian/JP-13-ITA-L-SL.yaml +++ b/data/custodian/JP-13-ITA-L-SL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-SL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-SL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-SL ghcid_numeric: 9557422405834936949 valid_from: '2025-12-06T23:38:56.944850+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SHUKUTOKUDAIGAKUTOKYO Library @@ -204,3 +205,22 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:44:14.839927+00:00' + source_url: http://www.shukutoku.ac.jp/campuslife/library/tokyo + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.shukutoku.ac.jp/favicon.ico + source_url: http://www.shukutoku.ac.jp/campuslife/library/tokyo + css_selector: '[document] > html > body > link' + retrieved_on: '2025-12-25T15:44:14.839927+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-ITA-L-TL-tokushimakogyotankidaigaku_library.yaml b/data/custodian/JP-13-ITA-L-TL-tokushimakogyotankidaigaku_library.yaml index b7f24d1673..21fabb32ab 100644 --- a/data/custodian/JP-13-ITA-L-TL-tokushimakogyotankidaigaku_library.yaml +++ b/data/custodian/JP-13-ITA-L-TL-tokushimakogyotankidaigaku_library.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-L-TL-tokushimakogyotankidaigaku_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-L-TL-tokushimakogyotankidaigaku_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-L-TL-tokushimakogyotankidaigaku_library ghcid_numeric: 16587535559392313608 valid_from: '2025-12-06T23:38:57.282030+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKUSHIMAKOGYOTANKIDAIGAKU Library @@ -206,3 +207,28 @@ location: geonames_id: 1861302 geonames_name: Itanoura feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:44:24.873408+00:00' + source_url: http://www.tokuco.ac.jp/daigaku/library.php + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.tokuco.ac.jp/wordpress/wp-content/uploads/2023/06/cropped-favicon_180px-180x180.png + source_url: http://www.tokuco.ac.jp/daigaku/library.php + css_selector: '[document] > html > head > link:nth-of-type(14)' + retrieved_on: '2025-12-25T15:44:24.873408+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.tokuco.ac.jp/shared/img/common/OGP.jpg + source_url: http://www.tokuco.ac.jp/daigaku/library.php + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T15:44:24.873408+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-ITA-L-TL.yaml b/data/custodian/JP-13-ITA-L-TL.yaml index fc37580f79..91930f2afc 100644 --- a/data/custodian/JP-13-ITA-L-TL.yaml +++ b/data/custodian/JP-13-ITA-L-TL.yaml @@ -205,3 +205,38 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:44:33.045363+00:00' + source_url: http://www.tokyo-kasei.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.tokyo-kasei.ac.jp/common/image/logo.png + source_url: http://www.tokyo-kasei.ac.jp/library + css_selector: '[document] > html > body.isPC.is-scrolling > div.wrapper-new:nth-of-type(4) + > nav.global-nav-new > div.global-nav-new__header > div.global-nav-new__logo + > a > img' + retrieved_on: '2025-12-25T15:44:33.045363+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東京家政大学 + - claim_type: favicon_url + claim_value: http://www.tokyo-kasei.ac.jp/common/image/touch-icon.png + source_url: http://www.tokyo-kasei.ac.jp/library + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:44:33.045363+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www.tokyo-kasei.ac.jp/common/image/og_image.jpg + source_url: http://www.tokyo-kasei.ac.jp/library + css_selector: '[document] > html > head > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T15:44:33.045363+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-M-IAM.yaml b/data/custodian/JP-13-ITA-M-IAM.yaml index 99a5d4b63b..8789042b69 100644 --- a/data/custodian/JP-13-ITA-M-IAM.yaml +++ b/data/custodian/JP-13-ITA-M-IAM.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-M-IAM - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-M-IAM valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-M-IAM ghcid_numeric: 6051803860935817613 valid_from: '2025-12-06T23:38:33.500746+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: ITABASHI ART MUSEUM @@ -211,7 +212,8 @@ wikidata_enrichment: instance_of: &id005 - id: Q207694 label: art museum - description: building or space for the exhibition of art (for institution, use Q3196771) + description: building or space for the exhibition of art (for institution, use + Q3196771) wikidata_instance_of: *id005 wikidata_location: country: &id006 @@ -263,3 +265,36 @@ location: postal_code: 175-0092 street_address: AKATSUKA, Itabashi Ku, Tokyo To, 175-0092 normalization_timestamp: '2025-12-09T12:21:38.963724+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:44:50.731319+00:00' + source_url: https://www.city.itabashi.tokyo.jp/artmuseum + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/project_artmuseum/_res/design/images/header/tlogo.png + source_url: https://www.city.itabashi.tokyo.jp/artmuseum + css_selector: '#tlogo > h1 > a > img' + retrieved_on: '2025-12-25T15:44:50.731319+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 板橋区立美術館 ITABASHI ART MUSEUM + - claim_type: favicon_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/project_artmuseum/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.itabashi.tokyo.jp/artmuseum + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:44:50.731319+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: https://www.city.itabashi.tokyo.jp/artmuseum + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:44:50.731319+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-M-IBG.yaml b/data/custodian/JP-13-ITA-M-IBG.yaml index 17ff102d1c..350de18afa 100644 --- a/data/custodian/JP-13-ITA-M-IBG.yaml +++ b/data/custodian/JP-13-ITA-M-IBG.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-M-IBG - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-M-IBG valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-M-IBG ghcid_numeric: 10994599943769151975 valid_from: '2025-12-06T23:38:33.495766+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: ITABASHI BOTANICAL GARDENS @@ -151,3 +152,28 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:45:01.091956+00:00' + source_url: https://www.seibu-la.co.jp/nettaikan + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.seibu-la.co.jp/nettaikan/files/apple-touch-icon.png + source_url: https://www.seibu-la.co.jp/nettaikan + css_selector: '#nettaikan > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:45:01.091956+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.seibu-la.co.jp/nettaikan//files/og-image.jpg + source_url: https://www.seibu-la.co.jp/nettaikan + css_selector: '#nettaikan > head > meta:nth-of-type(14)' + retrieved_on: '2025-12-25T15:45:01.091956+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-M-IHM.yaml b/data/custodian/JP-13-ITA-M-IHM.yaml index 02b82d1bd6..5c0fddf54b 100644 --- a/data/custodian/JP-13-ITA-M-IHM.yaml +++ b/data/custodian/JP-13-ITA-M-IHM.yaml @@ -828,3 +828,36 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/w6iY87pke0I/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:45:08.591037+00:00' + source_url: https://www.city.itabashi.tokyo.jp/kyodoshiryokan + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/project_kyoudo/_res/design/images/header/tlogo.png + source_url: https://www.city.itabashi.tokyo.jp/kyodoshiryokan + css_selector: '#tlogo > h1 > a > img' + retrieved_on: '2025-12-25T15:45:08.591037+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 板橋区立郷土資料館 ITABASHI HISTORICAL MUSEUM + - claim_type: favicon_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/project_kyoudo/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.itabashi.tokyo.jp/kyodoshiryokan + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:45:08.591037+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.itabashi.tokyo.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: https://www.city.itabashi.tokyo.jp/kyodoshiryokan + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:45:08.591037+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-M-JCM.yaml b/data/custodian/JP-13-ITA-M-JCM.yaml index 660ea71098..0b088fd337 100644 --- a/data/custodian/JP-13-ITA-M-JCM.yaml +++ b/data/custodian/JP-13-ITA-M-JCM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-M-JCM - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-M-JCM valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-M-JCM ghcid_numeric: 3039065895030684085 valid_from: '2025-12-06T23:38:33.493555+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: JAPAN CALLIGRAPHY MUSEUM @@ -151,3 +152,22 @@ location: geonames_id: 1861321 geonames_name: Itabashi feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:45:47.206043+00:00' + source_url: http://www.shodo-bijutsukan.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.shodo-bijutsukan.or.jp/img/common/favicon.ico + source_url: http://www.shodo-bijutsukan.or.jp + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T15:45:47.206043+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-ITA-M-MB.yaml b/data/custodian/JP-13-ITA-M-MB.yaml index 7f2159a96e..54cad5cc76 100644 --- a/data/custodian/JP-13-ITA-M-MB.yaml +++ b/data/custodian/JP-13-ITA-M-MB.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-ITA-M-MB - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-ITA-M-MB valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-ITA-M-MB ghcid_numeric: 3689810229605177396 valid_from: '2025-12-06T23:38:39.322806+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Miki Bunko @@ -234,3 +235,28 @@ location: postal_code: 771-0212 street_address: NAKAGIRAI, Itano Gun Matsushige Cho, Tokushima Ken, 771-0212 normalization_timestamp: '2025-12-09T12:21:39.254461+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:46:05.964284+00:00' + source_url: http://www.mikibunko.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.mikibunko.jp/images/head/safari-pinned-tab.svg + source_url: http://www.mikibunko.jp + css_selector: '[document] > html > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T15:46:05.964284+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www.mikibunko.jp/images/head/og-image.jpg + source_url: http://www.mikibunko.jp + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T15:46:05.964284+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 4 diff --git a/data/custodian/JP-13-ITA-M-MHFMJPM.yaml b/data/custodian/JP-13-ITA-M-MHFMJPM.yaml index f639e78db2..16c2ae11cc 100644 --- a/data/custodian/JP-13-ITA-M-MHFMJPM.yaml +++ b/data/custodian/JP-13-ITA-M-MHFMJPM.yaml @@ -256,3 +256,28 @@ location: postal_code: 771-0220 street_address: HIROSHIMA, Itano Gun Matsushige Cho, Tokushima Ken, 771-0220 normalization_timestamp: '2025-12-09T12:21:39.312002+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:46:38.699177+00:00' + source_url: http://www.joruri.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.joruri.jp/apple-touch-icon.png + source_url: http://www.joruri.jp + css_selector: '[document] > html.js > head > link:nth-of-type(16)' + retrieved_on: '2025-12-25T15:46:38.699177+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www.joruri.jp/og-img.jpg + source_url: http://www.joruri.jp + css_selector: '[document] > html.js > head > meta:nth-of-type(14)' + retrieved_on: '2025-12-25T15:46:38.699177+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-ITA-M-TKUM.yaml b/data/custodian/JP-13-ITA-M-TKUM.yaml index b45732d1ec..52fc94cf54 100644 --- a/data/custodian/JP-13-ITA-M-TKUM.yaml +++ b/data/custodian/JP-13-ITA-M-TKUM.yaml @@ -231,3 +231,38 @@ location: postal_code: 173-8602 street_address: KAGA, Itabashi Ku, Tokyo To, 173-8602 normalization_timestamp: '2025-12-09T12:21:39.367632+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:46:45.567511+00:00' + source_url: https://www.tokyo-kasei.ac.jp/academics/museum + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.tokyo-kasei.ac.jp/common/image/logo.png + source_url: https://www.tokyo-kasei.ac.jp/academics/museum + css_selector: '[document] > html > body.museum.isPC > div.wrapper-new:nth-of-type(4) + > nav.global-nav-new > div.global-nav-new__header > div.global-nav-new__logo + > a > img' + retrieved_on: '2025-12-25T15:46:45.567511+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東京家政大学 + - claim_type: favicon_url + claim_value: https://www.tokyo-kasei.ac.jp/common/image/touch-icon.png + source_url: https://www.tokyo-kasei.ac.jp/academics/museum + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:46:45.567511+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.tokyo-kasei.ac.jp/common/image/og_image.jpg + source_url: https://www.tokyo-kasei.ac.jp/academics/museum + css_selector: '[document] > html > head > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T15:46:45.567511+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-ITA-M-TPCBCP.yaml b/data/custodian/JP-13-ITA-M-TPCBCP.yaml index a61f0b001d..bfd8225295 100644 --- a/data/custodian/JP-13-ITA-M-TPCBCP.yaml +++ b/data/custodian/JP-13-ITA-M-TPCBCP.yaml @@ -265,3 +265,28 @@ location: postal_code: 779-0108 street_address: INUBUSHI, Itano Gun Itano Cho, Tokushima Ken, 779-0108 normalization_timestamp: '2025-12-09T12:21:39.425468+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:46:54.365338+00:00' + source_url: https://www.pref.tokushima.lg.jp/rekishiru + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.pref.tokushima.lg.jp/favicon.ico + source_url: https://www.pref.tokushima.lg.jp/rekishiru + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:46:54.365338+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.pref.tokushima.lg.jp/file/cooperation/banner_white.png + source_url: https://www.pref.tokushima.lg.jp/rekishiru + css_selector: '[document] > html > head > meta:nth-of-type(4)' + retrieved_on: '2025-12-25T15:46:54.365338+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-IWA-L-IL.yaml b/data/custodian/JP-13-IWA-L-IL.yaml index b0b4b39fff..22761a47e8 100644 --- a/data/custodian/JP-13-IWA-L-IL.yaml +++ b/data/custodian/JP-13-IWA-L-IL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-IWA-L-IL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-IWA-L-IL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-IWA-L-IL ghcid_numeric: 4654274690900483203 valid_from: '2025-12-06T23:38:46.748001+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: IWAMICHORITSU Library @@ -153,3 +154,22 @@ location: geonames_id: 9633050 geonames_name: Iwami feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:47:01.982908+00:00' + source_url: http://www.iwami.gr.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.iwami.gr.jp/apple-touch-icon.png + source_url: http://www.iwami.gr.jp/library + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:47:01.982908+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-IZU-M-TCMAIKMH.yaml b/data/custodian/JP-13-IZU-M-TCMAIKMH.yaml index f2b945d20d..ee8cd2dff2 100644 --- a/data/custodian/JP-13-IZU-M-TCMAIKMH.yaml +++ b/data/custodian/JP-13-IZU-M-TCMAIKMH.yaml @@ -286,3 +286,28 @@ location: geonames_id: 1861074 feature_code: PPL normalization_timestamp: '2025-12-09T06:53:34.325553+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:47:45.231885+00:00' + source_url: https://www.city.toyooka.lg.jp/1019810/1019847/itoh-museum + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.toyooka.lg.jp/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.toyooka.lg.jp/1019810/1019847/itoh-museum + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T15:47:45.231885+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.toyooka.lg.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: https://www.city.toyooka.lg.jp/1019810/1019847/itoh-museum + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T15:47:45.231885+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KAI-L-KL-kaiyochoritsushishikui_library.yaml b/data/custodian/JP-13-KAI-L-KL-kaiyochoritsushishikui_library.yaml index dd86110cca..0fc3108b45 100644 --- a/data/custodian/JP-13-KAI-L-KL-kaiyochoritsushishikui_library.yaml +++ b/data/custodian/JP-13-KAI-L-KL-kaiyochoritsushishikui_library.yaml @@ -15,7 +15,8 @@ original_entry: city: Kaifu Gun Kaiyo Cho region: Tokushima Ken postal_code: 775-0501 - street_address: 375 SHISHIKUIURA SHISHIKUI, Kaifu Gun Kaiyo Cho, Tokushima Ken, 775-0501 + street_address: 375 SHISHIKUIURA SHISHIKUI, Kaifu Gun Kaiyo Cho, Tokushima Ken, + 775-0501 processing_timestamp: '2025-12-06T23:38:47.391846+00:00' ghcid: ghcid_current: JP-13-KAI-L-KL-kaiyochoritsushishikui_library @@ -32,13 +33,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KAI-L-KL-kaiyochoritsushishikui_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KAI-L-KL-kaiyochoritsushishikui_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KAI-L-KL-kaiyochoritsushishikui_library ghcid_numeric: 18196068420552679977 valid_from: '2025-12-06T23:38:47.391846+00:00' @@ -96,8 +98,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KAIYOCHORITSUSHISHIKUI Library @@ -139,7 +141,8 @@ location: region_code: 13 country: JP postal_code: 775-0501 - street_address: 375 SHISHIKUIURA SHISHIKUI, Kaifu Gun Kaiyo Cho, Tokushima Ken, 775-0501 + street_address: 375 SHISHIKUIURA SHISHIKUI, Kaifu Gun Kaiyo Cho, Tokushima Ken, + 775-0501 normalization_timestamp: '2025-12-09T20:21:47.215834+00:00' latitude: 43.57758 longitude: 144.92274 @@ -153,3 +156,20 @@ location: geonames_id: 2129791 geonames_name: Kaiyō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:47:55.701522+00:00' + source_url: http://www.mmpt.town.kainan.tokushima.jp/TOSHO/tosho_top.asp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://localhost/TOSHOW/asp/shared/img/snsThumbnail.png + source_url: http://www.mmpt.town.kainan.tokushima.jp/TOSHO/tosho_top.asp + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T15:47:55.701522+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-KAN-L-KCL.yaml b/data/custodian/JP-13-KAN-L-KCL.yaml index d1ad51308b..5658bf8d15 100644 --- a/data/custodian/JP-13-KAN-L-KCL.yaml +++ b/data/custodian/JP-13-KAN-L-KCL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KAN-L-KCL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KAN-L-KCL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KAN-L-KCL ghcid_numeric: 8766406421363021505 valid_from: '2025-12-06T23:38:42.189059+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kanuma City Library @@ -151,3 +152,28 @@ location: geonames_id: 1860098 geonames_name: Kanuma feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:50:34.290042+00:00' + source_url: https://www.lib-kanuma.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.lib-kanuma.jp/favicon.ico?v=4a3cd1ede3d498ecea00dc95a0528588 + source_url: https://www.lib-kanuma.jp + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:50:34.290042+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://lib-kanuma.jp/ogp.png + source_url: https://www.lib-kanuma.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:50:34.290042+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KAN-L-KLA.yaml b/data/custodian/JP-13-KAN-L-KLA.yaml index e5192f4bbb..a74f193833 100644 --- a/data/custodian/JP-13-KAN-L-KLA.yaml +++ b/data/custodian/JP-13-KAN-L-KLA.yaml @@ -152,3 +152,28 @@ location: geonames_id: 1860098 geonames_name: Kanuma feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:50:43.338427+00:00' + source_url: https://www.lib-kanuma.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.lib-kanuma.jp/favicon.ico?v=4a3cd1ede3d498ecea00dc95a0528588 + source_url: https://www.lib-kanuma.jp + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:50:43.338427+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://lib-kanuma.jp/ogp.png + source_url: https://www.lib-kanuma.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:50:43.338427+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KAN-L-KLH.yaml b/data/custodian/JP-13-KAN-L-KLH.yaml index b7475af6cc..e74c1e9039 100644 --- a/data/custodian/JP-13-KAN-L-KLH.yaml +++ b/data/custodian/JP-13-KAN-L-KLH.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KAN-L-KLH - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KAN-L-KLH valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KAN-L-KLH ghcid_numeric: 18101461760908513476 valid_from: '2025-12-06T23:38:42.191428+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KANUMASHIRITSU Library HIGASHIBUNKAN @@ -151,3 +152,28 @@ location: geonames_id: 1860098 geonames_name: Kanuma feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:50:52.070313+00:00' + source_url: https://www.lib-kanuma.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.lib-kanuma.jp/favicon.ico?v=4a3cd1ede3d498ecea00dc95a0528588 + source_url: https://www.lib-kanuma.jp + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T15:50:52.070313+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://lib-kanuma.jp/ogp.png + source_url: https://www.lib-kanuma.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:50:52.070313+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KAN-M-KMAMKS.yaml b/data/custodian/JP-13-KAN-M-KMAMKS.yaml index 66036a5a44..394fd1a420 100644 --- a/data/custodian/JP-13-KAN-M-KMAMKS.yaml +++ b/data/custodian/JP-13-KAN-M-KMAMKS.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KAN-M-KMAMKS - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KAN-M-KMAMKS valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KAN-M-KMAMKS ghcid_numeric: 13529926214997756070 valid_from: '2025-12-06T23:38:31.840757+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KANUMA MUNICIPAL ART MUSEUM OF KAWAKAMI SUMIO @@ -215,7 +216,8 @@ wikidata_enrichment: instance_of: &id005 - id: Q207694 label: art museum - description: building or space for the exhibition of art (for institution, use Q3196771) + description: building or space for the exhibition of art (for institution, use + Q3196771) - id: Q10624527 label: biographical museum description: museum dedicated to the life and works of a specific person @@ -275,3 +277,20 @@ location: postal_code: 322-0031 street_address: MUTSUMICHO, Kanuma Shi, Tochigi Ken, 322-0031 normalization_timestamp: '2025-12-09T12:21:39.824966+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:51:04.774568+00:00' + source_url: https://kawakamisumio-bijutsukan.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://kawakamisumio-bijutsukan.jp/files/libs/637/202101111233232246.jpg?1766677856 + source_url: https://kawakamisumio-bijutsukan.jp + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T15:51:04.774568+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-KAT-L-KTL.yaml b/data/custodian/JP-13-KAT-L-KTL.yaml index 64787607f9..253a6c0213 100644 --- a/data/custodian/JP-13-KAT-L-KTL.yaml +++ b/data/custodian/JP-13-KAT-L-KTL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KAT-L-KTL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KAT-L-KTL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KAT-L-KTL ghcid_numeric: 15521640390366452160 valid_from: '2025-12-06T23:38:47.376999+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Katsuura Town Library @@ -153,3 +154,22 @@ location: geonames_id: 1859797 geonames_name: Katsura feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:52:27.634608+00:00' + source_url: http://www.town.katsuura.lg.jp/docs/2016092100045 + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.town.katsuura.lg.jp/_themes/joruri/sogo/img/logo2.png + source_url: http://www.town.katsuura.lg.jp/docs/2016092100045 + css_selector: '#sogoHeader > div.pieceContainer > div.pieceBody > h1 > img' + retrieved_on: '2025-12-25T15:52:27.634608+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 勝浦町 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KAT-L-TL.yaml b/data/custodian/JP-13-KAT-L-TL.yaml index 1e5ae9e714..648c4c6d62 100644 --- a/data/custodian/JP-13-KAT-L-TL.yaml +++ b/data/custodian/JP-13-KAT-L-TL.yaml @@ -220,3 +220,22 @@ location: geonames_id: 8469284 geonames_name: Katsushika feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:52:47.742553+00:00' + source_url: http://www.tsc-05.ac.jp/about_us/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.tsc-05.ac.jp/25/wp-content/themes/tsc2025/images/logo.svg + source_url: http://www.tsc-05.ac.jp/about_us/library + css_selector: '#header > p.logo > a > img' + retrieved_on: '2025-12-25T15:52:47.742553+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KAT-M-PG.yaml b/data/custodian/JP-13-KAT-M-PG.yaml index 3555b19c4c..ce8d432b1c 100644 --- a/data/custodian/JP-13-KAT-M-PG.yaml +++ b/data/custodian/JP-13-KAT-M-PG.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KAT-M-PG - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KAT-M-PG valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KAT-M-PG ghcid_numeric: 4850448611769158582 valid_from: '2025-12-06T23:38:33.529816+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: The planetarium Galaxy @@ -207,3 +208,28 @@ location: geonames_id: 8469284 geonames_name: Katsushika feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:52:57.928002+00:00' + source_url: https://gingaza-2019.amebaownd.com + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://cdn.amebaowndme.com/madrid-prd/madrid-web/images/sites/623074/41f54b70178fee4cb98f0ab314831918_0ffb2d5bdf3f4347583dab99bd90171b.png?width=180&height=180 + source_url: https://gingaza-2019.amebaownd.com + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:52:57.928002+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://cdn.amebaowndme.com/madrid-prd/madrid-web/images/sites/623074/a410b3f405b05f59b55f9ac5dfdc2c79_8dc0150bf2276c5c5f65d16e6b97ccde.jpg + source_url: https://gingaza-2019.amebaownd.com + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T15:52:57.928002+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KIN-M-KBK.yaml b/data/custodian/JP-13-KIN-M-KBK.yaml index b4e7e56af2..c538426b4b 100644 --- a/data/custodian/JP-13-KIN-M-KBK.yaml +++ b/data/custodian/JP-13-KIN-M-KBK.yaml @@ -251,3 +251,28 @@ location: geonames_id: 1859439 feature_code: PPL normalization_timestamp: '2025-12-09T06:53:34.367903+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:53:19.743873+00:00' + source_url: http://kinobun.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://kinobun.jp/apple-touch-icon.png + source_url: http://kinobun.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T15:53:19.743873+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://kinobun.jp/images/og.png + source_url: http://kinobun.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T15:53:19.743873+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KIO-L-KL.yaml b/data/custodian/JP-13-KIO-L-KL.yaml index d8674c9a4a..bcc7b30650 100644 --- a/data/custodian/JP-13-KIO-L-KL.yaml +++ b/data/custodian/JP-13-KIO-L-KL.yaml @@ -41,13 +41,14 @@ ghcid: resolution_date: '2025-12-07T12:05:13.106921+00:00' ghcid_history: - ghcid: JP-13-KIO-L-KL - valid_from: "2025-12-10T09:44:00Z" + valid_from: '2025-12-10T09:44:00Z' valid_to: null - reason: "Corrected region code from JP-TK (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TK (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TK-KIO-L-KL valid_from: null - valid_to: "2025-12-10T09:44:00Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:00Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-XX-XXX-L-KL ghcid_numeric: 621686996941250752 valid_from: '2025-12-06T23:38:55.488528+00:00' @@ -109,8 +110,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITASATODAIGAKUKAIYOSEIMEIKAGAKUBU Library @@ -204,3 +205,39 @@ location: geonames_id: 10902806 feature_code: PPL normalization_timestamp: '2025-12-09T12:21:15.504021+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:53:26.583513+00:00' + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: '[inline-svg]' + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + css_selector: '#__nuxt > div.layouts-global.is-light > header.global-header > + div.base-layout-row.is-hidden-mobile > div.global-header-left > a.lang-link + > p.base-heading.is-image > svg.ui-parts-logo-service.global-header-brand' + retrieved_on: '2025-12-25T15:53:26.583513+00:00' + extraction_method: crawl4ai_svg_detection + detection_confidence: high + is_inline_svg: true + aria_label: '' + - claim_type: favicon_url + claim_value: https://www.ndl.go.jp/assets/hp/favicon/favicon.ico + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + css_selector: '[document] > html > head > link:nth-of-type(13)' + retrieved_on: '2025-12-25T15:53:26.583513+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.ndl.go.jp/assets/hp/og.png + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:53:26.583513+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIO-L-OL.yaml b/data/custodian/JP-13-KIO-L-OL.yaml index e0062ca501..0adce740bb 100644 --- a/data/custodian/JP-13-KIO-L-OL.yaml +++ b/data/custodian/JP-13-KIO-L-OL.yaml @@ -36,13 +36,14 @@ ghcid: resolution_date: '2025-12-07T12:05:17.818935+00:00' ghcid_history: - ghcid: JP-13-KIO-L-OL - valid_from: "2025-12-10T09:44:00Z" + valid_from: '2025-12-10T09:44:00Z' valid_to: null - reason: "Corrected region code from JP-TK (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TK (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TK-KIO-L-OL valid_from: null - valid_to: "2025-12-10T09:44:00Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:00Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-XX-XXX-L-OL ghcid_numeric: 18051611345511232564 valid_from: '2025-12-06T23:38:41.560162+00:00' @@ -155,3 +156,39 @@ location: geonames_id: 10902806 feature_code: PPL normalization_timestamp: '2025-12-09T06:57:24.281565+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:53:32.745961+00:00' + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: '[inline-svg]' + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + css_selector: '#__nuxt > div.layouts-global.is-light > header.global-header > + div.base-layout-row.is-hidden-mobile > div.global-header-left > a.lang-link + > p.base-heading.is-image > svg.ui-parts-logo-service.global-header-brand' + retrieved_on: '2025-12-25T15:53:32.745961+00:00' + extraction_method: crawl4ai_svg_detection + detection_confidence: high + is_inline_svg: true + aria_label: '' + - claim_type: favicon_url + claim_value: https://www.ndl.go.jp/assets/hp/favicon/favicon.ico + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + css_selector: '[document] > html > head > link:nth-of-type(13)' + retrieved_on: '2025-12-25T15:53:32.745961+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.ndl.go.jp/assets/hp/og.png + source_url: https://www.ndl.go.jp/jp/tokyo/index.html + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T15:53:32.745961+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-L-IRCSEMF.yaml b/data/custodian/JP-13-KIT-L-IRCSEMF.yaml index df7ce0a7fa..cc49129220 100644 --- a/data/custodian/JP-13-KIT-L-IRCSEMF.yaml +++ b/data/custodian/JP-13-KIT-L-IRCSEMF.yaml @@ -152,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:53:39.722189+00:00' + source_url: http://www.shibusawa.or.jp/center/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.shibusawa.or.jp/favicon.ico + source_url: http://www.shibusawa.or.jp/center/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:53:39.722189+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-L-KCCLB.yaml b/data/custodian/JP-13-KIT-L-KCCLB.yaml index 90f3427002..519c9b9a71 100644 --- a/data/custodian/JP-13-KIT-L-KCCLB.yaml +++ b/data/custodian/JP-13-KIT-L-KCCLB.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KCCLB - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KCCLB valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KCCLB ghcid_numeric: 6422816410921665288 valid_from: '2025-12-06T23:38:48.546230+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kita City Central Library Branch @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:53:55.077770+00:00' + source_url: https://www.library.city.kita.tokyo.jp/viewer/info.html?id=15 + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/viewer/info.html?id=15 + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T15:53:55.077770+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KJL.yaml b/data/custodian/JP-13-KIT-L-KJL.yaml index b7bd98157a..f7fce7304e 100644 --- a/data/custodian/JP-13-KIT-L-KJL.yaml +++ b/data/custodian/JP-13-KIT-L-KJL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KJL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KJL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KJL ghcid_numeric: 3777669680353300334 valid_from: '2025-12-06T23:38:52.975563+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSU J&L @@ -151,3 +152,28 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:54:01.860909+00:00' + source_url: https://jtol.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://storage.googleapis.com/production-os-assets/assets/80ec5925-eb12-411b-a76c-31f82c6f1338 + source_url: https://jtol.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T15:54:01.860909+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/png + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://storage.googleapis.com/production-os-assets/assets/2c3ae752-a56f-468b-9565-dda405e83b0f + source_url: https://jtol.tokyo.jp + css_selector: '[document] > html > head > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T15:54:01.860909+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabane_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabane_library.yaml index 713685e2b9..f57cd02341 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabane_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabane_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsuakabane_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsuakabane_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsuakabane_library ghcid_numeric: 9146600354555233288 valid_from: '2025-12-06T23:38:43.429925+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUAKABANE Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:54:10.275429+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:54:10.275429+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanekita_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanekita_library.yaml index ebda2c1fae..8ac37a595f 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanekita_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanekita_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:54:20.176256+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:54:20.176256+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanenishi_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanenishi_library.yaml index ab398d235f..f6dec31312 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanenishi_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsuakabanenishi_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsuakabanenishi_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsuakabanenishi_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsuakabanenishi_library ghcid_numeric: 8635264261108809334 valid_from: '2025-12-06T23:38:43.432195+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUAKABANENISHI Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:54:30.454677+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:54:30.454677+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashijujo_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashijujo_library.yaml index 0a33f8a194..e66e36f9e8 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashijujo_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashijujo_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsuhigashijujo_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsuhigashijujo_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsuhigashijujo_library ghcid_numeric: 7649222176705503614 valid_from: '2025-12-06T23:38:43.455427+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUHIGASHIJUJO Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:54:38.953184+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:54:38.953184+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashitabata_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashitabata_library.yaml index ed46889b1b..d5134e3be7 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashitabata_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsuhigashitabata_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsuhigashitabata_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsuhigashitabata_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsuhigashitabata_library ghcid_numeric: 11982519464307566160 valid_from: '2025-12-06T23:38:43.446122+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUHIGASHITABATA Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:54:48.883704+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:54:48.883704+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsukamijujo_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsukamijujo_library.yaml index 7c64c9563c..b3b6768456 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsukamijujo_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsukamijujo_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsukamijujo_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsukamijujo_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsukamijujo_library ghcid_numeric: 16482349622497987151 valid_from: '2025-12-06T23:38:43.443763+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUKAMIJUJO Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:54:58.831840+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:54:58.831840+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsukamiya_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsukamiya_library.yaml index 2f8cdd2d6d..3778b248fc 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsukamiya_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsukamiya_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:55:08.252734+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:55:08.252734+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsukima_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsukima_library.yaml index 38cb46ba19..dd32000b44 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsukima_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsukima_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsukima_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsukima_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsukima_library ghcid_numeric: 6354156278038398548 valid_from: '2025-12-06T23:38:43.434493+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUKIMA Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:55:16.672484+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:55:16.672484+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsushowamachi_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsushowamachi_library.yaml index b16f218a3c..ccef90c282 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsushowamachi_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsushowamachi_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:55:26.739150+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:55:26.739150+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsutabata_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsutabata_library.yaml index efaedddffb..c78b065196 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsutabata_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsutabata_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsutabata_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsutabata_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsutabata_library ghcid_numeric: 12817896301577154074 valid_from: '2025-12-06T23:38:43.441369+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUTABATA Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:55:35.374162+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:55:35.374162+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawa_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawa_library.yaml index d341a8da50..d0682824a0 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawa_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawa_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsutakinogawa_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsutakinogawa_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsutakinogawa_library ghcid_numeric: 8340478296680581700 valid_from: '2025-12-06T23:38:43.436767+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUTAKINOGAWA Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:55:45.170687+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:55:45.170687+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawanishi_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawanishi_library.yaml index 49e7a3dde6..1c3930abe3 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawanishi_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsutakinogawanishi_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsutakinogawanishi_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsutakinogawanishi_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsutakinogawanishi_library ghcid_numeric: 12461388516402954630 valid_from: '2025-12-06T23:38:43.450825+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUTAKINOGAWANISHI Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:55:57.706661+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:55:57.706661+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL-kitakuritsutoshima_library.yaml b/data/custodian/JP-13-KIT-L-KL-kitakuritsutoshima_library.yaml index 3cc38d8a16..9a9069b218 100644 --- a/data/custodian/JP-13-KIT-L-KL-kitakuritsutoshima_library.yaml +++ b/data/custodian/JP-13-KIT-L-KL-kitakuritsutoshima_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-KL-kitakuritsutoshima_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-KL-kitakuritsutoshima_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-KL-kitakuritsutoshima_library ghcid_numeric: 16826272790973670561 valid_from: '2025-12-06T23:38:43.453145+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KITAKURITSUTOSHIMA Library @@ -151,3 +152,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:56:05.958727+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:56:05.958727+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-KL.yaml b/data/custodian/JP-13-KIT-L-KL.yaml index 88fe44d152..3331924011 100644 --- a/data/custodian/JP-13-KIT-L-KL.yaml +++ b/data/custodian/JP-13-KIT-L-KL.yaml @@ -243,3 +243,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:56:14.177039+00:00' + source_url: https://www.library.city.kita.tokyo.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.city.kita.tokyo.jp/apple-touch-icon.png + source_url: https://www.library.city.kita.tokyo.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T15:56:14.177039+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KIT-L-PML.yaml b/data/custodian/JP-13-KIT-L-PML.yaml index 4b32dc6b8e..75303f7023 100644 --- a/data/custodian/JP-13-KIT-L-PML.yaml +++ b/data/custodian/JP-13-KIT-L-PML.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-PML - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-PML valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-PML ghcid_numeric: 5859383514047773791 valid_from: '2025-12-06T23:38:57.660762+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Paper Museum Library @@ -151,3 +152,28 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:56:34.122697+00:00' + source_url: http://www.papermuseum.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://papermuseum.jp/wp-content/uploads/2025/07/cropped-kamihaku-logo-180x180.jpg + source_url: http://www.papermuseum.jp/library + css_selector: '[document] > html.js.flexbox > body > link:nth-of-type(44)' + retrieved_on: '2025-12-25T15:56:34.122697+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://papermuseum.jp/wp-content/uploads/2015/05/cec6fff5aa480f31eb9533842075cd1e.jpg + source_url: http://www.papermuseum.jp/library + css_selector: '[document] > html.js.flexbox > body > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T15:56:34.122697+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 4 diff --git a/data/custodian/JP-13-KIT-L-SL.yaml b/data/custodian/JP-13-KIT-L-SL.yaml index 6bbf7c10f5..97c4cf3860 100644 --- a/data/custodian/JP-13-KIT-L-SL.yaml +++ b/data/custodian/JP-13-KIT-L-SL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-SL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-SL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-SL ghcid_numeric: 10404876112591137316 valid_from: '2025-12-06T23:38:57.045915+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SEIBIGAKUENTANKIDAIGAKU Library @@ -204,3 +205,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:56:45.119326+00:00' + source_url: http://www.seibi.ac.jp/college/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.seibi.ac.jp/favicon.ico + source_url: http://www.seibi.ac.jp/college/library + css_selector: '[document] > html.js.flexbox > head > link' + retrieved_on: '2025-12-25T15:56:45.119326+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-L-TLO.yaml b/data/custodian/JP-13-KIT-L-TLO.yaml index a022408b0d..9d9d3eddd5 100644 --- a/data/custodian/JP-13-KIT-L-TLO.yaml +++ b/data/custodian/JP-13-KIT-L-TLO.yaml @@ -205,3 +205,28 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:56:50.511030+00:00' + source_url: http://www.tokyo-fukushi.ac.jp/library/oji-library/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://liboji-tokyo-fukushi.opac.jp/common/images/op4-favicon.ico + source_url: http://www.tokyo-fukushi.ac.jp/library/oji-library/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:56:50.511030+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://liboji-tokyo-fukushi.opac.jp/common/images/ogp-image.jpg + source_url: http://www.tokyo-fukushi.ac.jp/library/oji-library/index.html + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T15:56:50.511030+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-L-TSU.yaml b/data/custodian/JP-13-KIT-L-TSU.yaml index 0ec6d7a51f..26296fb1a7 100644 --- a/data/custodian/JP-13-KIT-L-TSU.yaml +++ b/data/custodian/JP-13-KIT-L-TSU.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIT-L-TSU - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIT-L-TSU valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIT-L-TSU ghcid_numeric: 12813855684084991243 valid_from: '2025-12-06T23:38:56.917010+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Seitoku University @@ -216,3 +217,22 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:57:12.450587+00:00' + source_url: https://tokyoseitoku-opac.limedio.ricoh.co.jp/drupal + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://tokyoseitoku-opac.limedio.ricoh.co.jp/opac/images/cyan/favicon.ico + source_url: https://tokyoseitoku-opac.limedio.ricoh.co.jp/drupal + css_selector: '[document] > html > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T15:57:12.450587+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-L-TULAL.yaml b/data/custodian/JP-13-KIT-L-TULAL.yaml index 3117485ecf..e6bcc3e37d 100644 --- a/data/custodian/JP-13-KIT-L-TULAL.yaml +++ b/data/custodian/JP-13-KIT-L-TULAL.yaml @@ -152,3 +152,37 @@ location: geonames_id: 8469285 geonames_name: Kita feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:57:21.667242+00:00' + source_url: https://www.toyo.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.toyo.ac.jp/img/common/img_logo.svg + source_url: https://www.toyo.ac.jp/library + css_selector: '#gheader > div.gnav__frm > h1.gnav__logo > a.gnav__logo-link > + img.gnav__logo-img' + retrieved_on: '2025-12-25T15:57:21.667242+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東洋大学 + - claim_type: favicon_url + claim_value: https://www.toyo.ac.jp/img/common/favicon.ico + source_url: https://www.toyo.ac.jp/library + css_selector: '[document] > html.js_domload.js_ajax_load > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T15:57:21.667242+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.toyo.ac.jp/ogp.jpg + source_url: https://www.toyo.ac.jp/library + css_selector: '[document] > html.js_domload.js_ajax_load > head > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T15:57:21.667242+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-M-KCAM.yaml b/data/custodian/JP-13-KIT-M-KCAM.yaml index 38157cc0fa..6e70d86ea4 100644 --- a/data/custodian/JP-13-KIT-M-KCAM.yaml +++ b/data/custodian/JP-13-KIT-M-KCAM.yaml @@ -1196,3 +1196,30 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/7rt0NzB4I5k/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:57:28.771200+00:00' + source_url: https://www.city.kita.tokyo.jp/hakubutsukan + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.kita.lg.jp/_template_/_site_/_default_/_res/design/images/header/tlogo.svg + source_url: https://www.city.kita.tokyo.jp/hakubutsukan + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T15:57:28.771200+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 北区公式ホームページトップページ + - claim_type: favicon_url + claim_value: https://www.city.kita.lg.jp/_template_/_site_/_default_/_res/favicon.ico + source_url: https://www.city.kita.tokyo.jp/hakubutsukan + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T15:57:28.771200+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIT-M-PM.yaml b/data/custodian/JP-13-KIT-M-PM.yaml index 080af77742..49f7a57342 100644 --- a/data/custodian/JP-13-KIT-M-PM.yaml +++ b/data/custodian/JP-13-KIT-M-PM.yaml @@ -453,3 +453,28 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/A8Ba3hzxZU8/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:57:52.713801+00:00' + source_url: https://papermuseum.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://papermuseum.jp/wp-content/uploads/2025/07/cropped-kamihaku-logo-180x180.jpg + source_url: https://papermuseum.jp + css_selector: '[document] > html.js.flexbox > body > link:nth-of-type(44)' + retrieved_on: '2025-12-25T15:57:52.713801+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://papermuseum.jp/wp-content/uploads/2015/05/cec6fff5aa480f31eb9533842075cd1e.jpg + source_url: https://papermuseum.jp + css_selector: '[document] > html.js.flexbox > body > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T15:57:52.713801+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 4 diff --git a/data/custodian/JP-13-KIT-M-TMMWA.yaml b/data/custodian/JP-13-KIT-M-TMMWA.yaml index b61cefc124..7da5813b85 100644 --- a/data/custodian/JP-13-KIT-M-TMMWA.yaml +++ b/data/custodian/JP-13-KIT-M-TMMWA.yaml @@ -280,3 +280,31 @@ youtube_enrichment: view_count: 0 videos: [] status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:58:01.198245+00:00' + source_url: https://kitabunka.or.jp/tabata + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://kitabunka.jp/wp/wp-content/themes/html5blank-stable/img/logo.png + source_url: https://kitabunka.or.jp/tabata + css_selector: '[document] > html.js.flexbox > body > header.header.clear > div.wrap.w1000 + > div.flex > div.logo > a > img' + retrieved_on: '2025-12-25T15:58:01.198245+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 公益財団法人 北区文化振興財団 + - claim_type: favicon_url + claim_value: https://kitabunka.jp/wp/wp-content/themes/html5blank-stable/img/kitabunka.ico + source_url: https://kitabunka.or.jp/tabata + css_selector: '[document] > html.js.flexbox > head > link' + retrieved_on: '2025-12-25T15:58:01.198245+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-GLJNA.yaml b/data/custodian/JP-13-KIY-L-GLJNA.yaml index 0215143719..a1b63a37d2 100644 --- a/data/custodian/JP-13-KIY-L-GLJNA.yaml +++ b/data/custodian/JP-13-KIY-L-GLJNA.yaml @@ -152,3 +152,28 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:58:08.978579+00:00' + source_url: http://www.nurse.or.jp/nursing/education/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.nurse.or.jp/assets/img/favicon.ico + source_url: http://www.nurse.or.jp/nursing/education/library + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T15:58:08.978579+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.nurse.or.jp/asset/img/ogpimg.png + source_url: http://www.nurse.or.jp/nursing/education/library + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T15:58:08.978579+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-JCSWL.yaml b/data/custodian/JP-13-KIY-L-JCSWL.yaml index 2c7927eb8b..f4b9d30e0f 100644 --- a/data/custodian/JP-13-KIY-L-JCSWL.yaml +++ b/data/custodian/JP-13-KIY-L-JCSWL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-JCSWL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-JCSWL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-JCSWL ghcid_numeric: 11055698952798146834 valid_from: '2025-12-06T23:38:55.188806+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Japan College of Social Work Library @@ -196,7 +197,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.jcsw.ac.jp/facilities/library/ wikidata_official_website: http://www.jcsw.ac.jp/facilities/library/ @@ -218,3 +220,28 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:58:28.907416+00:00' + source_url: http://www.jcsw.ac.jp/facilities/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.jcsw.ac.jp/img/apple-touch-icon.png + source_url: http://www.jcsw.ac.jp/facilities/library + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T15:58:28.907416+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.jcsw.ac.jp/80th/img/ogp.jpg + source_url: http://www.jcsw.ac.jp/facilities/library + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T15:58:28.907416+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KIY-L-KCL.yaml b/data/custodian/JP-13-KIY-L-KCL.yaml index a0ad8a63ad..fb42317aa8 100644 --- a/data/custodian/JP-13-KIY-L-KCL.yaml +++ b/data/custodian/JP-13-KIY-L-KCL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-KCL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-KCL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-KCL ghcid_numeric: 3117365142024431068 valid_from: '2025-12-06T23:38:43.880387+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kiyose Chuo Library @@ -151,3 +152,30 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:58:41.775443+00:00' + source_url: https://www.library.kiyose.tokyo.jp/lib_info/chuo.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://www.library.kiyose.tokyo.jp/lib_info/chuo.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T15:58:41.775443+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 清瀬市立図書館 + - claim_type: favicon_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://www.library.kiyose.tokyo.jp/lib_info/chuo.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T15:58:41.775443+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-KEL.yaml b/data/custodian/JP-13-KIY-L-KEL.yaml index b166292a1a..98db7b7fa3 100644 --- a/data/custodian/JP-13-KIY-L-KEL.yaml +++ b/data/custodian/JP-13-KIY-L-KEL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-KEL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-KEL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-KEL ghcid_numeric: 9717231304502019331 valid_from: '2025-12-06T23:38:43.891826+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kiyose Ekimae Library @@ -151,3 +152,30 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:58:50.883033+00:00' + source_url: https://www.library.kiyose.tokyo.jp/lib_info/ekimae.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://www.library.kiyose.tokyo.jp/lib_info/ekimae.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T15:58:50.883033+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 清瀬市立図書館 + - claim_type: favicon_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://www.library.kiyose.tokyo.jp/lib_info/ekimae.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T15:58:50.883033+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-KMKL.yaml b/data/custodian/JP-13-KIY-L-KMKL.yaml index 3e8df06851..b94142a419 100644 --- a/data/custodian/JP-13-KIY-L-KMKL.yaml +++ b/data/custodian/JP-13-KIY-L-KMKL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-KMKL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-KMKL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-KMKL ghcid_numeric: 7845588163158553809 valid_from: '2025-12-06T23:38:43.885010+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kiyose Motomachi Kodomo Library @@ -151,3 +152,30 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:59:00.204169+00:00' + source_url: https://www.library.kiyose.tokyo.jp/lib_info/motomachi.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://www.library.kiyose.tokyo.jp/lib_info/motomachi.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T15:59:00.204169+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 清瀬市立図書館 + - claim_type: favicon_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://www.library.kiyose.tokyo.jp/lib_info/motomachi.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T15:59:00.204169+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-KNL.yaml b/data/custodian/JP-13-KIY-L-KNL.yaml index 1a66a26681..b71c2beec6 100644 --- a/data/custodian/JP-13-KIY-L-KNL.yaml +++ b/data/custodian/JP-13-KIY-L-KNL.yaml @@ -152,3 +152,30 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:59:10.571864+00:00' + source_url: https://www.library.kiyose.tokyo.jp/lib_info/noshio.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://www.library.kiyose.tokyo.jp/lib_info/noshio.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T15:59:10.571864+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 清瀬市立図書館 + - claim_type: favicon_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://www.library.kiyose.tokyo.jp/lib_info/noshio.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T15:59:10.571864+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-KSL.yaml b/data/custodian/JP-13-KIY-L-KSL.yaml index fc0e248417..0d2c233c06 100644 --- a/data/custodian/JP-13-KIY-L-KSL.yaml +++ b/data/custodian/JP-13-KIY-L-KSL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-KSL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-KSL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-KSL ghcid_numeric: 17829762762928010003 valid_from: '2025-12-06T23:38:43.882632+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kiyose Shitajuku Library @@ -151,3 +152,30 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:59:20.098337+00:00' + source_url: https://www.library.kiyose.tokyo.jp/lib_info/shitajuku.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://www.library.kiyose.tokyo.jp/lib_info/shitajuku.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T15:59:20.098337+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 清瀬市立図書館 + - claim_type: favicon_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://www.library.kiyose.tokyo.jp/lib_info/shitajuku.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T15:59:20.098337+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-KTL.yaml b/data/custodian/JP-13-KIY-L-KTL.yaml index c6eebed723..2090712fde 100644 --- a/data/custodian/JP-13-KIY-L-KTL.yaml +++ b/data/custodian/JP-13-KIY-L-KTL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-KTL - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-KTL valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-KTL ghcid_numeric: 11281465068705462857 valid_from: '2025-12-06T23:38:43.889591+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kiyose Takeoka Library @@ -151,3 +152,30 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:59:29.496975+00:00' + source_url: https://www.library.kiyose.tokyo.jp/lib_info/takeoka.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/images/logo.png + source_url: https://www.library.kiyose.tokyo.jp/lib_info/takeoka.html + css_selector: '#header_logo > a.active > img' + retrieved_on: '2025-12-25T15:59:29.496975+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 清瀬市立図書館 + - claim_type: favicon_url + claim_value: https://www.library.kiyose.tokyo.jp/themes/lib_theme/favicon.ico + source_url: https://www.library.kiyose.tokyo.jp/lib_info/takeoka.html + css_selector: '[document] > html > head.notranslate > link' + retrieved_on: '2025-12-25T15:59:29.496975+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-LMPU.yaml b/data/custodian/JP-13-KIY-L-LMPU.yaml index b7d1e969ab..7121ee47fb 100644 --- a/data/custodian/JP-13-KIY-L-LMPU.yaml +++ b/data/custodian/JP-13-KIY-L-LMPU.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-LMPU - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-LMPU valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-LMPU ghcid_numeric: 5743938741689940983 valid_from: '2025-12-06T23:38:55.310024+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Library, Meiji Pharmaceutical University @@ -204,3 +205,28 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:59:39.631000+00:00' + source_url: http://www.my-pharm.ac.jp/~toshokan/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.my-pharm.ac.jp/files/pv/1/site/favicon.ico + source_url: http://www.my-pharm.ac.jp/~toshokan/index.html + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T15:59:39.631000+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.my-pharm.ac.jp/files/co/ogimage/ogp.png + source_url: http://www.my-pharm.ac.jp/~toshokan/index.html + css_selector: '[document] > html > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T15:59:39.631000+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-L-ORCTRI.yaml b/data/custodian/JP-13-KIY-L-ORCTRI.yaml index 5eaf4bd87e..f4e1daefe7 100644 --- a/data/custodian/JP-13-KIY-L-ORCTRI.yaml +++ b/data/custodian/JP-13-KIY-L-ORCTRI.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-L-ORCTRI - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-L-ORCTRI valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-L-ORCTRI ghcid_numeric: 15784382743609909290 valid_from: '2025-12-06T23:38:58.704186+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Obayashi Road Corporation Technical Research Institute @@ -151,3 +152,28 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T15:59:57.627602+00:00' + source_url: http://www.obayashi-road.co.jp/technology/research + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.obayashi-road.co.jp/wp-content/themes/obayashi-road/favicon.ico + source_url: http://www.obayashi-road.co.jp/technology/research + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T15:59:57.627602+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.obayashi-road.co.jp/wp-content/themes/obayashi-road/og.png + source_url: http://www.obayashi-road.co.jp/technology/research + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T15:59:57.627602+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KIY-M-KMM.yaml b/data/custodian/JP-13-KIY-M-KMM.yaml index 363afe30ad..5c8b9d86ad 100644 --- a/data/custodian/JP-13-KIY-M-KMM.yaml +++ b/data/custodian/JP-13-KIY-M-KMM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KIY-M-KMM - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KIY-M-KMM valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KIY-M-KMM ghcid_numeric: 10131382580904959060 valid_from: '2025-12-06T23:38:33.711915+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KIYOSE MUNICIPAL MUSEUM @@ -151,3 +152,30 @@ location: geonames_id: 11611938 geonames_name: Kiyose feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:00:09.830363+00:00' + source_url: http://museum-kiyose.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://museum-kiyose.jp/wp-content/uploads/2025/03/favicon-450x450.png + source_url: http://museum-kiyose.jp + css_selector: '[document] > html.wf-big-caslon-fb-n4-active.wf-hiragino-kaku-gothic-pron-n6-active + > head > link:nth-of-type(48)' + retrieved_on: '2025-12-25T16:00:09.830363+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 192x192 + - claim_type: og_image_url + claim_value: https://museum-kiyose.jp/wp-content/uploads/2025/03/slide_top_main_5-900x587.jpg + source_url: http://museum-kiyose.jp + css_selector: '[document] > html.wf-big-caslon-fb-n4-active.wf-hiragino-kaku-gothic-pron-n6-active + > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T16:00:09.830363+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KOD-L-BGUKL.yaml b/data/custodian/JP-13-KOD-L-BGUKL.yaml index b41aa2132e..c699f0f0b2 100644 --- a/data/custodian/JP-13-KOD-L-BGUKL.yaml +++ b/data/custodian/JP-13-KOD-L-BGUKL.yaml @@ -205,3 +205,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:00:41.996793+00:00' + source_url: http://lib.bunka.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://lib.bunka.ac.jp/web_admin/wp-content/uploads/2022/06/cropped-favicon-180x180.png + source_url: http://lib.bunka.ac.jp + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T16:00:41.996793+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KIMC.yaml b/data/custodian/JP-13-KOD-L-KIMC.yaml index ed4a7333cc..259c89bf72 100644 --- a/data/custodian/JP-13-KOD-L-KIMC.yaml +++ b/data/custodian/JP-13-KOD-L-KIMC.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KIMC - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KIMC valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KIMC ghcid_numeric: 7707655400399442056 valid_from: '2025-12-06T23:38:55.423632+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kaetsu Information & Media Center @@ -196,7 +197,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://imc.kaetsu.ac.jp/ wikidata_official_website: http://imc.kaetsu.ac.jp/ @@ -218,3 +220,28 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:01:19.344149+00:00' + source_url: http://imc.kaetsu.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://lh3.googleusercontent.com/sitesv/AAzXCkdCUJRI3krBpYmzsiTFDswQd1-Oub-3V6TfFrqpYQvGVIpleWjRly-MCEaJA5mad2nOCikKaSeBbwL8guU1ES7nf9dAxZRo_cmWBOcg_WFpK_Mz1DQiyZDOsoBR-BsF4XDwutLCN0ARPaglU_oGq61VflQKOIB8zznfazyhoErtlAVQ0wP7OTaqYkk + source_url: http://imc.kaetsu.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:01:19.344149+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://lh3.googleusercontent.com/sitesv/AAzXCke1cPAG5_px-4Kp4mwYgjUbvz-E4I-spMUNKq_AxURje0X7k8Otkobz2hbiauZgt7roVj9lEEMPcZvUVqhjpZ3vMJub-Wzv48ToGQuLd64kALNp-FPprMWJvjnBYt4u4SCmF3pSkZc57NW8sI_Ahmf2POL6N68Y8sg=w16383 + source_url: http://imc.kaetsu.ac.jp + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T16:01:19.344149+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KOD-L-KL-kodairashiritsuhanakoganei_library.yaml b/data/custodian/JP-13-KOD-L-KL-kodairashiritsuhanakoganei_library.yaml index 0726ad4d98..36407f2d9e 100644 --- a/data/custodian/JP-13-KOD-L-KL-kodairashiritsuhanakoganei_library.yaml +++ b/data/custodian/JP-13-KOD-L-KL-kodairashiritsuhanakoganei_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:01:31.598502+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:01:31.598502+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KL-kodairashiritsukamijuku_library.yaml b/data/custodian/JP-13-KOD-L-KL-kodairashiritsukamijuku_library.yaml index 5790bb9b8c..c382949cda 100644 --- a/data/custodian/JP-13-KOD-L-KL-kodairashiritsukamijuku_library.yaml +++ b/data/custodian/JP-13-KOD-L-KL-kodairashiritsukamijuku_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KL-kodairashiritsukamijuku_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KL-kodairashiritsukamijuku_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KL-kodairashiritsukamijuku_library ghcid_numeric: 9436911239262342575 valid_from: '2025-12-06T23:38:43.805757+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHIRITSUKAMIJUKU Library @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:01:46.716353+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:01:46.716353+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KL-kodairashiritsukihei_library.yaml b/data/custodian/JP-13-KOD-L-KL-kodairashiritsukihei_library.yaml index c8f5c56f7a..b17db5812e 100644 --- a/data/custodian/JP-13-KOD-L-KL-kodairashiritsukihei_library.yaml +++ b/data/custodian/JP-13-KOD-L-KL-kodairashiritsukihei_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KL-kodairashiritsukihei_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KL-kodairashiritsukihei_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KL-kodairashiritsukihei_library ghcid_numeric: 466045006652391380 valid_from: '2025-12-06T23:38:43.803517+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHIRITSUKIHEI Library @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:02:01.100544+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:02:01.100544+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KL-kodairashiritsunakamachi_library.yaml b/data/custodian/JP-13-KOD-L-KL-kodairashiritsunakamachi_library.yaml index e938056cde..f1e6c5ab7f 100644 --- a/data/custodian/JP-13-KOD-L-KL-kodairashiritsunakamachi_library.yaml +++ b/data/custodian/JP-13-KOD-L-KL-kodairashiritsunakamachi_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KL-kodairashiritsunakamachi_library - valid_from: "2025-12-10T09:44:05Z" + valid_from: '2025-12-10T09:44:05Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KL-kodairashiritsunakamachi_library valid_from: null - valid_to: "2025-12-10T09:44:05Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:05Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KL-kodairashiritsunakamachi_library ghcid_numeric: 10301588045980117147 valid_from: '2025-12-06T23:38:43.810788+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHIRITSUNAKAMACHI Library @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:02:12.632456+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:02:12.632456+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KL-kodairashiritsuogawanishimachi_library.yaml b/data/custodian/JP-13-KOD-L-KL-kodairashiritsuogawanishimachi_library.yaml index b986a19015..582933f81e 100644 --- a/data/custodian/JP-13-KOD-L-KL-kodairashiritsuogawanishimachi_library.yaml +++ b/data/custodian/JP-13-KOD-L-KL-kodairashiritsuogawanishimachi_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KL-kodairashiritsuogawanishimachi_library - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KL-kodairashiritsuogawanishimachi_library valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KL-kodairashiritsuogawanishimachi_library ghcid_numeric: 2181721510907518788 valid_from: '2025-12-06T23:38:43.801229+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHIRITSUOGAWANISHIMACHI Library @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:02:23.585526+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:02:23.585526+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KL-kodairashiritsuonuma_library.yaml b/data/custodian/JP-13-KOD-L-KL-kodairashiritsuonuma_library.yaml index 7bbb57fe5c..5ef2960373 100644 --- a/data/custodian/JP-13-KOD-L-KL-kodairashiritsuonuma_library.yaml +++ b/data/custodian/JP-13-KOD-L-KL-kodairashiritsuonuma_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KL-kodairashiritsuonuma_library - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KL-kodairashiritsuonuma_library valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KL-kodairashiritsuonuma_library ghcid_numeric: 414935543335016028 valid_from: '2025-12-06T23:38:43.813096+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHIRITSUONUMA Library @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:02:39.266958+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:02:39.266958+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KL-kodairashiritsutsuda_library.yaml b/data/custodian/JP-13-KOD-L-KL-kodairashiritsutsuda_library.yaml index 08c1480736..07ab0898b9 100644 --- a/data/custodian/JP-13-KOD-L-KL-kodairashiritsutsuda_library.yaml +++ b/data/custodian/JP-13-KOD-L-KL-kodairashiritsutsuda_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KL-kodairashiritsutsuda_library - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KL-kodairashiritsutsuda_library valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KL-kodairashiritsutsuda_library ghcid_numeric: 1967413942772359446 valid_from: '2025-12-06T23:38:43.808480+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHIRITSUTSUDA Library @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:02:53.457108+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:02:53.457108+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KL.yaml b/data/custodian/JP-13-KOD-L-KL.yaml index 0fbfff363b..3b515a0f79 100644 --- a/data/custodian/JP-13-KOD-L-KL.yaml +++ b/data/custodian/JP-13-KOD-L-KL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KL - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KL valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KL ghcid_numeric: 14613600953179088682 valid_from: '2025-12-06T23:38:43.788803+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHICHUO Library @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:03:08.703390+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:03:08.703390+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KLH.yaml b/data/custodian/JP-13-KOD-L-KLH.yaml index 926d09b7d6..1cf28394f4 100644 --- a/data/custodian/JP-13-KOD-L-KLH.yaml +++ b/data/custodian/JP-13-KOD-L-KLH.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KLH - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KLH valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KLH ghcid_numeric: 17352392672325653993 valid_from: '2025-12-06T23:38:43.791151+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHICHUO Library HANAKOGANEIKITABUNSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:03:23.407517+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:03:23.407517+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KLJ.yaml b/data/custodian/JP-13-KOD-L-KLJ.yaml index b1949c0d27..e4d1c61eb9 100644 --- a/data/custodian/JP-13-KOD-L-KLJ.yaml +++ b/data/custodian/JP-13-KOD-L-KLJ.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KLJ - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KLJ valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KLJ ghcid_numeric: 126172470882147054 valid_from: '2025-12-06T23:38:43.796689+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHICHUO Library JOSUIMINAMIBUNSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:03:35.752428+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:03:35.752428+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-KLO.yaml b/data/custodian/JP-13-KOD-L-KLO.yaml index 791409d3da..d29909ccfe 100644 --- a/data/custodian/JP-13-KOD-L-KLO.yaml +++ b/data/custodian/JP-13-KOD-L-KLO.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-L-KLO - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-L-KLO valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-L-KLO ghcid_numeric: 6585196833365884199 valid_from: '2025-12-06T23:38:43.794462+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRASHICHUO Library OGAWABUNSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:03:47.126513+00:00' + source_url: https://library.kodaira.ed.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.kodaira.ed.jp/apple-touch-icon.png + source_url: https://library.kodaira.ed.jp + css_selector: '[document] > html > head > link:nth-of-type(12)' + retrieved_on: '2025-12-25T16:03:47.126513+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOD-L-PUL.yaml b/data/custodian/JP-13-KOD-L-PUL.yaml index 0f5c1046c9..4c5d5fbae3 100644 --- a/data/custodian/JP-13-KOD-L-PUL.yaml +++ b/data/custodian/JP-13-KOD-L-PUL.yaml @@ -211,3 +211,30 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:03:54.322037+00:00' + source_url: https://www.uitec.jeed.go.jp/library/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.uitec.jeed.go.jp/ka7cok0000000080/site_logo.jpg + source_url: https://www.uitec.jeed.go.jp/library/index.html + css_selector: '#h_logo > a > img' + retrieved_on: '2025-12-25T16:03:54.322037+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: PTU 職業能力開発総合大学校 + - claim_type: favicon_url + claim_value: https://www.uitec.jeed.go.jp/favicon.ico + source_url: https://www.uitec.jeed.go.jp/library/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:03:54.322037+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KOD-L-SGUCL.yaml b/data/custodian/JP-13-KOD-L-SGUCL.yaml index f9a9621e58..7330794ac3 100644 --- a/data/custodian/JP-13-KOD-L-SGUCL.yaml +++ b/data/custodian/JP-13-KOD-L-SGUCL.yaml @@ -220,3 +220,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:04:03.997111+00:00' + source_url: http://libwww.shiraume.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://libwww.shiraume.ac.jp/common/images/favicon.png + source_url: http://libwww.shiraume.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:04:03.997111+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/png + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-KOD-M-FMS.yaml b/data/custodian/JP-13-KOD-M-FMS.yaml index d3896e2ce5..06ab3d9292 100644 --- a/data/custodian/JP-13-KOD-M-FMS.yaml +++ b/data/custodian/JP-13-KOD-M-FMS.yaml @@ -152,3 +152,22 @@ location: geonames_id: 11611930 geonames_name: Kodaira feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:04:19.518948+00:00' + source_url: https://www.city.kodaira.tokyo.jp/kids/017/017707.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.kodaira.tokyo.jp/favicon.ico + source_url: https://www.city.kodaira.tokyo.jp/kids/017/017707.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:04:19.518948+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KOD-M-KHDAM.yaml b/data/custodian/JP-13-KOD-M-KHDAM.yaml index 58205672cd..e05f501690 100644 --- a/data/custodian/JP-13-KOD-M-KHDAM.yaml +++ b/data/custodian/JP-13-KOD-M-KHDAM.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOD-M-KHDAM - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOD-M-KHDAM valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOD-M-KHDAM ghcid_numeric: 16185805474471373481 valid_from: '2025-12-06T23:38:33.674065+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KODAIRA HIRAKUSHI DENCHU ART MUSEUM @@ -280,3 +281,22 @@ location: postal_code: 187-0045 street_address: GAKUEN NISHIMACHI, Kodaira Shi, Tokyo To, 187-0045 normalization_timestamp: '2025-12-09T12:21:43.435196+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:04:36.845928+00:00' + source_url: https://www.city.kodaira.tokyo.jp/dencyu + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.kodaira.tokyo.jp/favicon.ico + source_url: https://www.city.kodaira.tokyo.jp/dencyu + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:04:36.845928+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KOG-L-KLN.yaml b/data/custodian/JP-13-KOG-L-KLN.yaml index 293992638c..563d93f457 100644 --- a/data/custodian/JP-13-KOG-L-KLN.yaml +++ b/data/custodian/JP-13-KOG-L-KLN.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOG-L-KLN - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOG-L-KLN valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOG-L-KLN ghcid_numeric: 13188409437596425627 valid_from: '2025-12-06T23:38:52.603994+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOGANEISHIRITSU Library NUKUIKITABUNSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11612579 geonames_name: Koganei feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:40:53.498398+00:00' + source_url: http://www.ntk-koganei.org/library/index.php + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.ntk-koganei.org/images/top_logo.png + source_url: http://www.ntk-koganei.org/library/index.php + css_selector: '#wrap_header > a > img.logo' + retrieved_on: '2025-12-25T16:40:53.498398+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOG-L-TGUL.yaml b/data/custodian/JP-13-KOG-L-TGUL.yaml index 9f8f3313d7..853a27a73d 100644 --- a/data/custodian/JP-13-KOG-L-TGUL.yaml +++ b/data/custodian/JP-13-KOG-L-TGUL.yaml @@ -226,3 +226,28 @@ location: postal_code: 184-8501 street_address: 4-1-1 NIKUIKITAMACHI, Koganei Shi, Tokyo To, 184-8501 normalization_timestamp: '2025-12-09T12:21:43.868583+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:41:06.900395+00:00' + source_url: http://library.u-gakugei.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://library.u-gakugei.ac.jp/themes/custom/ugakugei/favicon.ico + source_url: http://library.u-gakugei.ac.jp + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T16:41:06.900395+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://lib.u-gakugei.ac.jp/sites/default/files/2021-03/library_0.jpg + source_url: http://library.u-gakugei.ac.jp + css_selector: '[document] > html > head > meta:nth-of-type(5)' + retrieved_on: '2025-12-25T16:41:06.900395+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KOG-M-NIICT.yaml b/data/custodian/JP-13-KOG-M-NIICT.yaml index 8117e2c109..8c45660021 100644 --- a/data/custodian/JP-13-KOG-M-NIICT.yaml +++ b/data/custodian/JP-13-KOG-M-NIICT.yaml @@ -152,3 +152,20 @@ location: geonames_id: 11612579 geonames_name: Koganei feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:41:35.362205+00:00' + source_url: https://www.nict.go.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.nict.go.jp/common/prefs/ttlnv90000000fbt-img/nict-logo-new2.png + source_url: https://www.nict.go.jp/index.html + css_selector: '[document] > html > head > meta:nth-of-type(5)' + retrieved_on: '2025-12-25T16:41:35.362205+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-KOG-M-NSMTUAT.yaml b/data/custodian/JP-13-KOG-M-NSMTUAT.yaml index 700e89a685..f86be1086a 100644 --- a/data/custodian/JP-13-KOG-M-NSMTUAT.yaml +++ b/data/custodian/JP-13-KOG-M-NSMTUAT.yaml @@ -248,3 +248,22 @@ location: postal_code: 184-8588 street_address: NAKACHO, Koganei Shi, Tokyo To, 184-8588 normalization_timestamp: '2025-12-09T12:21:43.997636+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:41:47.329322+00:00' + source_url: https://www.tuat-museum.org + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.tuat-museum.org/wp-content/uploads/2018/02/博物館ロゴ.png + source_url: https://www.tuat-museum.org + css_selector: '[document] > html > head > link:nth-of-type(44)' + retrieved_on: '2025-12-25T16:41:47.329322+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 192x192 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-KOK-L-KCHL-kokubunji_city_honda_library.yaml b/data/custodian/JP-13-KOK-L-KCHL-kokubunji_city_honda_library.yaml index e4750796a0..471e6ccee7 100644 --- a/data/custodian/JP-13-KOK-L-KCHL-kokubunji_city_honda_library.yaml +++ b/data/custodian/JP-13-KOK-L-KCHL-kokubunji_city_honda_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOK-L-KCHL-kokubunji_city_honda_library - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOK-L-KCHL-kokubunji_city_honda_library valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOK-L-KCHL-kokubunji_city_honda_library ghcid_numeric: 10547591598549746354 valid_from: '2025-12-06T23:38:43.847942+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kokubunji City Honda Library @@ -151,3 +152,22 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:41:58.083612+00:00' + source_url: https://library.kokubunji.ed.jp/k122_lib01_honda.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.kokubunji.ed.jp/img/common/logo.jpg + source_url: https://library.kokubunji.ed.jp/k122_lib01_honda.html + css_selector: '#wrap > div.page_header > header > h1 > a > img' + retrieved_on: '2025-12-25T16:41:58.083612+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国分寺市図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOK-L-KCHL.yaml b/data/custodian/JP-13-KOK-L-KCHL.yaml index 274224987e..147f3d30e1 100644 --- a/data/custodian/JP-13-KOK-L-KCHL.yaml +++ b/data/custodian/JP-13-KOK-L-KCHL.yaml @@ -152,3 +152,22 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:05.306712+00:00' + source_url: https://library.kokubunji.ed.jp/k122_lib03_hikari.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.kokubunji.ed.jp/img/common/logo.jpg + source_url: https://library.kokubunji.ed.jp/k122_lib03_hikari.html + css_selector: '#wrap > div.page_header > header > h1 > a > img' + retrieved_on: '2025-12-25T16:42:05.306712+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国分寺市図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOK-L-KCHLSB.yaml b/data/custodian/JP-13-KOK-L-KCHLSB.yaml index 7ccd84808e..4be9a39164 100644 --- a/data/custodian/JP-13-KOK-L-KCHLSB.yaml +++ b/data/custodian/JP-13-KOK-L-KCHLSB.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOK-L-KCHLSB - valid_from: "2025-12-10T09:44:06Z" + valid_from: '2025-12-10T09:44:06Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOK-L-KCHLSB valid_from: null - valid_to: "2025-12-10T09:44:06Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:06Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOK-L-KCHLSB ghcid_numeric: 9278579973066084118 valid_from: '2025-12-06T23:38:43.854827+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kokubunji City Honda Library Shiyakusho Branch @@ -151,3 +152,22 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:12.002038+00:00' + source_url: https://library.kokubunji.ed.jp/k122_lib06_eki.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.kokubunji.ed.jp/img/common/logo.jpg + source_url: https://library.kokubunji.ed.jp/k122_lib06_eki.html + css_selector: '#wrap > div.page_header > header > h1 > a > img' + retrieved_on: '2025-12-25T16:42:12.002038+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国分寺市図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOK-L-KCKL.yaml b/data/custodian/JP-13-KOK-L-KCKL.yaml index 31bdfcea44..9990b05899 100644 --- a/data/custodian/JP-13-KOK-L-KCKL.yaml +++ b/data/custodian/JP-13-KOK-L-KCKL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOK-L-KCKL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOK-L-KCKL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOK-L-KCKL ghcid_numeric: 1494142876010525296 valid_from: '2025-12-06T23:38:43.843216+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kokubunji City Koigakubo Library @@ -151,3 +152,22 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:18.675931+00:00' + source_url: https://library.kokubunji.ed.jp/k122_lib02_koi.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.kokubunji.ed.jp/img/common/logo.jpg + source_url: https://library.kokubunji.ed.jp/k122_lib02_koi.html + css_selector: '#wrap > div.page_header > header > h1 > a > img' + retrieved_on: '2025-12-25T16:42:18.675931+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国分寺市図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOK-L-KCML.yaml b/data/custodian/JP-13-KOK-L-KCML.yaml index 7bf1a20c70..a07f2db00a 100644 --- a/data/custodian/JP-13-KOK-L-KCML.yaml +++ b/data/custodian/JP-13-KOK-L-KCML.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOK-L-KCML - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOK-L-KCML valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOK-L-KCML ghcid_numeric: 8397318435142022694 valid_from: '2025-12-06T23:38:43.850217+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kokubunji City Motomachi Library @@ -151,3 +152,22 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:25.298122+00:00' + source_url: https://library.kokubunji.ed.jp/k122_lib04_moto.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.kokubunji.ed.jp/img/common/logo.jpg + source_url: https://library.kokubunji.ed.jp/k122_lib04_moto.html + css_selector: '#wrap > div.page_header > header > h1 > a > img' + retrieved_on: '2025-12-25T16:42:25.298122+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国分寺市図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOK-L-KCNL.yaml b/data/custodian/JP-13-KOK-L-KCNL.yaml index 8fdff4c423..192f8e2d93 100644 --- a/data/custodian/JP-13-KOK-L-KCNL.yaml +++ b/data/custodian/JP-13-KOK-L-KCNL.yaml @@ -152,3 +152,22 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:31.884230+00:00' + source_url: https://library.kokubunji.ed.jp/k122_lib05_nami.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://library.kokubunji.ed.jp/img/common/logo.jpg + source_url: https://library.kokubunji.ed.jp/k122_lib05_nami.html + css_selector: '#wrap > div.page_header > header > h1 > a > img' + retrieved_on: '2025-12-25T16:42:31.884230+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国分寺市図書館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOK-L-TKUL.yaml b/data/custodian/JP-13-KOK-L-TKUL.yaml index 82e61f9b9c..bf6f89ccd4 100644 --- a/data/custodian/JP-13-KOK-L-TKUL.yaml +++ b/data/custodian/JP-13-KOK-L-TKUL.yaml @@ -214,3 +214,22 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:41.360222+00:00' + source_url: http://www.tku.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.tku.ac.jp/upload/media/images/apple-touch-icon.png + source_url: http://www.tku.ac.jp/library + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T16:42:41.360222+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-KOK-L-TMTL.yaml b/data/custodian/JP-13-KOK-L-TMTL.yaml index 8a5011f8cd..d8d4d67ae8 100644 --- a/data/custodian/JP-13-KOK-L-TMTL.yaml +++ b/data/custodian/JP-13-KOK-L-TMTL.yaml @@ -273,3 +273,36 @@ location: postal_code: 185-8520 street_address: 2-2-26 IZUMICHO, Kokubunjishi, Tokyo To, 185-8520 normalization_timestamp: '2025-12-09T12:21:44.402367+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:49.879089+00:00' + source_url: https://www.library.metro.tokyo.lg.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.metro.tokyo.lg.jp/common/img/logo.png + source_url: https://www.library.metro.tokyo.lg.jp + css_selector: '#header > div.header__body > div.header__left > h1.logo > a > img' + retrieved_on: '2025-12-25T16:42:49.879089+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東京都立図書館 + - claim_type: favicon_url + claim_value: https://www.library.metro.tokyo.lg.jp/common/img/favicon/favicon.ico + source_url: https://www.library.metro.tokyo.lg.jp + css_selector: '[document] > html.js.flexbox > head > link' + retrieved_on: '2025-12-25T16:42:49.879089+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.library.metro.tokyo.lg.jp/common/img/ogp.png + source_url: https://www.library.metro.tokyo.lg.jp + css_selector: '[document] > html.js.flexbox > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T16:42:49.879089+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KOK-M-KCMCA.yaml b/data/custodian/JP-13-KOK-M-KCMCA.yaml index aa16b66db7..06cef67d18 100644 --- a/data/custodian/JP-13-KOK-M-KCMCA.yaml +++ b/data/custodian/JP-13-KOK-M-KCMCA.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOK-M-KCMCA - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOK-M-KCMCA valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOK-M-KCMCA ghcid_numeric: 10169754226880234912 valid_from: '2025-12-06T23:38:33.694283+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOKUBUNJI CITY MUSEUM OF CULTURAL ARTIFACTS @@ -151,3 +152,30 @@ location: geonames_id: 1858964 geonames_name: Kokubunji feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:42:58.508404+00:00' + source_url: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/1004249.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/_template_/_site_/_default_/_res/design/images/header/tlogo_top.png + source_url: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/1004249.html + css_selector: '#tlogo > h1 > a > img' + retrieved_on: '2025-12-25T16:42:58.508404+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/1004249.html + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T16:42:58.508404+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-KOK-M-MKTRM.yaml b/data/custodian/JP-13-KOK-M-MKTRM.yaml index c1885efacd..3f5ee1de85 100644 --- a/data/custodian/JP-13-KOK-M-MKTRM.yaml +++ b/data/custodian/JP-13-KOK-M-MKTRM.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOK-M-MKTRM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOK-M-MKTRM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOK-M-MKTRM ghcid_numeric: 4259716374294007326 valid_from: '2025-12-06T23:38:33.699122+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MUSASHI KOKUBUNJI TEMPLE REMAINS MUSEUM @@ -234,3 +235,30 @@ location: postal_code: 185-0023 street_address: NISHIMOTOMACHI, Kokubunji Shi, Tokyo To, 185-0023 normalization_timestamp: '2025-12-09T12:21:44.494683+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:43:05.921785+00:00' + source_url: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/1004239.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/_template_/_site_/_default_/_res/design/images/header/tlogo_top.png + source_url: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/1004239.html + css_selector: '#tlogo > h1 > a > img' + retrieved_on: '2025-12-25T16:43:05.921785+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: https://www.city.kokubunji.tokyo.jp/shisetsu/kouen/1005196/1004239.html + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T16:43:05.921785+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu.yaml b/data/custodian/JP-13-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu.yaml index f23a0bd047..cea5688bec 100644 --- a/data/custodian/JP-13-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu.yaml +++ b/data/custodian/JP-13-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOM-L-K-komaeshiiwadochiikisentatoshoshitsu ghcid_numeric: 17569305807227041179 valid_from: '2025-12-06T23:38:49.235556+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMAESHIIWADOCHIIKISENTATOSHOSHITSU @@ -153,3 +154,22 @@ location: geonames_id: 11612580 geonames_name: Komae feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:43:13.301974+00:00' + source_url: https://www.library.komae.tokyo.jp/facility + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.komae.tokyo.jp/site/wp-content/uploads/2021/01/cropped-komae_city_logo_img-180x180.png + source_url: https://www.library.komae.tokyo.jp/facility + css_selector: '[document] > html > head > link:nth-of-type(28)' + retrieved_on: '2025-12-25T16:43:13.301974+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu.yaml b/data/custodian/JP-13-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu.yaml index d41367d97b..573dc19042 100644 --- a/data/custodian/JP-13-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu.yaml +++ b/data/custodian/JP-13-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOM-L-K-komaeshikamiizumichiikisentatoshoshitsu ghcid_numeric: 1330790090514783224 valid_from: '2025-12-06T23:38:49.233202+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMAESHIKAMIIZUMICHIIKISENTATOSHOSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11612580 geonames_name: Komae feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:43:21.702537+00:00' + source_url: https://www.library.komae.tokyo.jp/facility + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.komae.tokyo.jp/site/wp-content/uploads/2021/01/cropped-komae_city_logo_img-180x180.png + source_url: https://www.library.komae.tokyo.jp/facility + css_selector: '[document] > html > head > link:nth-of-type(28)' + retrieved_on: '2025-12-25T16:43:21.702537+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOM-L-K-komaeshinambuchiikisentatoshoshitsu.yaml b/data/custodian/JP-13-KOM-L-K-komaeshinambuchiikisentatoshoshitsu.yaml index a9632ffd32..1e766eabaa 100644 --- a/data/custodian/JP-13-KOM-L-K-komaeshinambuchiikisentatoshoshitsu.yaml +++ b/data/custodian/JP-13-KOM-L-K-komaeshinambuchiikisentatoshoshitsu.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOM-L-K-komaeshinambuchiikisentatoshoshitsu - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOM-L-K-komaeshinambuchiikisentatoshoshitsu valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOM-L-K-komaeshinambuchiikisentatoshoshitsu ghcid_numeric: 9861191860028281868 valid_from: '2025-12-06T23:38:49.238011+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMAESHINAMBUCHIIKISENTATOSHOSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11612580 geonames_name: Komae feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:43:30.617634+00:00' + source_url: https://www.library.komae.tokyo.jp/facility + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.komae.tokyo.jp/site/wp-content/uploads/2021/01/cropped-komae_city_logo_img-180x180.png + source_url: https://www.library.komae.tokyo.jp/facility + css_selector: '[document] > html > head > link:nth-of-type(28)' + retrieved_on: '2025-12-25T16:43:30.617634+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOM-L-K-komaeshinogawachiikisentatoshoshitsu.yaml b/data/custodian/JP-13-KOM-L-K-komaeshinogawachiikisentatoshoshitsu.yaml index 5573b0c4b1..175d430122 100644 --- a/data/custodian/JP-13-KOM-L-K-komaeshinogawachiikisentatoshoshitsu.yaml +++ b/data/custodian/JP-13-KOM-L-K-komaeshinogawachiikisentatoshoshitsu.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOM-L-K-komaeshinogawachiikisentatoshoshitsu - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOM-L-K-komaeshinogawachiikisentatoshoshitsu valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOM-L-K-komaeshinogawachiikisentatoshoshitsu ghcid_numeric: 7216704275238815015 valid_from: '2025-12-06T23:38:49.230925+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMAESHINOGAWACHIIKISENTATOSHOSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11612580 geonames_name: Komae feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:43:38.402923+00:00' + source_url: https://www.library.komae.tokyo.jp/facility + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.komae.tokyo.jp/site/wp-content/uploads/2021/01/cropped-komae_city_logo_img-180x180.png + source_url: https://www.library.komae.tokyo.jp/facility + css_selector: '[document] > html > head > link:nth-of-type(28)' + retrieved_on: '2025-12-25T16:43:38.402923+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOM-L-K.yaml b/data/custodian/JP-13-KOM-L-K.yaml index 81d388a9f2..12a51b271f 100644 --- a/data/custodian/JP-13-KOM-L-K.yaml +++ b/data/custodian/JP-13-KOM-L-K.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOM-L-K - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOM-L-K valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOM-L-K ghcid_numeric: 18041565516247263266 valid_from: '2025-12-06T23:38:49.228737+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMAESHINISHIGAWARAKOMINKANTOSHOSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 11612580 geonames_name: Komae feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:43:46.142163+00:00' + source_url: https://www.library.komae.tokyo.jp/facility + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.komae.tokyo.jp/site/wp-content/uploads/2021/01/cropped-komae_city_logo_img-180x180.png + source_url: https://www.library.komae.tokyo.jp/facility + css_selector: '[document] > html > head > link:nth-of-type(28)' + retrieved_on: '2025-12-25T16:43:46.142163+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOM-L-KL.yaml b/data/custodian/JP-13-KOM-L-KL.yaml index 4791301e0b..8d4c7974f1 100644 --- a/data/custodian/JP-13-KOM-L-KL.yaml +++ b/data/custodian/JP-13-KOM-L-KL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOM-L-KL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOM-L-KL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOM-L-KL ghcid_numeric: 12116299919488097045 valid_from: '2025-12-06T23:38:43.870916+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMAESHIRITSUCHUO Library @@ -153,3 +154,22 @@ location: geonames_id: 11612580 geonames_name: Komae feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:43:56.576695+00:00' + source_url: https://www.library.komae.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.komae.tokyo.jp/site/wp-content/uploads/2021/01/cropped-komae_city_logo_img-180x180.png + source_url: https://www.library.komae.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(28)' + retrieved_on: '2025-12-25T16:43:56.576695+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOM-L-SL.yaml b/data/custodian/JP-13-KOM-L-SL.yaml index 4dadd18f2c..c68dffe223 100644 --- a/data/custodian/JP-13-KOM-L-SL.yaml +++ b/data/custodian/JP-13-KOM-L-SL.yaml @@ -15,7 +15,8 @@ original_entry: city: Komatsushima Shi region: Tokushima Ken postal_code: 773-0001 - street_address: 29-11 KOMATSUSHIMACHO SHINKO, Komatsushima Shi, Tokushima Ken, 773-0001 + street_address: 29-11 KOMATSUSHIMACHO SHINKO, Komatsushima Shi, Tokushima Ken, + 773-0001 processing_timestamp: '2025-12-06T23:38:47.341444+00:00' ghcid: ghcid_current: JP-13-KOM-L-SL @@ -32,13 +33,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOM-L-SL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOM-L-SL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOM-L-SL ghcid_numeric: 3912661702163306384 valid_from: '2025-12-06T23:38:47.341444+00:00' @@ -96,8 +98,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SHOGAIGAKUSHUSENTAKOMATSUSHIMASHIRITSU Library @@ -151,3 +153,22 @@ location: geonames_id: 11839307 geonames_name: Komatsushima feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:44:06.490536+00:00' + source_url: https://www.city.komatsushima.lg.jp/shisei/soshiki/toshokan + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.city.komatsushima.lg.jp/img/favicon.ico + source_url: https://www.city.komatsushima.lg.jp/shisei/soshiki/toshokan + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T16:44:06.490536+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KOT-L-ALMCAT.yaml b/data/custodian/JP-13-KOT-L-ALMCAT.yaml index e7d3e241cc..2eb731de2a 100644 --- a/data/custodian/JP-13-KOT-L-ALMCAT.yaml +++ b/data/custodian/JP-13-KOT-L-ALMCAT.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-L-ALMCAT - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-L-ALMCAT valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-L-ALMCAT ghcid_numeric: 314346919356344796 valid_from: '2025-12-06T23:38:58.094414+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Art Library, Museum of Comtemporary Art, Tokyo @@ -151,3 +152,28 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:44:23.820611+00:00' + source_url: http://www.mot-art-museum.jp/library/collection.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.mot-art-museum.jp/_assets/images/head/safari-pinned-tab.svg + source_url: http://www.mot-art-museum.jp/library/collection.html + css_selector: '[document] > html.font-loaded > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T16:44:23.820611+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.mot-art-museum.jp/_assets/images/head/og-image@2x.png + source_url: http://www.mot-art-museum.jp/library/collection.html + css_selector: '[document] > html.font-loaded > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T16:44:23.820611+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 4 diff --git a/data/custodian/JP-13-KOT-L-ML.yaml b/data/custodian/JP-13-KOT-L-ML.yaml index daf0fb378c..3a8a2d3a44 100644 --- a/data/custodian/JP-13-KOT-L-ML.yaml +++ b/data/custodian/JP-13-KOT-L-ML.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-L-ML - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-L-ML valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-L-ML ghcid_numeric: 2321164767122624133 valid_from: '2025-12-06T23:38:59.466666+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MUSASHINODAIGAKUARIAKE Library @@ -204,3 +205,28 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:45:52.548488+00:00' + source_url: http://www.musashino-u.ac.jp/library/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.musashino-u.ac.jp/assets/img/common/apple-touch-icon_180x180.png + source_url: http://www.musashino-u.ac.jp/library/index.html + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T16:45:52.548488+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/png + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.musashino-u.ac.jp/ogp.jpg + source_url: http://www.musashino-u.ac.jp/library/index.html + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T16:45:52.548488+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-KOT-L-SITTL.yaml b/data/custodian/JP-13-KOT-L-SITTL.yaml index 82b2c42a64..4c8de5f4f2 100644 --- a/data/custodian/JP-13-KOT-L-SITTL.yaml +++ b/data/custodian/JP-13-KOT-L-SITTL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-L-SITTL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-L-SITTL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-L-SITTL ghcid_numeric: 8969949617735276285 valid_from: '2025-12-06T23:38:54.929443+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Shibaura Institute of Technology Toyosu Library @@ -190,7 +191,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://lib.shibaura-it.ac.jp wikidata_official_website: http://lib.shibaura-it.ac.jp @@ -212,3 +214,22 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:45:59.163354+00:00' + source_url: http://lib.shibaura-it.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.shibaura-it.ac.jp/files/images/favicon.ico + source_url: http://lib.shibaura-it.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:45:59.163354+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KOT-L-TEPSCTMRIE.yaml b/data/custodian/JP-13-KOT-L-TEPSCTMRIE.yaml index 8f6c6cbeff..15d916ae55 100644 --- a/data/custodian/JP-13-KOT-L-TEPSCTMRIE.yaml +++ b/data/custodian/JP-13-KOT-L-TEPSCTMRIE.yaml @@ -155,3 +155,23 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:46:22.560259+00:00' + source_url: http://www.tokyokankyo.jp/kankyoken/profile/utility#library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.tokyokankyo.jp/kankyoken/wp-content/themes/kankyoken/images/top-logo.png + source_url: http://www.tokyokankyo.jp/kankyoken/profile/utility#library + css_selector: '[document] > html > body.home.wp-singular > div.container > header + > div.header-container > h1 > a > img' + retrieved_on: '2025-12-25T16:46:22.560259+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東京都環境科学研究所 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOT-L-TL.yaml b/data/custodian/JP-13-KOT-L-TL.yaml index c8b898852f..8347c5ec3a 100644 --- a/data/custodian/JP-13-KOT-L-TL.yaml +++ b/data/custodian/JP-13-KOT-L-TL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-L-TL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-L-TL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-L-TL ghcid_numeric: 16577633535012922150 valid_from: '2025-12-06T23:38:55.467766+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKYOARIAKEIRYODAIGAKUFUZOKU Library @@ -204,3 +205,28 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:46:29.832554+00:00' + source_url: http://www.tau.ac.jp/facilities/library/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.tau.ac.jp/wp-content/uploads/favicon.ico + source_url: http://www.tau.ac.jp/facilities/library/index.html + css_selector: '[document] > html > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T16:46:29.832554+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.tau.ac.jp/wp-content/uploads/2023/04/thum_OG.jpg + source_url: http://www.tau.ac.jp/facilities/library/index.html + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T16:46:29.832554+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KOT-L-TUMSTLEB.yaml b/data/custodian/JP-13-KOT-L-TUMSTLEB.yaml index a0f04ac71d..56f708e617 100644 --- a/data/custodian/JP-13-KOT-L-TUMSTLEB.yaml +++ b/data/custodian/JP-13-KOT-L-TUMSTLEB.yaml @@ -37,20 +37,22 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-L-TUMSTLEB - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-L-TUMSTLEB valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-L-TUMSTLEB ghcid_numeric: 12908528722178648828 valid_from: '2025-12-06T23:38:53.413683+00:00' reason: Initial GHCID from CH-Annotator (japan_complete_ch_annotator.yaml) custodian_name: claim_type: custodian_name - claim_value: Tokyo University of Marine Science and Technology Library Etchujima branch + claim_value: Tokyo University of Marine Science and Technology Library Etchujima + branch source_type: ch_annotator identifiers: - identifier_scheme: GHCID @@ -101,11 +103,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: Tokyo University of Marine Science and Technology Library Etchujima branch + claim_value: Tokyo University of Marine Science and Technology Library Etchujima + branch property_uri: skos:prefLabel provenance: namespace: glam @@ -164,7 +167,8 @@ wikidata_enrichment: wikidata_labels: en: Tokyo University of Marine Science and Technology Library Etchujima branch ja: 東京海洋大学附属図書館越中島分館 - wikidata_label_en: Tokyo University of Marine Science and Technology Library Etchujima branch + wikidata_label_en: Tokyo University of Marine Science and Technology Library Etchujima + branch wikidata_label_ja: 東京海洋大学附属図書館越中島分館 wikidata_classification: instance_of: &id004 @@ -204,3 +208,22 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:46:42.280914+00:00' + source_url: http://lib.s.kaiyodai.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.s.kaiyodai.ac.jp/theme/Kaiyo/net_commons/favicon.ico?1635399676 + source_url: http://lib.s.kaiyodai.ac.jp + css_selector: '[document] > html.ng-scope > head > link' + retrieved_on: '2025-12-25T16:46:42.280914+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KOT-M-CTARWD.yaml b/data/custodian/JP-13-KOT-M-CTARWD.yaml index 66d726ca38..c9cdb4cb75 100644 --- a/data/custodian/JP-13-KOT-M-CTARWD.yaml +++ b/data/custodian/JP-13-KOT-M-CTARWD.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-M-CTARWD - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-M-CTARWD valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-M-CTARWD ghcid_numeric: 14352239066257124496 valid_from: '2025-12-06T23:38:33.268225+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: The Center of the Tokyo Air Raids and War Damage @@ -151,3 +152,22 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:46:51.886982+00:00' + source_url: https://tokyo-sensai.net + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://tokyo-sensai.net/wp/wp-content/uploads/2022/08/cropped-favi-180x180.png + source_url: https://tokyo-sensai.net + css_selector: '[document] > html.js > head > link:nth-of-type(20)' + retrieved_on: '2025-12-25T16:46:51.886982+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KOT-M-DFEH.yaml b/data/custodian/JP-13-KOT-M-DFEH.yaml index 913ab6a5c1..ad2712049e 100644 --- a/data/custodian/JP-13-KOT-M-DFEH.yaml +++ b/data/custodian/JP-13-KOT-M-DFEH.yaml @@ -807,3 +807,22 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/hc6Ao_cKgvQ/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:47:00.306984+00:00' + source_url: http://d5f.org + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://d5f.org/wp/wp-content/themes/fukuryumaru_theme/favicon.ico + source_url: http://d5f.org + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:47:00.306984+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KOT-M-GSM.yaml b/data/custodian/JP-13-KOT-M-GSM.yaml index 7f5119e8cb..e3c6b04833 100644 --- a/data/custodian/JP-13-KOT-M-GSM.yaml +++ b/data/custodian/JP-13-KOT-M-GSM.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-M-GSM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-M-GSM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-M-GSM ghcid_numeric: 1298210316646614805 valid_from: '2025-12-06T23:38:33.259603+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: GAS SCIENCE MUSEUM @@ -250,3 +251,37 @@ location: postal_code: 135-0061 street_address: TOYOSU, Koto Ku, Tokyo To, 135-0061 normalization_timestamp: '2025-12-09T12:21:45.795110+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:47:08.895736+00:00' + source_url: https://www.gas-kagakukan.com + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.gas-kagakukan.com/common20/img/logo_group.svg + source_url: https://www.gas-kagakukan.com + css_selector: '#header > section.l-header-group > div.l-header-group__inner > + p.l-header-group__logo > a > img' + retrieved_on: '2025-12-25T16:47:08.895736+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: TOKYO GAS GROUP + - claim_type: favicon_url + claim_value: https://www.gas-kagakukan.com/apple-touch-icon.png + source_url: https://www.gas-kagakukan.com + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:47:08.895736+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.gas-kagakukan.com/og.png + source_url: https://www.gas-kagakukan.com + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T16:47:08.895736+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KOT-M-KCBM.yaml b/data/custodian/JP-13-KOT-M-KCBM.yaml index 788bd496f3..ddba9cb1e4 100644 --- a/data/custodian/JP-13-KOT-M-KCBM.yaml +++ b/data/custodian/JP-13-KOT-M-KCBM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-M-KCBM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-M-KCBM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-M-KCBM ghcid_numeric: 12626072292159352317 valid_from: '2025-12-06T23:38:33.252343+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOTO CITY BASHO MUSEUM @@ -151,3 +152,22 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:47:20.116193+00:00' + source_url: https://www.kcf.or.jp/basho + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.kcf.or.jp/images/common/logo_s.png + source_url: https://www.kcf.or.jp/basho + css_selector: '#header > div.inner > a > img.hd_logo' + retrieved_on: '2025-12-25T16:47:20.116193+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 公益財団法人 江東区文化コミュニティ財団 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOT-M-KCFEM.yaml b/data/custodian/JP-13-KOT-M-KCFEM.yaml index 9caa946224..aeffc11dbc 100644 --- a/data/custodian/JP-13-KOT-M-KCFEM.yaml +++ b/data/custodian/JP-13-KOT-M-KCFEM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-M-KCFEM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-M-KCFEM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-M-KCFEM ghcid_numeric: 5881571536165628428 valid_from: '2025-12-06T23:38:33.254810+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOTO CITY FUKAGAWA EDO MUSEUM @@ -151,3 +152,22 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:47:28.941981+00:00' + source_url: https://www.kcf.or.jp/fukagawa + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.kcf.or.jp/images/common/logo_s.png + source_url: https://www.kcf.or.jp/fukagawa + css_selector: '#header > div.inner > a > img.hd_logo' + retrieved_on: '2025-12-25T16:47:28.941981+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 公益財団法人 江東区文化コミュニティ財団 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOT-M-MCAT.yaml b/data/custodian/JP-13-KOT-M-MCAT.yaml index 0f66e9e1f6..77dc999be8 100644 --- a/data/custodian/JP-13-KOT-M-MCAT.yaml +++ b/data/custodian/JP-13-KOT-M-MCAT.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-M-MCAT - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-M-MCAT valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-M-MCAT ghcid_numeric: 9429219328438882338 valid_from: '2025-12-06T23:38:33.257256+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MUSEUM OF CONTEMPORARY ART, TOKYO @@ -151,3 +152,28 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:47:37.071528+00:00' + source_url: https://www.mot-art-museum.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.mot-art-museum.jp/_assets/images/head/safari-pinned-tab.svg + source_url: https://www.mot-art-museum.jp + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T16:47:37.071528+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.mot-art-museum.jp/_assets/images/head/og-image@2x.png + source_url: https://www.mot-art-museum.jp + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T16:47:37.071528+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 4 diff --git a/data/custodian/JP-13-KOT-M-MNMESI.yaml b/data/custodian/JP-13-KOT-M-MNMESI.yaml index 18c377a2a9..d21d9f0927 100644 --- a/data/custodian/JP-13-KOT-M-MNMESI.yaml +++ b/data/custodian/JP-13-KOT-M-MNMESI.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOT-M-MNMESI - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOT-M-MNMESI valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOT-M-MNMESI ghcid_numeric: 17675681126292546767 valid_from: '2025-12-06T23:38:33.263050+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Miraikan-THE NATIONAL MUSEUM OF EMERGING SCIENCE AND INNOVATION @@ -151,3 +152,28 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:47:46.126313+00:00' + source_url: https://www.miraikan.jst.go.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.miraikan.jst.go.jp/_assets/img/global/apple-touch-icon.png + source_url: https://www.miraikan.jst.go.jp + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T16:47:46.126313+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.miraikan.jst.go.jp/images/20220927top_ogp.jpg + source_url: https://www.miraikan.jst.go.jp + css_selector: '[document] > html > head > meta:nth-of-type(18)' + retrieved_on: '2025-12-25T16:47:46.126313+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KOT-M-NFM.yaml b/data/custodian/JP-13-KOT-M-NFM.yaml index ce29d8b8c8..6f1454d40a 100644 --- a/data/custodian/JP-13-KOT-M-NFM.yaml +++ b/data/custodian/JP-13-KOT-M-NFM.yaml @@ -464,3 +464,22 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/W6LltUte9Tc/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:47:55.348513+00:00' + source_url: https://www.kcf.or.jp/nakagawa + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.kcf.or.jp/images/common/logo_s.png + source_url: https://www.kcf.or.jp/nakagawa + css_selector: '#header > div.inner > a > img.hd_logo' + retrieved_on: '2025-12-25T16:47:55.348513+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 公益財団法人 江東区文化コミュニティ財団 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KOT-M-YSTGD.yaml b/data/custodian/JP-13-KOT-M-YSTGD.yaml index 2417696fa6..8717654fec 100644 --- a/data/custodian/JP-13-KOT-M-YSTGD.yaml +++ b/data/custodian/JP-13-KOT-M-YSTGD.yaml @@ -152,3 +152,28 @@ location: geonames_id: 11209896 geonames_name: Kotō feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:48:04.460776+00:00' + source_url: https://www.yumenoshima.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.yumenoshima.jp/cms/wp-content/themes/yumenoshima/assets/img/common/apple-touch-icon-precomposed.png + source_url: https://www.yumenoshima.jp + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T16:48:04.460776+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.yumenoshima.jp/cms/wp-content/uploads/2022/04/ogp_sougou.png + source_url: https://www.yumenoshima.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T16:48:04.460776+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KOZ-L-KPL.yaml b/data/custodian/JP-13-KOZ-L-KPL.yaml index b4f772740a..f3f59fb433 100644 --- a/data/custodian/JP-13-KOZ-L-KPL.yaml +++ b/data/custodian/JP-13-KOZ-L-KPL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KOZ-L-KPL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KOZ-L-KPL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KOZ-L-KPL ghcid_numeric: 3813323661890044744 valid_from: '2025-12-06T23:38:48.690936+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOUZUSHIMA PUBLIC LIBRARY @@ -151,3 +152,22 @@ location: geonames_id: 1858557 geonames_name: Kōzushima feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:48:21.966953+00:00' + source_url: http://vill.kouzushima.tokyo.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.vill.kouzushima.tokyo.jp/images/2023/02/cropped-favicon-180x180.png + source_url: http://vill.kouzushima.tokyo.jp/library + css_selector: '[document] > html.pc > head > link:nth-of-type(25)' + retrieved_on: '2025-12-25T16:48:21.966953+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KUB-L-FL.yaml b/data/custodian/JP-13-KUB-L-FL.yaml index 6576c24e3c..fde47909b0 100644 --- a/data/custodian/JP-13-KUB-L-FL.yaml +++ b/data/custodian/JP-13-KUB-L-FL.yaml @@ -156,3 +156,22 @@ location: geonames_id: 1907170 feature_code: PPL normalization_timestamp: '2025-12-09T06:57:24.303317+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:48:32.252085+00:00' + source_url: https://libopac.tamabi.ac.jp/drupal + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://libopac.tamabi.ac.jp/opac/images/cyan/favicon.ico + source_url: https://libopac.tamabi.ac.jp/drupal + css_selector: '[document] > html > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T16:48:32.252085+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KUN-L-HUCHSSL.yaml b/data/custodian/JP-13-KUN-L-HUCHSSL.yaml index ff087709d7..6b5ac0ec52 100644 --- a/data/custodian/JP-13-KUN-L-HUCHSSL.yaml +++ b/data/custodian/JP-13-KUN-L-HUCHSSL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUN-L-HUCHSSL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUN-L-HUCHSSL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUN-L-HUCHSSL ghcid_numeric: 11777671282017497220 valid_from: '2025-12-06T23:38:53.385174+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Hitotsubashi University, Center for Historical Social Science Literature @@ -164,7 +165,8 @@ wikidata_enrichment: wikidata_labels: en: Hitotsubashi University, Center for Historical Social Science Literature ja: 一橋大学社会科学古典資料センター - wikidata_label_en: Hitotsubashi University, Center for Historical Social Science Literature + wikidata_label_en: Hitotsubashi University, Center for Historical Social Science + Literature wikidata_label_ja: 一橋大学社会科学古典資料センター wikidata_classification: instance_of: &id004 @@ -204,3 +206,36 @@ location: geonames_id: 11611617 geonames_name: Kunitachi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:48:46.891993+00:00' + source_url: http://chssl.lib.hit-u.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://chssl.lib.hit-u.ac.jp/images/2020/02/logo_chssl_ja.png + source_url: http://chssl.lib.hit-u.ac.jp + css_selector: '#head-logo > a > img' + retrieved_on: '2025-12-25T16:48:46.891993+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 一橋大学社会科学古典資料センター + - claim_type: favicon_url + claim_value: http://chssl.lib.hit-u.ac.jp/images/apple-touch-icon-precomposed.png + source_url: http://chssl.lib.hit-u.ac.jp + css_selector: '[document] > html > head > link:nth-of-type(30)' + retrieved_on: '2025-12-25T16:48:46.891993+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://chssl.lib.hit-u.ac.jp/images/2020/02/topmain30.png + source_url: http://chssl.lib.hit-u.ac.jp + css_selector: '[document] > html > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T16:48:46.891993+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KUN-L-HUL.yaml b/data/custodian/JP-13-KUN-L-HUL.yaml index c632d7c511..80cd3ee711 100644 --- a/data/custodian/JP-13-KUN-L-HUL.yaml +++ b/data/custodian/JP-13-KUN-L-HUL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUN-L-HUL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUN-L-HUL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUN-L-HUL ghcid_numeric: 5555965498957103888 valid_from: '2025-12-06T23:38:53.376059+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Hitotsubashi University Library @@ -151,3 +152,20 @@ location: geonames_id: 11611617 geonames_name: Kunitachi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:49:03.778034+00:00' + source_url: http://www.lib.hit-u.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://www.lib.hit-u.ac.jp/images/2020/02/og.png + source_url: http://www.lib.hit-u.ac.jp + css_selector: '[document] > html > head > meta:nth-of-type(13)' + retrieved_on: '2025-12-25T16:49:03.778034+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-KUN-L-TWSCPEL.yaml b/data/custodian/JP-13-KUN-L-TWSCPEL.yaml index 803ad592eb..801fa86ddf 100644 --- a/data/custodian/JP-13-KUN-L-TWSCPEL.yaml +++ b/data/custodian/JP-13-KUN-L-TWSCPEL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUN-L-TWSCPEL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUN-L-TWSCPEL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUN-L-TWSCPEL ghcid_numeric: 606426987139968884 valid_from: '2025-12-06T23:38:55.112077+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Women's Collge of Physical Education Library @@ -204,3 +205,28 @@ location: geonames_id: 11611617 geonames_name: Kunitachi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:52:08.511269+00:00' + source_url: http://www.twcpe.ac.jp/library/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.twcpe.ac.jp/common/images/favicon.ico + source_url: http://www.twcpe.ac.jp/library/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:52:08.511269+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.twcpe.ac.jp/common/images/og.jpg + source_url: http://www.twcpe.ac.jp/library/index.html + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T16:52:08.511269+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KUN-L-YCIL.yaml b/data/custodian/JP-13-KUN-L-YCIL.yaml index ad1c22cf6a..48e9e6df7c 100644 --- a/data/custodian/JP-13-KUN-L-YCIL.yaml +++ b/data/custodian/JP-13-KUN-L-YCIL.yaml @@ -152,3 +152,28 @@ location: geonames_id: 11611617 geonames_name: Kunitachi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:52:17.071371+00:00' + source_url: http://www.yakult.co.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.yakult.co.jp/common/images/favicon_a.ico + source_url: http://www.yakult.co.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:52:17.071371+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.yakult.co.jp/common/images/ogimage.jpg + source_url: http://www.yakult.co.jp + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T16:52:17.071371+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-KUN-M-KKBK.yaml b/data/custodian/JP-13-KUN-M-KKBK.yaml index bb437e8737..0bb3b7a844 100644 --- a/data/custodian/JP-13-KUN-M-KKBK.yaml +++ b/data/custodian/JP-13-KUN-M-KKBK.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUN-M-KKBK - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUN-M-KKBK valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUN-M-KKBK ghcid_numeric: 9044944443397074721 valid_from: '2025-12-06T23:38:33.701689+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KUNITACHI KYODO BUNKA-KAN @@ -230,3 +231,22 @@ location: postal_code: 186-0211 street_address: YAHO, Kunitachi Shi, Tokyo To, 186-0211 normalization_timestamp: '2025-12-09T12:21:46.804118+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:52:28.651405+00:00' + source_url: https://kuzaidan.or.jp/province + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://kuzaidan.or.jp/province/wp-content/uploads/sites/4/2017/04/cropped-a3b94f0439e949e33b727a3227e15a57-180x180.jpg + source_url: https://kuzaidan.or.jp/province + css_selector: '[document] > html > head > link:nth-of-type(20)' + retrieved_on: '2025-12-25T16:52:28.651405+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KUN-M-THAM.yaml b/data/custodian/JP-13-KUN-M-THAM.yaml index 9a12ad811c..e35607e260 100644 --- a/data/custodian/JP-13-KUN-M-THAM.yaml +++ b/data/custodian/JP-13-KUN-M-THAM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUN-M-THAM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUN-M-THAM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUN-M-THAM ghcid_numeric: 356960618392281871 valid_from: '2025-12-06T23:38:33.704353+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tamashin History & Art Museum @@ -151,3 +152,22 @@ location: geonames_id: 11611617 geonames_name: Kunitachi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:52:35.566704+00:00' + source_url: https://www.tamashin.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://static.parastorage.com/client/pfavico.ico + source_url: https://www.tamashin.or.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:52:35.566704+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: 192x192 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KUR-L-K-kurayoshishinadatekominkantoshoshitsu.yaml b/data/custodian/JP-13-KUR-L-K-kurayoshishinadatekominkantoshoshitsu.yaml index 0130bd1f6f..e7b6822347 100644 --- a/data/custodian/JP-13-KUR-L-K-kurayoshishinadatekominkantoshoshitsu.yaml +++ b/data/custodian/JP-13-KUR-L-K-kurayoshishinadatekominkantoshoshitsu.yaml @@ -152,3 +152,20 @@ location: geonames_id: 1858301 geonames_name: Kurayoshi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:53:05.386427+00:00' + source_url: http://konadate.blog13.fc2.com + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://blog-imgs-27.fc2.com/k/o/n/konadate/kou.jpg + source_url: http://konadate.blog13.fc2.com + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T16:53:05.386427+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu.yaml b/data/custodian/JP-13-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu.yaml index 23616f5eff..7539939e3e 100644 --- a/data/custodian/JP-13-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu.yaml +++ b/data/custodian/JP-13-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-L-K-kurobeshiritsuaimotokominkantoshoshitsu ghcid_numeric: 5592504565740289473 valid_from: '2025-12-06T23:38:49.554019+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KUROBESHIRITSUAIMOTOKOMINKANTOSHOSHITSU @@ -151,3 +152,22 @@ location: geonames_id: 6822126 geonames_name: Kurobe-shi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:53:45.455099+00:00' + source_url: http://www2.tkc.pref.toyama.jp/kouminkan/info/svOrgDtl.aspx?orgcd=1932&stdycd=C0000762 + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.tkc.pref.toyama.jp/design/img/idx/h_logo_sp.png + source_url: http://www2.tkc.pref.toyama.jp/kouminkan/info/svOrgDtl.aspx?orgcd=1932&stdycd=C0000762 + css_selector: '#sp_header > h1.hsp_logo > a > img' + retrieved_on: '2025-12-25T16:53:45.455099+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: とやま学遊ネット + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KUR-L-KCL.yaml b/data/custodian/JP-13-KUR-L-KCL.yaml index 36fc8333c7..e3338c6c05 100644 --- a/data/custodian/JP-13-KUR-L-KCL.yaml +++ b/data/custodian/JP-13-KUR-L-KCL.yaml @@ -152,3 +152,30 @@ location: geonames_id: 1858301 geonames_name: Kurayoshi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:54:25.408447+00:00' + source_url: http://www.lib.city.kurayoshi.lg.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.lib.city.kurayoshi.lg.jp/Images/logo.png + source_url: http://www.lib.city.kurayoshi.lg.jp + css_selector: '#Header > div.contents_b > a.logo > img' + retrieved_on: '2025-12-25T16:54:25.408447+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 倉吉市 + - claim_type: favicon_url + claim_value: http://www.lib.city.kurayoshi.lg.jp/Images/lib/apple-touch-icon-180x180.png + source_url: http://www.lib.city.kurayoshi.lg.jp + css_selector: '[document] > html > head > link.png' + retrieved_on: '2025-12-25T16:54:25.408447+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/png + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 4 diff --git a/data/custodian/JP-13-KUR-L-KL.yaml b/data/custodian/JP-13-KUR-L-KL.yaml index 0dea196ee7..526c457f17 100644 --- a/data/custodian/JP-13-KUR-L-KL.yaml +++ b/data/custodian/JP-13-KUR-L-KL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-L-KL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-L-KL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-L-KL ghcid_numeric: 10208366457471433597 valid_from: '2025-12-06T23:38:46.742819+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KURAYOSHISHIRITSUSEKIGANE Library @@ -151,3 +152,30 @@ location: geonames_id: 1858301 geonames_name: Kurayoshi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:54:33.190407+00:00' + source_url: http://www.lib.city.kurayoshi.lg.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.lib.city.kurayoshi.lg.jp/Images/logo.png + source_url: http://www.lib.city.kurayoshi.lg.jp + css_selector: '#Header > div.contents_b > a.logo > img' + retrieved_on: '2025-12-25T16:54:33.190407+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 倉吉市 + - claim_type: favicon_url + claim_value: http://www.lib.city.kurayoshi.lg.jp/Images/lib/apple-touch-icon-180x180.png + source_url: http://www.lib.city.kurayoshi.lg.jp + css_selector: '[document] > html > head > link.png' + retrieved_on: '2025-12-25T16:54:33.190407+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/png + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 4 diff --git a/data/custodian/JP-13-KUR-L-TTL.yaml b/data/custodian/JP-13-KUR-L-TTL.yaml index 5b37d5ccdd..34bef0bf78 100644 --- a/data/custodian/JP-13-KUR-L-TTL.yaml +++ b/data/custodian/JP-13-KUR-L-TTL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-L-TTL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-L-TTL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-L-TTL ghcid_numeric: 8978184988403278919 valid_from: '2025-12-06T23:38:57.258214+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOTTORIKANGODAIGAKU・TOTTORITANKIDAIGAKUFUZOKU Library @@ -196,7 +197,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.cygnus.ac.jp/campuslife/library.html wikidata_official_website: http://www.cygnus.ac.jp/campuslife/library.html @@ -218,3 +220,22 @@ location: geonames_id: 1858301 geonames_name: Kurayoshi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:54:50.487158+00:00' + source_url: http://www.cygnus.ac.jp/campuslife/library.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.cygnus.ac.jp/campuslife/img/logo.png + source_url: http://www.cygnus.ac.jp/campuslife/library.html + css_selector: '#mobile-head > h2.logo > a > img' + retrieved_on: '2025-12-25T16:54:50.487158+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 鳥取短期大学 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KUR-M-KCAM.yaml b/data/custodian/JP-13-KUR-M-KCAM.yaml index ef5060d886..f4bb596d5b 100644 --- a/data/custodian/JP-13-KUR-M-KCAM.yaml +++ b/data/custodian/JP-13-KUR-M-KCAM.yaml @@ -41,13 +41,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-M-KCAM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-M-KCAM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-M-KCAM ghcid_numeric: 5891380175074781886 valid_from: '2025-12-06T23:38:34.709637+00:00' @@ -106,8 +107,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kurobe City Art Museum @@ -191,7 +192,8 @@ wikidata_enrichment: instance_of: &id005 - id: Q207694 label: art museum - description: building or space for the exhibition of art (for institution, use Q3196771) + description: building or space for the exhibition of art (for institution, use + Q3196771) wikidata_instance_of: *id005 wikidata_location: country: &id006 @@ -225,3 +227,30 @@ location: geonames_id: 6822126 geonames_name: Kurobe-shi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:54:58.401296+00:00' + source_url: https://www.city.kurobe.toyama.jp/category/page.aspx?servno=79 + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.kurobe.toyama.jp/designs/common/image/logo_header.png + source_url: https://www.city.kurobe.toyama.jp/category/page.aspx?servno=79 + css_selector: '[document] > html > body > header.rs_skip > div > p > a > img' + retrieved_on: '2025-12-25T16:54:58.401296+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 黒部市 + - claim_type: favicon_url + claim_value: https://www.city.kurobe.toyama.jp/favicon.ico + source_url: https://www.city.kurobe.toyama.jp/category/page.aspx?servno=79 + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:54:58.401296+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-KUR-M-KMEP.yaml b/data/custodian/JP-13-KUR-M-KMEP.yaml index a607e64c57..daad36d91b 100644 --- a/data/custodian/JP-13-KUR-M-KMEP.yaml +++ b/data/custodian/JP-13-KUR-M-KMEP.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-M-KMEP - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-M-KMEP valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-M-KMEP ghcid_numeric: 5786834610834661614 valid_from: '2025-12-06T23:38:34.716985+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KUROBE MUSEUM OF ELECTRIC POWER @@ -175,8 +176,8 @@ wikidata_enrichment: instance_of: &id004 - id: Q33506 label: museum - description: institution that holds artifacts and other objects of scientific, artistic, cultural, historical, or other - importance + description: institution that holds artifacts and other objects of scientific, + artistic, cultural, historical, or other importance wikidata_instance_of: *id004 wikidata_location: located_in_admin_entity: &id006 @@ -213,3 +214,28 @@ location: geonames_id: 6822126 geonames_name: Kurobe-shi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:55:11.019600+00:00' + source_url: https://www.kepco.co.jp/sp/corporate/profile/community/pr/kurobe/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.kepco.co.jp/share/images/apple-touch-icon.png + source_url: https://www.kepco.co.jp/sp/corporate/profile/community/pr/kurobe/index.html + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T16:55:11.019600+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.kepco.co.jp/sp/asset/image/common/ogp.png + source_url: https://www.kepco.co.jp/sp/corporate/profile/community/pr/kurobe/index.html + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T16:55:11.019600+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-KUR-M-KYSM.yaml b/data/custodian/JP-13-KUR-M-KYSM.yaml index 527d7a46f7..1e11d3d063 100644 --- a/data/custodian/JP-13-KUR-M-KYSM.yaml +++ b/data/custodian/JP-13-KUR-M-KYSM.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-M-KYSM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-M-KYSM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-M-KYSM ghcid_numeric: 7483705505883212063 valid_from: '2025-12-06T23:38:34.706936+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KUROBE YOSHIDA SCIENCE MUSEUM @@ -242,3 +243,22 @@ location: postal_code: 938-0005 street_address: YOSHIDA, Kurobe Shi, Toyama Ken, 938-0005 normalization_timestamp: '2025-12-09T12:21:49.474173+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:56:03.242111+00:00' + source_url: http://kysm.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://kysm.or.jp/renewal/wp-content/uploads/2022/04/cropped-kysm_logo-180x180.png + source_url: http://kysm.or.jp + css_selector: '[document] > html > head > link:nth-of-type(22)' + retrieved_on: '2025-12-25T16:56:03.242111+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-KUR-M-SMA.yaml b/data/custodian/JP-13-KUR-M-SMA.yaml index 070e0d8e66..dfca6620f9 100644 --- a/data/custodian/JP-13-KUR-M-SMA.yaml +++ b/data/custodian/JP-13-KUR-M-SMA.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-M-SMA - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-M-SMA valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-M-SMA ghcid_numeric: 14036797914060583087 valid_from: '2025-12-06T23:38:34.714610+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SELENE MUSEUM OF ART @@ -151,3 +152,23 @@ location: geonames_id: 6822126 geonames_name: Kurobe-shi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:56:10.481679+00:00' + source_url: https://www.unazuki-selene.com + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.unazuki-selene.com/common/img/gl/logo.png + source_url: https://www.unazuki-selene.com + css_selector: '#top-head > div.header1 > div.row.sm_full > h1.col.span_2 > a > + img' + retrieved_on: '2025-12-25T16:56:10.481679+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 黒部市芸術創造センター セレネ + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-KUR-M-TNPM.yaml b/data/custodian/JP-13-KUR-M-TNPM.yaml index f1ac84feb9..24a567c67f 100644 --- a/data/custodian/JP-13-KUR-M-TNPM.yaml +++ b/data/custodian/JP-13-KUR-M-TNPM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-KUR-M-TNPM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-KUR-M-TNPM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-KUR-M-TNPM ghcid_numeric: 8910617504386908611 valid_from: '2025-12-06T23:38:38.427758+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tottori Nijisseiki Pear Museum @@ -151,3 +152,28 @@ location: geonames_id: 1858301 geonames_name: Kurayoshi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:56:27.077681+00:00' + source_url: http://1174.sanin.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://1174.sanin.jp/user/common/img/i_icon.png?2024 + source_url: http://1174.sanin.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:56:27.077681+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://1174.sanin.jp/user/common/img/ogp.png + source_url: http://1174.sanin.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T16:56:27.077681+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MAC-L-FCCEL.yaml b/data/custodian/JP-13-MAC-L-FCCEL.yaml index a7d9a410e3..56a384b735 100644 --- a/data/custodian/JP-13-MAC-L-FCCEL.yaml +++ b/data/custodian/JP-13-MAC-L-FCCEL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-L-FCCEL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-L-FCCEL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-L-FCCEL ghcid_numeric: 12730283548252790485 valid_from: '2025-12-06T23:38:57.048815+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Felicia College of Childhood Education Library @@ -204,3 +205,22 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:56:37.974077+00:00' + source_url: https://felicia-lib.meisen.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://felicia-lib.meisen.ac.jp/favicon.ico + source_url: https://felicia-lib.meisen.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T16:56:37.974077+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MAC-L-JFOUL.yaml b/data/custodian/JP-13-MAC-L-JFOUL.yaml index a94161f6d9..a34b93f1a4 100644 --- a/data/custodian/JP-13-MAC-L-JFOUL.yaml +++ b/data/custodian/JP-13-MAC-L-JFOUL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-L-JFOUL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-L-JFOUL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-L-JFOUL ghcid_numeric: 10666475541397885874 valid_from: '2025-12-06T23:38:54.833473+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: J. F. Oberlin University Library @@ -209,3 +210,20 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:57:47.302206+00:00' + source_url: http://www.obirin.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://www.obirin.ac.jp/common/img/base/ogp_image.png + source_url: http://www.obirin.ac.jp/library + css_selector: '#pagetop > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T16:57:47.302206+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MAC-L-KLJ.yaml b/data/custodian/JP-13-MAC-L-KLJ.yaml index 6706b8170c..b572bf4c54 100644 --- a/data/custodian/JP-13-MAC-L-KLJ.yaml +++ b/data/custodian/JP-13-MAC-L-KLJ.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-L-KLJ - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-L-KLJ valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-L-KLJ ghcid_numeric: 9766509380386633357 valid_from: '2025-12-06T23:38:54.894094+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOKUSHIKANDAIGAKUTSURUKAWA Library ・JOHOMEDEIASENTA @@ -204,3 +205,28 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T16:57:55.605789+00:00' + source_url: https://www.kokushikan.ac.jp/education/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.kokushikan.ac.jp/favicon.ico + source_url: https://www.kokushikan.ac.jp/education/library + css_selector: '[document] > html.is-scroll.is-loaded > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T16:57:55.605789+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.kokushikan.ac.jp/assets/img/common/ogp_image.jpg + source_url: https://www.kokushikan.ac.jp/education/library + css_selector: '[document] > html.is-scroll.is-loaded > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T16:57:55.605789+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MAC-L-SL.yaml b/data/custodian/JP-13-MAC-L-SL.yaml index 8de099b52f..429d27df3b 100644 --- a/data/custodian/JP-13-MAC-L-SL.yaml +++ b/data/custodian/JP-13-MAC-L-SL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-L-SL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-L-SL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-L-SL ghcid_numeric: 12468673775835405641 valid_from: '2025-12-06T23:38:57.514823+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SAREJIOKOGYOKOTOSEMMONGAKKO Library @@ -151,3 +152,22 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:18:28.165685+00:00' + source_url: https://opac.salesio-sp.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://opac.salesio-sp.ac.jp/favicon.ico + source_url: https://opac.salesio-sp.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T17:18:28.165685+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MAC-L-TKGULOML.yaml b/data/custodian/JP-13-MAC-L-TKGULOML.yaml index c5121eae1e..df11749307 100644 --- a/data/custodian/JP-13-MAC-L-TKGULOML.yaml +++ b/data/custodian/JP-13-MAC-L-TKGULOML.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-L-TKGULOML - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-L-TKGULOML valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-L-TKGULOML ghcid_numeric: 3710699386022016657 valid_from: '2025-12-06T23:38:55.082909+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Kasei Gakuin University Library, Oe Memorial Library @@ -209,3 +210,23 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:18:51.988068+00:00' + source_url: http://www.kasei-gakuin.ac.jp/library/lib-top.htm + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.kasei-gakuin.ac.jp/tkgu_cms/wp-content/uploads/2022/04/cropped-favicon-512x512-1-180x180.png + source_url: http://www.kasei-gakuin.ac.jp/library/lib-top.htm + css_selector: '[document] > html.fontawesome-i2svg-active.fontawesome-i2svg-complete + > head > link:nth-of-type(30)' + retrieved_on: '2025-12-25T17:18:51.988068+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 3 diff --git a/data/custodian/JP-13-MAC-L-WUUMLIC.yaml b/data/custodian/JP-13-MAC-L-WUUMLIC.yaml index 327925a975..2f9d3674c2 100644 --- a/data/custodian/JP-13-MAC-L-WUUMLIC.yaml +++ b/data/custodian/JP-13-MAC-L-WUUMLIC.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-L-WUUMLIC - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-L-WUUMLIC valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-L-WUUMLIC ghcid_numeric: 4450854994508355883 valid_from: '2025-12-06T23:38:55.325862+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Wako University Umene Memorial Library & IT Center @@ -196,7 +197,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.wako.ac.jp/library/ wikidata_official_website: http://www.wako.ac.jp/library/ @@ -218,3 +220,22 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:19:08.848541+00:00' + source_url: http://www.wako.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.wako.ac.jp/assets/favicon.ico + source_url: http://www.wako.ac.jp/library + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T17:19:08.848541+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MAC-M-JMIMC.yaml b/data/custodian/JP-13-MAC-M-JMIMC.yaml index c3a0c16350..c62518eb8e 100644 --- a/data/custodian/JP-13-MAC-M-JMIMC.yaml +++ b/data/custodian/JP-13-MAC-M-JMIMC.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-M-JMIMC - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-M-JMIMC valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-M-JMIMC ghcid_numeric: 9094240802715911478 valid_from: '2025-12-06T23:38:33.649823+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: JIYU MINKEN INSTITUTE OF MACHIDA CITY @@ -193,8 +194,8 @@ wikidata_enrichment: instance_of: &id004 - id: Q33506 label: museum - description: institution that holds artifacts and other objects of scientific, artistic, cultural, historical, or other - importance + description: institution that holds artifacts and other objects of scientific, + artistic, cultural, historical, or other importance main_subject: - id: Q711511 label: Freedom and People's Rights Movement @@ -240,3 +241,37 @@ location: postal_code: 195-0063 street_address: NOZUTAMACHI, Machida Shi, Tokyo To, 195-0063 normalization_timestamp: '2025-12-09T12:21:51.793991+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:19:16.915209+00:00' + source_url: https://www.city.machida.tokyo.jp/bunka/bunka_geijutsu/cul/cul03/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.machida.tokyo.jp/images/2024_header_logo.png + source_url: https://www.city.machida.tokyo.jp/bunka/bunka_geijutsu/cul/cul03/index.html + css_selector: '#basebg > header.header > div.header__inner > div.header__top > + div.header__logo > a > img.header__logo-img' + retrieved_on: '2025-12-25T17:19:16.915209+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 町田市 + - claim_type: favicon_url + claim_value: https://www.city.machida.tokyo.jp/images/apple-touch-icon.png + source_url: https://www.city.machida.tokyo.jp/bunka/bunka_geijutsu/cul/cul03/index.html + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:19:16.915209+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.machida.tokyo.jp/images/ogp.png + source_url: https://www.city.machida.tokyo.jp/bunka/bunka_geijutsu/cul/cul03/index.html + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T17:19:16.915209+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MAC-M-SPUY.yaml b/data/custodian/JP-13-MAC-M-SPUY.yaml index c0af5335f5..3e5f9bfc88 100644 --- a/data/custodian/JP-13-MAC-M-SPUY.yaml +++ b/data/custodian/JP-13-MAC-M-SPUY.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-M-SPUY - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-M-SPUY valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-M-SPUY ghcid_numeric: 16114001547831684527 valid_from: '2025-12-06T23:38:33.642201+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SHOWA PHARMACEUTICAL UNIVERSITY YAKUYOUSHOKUBUTSUEN @@ -151,3 +152,28 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:19:25.217135+00:00' + source_url: https://www.shoyaku.ac.jp/garden + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.shoyaku.ac.jp/common/img/icon.png + source_url: https://www.shoyaku.ac.jp/garden + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:19:25.217135+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www.shoyaku.ac.jp/common/img/thumb_fb.jpg + source_url: https://www.shoyaku.ac.jp/garden + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T17:19:25.217135+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MAC-M-TKGMDL.yaml b/data/custodian/JP-13-MAC-M-TKGMDL.yaml index d8994f838b..4aa1ca09b3 100644 --- a/data/custodian/JP-13-MAC-M-TKGMDL.yaml +++ b/data/custodian/JP-13-MAC-M-TKGMDL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MAC-M-TKGMDL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MAC-M-TKGMDL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MAC-M-TKGMDL ghcid_numeric: 8861119011211463937 valid_from: '2025-12-06T23:38:33.639962+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKYO KASEI GAKUIN MUSEUM OF DAILY LIFE @@ -151,3 +152,30 @@ location: geonames_id: 1857871 geonames_name: Machida feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:19:37.329145+00:00' + source_url: https://www.kasei-gakuin.ac.jp/action/museum.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.kasei-gakuin.ac.jp/tkgu_cms/wp-content/uploads/2022/04/cropped-favicon-512x512-1-180x180.png + source_url: https://www.kasei-gakuin.ac.jp/action/museum.html + css_selector: '[document] > html.fontawesome-i2svg-active.fontawesome-i2svg-complete + > head > link:nth-of-type(38)' + retrieved_on: '2025-12-25T17:19:37.329145+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.kasei-gakuin.ac.jp/tkgu_cms/wp-content/uploads/2022/04/og-image.png + source_url: https://www.kasei-gakuin.ac.jp/action/museum.html + css_selector: '[document] > html.fontawesome-i2svg-active.fontawesome-i2svg-complete + > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T17:19:37.329145+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MEG-L-CPASLGSASU.yaml b/data/custodian/JP-13-MEG-L-CPASLGSASU.yaml index cae8dba2d9..ecaa32626f 100644 --- a/data/custodian/JP-13-MEG-L-CPASLGSASU.yaml +++ b/data/custodian/JP-13-MEG-L-CPASLGSASU.yaml @@ -1,5 +1,6 @@ original_entry: - name: Center for Pacific and American Studies Library, Graduate School of Arts & Sciences of the University of Tokyo + name: Center for Pacific and American Studies Library, Graduate School of Arts & + Sciences of the University of Tokyo institution_type: LIBRARY source: CH-Annotator (japan_complete_ch_annotator.yaml) identifiers: @@ -37,20 +38,22 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-L-CPASLGSASU - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-L-CPASLGSASU valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-L-CPASLGSASU ghcid_numeric: 1681714570738939368 valid_from: '2025-12-06T23:38:53.331310+00:00' reason: Initial GHCID from CH-Annotator (japan_complete_ch_annotator.yaml) custodian_name: claim_type: custodian_name - claim_value: Center for Pacific and American Studies Library, Graduate School of Arts & Sciences of the University of Tokyo + claim_value: Center for Pacific and American Studies Library, Graduate School of + Arts & Sciences of the University of Tokyo source_type: ch_annotator identifiers: - identifier_scheme: GHCID @@ -101,12 +104,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: Center for Pacific and American Studies Library, Graduate School of Arts & Sciences of the University of - Tokyo + claim_value: Center for Pacific and American Studies Library, Graduate School + of Arts & Sciences of the University of Tokyo property_uri: skos:prefLabel provenance: namespace: glam @@ -164,10 +167,11 @@ wikidata_enrichment: - P856 - P968 wikidata_labels: - en: Center for Pacific and American Studies Library, Graduate School of Arts & Sciences of the University of Tokyo + en: Center for Pacific and American Studies Library, Graduate School of Arts & + Sciences of the University of Tokyo ja: 東京大学大学院総合文化研究科附属アメリカ太平洋地域研究センター図書室 - wikidata_label_en: Center for Pacific and American Studies Library, Graduate School of Arts & Sciences of the University - of Tokyo + wikidata_label_en: Center for Pacific and American Studies Library, Graduate School + of Arts & Sciences of the University of Tokyo wikidata_label_ja: 東京大学大学院総合文化研究科附属アメリカ太平洋地域研究センター図書室 wikidata_classification: instance_of: &id004 @@ -209,3 +213,22 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:19:51.107541+00:00' + source_url: http://www.cpas.c.u-tokyo.ac.jp/lib/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.cpas.c.u-tokyo.ac.jp/lib/favicon.ico + source_url: http://www.cpas.c.u-tokyo.ac.jp/lib/index.html + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T17:19:51.107541+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MEG-L-KLUT.yaml b/data/custodian/JP-13-MEG-L-KLUT.yaml index fc958147ec..2ad0f53448 100644 --- a/data/custodian/JP-13-MEG-L-KLUT.yaml +++ b/data/custodian/JP-13-MEG-L-KLUT.yaml @@ -152,3 +152,22 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:38:02.090845+00:00' + source_url: https://www.lib.u-tokyo.ac.jp/ja/library/komaba + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.lib.u-tokyo.ac.jp/themes/custom/tokyolib/dest/images/favicon/safari-pinned-tab.svg + source_url: https://www.lib.u-tokyo.ac.jp/ja/library/komaba + css_selector: '[document] > html.js > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T17:38:02.090845+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 6 diff --git a/data/custodian/JP-13-MEG-L-LTMMP.yaml b/data/custodian/JP-13-MEG-L-LTMMP.yaml index 77ec8e9a73..1d5b13d1b9 100644 --- a/data/custodian/JP-13-MEG-L-LTMMP.yaml +++ b/data/custodian/JP-13-MEG-L-LTMMP.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-L-LTMMP - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-L-LTMMP valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-L-LTMMP ghcid_numeric: 6263505544467005465 valid_from: '2025-12-06T23:38:58.875196+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Library, Tokyo Metropolitan Museum of Photography @@ -151,3 +152,22 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:38:14.383489+00:00' + source_url: https://library.topmuseum.jp/drupal + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://library.topmuseum.jp/opac/images/cyan/favicon.ico + source_url: https://library.topmuseum.jp/drupal + css_selector: '[document] > html > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T17:38:14.383489+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MEG-L-RCASTLUT.yaml b/data/custodian/JP-13-MEG-L-RCASTLUT.yaml index 17e4bb5ae4..43a74a7874 100644 --- a/data/custodian/JP-13-MEG-L-RCASTLUT.yaml +++ b/data/custodian/JP-13-MEG-L-RCASTLUT.yaml @@ -1,5 +1,6 @@ original_entry: - name: Research Center for Advanced Science and Technology Library, the University of Tokyo + name: Research Center for Advanced Science and Technology Library, the University + of Tokyo institution_type: LIBRARY source: CH-Annotator (japan_complete_ch_annotator.yaml) identifiers: @@ -37,20 +38,22 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-L-RCASTLUT - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-L-RCASTLUT valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-L-RCASTLUT ghcid_numeric: 7271547228207827622 valid_from: '2025-12-06T23:38:53.328512+00:00' reason: Initial GHCID from CH-Annotator (japan_complete_ch_annotator.yaml) custodian_name: claim_type: custodian_name - claim_value: Research Center for Advanced Science and Technology Library, the University of Tokyo + claim_value: Research Center for Advanced Science and Technology Library, the University + of Tokyo source_type: ch_annotator identifiers: - identifier_scheme: GHCID @@ -101,11 +104,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: Research Center for Advanced Science and Technology Library, the University of Tokyo + claim_value: Research Center for Advanced Science and Technology Library, the + University of Tokyo property_uri: skos:prefLabel provenance: namespace: glam @@ -162,9 +166,11 @@ wikidata_enrichment: - P791 - P856 wikidata_labels: - en: Research Center for Advanced Science and Technology Library, the University of Tokyo + en: Research Center for Advanced Science and Technology Library, the University + of Tokyo ja: 東京大学先端科学技術研究センター図書室 - wikidata_label_en: Research Center for Advanced Science and Technology Library, the University of Tokyo + wikidata_label_en: Research Center for Advanced Science and Technology Library, + the University of Tokyo wikidata_label_ja: 東京大学先端科学技術研究センター図書室 wikidata_classification: instance_of: &id004 @@ -204,3 +210,28 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:40:11.494377+00:00' + source_url: http://www.office.rcast.u-tokyo.ac.jp/tosho/index-j.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.office.rcast.u-tokyo.ac.jp/content/000017986.png + source_url: http://www.office.rcast.u-tokyo.ac.jp/tosho/index-j.html + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:40:11.494377+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.rcast.u-tokyo.ac.jp/content/000011204.png + source_url: http://www.office.rcast.u-tokyo.ac.jp/tosho/index-j.html + css_selector: '[document] > html > head > meta:nth-of-type(8)' + retrieved_on: '2025-12-25T17:40:11.494377+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MEG-L-THUHL.yaml b/data/custodian/JP-13-MEG-L-THUHL.yaml index fbee6dd998..dc0f289800 100644 --- a/data/custodian/JP-13-MEG-L-THUHL.yaml +++ b/data/custodian/JP-13-MEG-L-THUHL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-L-THUHL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-L-THUHL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-L-THUHL ghcid_numeric: 4875654939205705548 valid_from: '2025-12-06T23:38:55.444906+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Healthcare University Higashigaoka Library @@ -204,3 +205,20 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:40:22.147626+00:00' + source_url: http://www.thcu.ac.jp/facilities/library + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://thcu.ac.jp/img/asset/ogp.png + source_url: http://www.thcu.ac.jp/facilities/library + css_selector: '[document] > html.other > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T17:40:22.147626+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MEG-M-FGLC.yaml b/data/custodian/JP-13-MEG-M-FGLC.yaml index 819ac07c13..d89a30780f 100644 --- a/data/custodian/JP-13-MEG-M-FGLC.yaml +++ b/data/custodian/JP-13-MEG-M-FGLC.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-M-FGLC - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-M-FGLC valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-M-FGLC ghcid_numeric: 8956157568430366861 valid_from: '2025-12-06T23:38:33.316381+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: FLOWER AND GREENERY LEARNING CENTER @@ -151,3 +152,36 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:40:43.072139+00:00' + source_url: https://www.city.meguro.tokyo.jp/smph/kurashi/sports_koen_yoka/koen/omoshiro/midorigakushu.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.meguro.tokyo.jp/shared/images/header/hlogo.png + source_url: https://www.city.meguro.tokyo.jp/smph/kurashi/sports_koen_yoka/koen/omoshiro/midorigakushu.html + css_selector: '#tmp_hlogo > p > a > img' + retrieved_on: '2025-12-25T17:40:43.072139+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 目黒区 + - claim_type: favicon_url + claim_value: https://www.city.meguro.tokyo.jp/shared/images/favicon/apple-touch-icon-precomposed.png + source_url: https://www.city.meguro.tokyo.jp/smph/kurashi/sports_koen_yoka/koen/omoshiro/midorigakushu.html + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T17:40:43.072139+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.meguro.tokyo.jp/shared/images/sns/logo.jpg + source_url: https://www.city.meguro.tokyo.jp/smph/kurashi/sports_koen_yoka/koen/omoshiro/midorigakushu.html + css_selector: '[document] > html > head > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T17:40:43.072139+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MEG-M-JFCM.yaml b/data/custodian/JP-13-MEG-M-JFCM.yaml index e64d1f8099..fa085dd5fa 100644 --- a/data/custodian/JP-13-MEG-M-JFCM.yaml +++ b/data/custodian/JP-13-MEG-M-JFCM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-M-JFCM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-M-JFCM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-M-JFCM ghcid_numeric: 4979267397851249965 valid_from: '2025-12-06T23:38:33.307694+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: THE JAPAN FOLK CRAFTS MUSEUM @@ -151,3 +152,28 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:40:52.819480+00:00' + source_url: https://www.mingeikan.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://mingeikan.or.jp/wp-content/themes/mingeikan/icon/apple-touch-icon-152x152.png + source_url: https://www.mingeikan.or.jp + css_selector: '[document] > html.mac.chrome > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T17:40:52.819480+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 152x152 + - claim_type: og_image_url + claim_value: https://mingeikan.or.jp/wp-content/themes/mingeikan/images/ogp.jpg + source_url: https://www.mingeikan.or.jp + css_selector: '[document] > html.mac.chrome > head > meta:nth-of-type(16)' + retrieved_on: '2025-12-25T17:40:52.819480+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 9 diff --git a/data/custodian/JP-13-MEG-M-KMCASUT.yaml b/data/custodian/JP-13-MEG-M-KMCASUT.yaml index 30df5c1581..ba3365de13 100644 --- a/data/custodian/JP-13-MEG-M-KMCASUT.yaml +++ b/data/custodian/JP-13-MEG-M-KMCASUT.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-M-KMCASUT - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-M-KMCASUT valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-M-KMCASUT ghcid_numeric: 630812962834228263 valid_from: '2025-12-06T23:38:33.330465+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOMABA MUSEUM COLLEGE OF ARTS AND SCIENCES, UNIVERSITY OF TOKYO @@ -151,3 +152,22 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:41:00.726336+00:00' + source_url: http://museum.c.u-tokyo.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://museum.c.u-tokyo.ac.jp/favicon.ico + source_url: http://museum.c.u-tokyo.ac.jp + css_selector: '[document] > html > body > link' + retrieved_on: '2025-12-25T17:41:00.726336+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MEG-M-MCSACTOURC.yaml b/data/custodian/JP-13-MEG-M-MCSACTOURC.yaml index 8e313ca5fa..b0dbd0bbcf 100644 --- a/data/custodian/JP-13-MEG-M-MCSACTOURC.yaml +++ b/data/custodian/JP-13-MEG-M-MCSACTOURC.yaml @@ -1,6 +1,6 @@ original_entry: - name: MUSEUM OF CONTEMPORARY SCULPTURE, AFFILATED TO CHOSENIN TEMPLE AND OPERATED UNDER THE RELIGIOUS CORPORATION ACT OF - 1951 + name: MUSEUM OF CONTEMPORARY SCULPTURE, AFFILATED TO CHOSENIN TEMPLE AND OPERATED + UNDER THE RELIGIOUS CORPORATION ACT OF 1951 institution_type: MUSEUM source: CH-Annotator (japan_complete_ch_annotator.yaml) identifiers: @@ -33,21 +33,22 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-M-MCSACTOURC - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-M-MCSACTOURC valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-M-MCSACTOURC ghcid_numeric: 12798304751196016517 valid_from: '2025-12-06T23:38:33.313852+00:00' reason: Initial GHCID from CH-Annotator (japan_complete_ch_annotator.yaml) custodian_name: claim_type: custodian_name - claim_value: MUSEUM OF CONTEMPORARY SCULPTURE, AFFILATED TO CHOSENIN TEMPLE AND OPERATED UNDER THE RELIGIOUS CORPORATION - ACT OF 1951 + claim_value: MUSEUM OF CONTEMPORARY SCULPTURE, AFFILATED TO CHOSENIN TEMPLE AND + OPERATED UNDER THE RELIGIOUS CORPORATION ACT OF 1951 source_type: ch_annotator identifiers: - identifier_scheme: GHCID @@ -98,12 +99,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: MUSEUM OF CONTEMPORARY SCULPTURE, AFFILATED TO CHOSENIN TEMPLE AND OPERATED UNDER THE RELIGIOUS CORPORATION - ACT OF 1951 + claim_value: MUSEUM OF CONTEMPORARY SCULPTURE, AFFILATED TO CHOSENIN TEMPLE AND + OPERATED UNDER THE RELIGIOUS CORPORATION ACT OF 1951 property_uri: skos:prefLabel provenance: namespace: glam @@ -154,3 +155,22 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:41:07.368780+00:00' + source_url: http://museum-of-sculpture.org + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://museum-of-sculpture.org/wp-content/themes/gendaichoukoku/img/header_logo.png + source_url: http://museum-of-sculpture.org + css_selector: '#header > div.header_left > h1 > a > img.pc' + retrieved_on: '2025-12-25T17:41:07.368780+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 宗教法人長泉院付属現代彫刻美術館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-MEG-M-MHM.yaml b/data/custodian/JP-13-MEG-M-MHM.yaml index 222a86e5a6..77bf26e46e 100644 --- a/data/custodian/JP-13-MEG-M-MHM.yaml +++ b/data/custodian/JP-13-MEG-M-MHM.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-M-MHM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-M-MHM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-M-MHM ghcid_numeric: 4332708100571013991 valid_from: '2025-12-06T23:38:33.319628+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MEGURO HISTORY MUSEUM @@ -244,3 +245,36 @@ location: postal_code: 153-0061 street_address: NAKAMEGURO, Meguro Ku, Tokyo To, 153-0061 normalization_timestamp: '2025-12-09T12:21:53.000659+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:41:20.540504+00:00' + source_url: https://www.city.meguro.tokyo.jp/shisetsu/shisetsu/bijutsu/rekishi_shiryokan + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.city.meguro.tokyo.jp/shared/images/header/hlogo.png + source_url: https://www.city.meguro.tokyo.jp/shisetsu/shisetsu/bijutsu/rekishi_shiryokan + css_selector: '#tmp_hlogo > p > a > img' + retrieved_on: '2025-12-25T17:41:20.540504+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 目黒区 + - claim_type: favicon_url + claim_value: https://www.city.meguro.tokyo.jp/shared/images/favicon/apple-touch-icon-precomposed.png + source_url: https://www.city.meguro.tokyo.jp/shisetsu/shisetsu/bijutsu/rekishi_shiryokan + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T17:41:20.540504+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.meguro.tokyo.jp/shared/images/sns/logo.jpg + source_url: https://www.city.meguro.tokyo.jp/shisetsu/shisetsu/bijutsu/rekishi_shiryokan + css_selector: '[document] > html > head > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T17:41:20.540504+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MEG-M-SSM.yaml b/data/custodian/JP-13-MEG-M-SSM.yaml index 28ab3b857b..53a88294b2 100644 --- a/data/custodian/JP-13-MEG-M-SSM.yaml +++ b/data/custodian/JP-13-MEG-M-SSM.yaml @@ -152,3 +152,37 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:42:24.793378+00:00' + source_url: https://www.satosakura.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.satosakura.jp/wp-content/uploads/2023/02/cropped-logo_SSM_RGB-1.png + source_url: https://www.satosakura.jp + css_selector: '#masthead > div.custom-header > div.site-branding:nth-of-type(2) + > div.wrap > a.custom-logo-link > img.custom-logo' + retrieved_on: '2025-12-25T17:42:24.793378+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: Sato Sakura Museum + - claim_type: favicon_url + claim_value: https://www.satosakura.jp/wp-content/uploads/2023/02/logo_SSM_trim_RGB-100x100.jpg + source_url: https://www.satosakura.jp + css_selector: '[document] > html.js.svg > head > link:nth-of-type(37)' + retrieved_on: '2025-12-25T17:42:24.793378+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 32x32 + - claim_type: og_image_url + claim_value: https://www.satosakura.jp/wp-content/uploads/2025/10/21e53e1df529d30a6b96d3d44d75852f-1024x619.jpg + source_url: https://www.satosakura.jp + css_selector: '[document] > html.js.svg > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T17:42:24.793378+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MEG-M-TPAM.yaml b/data/custodian/JP-13-MEG-M-TPAM.yaml index 4c6c53ae03..5ee760a002 100644 --- a/data/custodian/JP-13-MEG-M-TPAM.yaml +++ b/data/custodian/JP-13-MEG-M-TPAM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MEG-M-TPAM - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MEG-M-TPAM valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MEG-M-TPAM ghcid_numeric: 4333244448707702141 valid_from: '2025-12-06T23:38:33.322640+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKYO PHOTOGRAPHIC ART MUSEUM @@ -151,3 +152,37 @@ location: geonames_id: 11790374 geonames_name: Meguro feature_code: PPLX +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:42:34.613297+00:00' + source_url: http://topmuseum.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://topmuseum.jp/common/image/logo_main.png + source_url: http://topmuseum.jp + css_selector: '#top > header.header.container--fluid > div.header__upper > div.header__logo + > h1 > a > img.main-logo' + retrieved_on: '2025-12-25T17:42:34.613297+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: TOP MUSEUM 東京都写真美術館 + - claim_type: favicon_url + claim_value: http://topmuseum.jp/common/image/favicon.ico + source_url: http://topmuseum.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T17:42:34.613297+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www + source_url: http://topmuseum.jp + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T17:42:34.613297+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-AIJL.yaml b/data/custodian/JP-13-MIN-L-AIJL.yaml index 78540a5f0c..313e66fc72 100644 --- a/data/custodian/JP-13-MIN-L-AIJL.yaml +++ b/data/custodian/JP-13-MIN-L-AIJL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-AIJL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-AIJL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-AIJL ghcid_numeric: 6148220201897631588 valid_from: '2025-12-06T23:38:57.914501+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Architectural Institute of Japan, Library @@ -151,3 +152,31 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:43:12.717294+00:00' + source_url: http://www.aij.or.jp/tosyokan.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.aij.or.jp/images/common/logo_w.png + source_url: http://www.aij.or.jp/tosyokan.html + css_selector: '#header > div.container.clearfix:nth-of-type(2) > div.header-main + > a.logo > img' + retrieved_on: '2025-12-25T17:43:12.717294+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: AIJ 一般社団法人 日本建築学会 + - claim_type: favicon_url + claim_value: http://www.aij.or.jp/static/default/favicon/favicon.ico + source_url: http://www.aij.or.jp/tosyokan.html + css_selector: '[document] > html.js.flexbox > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:43:12.717294+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-ALJAA.yaml b/data/custodian/JP-13-MIN-L-ALJAA.yaml index 5b55a01669..74ce787a28 100644 --- a/data/custodian/JP-13-MIN-L-ALJAA.yaml +++ b/data/custodian/JP-13-MIN-L-ALJAA.yaml @@ -41,13 +41,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-ALJAA - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-ALJAA valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-ALJAA ghcid_numeric: 7665149279643784112 valid_from: '2025-12-06T23:38:58.922690+00:00' @@ -106,8 +107,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Aviation Library, Japan Aeronautic Association @@ -206,8 +207,10 @@ wikidata_enrichment: sq: organizatë de: japanische Non-Profit-Organisation id: universitas di Jepang - fr: organisation japonaise, spécialisée dans la recherche sur la biologie et la vie des cétacés - wikidata_description_en: non-profit organisation in Japan which claims to be a research organization + fr: organisation japonaise, spécialisée dans la recherche sur la biologie et la + vie des cétacés + wikidata_description_en: non-profit organisation in Japan which claims to be a research + organization wikidata_aliases: fr: - Institute of Cetacean Research @@ -288,3 +291,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:43:23.724704+00:00' + source_url: http://www.aero.or.jp/koku_tosyokan/koku_toshokan.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.aero.or.jp/wp/wp-content/themes/aero_fhw/favicon/safari-pinned-tab.svg + source_url: http://www.aero.or.jp/koku_tosyokan/koku_toshokan.html + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T17:43:23.724704+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.aero.or.jp/wp/wp-content/themes/aero_fhw/common/images/ogp.jpg + source_url: http://www.aero.or.jp/koku_tosyokan/koku_toshokan.html + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T17:43:23.724704+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 7 diff --git a/data/custodian/JP-13-MIN-L-ALNACT.yaml b/data/custodian/JP-13-MIN-L-ALNACT.yaml index 6ad98ce7a8..d7cfcd67f6 100644 --- a/data/custodian/JP-13-MIN-L-ALNACT.yaml +++ b/data/custodian/JP-13-MIN-L-ALNACT.yaml @@ -152,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:43:31.054740+00:00' + source_url: https://www.nact.jp/art-library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.nact.jp/common/img/common/logo.svg + source_url: https://www.nact.jp/art-library + css_selector: '#header > div.outline > div.logo > a > picture > source > img' + retrieved_on: '2025-12-25T17:43:31.054740+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国立新美術館 THE NATIONAL ART CENTER, TOKYO + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-L-AMTL.yaml b/data/custodian/JP-13-MIN-L-AMTL.yaml index 7dc575cfd1..7be95f4e83 100644 --- a/data/custodian/JP-13-MIN-L-AMTL.yaml +++ b/data/custodian/JP-13-MIN-L-AMTL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-AMTL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-AMTL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-AMTL ghcid_numeric: 215346678841852975 valid_from: '2025-12-06T23:38:58.006481+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: The Ad Museum Tokyo Library @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:43:39.150693+00:00' + source_url: https://www.admt.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.admt.jp/favicon.ico + source_url: https://www.admt.jp/library + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T17:43:39.150693+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-ARL.yaml b/data/custodian/JP-13-MIN-L-ARL.yaml index 61f41b9c2f..30db2fec66 100644 --- a/data/custodian/JP-13-MIN-L-ARL.yaml +++ b/data/custodian/JP-13-MIN-L-ARL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-ARL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-ARL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-ARL ghcid_numeric: 6999754153686910274 valid_from: '2025-12-06T23:38:58.096807+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Academyhills Roppongi Library @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:43:50.109236+00:00' + source_url: http://www.academyhills.com/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.academyhills.com/favicon.ico + source_url: http://www.academyhills.com/library + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T17:43:50.109236+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.academyhills.com/prefs/tqe2it00000000oc-img/tqe2it00000o4rdr.jpg + source_url: http://www.academyhills.com/library + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T17:43:50.109236+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-FMCMJSKU.yaml b/data/custodian/JP-13-MIN-L-FMCMJSKU.yaml index ef3662d86a..0c26f3f2df 100644 --- a/data/custodian/JP-13-MIN-L-FMCMJSKU.yaml +++ b/data/custodian/JP-13-MIN-L-FMCMJSKU.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-FMCMJSKU - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-FMCMJSKU valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-FMCMJSKU ghcid_numeric: 6465543795312990924 valid_from: '2025-12-06T23:38:58.743571+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Fukuzawa Memorial Center for Modern Japanese Studies, Keio University @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:44:19.257449+00:00' + source_url: http://www.fmc.keio.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.fmc.keio.ac.jp/favicon.ico + source_url: http://www.fmc.keio.ac.jp + css_selector: '[document] > html.device-type-pc.device-os-mac > head > link' + retrieved_on: '2025-12-25T17:44:19.257449+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.fmc.keio.ac.jp/assets/ogp/ogp.png + source_url: http://www.fmc.keio.ac.jp + css_selector: '[document] > html.device-type-pc.device-os-mac > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T17:44:19.257449+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-HRLCHRA.yaml b/data/custodian/JP-13-MIN-L-HRLCHRA.yaml index b4032bb607..70bca1095b 100644 --- a/data/custodian/JP-13-MIN-L-HRLCHRA.yaml +++ b/data/custodian/JP-13-MIN-L-HRLCHRA.yaml @@ -152,3 +152,20 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:44:48.620567+00:00' + source_url: http://www.jinken-library.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.jinken-library.jp/img/og.jpg + source_url: http://www.jinken-library.jp + css_selector: '[document] > html.lang-en > head > meta:nth-of-type(5)' + retrieved_on: '2025-12-25T17:44:48.620567+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-L-IDDITPS.yaml b/data/custodian/JP-13-MIN-L-IDDITPS.yaml index e8fec55fb5..a55ea16304 100644 --- a/data/custodian/JP-13-MIN-L-IDDITPS.yaml +++ b/data/custodian/JP-13-MIN-L-IDDITPS.yaml @@ -32,20 +32,22 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-IDDITPS - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-IDDITPS valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-IDDITPS ghcid_numeric: 1135214967483520450 valid_from: '2025-12-06T23:38:57.635679+00:00' reason: Initial GHCID from CH-Annotator (japan_complete_ch_annotator.yaml) custodian_name: claim_type: custodian_name - claim_value: Information and Documentation Division, Institution for Transport Policy Studies + claim_value: Information and Documentation Division, Institution for Transport Policy + Studies source_type: ch_annotator identifiers: - identifier_scheme: GHCID @@ -96,11 +98,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: Information and Documentation Division, Institution for Transport Policy Studies + claim_value: Information and Documentation Division, Institution for Transport + Policy Studies property_uri: skos:prefLabel provenance: namespace: glam @@ -151,3 +154,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:44:58.296439+00:00' + source_url: https://www.jttri.or.jp/about/outline/inforlib + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.jttri.or.jp/images/favicons/safari-pinned-tab.svg + source_url: https://www.jttri.or.jp/about/outline/inforlib + css_selector: '[document] > html.js.webkit > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T17:44:58.296439+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.jttri.or.jp/images/favicons/ogp.png + source_url: https://www.jttri.or.jp/about/outline/inforlib + css_selector: '[document] > html.js.webkit > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T17:44:58.296439+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 5 diff --git a/data/custodian/JP-13-MIN-L-IHJL.yaml b/data/custodian/JP-13-MIN-L-IHJL.yaml index 0af2544a7d..49b9a0ea15 100644 --- a/data/custodian/JP-13-MIN-L-IHJL.yaml +++ b/data/custodian/JP-13-MIN-L-IHJL.yaml @@ -41,13 +41,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-IHJL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-IHJL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-IHJL ghcid_numeric: 8467145271040703086 valid_from: '2025-12-06T23:38:57.745870+00:00' @@ -78,7 +79,8 @@ provenance: extraction_method: 'Created from CH-Annotator file: japan_complete_ch_annotator.yaml' confidence_score: 0.98 notes: - - Removed incorrect wikidata_enrichment on 2025-12-08T08:18:48.744413+00:00. Re-enrichment required with proper matching. + - Removed incorrect wikidata_enrichment on 2025-12-08T08:18:48.744413+00:00. Re-enrichment + required with proper matching. - Canonical location normalized on 2025-12-09T12:21:54Z ch_annotator: convention_id: ch_annotator-v1_7_0 @@ -107,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: The International House of Japan Library @@ -183,8 +185,9 @@ wikidata_enrichment: instance_of: &id005 - id: Q7075 label: library - description: institution charged with the care of a collection of literary, musical, artistic, or reference materials, - such as books, manuscripts, recordings, or films + description: institution charged with the care of a collection of literary, + musical, artistic, or reference materials, such as books, manuscripts, recordings, + or films wikidata_instance_of: *id005 wikidata_location: country: &id006 @@ -210,3 +213,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:45:22.114616+00:00' + source_url: http://www.i-house.or.jp/programs/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.i-house.or.jp/programs/wp-content/themes/programs/apple-touch-icon.png + source_url: http://www.i-house.or.jp/programs/library + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T17:45:22.114616+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.i-house.or.jp/programs/wp-content/uploads/2022/01/70thLogoPickCard.jpg + source_url: http://www.i-house.or.jp/programs/library + css_selector: '[document] > html > head > meta:nth-of-type(17)' + retrieved_on: '2025-12-25T17:45:22.114616+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 5 diff --git a/data/custodian/JP-13-MIN-L-IL.yaml b/data/custodian/JP-13-MIN-L-IL.yaml index 73b9c7b284..5d0e36fd68 100644 --- a/data/custodian/JP-13-MIN-L-IL.yaml +++ b/data/custodian/JP-13-MIN-L-IL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-IL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-IL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-IL ghcid_numeric: 3267189815043421977 valid_from: '2025-12-06T23:38:57.764127+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: IPPANSHADANHOJINNIHONJIDOSHAKOGYOKAIJIDOSHA Library @@ -151,3 +152,36 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:45:29.236324+00:00' + source_url: http://www.jama.or.jp/lib/car_library/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.jama.or.jp/2022common/images//logo.png + source_url: http://www.jama.or.jp/lib/car_library/index.html + css_selector: '#l2_header_ctn > header > h1 > a > img' + retrieved_on: '2025-12-25T17:45:29.236324+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 一般社団法人 日本自動車工業会 JAMA + - claim_type: favicon_url + claim_value: http://www.jama.or.jp/2022common/images/favicon/safari-pinned-tab.svg + source_url: http://www.jama.or.jp/lib/car_library/index.html + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T17:45:29.236324+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.jama.or.jp/images/og.png + source_url: http://www.jama.or.jp/lib/car_library/index.html + css_selector: '[document] > html > head > meta:nth-of-type(16)' + retrieved_on: '2025-12-25T17:45:29.236324+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 5 diff --git a/data/custodian/JP-13-MIN-L-JAICAF.yaml b/data/custodian/JP-13-MIN-L-JAICAF.yaml index 8f26af79ce..46858e2cdd 100644 --- a/data/custodian/JP-13-MIN-L-JAICAF.yaml +++ b/data/custodian/JP-13-MIN-L-JAICAF.yaml @@ -32,20 +32,22 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-JAICAF - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-JAICAF valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-JAICAF ghcid_numeric: 2680714768289338986 valid_from: '2025-12-06T23:38:58.420483+00:00' reason: Initial GHCID from CH-Annotator (japan_complete_ch_annotator.yaml) custodian_name: claim_type: custodian_name - claim_value: Japan Association for International Collaboration of Agriculture and Forestry + claim_value: Japan Association for International Collaboration of Agriculture and + Forestry source_type: ch_annotator identifiers: - identifier_scheme: GHCID @@ -96,11 +98,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: Japan Association for International Collaboration of Agriculture and Forestry + claim_value: Japan Association for International Collaboration of Agriculture + and Forestry property_uri: skos:prefLabel provenance: namespace: glam @@ -151,3 +154,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:45:49.890466+00:00' + source_url: http://www.jaicaf.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.jaicaf.or.jp/favicons/safari-pinned-tab.svg + source_url: http://www.jaicaf.or.jp + css_selector: '[document] > html.no-touch.nonIE > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T17:45:49.890466+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 5 diff --git a/data/custodian/JP-13-MIN-L-JCFRI.yaml b/data/custodian/JP-13-MIN-L-JCFRI.yaml index 1fbf8013e4..43cd4e45c1 100644 --- a/data/custodian/JP-13-MIN-L-JCFRI.yaml +++ b/data/custodian/JP-13-MIN-L-JCFRI.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-JCFRI - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-JCFRI valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-JCFRI ghcid_numeric: 18570039260989341 valid_from: '2025-12-06T23:38:57.921295+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Japan Child and Family Research Institute @@ -151,3 +152,30 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:46:09.915464+00:00' + source_url: http://www.boshiaiikukai.jp/research.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://boshiaiikukai.jp/wp/wp-content/themes/system-template/favicon/safari-pinned-tab.svg + source_url: http://www.boshiaiikukai.jp/research.html + css_selector: '[document] > html.wf-a-otf-jun-pro-n3-active.wf-fot-tsukuardgothic-std-n4-active + > head > link:nth-of-type(9)' + retrieved_on: '2025-12-25T17:46:09.915464+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://boshiaiikukai.jp/wp/wp-content/uploads/2022/12/ogp.jpg + source_url: http://www.boshiaiikukai.jp/research.html + css_selector: '[document] > html.wf-a-otf-jun-pro-n3-active.wf-fot-tsukuardgothic-std-n4-active + > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T17:46:09.915464+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 4 diff --git a/data/custodian/JP-13-MIN-L-JFTCI.yaml b/data/custodian/JP-13-MIN-L-JFTCI.yaml index ef209cc747..3b176664ef 100644 --- a/data/custodian/JP-13-MIN-L-JFTCI.yaml +++ b/data/custodian/JP-13-MIN-L-JFTCI.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-JFTCI - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-JFTCI valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-JFTCI ghcid_numeric: 12348784047314172532 valid_from: '2025-12-06T23:38:58.948479+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Japan Foreign Trade Council, Inc. @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:46:24.238729+00:00' + source_url: http://www.jftc.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.jftc.or.jp/app-files/img/symbol/apple-touch-icon.png + source_url: http://www.jftc.or.jp + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T17:46:24.238729+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.jftc.or.jp/app-files/img/symbol/ogp.png + source_url: http://www.jftc.or.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T17:46:24.238729+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-L-JMSI.yaml b/data/custodian/JP-13-MIN-L-JMSI.yaml index ff40c1a006..d0e22c4a3a 100644 --- a/data/custodian/JP-13-MIN-L-JMSI.yaml +++ b/data/custodian/JP-13-MIN-L-JMSI.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-JMSI - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-JMSI valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-JMSI ghcid_numeric: 9368441392517881848 valid_from: '2025-12-06T23:38:57.909777+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: JAPAN MANAGEMENT SYSTEMS, Inc @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:46:35.968971+00:00' + source_url: http://www.jmsinc.co.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.jmsinc.co.jp/wordpress/wp-content/themes/jms2021/common/images/favicon.ico + source_url: http://www.jmsinc.co.jp + css_selector: '[document] > html.fac-js-enabled.fac-dom-loaded > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:46:35.968971+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://157.205.174.85/wordpress/wp-content/uploads/2021/07/logo.png + source_url: http://www.jmsinc.co.jp + css_selector: '[document] > html.fac-js-enabled.fac-dom-loaded > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T17:46:35.968971+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-JREIL.yaml b/data/custodian/JP-13-MIN-L-JREIL.yaml index a9ad81c82f..58e1a5279d 100644 --- a/data/custodian/JP-13-MIN-L-JREIL.yaml +++ b/data/custodian/JP-13-MIN-L-JREIL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-JREIL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-JREIL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-JREIL ghcid_numeric: 4416474988037649643 valid_from: '2025-12-06T23:38:57.942885+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Japan Real Estate Institute Library @@ -151,3 +152,37 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:47:03.287691+00:00' + source_url: http://www.reinet.or.jp/?page_id=346 + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.reinet.or.jp/assets/images/logo.svg + source_url: http://www.reinet.or.jp/?page_id=346 + css_selector: '#home > header > nav.navbar > div.header__container > div.navbar-brand + > a > img' + retrieved_on: '2025-12-25T17:47:03.287691+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 日本不動産研究所 + - claim_type: favicon_url + claim_value: http://www.reinet.or.jp/assets/images/common/favicon.ico + source_url: http://www.reinet.or.jp/?page_id=346 + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T17:47:03.287691+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: http://www.reinet.or.jp/assets/images/top/kv.jpg + source_url: http://www.reinet.or.jp/?page_id=346 + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T17:47:03.287691+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-K-kabushikigaishafujitsusokenkeizaikenkyujo.yaml b/data/custodian/JP-13-MIN-L-K-kabushikigaishafujitsusokenkeizaikenkyujo.yaml index d950b9fd17..6ffdddd432 100644 --- a/data/custodian/JP-13-MIN-L-K-kabushikigaishafujitsusokenkeizaikenkyujo.yaml +++ b/data/custodian/JP-13-MIN-L-K-kabushikigaishafujitsusokenkeizaikenkyujo.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-K-kabushikigaishafujitsusokenkeizaikenkyujo - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-K-kabushikigaishafujitsusokenkeizaikenkyujo valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-K-kabushikigaishafujitsusokenkeizaikenkyujo ghcid_numeric: 11996977972566592436 valid_from: '2025-12-06T23:38:58.959994+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KABUSHIKIGAISHAFUJITSUSOKENKEIZAIKENKYUJO @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:47:21.478122+00:00' + source_url: http://www.fujitsu.com/jp/group/fri/economic + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.fujitsu.com/-/media/Project/Fujitsu/Fujitsu-HQ/assets/img/favicon.ico?rev=ae9b6f01cab14782a4a36cde73c05d6d + source_url: http://www.fujitsu.com/jp/group/fri/economic + css_selector: '[document] > html.js.no-applicationcache > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T17:47:21.478122+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://global.fujitsu/-/media/Project/Fujitsu/shared/assets/img/ogp-image-v40.png?rev=150db6e93482478bbafa7d4a3f56c49a + source_url: http://www.fujitsu.com/jp/group/fri/economic + css_selector: '[document] > html.js.no-applicationcache > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T17:47:21.478122+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-K.yaml b/data/custodian/JP-13-MIN-L-K.yaml index 92ff61e848..3cc3f80568 100644 --- a/data/custodian/JP-13-MIN-L-K.yaml +++ b/data/custodian/JP-13-MIN-L-K.yaml @@ -152,3 +152,38 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:47:31.412962+00:00' + source_url: http://www.syokubunka.or.jp/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.syokubunka.or.jp/assets/img/common/logo_w.svg + source_url: http://www.syokubunka.or.jp/library + css_selector: '#library > footer.footer.js-footer > div.inner.is-pc > nav.gnav.is-footer + > ul.gnav__list > li.gnav__item.is-footer-logoarea:nth-of-type(9) > p.gnav__logo + > a > img' + retrieved_on: '2025-12-25T17:47:31.412962+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 公益財団法人 味の素食の文化センター + - claim_type: favicon_url + claim_value: http://www.syokubunka.or.jp/assets/img/favicon/apple-touch-icon.png + source_url: http://www.syokubunka.or.jp/library + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:47:31.412962+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: http://www.syokubunka.or.jp/assets/img/favicon/og_logo.png + source_url: http://www.syokubunka.or.jp/library + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T17:47:31.412962+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-L-KJG.yaml b/data/custodian/JP-13-MIN-L-KJG.yaml index 28fa910b9a..650eb68556 100644 --- a/data/custodian/JP-13-MIN-L-KJG.yaml +++ b/data/custodian/JP-13-MIN-L-KJG.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-KJG - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-KJG valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-KJG ghcid_numeric: 14978577991943657211 valid_from: '2025-12-06T23:38:58.785332+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: KOEKIZAIDANHOJINSASAKAWASUPOTSUZAIDANTOSHO・JOHOCHOSASHITSU/GAKUYUKAN @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:47:50.581881+00:00' + source_url: http://www.ssf.or.jp/library/tabid/635/Default.aspx + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.ssf.or.jp/apple-touch-icon.png + source_url: http://www.ssf.or.jp/library/tabid/635/Default.aspx + css_selector: '[document] > html.loading.pc > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:47:50.581881+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.ssf.or.jp/ogimage.png + source_url: http://www.ssf.or.jp/library/tabid/635/Default.aspx + css_selector: '[document] > html.loading.pc > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T17:47:50.581881+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-L-KUMCHO.yaml b/data/custodian/JP-13-MIN-L-KUMCHO.yaml index 2d60265bb5..bc8de9d1b5 100644 --- a/data/custodian/JP-13-MIN-L-KUMCHO.yaml +++ b/data/custodian/JP-13-MIN-L-KUMCHO.yaml @@ -205,3 +205,30 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:48:02.594471+00:00' + source_url: http://www.lib.keio.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.lib.keio.ac.jp/assets/images/logo.png + source_url: http://www.lib.keio.ac.jp + css_selector: '#header > h1 > a > img' + retrieved_on: '2025-12-25T17:48:02.594471+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 慶応義塾大学 メディアセンター + - claim_type: favicon_url + claim_value: http://www.lib.keio.ac.jp/assets/images/favicon.ico + source_url: http://www.lib.keio.ac.jp + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T17:48:02.594471+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-LGSTEU.yaml b/data/custodian/JP-13-MIN-L-LGSTEU.yaml index 183221bed3..341be633bd 100644 --- a/data/custodian/JP-13-MIN-L-LGSTEU.yaml +++ b/data/custodian/JP-13-MIN-L-LGSTEU.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-LGSTEU - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-LGSTEU valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-LGSTEU ghcid_numeric: 409731614087924814 valid_from: '2025-12-06T23:38:55.596825+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Library of Graduate School, Toyo Eiwa University @@ -204,3 +205,37 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:49:15.807028+00:00' + source_url: http://www.toyoeiwa.ac.jp/daigaku/shisetsu/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.toyoeiwa.ac.jp/daigaku/assets/img/shared/logo.png + source_url: http://www.toyoeiwa.ac.jp/daigaku/shisetsu/library + css_selector: '#header_inc > header.header > div.header_nav_bg > div.header_col01 + > a.logo > img' + retrieved_on: '2025-12-25T17:49:15.807028+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東洋英和女学院大学 + - claim_type: favicon_url + claim_value: https://www.toyoeiwa.ac.jp/daigaku/assets/img/shared/appletouch.png + source_url: http://www.toyoeiwa.ac.jp/daigaku/shisetsu/library + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T17:49:15.807028+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.toyoeiwa.ac.jp/daigaku/assets/img/shared/ogp.jpg + source_url: http://www.toyoeiwa.ac.jp/daigaku/shisetsu/library + css_selector: '[document] > html > head > meta:nth-of-type(14)' + retrieved_on: '2025-12-25T17:49:15.807028+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MIN-L-LTCJTBF.yaml b/data/custodian/JP-13-MIN-L-LTCJTBF.yaml index 12cf771350..081e8c3f4b 100644 --- a/data/custodian/JP-13-MIN-L-LTCJTBF.yaml +++ b/data/custodian/JP-13-MIN-L-LTCJTBF.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-LTCJTBF - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-LTCJTBF valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-LTCJTBF ghcid_numeric: 10511543912303115293 valid_from: '2025-12-06T23:38:58.040816+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Library of Tourism & Culture, Japan Travel Bureau Foundation @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:49:28.135031+00:00' + source_url: http://www.jtb.or.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.jtb.or.jp/library/wp-content/themes/jtbf-library/favicon.ico + source_url: http://www.jtb.or.jp/library + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T17:49:28.135031+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.jtb.or.jp/library/wp-content/themes/jtbf-library/img/og-logo.png + source_url: http://www.jtb.or.jp/library + css_selector: '[document] > html > head > meta:nth-of-type(5)' + retrieved_on: '2025-12-25T17:49:28.135031+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-MCPS.yaml b/data/custodian/JP-13-MIN-L-MCPS.yaml index 2785e62cff..8c3fe3f3e8 100644 --- a/data/custodian/JP-13-MIN-L-MCPS.yaml +++ b/data/custodian/JP-13-MIN-L-MCPS.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-MCPS - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-MCPS valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-MCPS ghcid_numeric: 10236622895335185370 valid_from: '2025-12-06T23:38:54.875826+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Media Center for Pharmaceutical Sciences @@ -164,7 +165,8 @@ wikidata_enrichment: wikidata_labels: en: Keio University Information and Media Center for Pharmaceutical Sciences ja: 慶應義塾大学薬学メディアセンター - wikidata_label_en: Keio University Information and Media Center for Pharmaceutical Sciences + wikidata_label_en: Keio University Information and Media Center for Pharmaceutical + Sciences wikidata_label_ja: 慶應義塾大学薬学メディアセンター wikidata_classification: instance_of: &id004 @@ -204,3 +206,30 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:50:01.314984+00:00' + source_url: https://www.lib.keio.ac.jp/pha/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.lib.keio.ac.jp/assets/images/logo.png + source_url: https://www.lib.keio.ac.jp/pha/index.html + css_selector: '#header > h1 > a > img' + retrieved_on: '2025-12-25T17:50:01.314984+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 慶応義塾大学 メディアセンター + - claim_type: favicon_url + claim_value: https://www.lib.keio.ac.jp/assets/images/favicon.ico + source_url: https://www.lib.keio.ac.jp/pha/index.html + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T17:50:01.314984+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-MGUSCL.yaml b/data/custodian/JP-13-MIN-L-MGUSCL.yaml index c5807a4f6b..3428ff9e97 100644 --- a/data/custodian/JP-13-MIN-L-MGUSCL.yaml +++ b/data/custodian/JP-13-MIN-L-MGUSCL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-MGUSCL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-MGUSCL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-MGUSCL ghcid_numeric: 3109651456540934719 valid_from: '2025-12-06T23:38:55.304702+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Meiji Gakuin University Shirokane Campus Library @@ -204,3 +205,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:50:23.322858+00:00' + source_url: http://www.meijigakuin.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.meijigakuin.ac.jp/common/favicon.ico + source_url: http://www.meijigakuin.ac.jp/library + css_selector: '[document] > html.no-js > head > link' + retrieved_on: '2025-12-25T17:50:23.322858+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.meijigakuin.ac.jp/downloads/screen/downloads/MG_Desktop_picture.jpg + source_url: http://www.meijigakuin.ac.jp/library + css_selector: '[document] > html.no-js > head > meta:nth-of-type(17)' + retrieved_on: '2025-12-25T17:50:23.322858+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-MIL.yaml b/data/custodian/JP-13-MIN-L-MIL.yaml index e291de5fcd..fc7e2f4fa7 100644 --- a/data/custodian/JP-13-MIN-L-MIL.yaml +++ b/data/custodian/JP-13-MIN-L-MIL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-MIL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-MIL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-MIL ghcid_numeric: 3805559297582869883 valid_from: '2025-12-06T23:38:58.726136+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Mecenat Information Library @@ -151,3 +152,30 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:50:35.792123+00:00' + source_url: http://www.mecenat.or.jp/ja/introduction/post/library + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.mecenat.or.jp/ja/wp-content/themes/mecenat/images/common/logo.svg + source_url: http://www.mecenat.or.jp/ja/introduction/post/library + css_selector: '#logo > a > img' + retrieved_on: '2025-12-25T17:50:35.792123+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 公益社団法人 企業メセナ協議会 + - claim_type: favicon_url + claim_value: http://www.mecenat.or.jp/test/wp-content/uploads/fbrfg/apple-touch-icon.png + source_url: http://www.mecenat.or.jp/ja/introduction/post/library + css_selector: '[document] > html > head > link:nth-of-type(16)' + retrieved_on: '2025-12-25T17:50:35.792123+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 76x76 + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 4 diff --git a/data/custodian/JP-13-MIN-L-NCACL.yaml b/data/custodian/JP-13-MIN-L-NCACL.yaml index be7c57efff..f45dff0015 100644 --- a/data/custodian/JP-13-MIN-L-NCACL.yaml +++ b/data/custodian/JP-13-MIN-L-NCACL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-NCACL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-NCACL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-NCACL ghcid_numeric: 13375768500732348979 valid_from: '2025-12-06T23:38:57.751601+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: National Consumer Affairs Center Library @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:50:53.837259+00:00' + source_url: http://www.kokusen.go.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.kokusen.go.jp/images/logo.jpg + source_url: http://www.kokusen.go.jp/index.html + css_selector: '#head_logo_sp > img' + retrieved_on: '2025-12-25T17:50:53.837259+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 独立行政法人国民生活センター + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-L-NRASR.yaml b/data/custodian/JP-13-MIN-L-NRASR.yaml index 23592cf4cb..cd3dcc52ca 100644 --- a/data/custodian/JP-13-MIN-L-NRASR.yaml +++ b/data/custodian/JP-13-MIN-L-NRASR.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-NRASR - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-NRASR valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-NRASR ghcid_numeric: 15266943249472025697 valid_from: '2025-12-06T23:38:59.863634+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Nuclear Regulation Authority, Study Room @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:51:13.648477+00:00' + source_url: https://www.nsr.go.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.nsr.go.jp/data/900000009.png + source_url: https://www.nsr.go.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T17:51:13.648477+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-L-O.yaml b/data/custodian/JP-13-MIN-L-O.yaml index b140ce029f..19921cbf4a 100644 --- a/data/custodian/JP-13-MIN-L-O.yaml +++ b/data/custodian/JP-13-MIN-L-O.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-O - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-O valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-O ghcid_numeric: 10266948521185033762 valid_from: '2025-12-06T23:38:56.146424+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: OSAKAKEIZAIHOKADAIGAKUAJIATAIHEIYOKENKYUSENTA @@ -204,3 +205,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:51:28.805130+00:00' + source_url: http://www.keiho-u.ac.jp/research/asia-pacific + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.keiho-u.ac.jp/otsaen000000003j-img/otsaen000000006t.png + source_url: http://www.keiho-u.ac.jp/research/asia-pacific + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T17:51:28.805130+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.keiho-u.ac.jp/otsaen000000003j-img/otsaen000000006y.png + source_url: http://www.keiho-u.ac.jp/research/asia-pacific + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T17:51:28.805130+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-L-RICE.yaml b/data/custodian/JP-13-MIN-L-RICE.yaml index 31a208e1f9..aafcc08dd5 100644 --- a/data/custodian/JP-13-MIN-L-RICE.yaml +++ b/data/custodian/JP-13-MIN-L-RICE.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-RICE - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-RICE valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-RICE ghcid_numeric: 10954120538049895824 valid_from: '2025-12-06T23:38:58.750484+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Research Institute of Construction and Economy @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:51:42.655762+00:00' + source_url: http://www.rice.or.jp/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.rice.or.jp/wp-content/uploads/2021/06/メインロゴ.png + source_url: http://www.rice.or.jp/index.html + css_selector: '[document] > html > head > link:nth-of-type(16)' + retrieved_on: '2025-12-25T17:51:42.655762+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 32x32 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-SL-shibaurakogyodaigakugakujutsujohosentashibaura_lib.yaml b/data/custodian/JP-13-MIN-L-SL-shibaurakogyodaigakugakujutsujohosentashibaura_lib.yaml index 03d19fd38a..a100937a26 100644 --- a/data/custodian/JP-13-MIN-L-SL-shibaurakogyodaigakugakujutsujohosentashibaura_lib.yaml +++ b/data/custodian/JP-13-MIN-L-SL-shibaurakogyodaigakugakujutsujohosentashibaura_lib.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-SL-shibaurakogyodaigakugakujutsujohosentashibaura_lib - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-SL-shibaurakogyodaigakugakujutsujohosentashibaura_lib valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-SL-shibaurakogyodaigakugakujutsujohosentashibaura_lib ghcid_numeric: 16700111484363270676 valid_from: '2025-12-06T23:38:54.935087+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SHIBAURAKOGYODAIGAKUGAKUJUTSUJOHOSENTASHIBAURA Library @@ -204,3 +205,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:52:06.014624+00:00' + source_url: http://lib.shibaura-it.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.shibaura-it.ac.jp/files/images/favicon.ico + source_url: http://lib.shibaura-it.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T17:52:06.014624+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-TL.yaml b/data/custodian/JP-13-MIN-L-TL.yaml index 570212c89b..91d6e12f91 100644 --- a/data/custodian/JP-13-MIN-L-TL.yaml +++ b/data/custodian/JP-13-MIN-L-TL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-TL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-TL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-TL ghcid_numeric: 9847004342569204196 valid_from: '2025-12-06T23:38:58.326189+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKYODOITSUBUNKASENTA Library @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:52:44.331878+00:00' + source_url: http://www.goethe.de/ins/jp/ja/tok/bib.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.goethe.de/resources/relaunch/favicon/safari-pinned-tab.svg + source_url: http://www.goethe.de/ins/jp/ja/tok/bib.html + css_selector: '[document] > html.gi-header-v3 > head > link:nth-of-type(6)' + retrieved_on: '2025-12-25T17:52:44.331878+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 5 diff --git a/data/custodian/JP-13-MIN-L-TMCL.yaml b/data/custodian/JP-13-MIN-L-TMCL.yaml index cba7184b59..193979ac9c 100644 --- a/data/custodian/JP-13-MIN-L-TMCL.yaml +++ b/data/custodian/JP-13-MIN-L-TMCL.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-TMCL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-TMCL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-TMCL ghcid_numeric: 13030027904128279481 valid_from: '2025-12-06T23:38:43.106433+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Metropolitan Central Library @@ -227,8 +228,8 @@ wikidata_enrichment: instance_of: &id005 - id: Q12317349 label: main library - description: most important public library in a municipality and/or library system that has several libraries or library - campuses + description: most important public library in a municipality and/or library + system that has several libraries or library campuses - id: Q11582691 label: prefectural library of Japan description: 都道府県が設置する図書館 @@ -286,3 +287,36 @@ location: postal_code: 106-8575 street_address: 5-7-13 MINAMIAZABU, Minato Ku, Tokyo To, 106-8575 normalization_timestamp: '2025-12-09T12:21:56.622265+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:52:52.857689+00:00' + source_url: https://www.library.metro.tokyo.lg.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.library.metro.tokyo.lg.jp/common/img/logo.png + source_url: https://www.library.metro.tokyo.lg.jp + css_selector: '#header > div.header__body > div.header__left > h1.logo > a > img' + retrieved_on: '2025-12-25T17:52:52.857689+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 東京都立図書館 + - claim_type: favicon_url + claim_value: https://www.library.metro.tokyo.lg.jp/common/img/favicon/favicon.ico + source_url: https://www.library.metro.tokyo.lg.jp + css_selector: '[document] > html.js.flexbox > head > link' + retrieved_on: '2025-12-25T17:52:52.857689+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/vnd.microsoft.icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.library.metro.tokyo.lg.jp/common/img/ogp.png + source_url: https://www.library.metro.tokyo.lg.jp + css_selector: '[document] > html.js.flexbox > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T17:52:52.857689+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-TUMSTL.yaml b/data/custodian/JP-13-MIN-L-TUMSTL.yaml index 2229763020..83a498ec7f 100644 --- a/data/custodian/JP-13-MIN-L-TUMSTL.yaml +++ b/data/custodian/JP-13-MIN-L-TUMSTL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-TUMSTL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-TUMSTL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-TUMSTL ghcid_numeric: 13755224667520732844 valid_from: '2025-12-06T23:38:53.402764+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo University of Marine Science and Technology Library @@ -187,7 +188,8 @@ wikidata_enrichment: member_of: - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://lib.s.kaiyodai.ac.jp wikidata_official_website: http://lib.s.kaiyodai.ac.jp @@ -209,3 +211,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:53:13.437471+00:00' + source_url: http://lib.s.kaiyodai.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://lib.s.kaiyodai.ac.jp/theme/Kaiyo/net_commons/favicon.ico?1635399676 + source_url: http://lib.s.kaiyodai.ac.jp + css_selector: '[document] > html.ng-scope > head > link' + retrieved_on: '2025-12-25T17:53:13.437471+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-L-TVL.yaml b/data/custodian/JP-13-MIN-L-TVL.yaml index c3e10bba37..b1a8fc5528 100644 --- a/data/custodian/JP-13-MIN-L-TVL.yaml +++ b/data/custodian/JP-13-MIN-L-TVL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-L-TVL - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-L-TVL valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-L-TVL ghcid_numeric: 12045430208154500728 valid_from: '2025-12-06T23:38:58.848319+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TEPIA Video Library @@ -151,3 +152,30 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:53:24.233573+00:00' + source_url: http://www.tepia.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.tepia.jp/img/index/header_logo01.png + source_url: http://www.tepia.jp + css_selector: '#home > div.sp > header > h1 > a > img' + retrieved_on: '2025-12-25T17:53:24.233573+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: TEPIA 一般財団法人 高度技術社会推進協会 + - claim_type: favicon_url + claim_value: http://www.tepia.jp/apple-touch-icon.png + source_url: http://www.tepia.jp + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T17:53:24.233573+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-M-HMMFA.yaml b/data/custodian/JP-13-MIN-M-HMMFA.yaml index 0ee6fcb477..231f3126f4 100644 --- a/data/custodian/JP-13-MIN-M-HMMFA.yaml +++ b/data/custodian/JP-13-MIN-M-HMMFA.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-HMMFA - valid_from: "2025-12-10T09:44:07Z" + valid_from: '2025-12-10T09:44:07Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-HMMFA valid_from: null - valid_to: "2025-12-10T09:44:07Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:07Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-HMMFA ghcid_numeric: 10445495229787364656 valid_from: '2025-12-06T23:38:33.043046+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HATAKEYAMA MEMORIAL MUSEUM OF FINE ART @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:57:50.593553+00:00' + source_url: https://www.ebara.co.jp/foundation/hatakeyama/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.ebara.com/etc.clientlibs/ebara/clientlibs/clientlib-site/resources/apple-touch-icon-180x180.png + source_url: https://www.ebara.co.jp/foundation/hatakeyama/index.html + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T17:57:50.593553+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 5 diff --git a/data/custodian/JP-13-MIN-M-INSNMNS.yaml b/data/custodian/JP-13-MIN-M-INSNMNS.yaml index 0e1adecfc1..052a88a7cb 100644 --- a/data/custodian/JP-13-MIN-M-INSNMNS.yaml +++ b/data/custodian/JP-13-MIN-M-INSNMNS.yaml @@ -152,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T17:58:15.517937+00:00' + source_url: https://ins.kahaku.go.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://ins.kahaku.go.jp/apple-touch-icon.png + source_url: https://ins.kahaku.go.jp + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T17:58:15.517937+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://ins.kahaku.go.jp/ogp.png + source_url: https://ins.kahaku.go.jp + css_selector: '[document] > html > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T17:58:15.517937+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MIN-M-MAPS.yaml b/data/custodian/JP-13-MIN-M-MAPS.yaml index 0f5b31aa5b..d05f56c560 100644 --- a/data/custodian/JP-13-MIN-M-MAPS.yaml +++ b/data/custodian/JP-13-MIN-M-MAPS.yaml @@ -152,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:13:32.797070+00:00' + source_url: http://www.aqua-park.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.aqua-park.jp/images/common/favi.ico + source_url: http://www.aqua-park.jp + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T18:13:32.797070+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.aqua-park.jp/special/staraquarium2025/images/common/ogp.jpg + source_url: http://www.aqua-park.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:13:32.797070+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-M-MMA.yaml b/data/custodian/JP-13-MIN-M-MMA.yaml index 4c1ba26b6d..7da035b651 100644 --- a/data/custodian/JP-13-MIN-M-MMA.yaml +++ b/data/custodian/JP-13-MIN-M-MMA.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-MMA - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-MMA valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-MMA ghcid_numeric: 10720411627554313918 valid_from: '2025-12-06T23:38:33.045791+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MATSUOKA MUSEUM OF ART @@ -226,7 +227,8 @@ wikidata_enrichment: instance_of: &id005 - id: Q207694 label: art museum - description: building or space for the exhibition of art (for institution, use Q3196771) + description: building or space for the exhibition of art (for institution, use + Q3196771) wikidata_instance_of: *id005 wikidata_location: country: &id006 @@ -274,3 +276,29 @@ location: postal_code: 108-0071 street_address: SHIROKANEDAI, Minato Ku, Tokyo To, 108-0071 normalization_timestamp: '2025-12-09T12:21:57.401558+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:14:27.111152+00:00' + source_url: https://www.matsuoka-museum.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.matsuoka-museum.jp/phonesIcon.png + source_url: https://www.matsuoka-museum.jp + css_selector: '[document] > html > head > link:nth-of-type(11)' + retrieved_on: '2025-12-25T18:14:27.111152+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.matsuoka-museum.jp//assets/images/facebookIcon.png + source_url: https://www.matsuoka-museum.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:14:27.111152+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-M-MSM.yaml b/data/custodian/JP-13-MIN-M-MSM.yaml index 91c2571912..0c54367d7d 100644 --- a/data/custodian/JP-13-MIN-M-MSM.yaml +++ b/data/custodian/JP-13-MIN-M-MSM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-MSM - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-MSM valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-MSM ghcid_numeric: 10319208063142259619 valid_from: '2025-12-06T23:38:33.005787+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MINATO SCIENCE MUSEUM @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:14:45.119770+00:00' + source_url: https://minato-kagaku.tokyo + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://minato-kagaku.tokyo/common/images/favicon_ios.png + source_url: https://minato-kagaku.tokyo + css_selector: '[document] > html > head > link:nth-of-type(13)' + retrieved_on: '2025-12-25T18:14:45.119770+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 4 diff --git a/data/custodian/JP-13-MIN-M-MT.yaml b/data/custodian/JP-13-MIN-M-MT.yaml index 859adbbb55..15dd7e0d48 100644 --- a/data/custodian/JP-13-MIN-M-MT.yaml +++ b/data/custodian/JP-13-MIN-M-MT.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-MT - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-MT valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-MT ghcid_numeric: 8919518239303823778 valid_from: '2025-12-06T23:38:33.002298+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Musée Tomo @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:14:51.190030+00:00' + source_url: https://www.musee-tomo.or.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.musee-tomo.or.jp/favicon.ico + source_url: https://www.musee-tomo.or.jp + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T18:14:51.190030+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.musee-tomo.or.jp/assets/img/top/ttl_bg.jpg + source_url: https://www.musee-tomo.or.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:14:51.190030+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-M-NACT.yaml b/data/custodian/JP-13-MIN-M-NACT.yaml index fdd444ed66..43e8e815c2 100644 --- a/data/custodian/JP-13-MIN-M-NACT.yaml +++ b/data/custodian/JP-13-MIN-M-NACT.yaml @@ -1536,3 +1536,28 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/BFe4t9bfwOw/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:14:59.380599+00:00' + source_url: https://www.nact.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.nact.jp/common/img/common/logo.svg + source_url: https://www.nact.jp + css_selector: '#header > div.outline > h1.logo > a > picture > source > img' + retrieved_on: '2025-12-25T18:14:59.380599+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 国立新美術館 THE NATIONAL ART CENTER, TOKYO + - claim_type: og_image_url + claim_value: https://www.nact.jp/common/img/common/og_image.gif + source_url: https://www.nact.jp + css_selector: '[document] > html > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T18:14:59.380599+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-M-NM.yaml b/data/custodian/JP-13-MIN-M-NM.yaml index 1d34db7cc4..7b6c62150c 100644 --- a/data/custodian/JP-13-MIN-M-NM.yaml +++ b/data/custodian/JP-13-MIN-M-NM.yaml @@ -470,3 +470,20 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/3OyKDE7ZfnU/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:15:07.746066+00:00' + source_url: https://www.nezu-muse.or.jp + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: http://www.nezu-muse.or.jp/ogp/ogp_img.jpg + source_url: https://www.nezu-muse.or.jp + css_selector: '[document] > html > head > meta:nth-of-type(14)' + retrieved_on: '2025-12-25T18:15:07.746066+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-M-NMB.yaml b/data/custodian/JP-13-MIN-M-NMB.yaml index d1e3bb41e8..b4e0019a97 100644 --- a/data/custodian/JP-13-MIN-M-NMB.yaml +++ b/data/custodian/JP-13-MIN-M-NMB.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-NMB - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-NMB valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-NMB ghcid_numeric: 12879774604308496096 valid_from: '2025-12-06T23:38:33.007995+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: NHK MUSEUM OF BROADCASTING @@ -255,3 +256,20 @@ location: postal_code: 105-0002 street_address: ATAGO, Minato Ku, Tokyo To, 105-0002 normalization_timestamp: '2025-12-09T12:21:57.700416+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:15:14.192091+00:00' + source_url: https://www.nhk.or.jp/museum + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.nhk.or.jp/museum/assets/img/common/ogp/ogimg.png + source_url: https://www.nhk.or.jp/museum + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:15:14.192091+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-M-OMA.yaml b/data/custodian/JP-13-MIN-M-OMA.yaml index 044404dac3..ff1cd5c753 100644 --- a/data/custodian/JP-13-MIN-M-OMA.yaml +++ b/data/custodian/JP-13-MIN-M-OMA.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-OMA - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-OMA valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-OMA ghcid_numeric: 16416165540328380530 valid_from: '2025-12-06T23:38:33.000068+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: OKURA MUSEUM OF ART @@ -151,3 +152,22 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:15:40.811309+00:00' + source_url: https://www.shukokan.org + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.shukokan.org/Portals/0/images/common/img_logo.png + source_url: https://www.shukokan.org + css_selector: '#dnn_dnnLOGO_imgLogo' + retrieved_on: '2025-12-25T18:15:40.811309+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 大倉集古館 + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-M-PSMARG.yaml b/data/custodian/JP-13-MIN-M-PSMARG.yaml index 70193d262b..b8d7d4821f 100644 --- a/data/custodian/JP-13-MIN-M-PSMARG.yaml +++ b/data/custodian/JP-13-MIN-M-PSMARG.yaml @@ -282,3 +282,38 @@ youtube_enrichment: view_count: 0 videos: [] status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:15:47.978427+00:00' + source_url: https://panasonic.co.jp/ew/museum + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://panasonic.co.jp/ew/etc-ew/designs/panasonic/holdings/images/holdings-plogo.svg + source_url: https://panasonic.co.jp/ew/museum + css_selector: '#page > header.holdings-header.nofix > div.holdings-header__fixarea__wrapper + > div.holdings-header__fixarea > div.holdings-header__main > div.holdings-header__main__in + > div.holdings-header__brand > div.brandlogo > a > img' + retrieved_on: '2025-12-25T18:15:47.978427+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: Panasonic + - claim_type: favicon_url + claim_value: https://panasonic.co.jp/ew/etc-ew/designs/panasonic/common-clientlibs/images/favicon.ico + source_url: https://panasonic.co.jp/ew/museum + css_selector: '[document] > html.js.flexbox > head > link' + retrieved_on: '2025-12-25T18:15:47.978427+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://panasonic.co.jp/ew/museum/contents/toppage/images/img-ogp.png + source_url: https://panasonic.co.jp/ew/museum + css_selector: '[document] > html.js.flexbox > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T18:15:47.978427+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIN-M-SMA.yaml b/data/custodian/JP-13-MIN-M-SMA.yaml index a2087d8218..82c84fe6f6 100644 --- a/data/custodian/JP-13-MIN-M-SMA.yaml +++ b/data/custodian/JP-13-MIN-M-SMA.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-SMA - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-SMA valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-SMA ghcid_numeric: 14659349751388969573 valid_from: '2025-12-06T23:38:33.035883+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: SUNTORY MUSEUM OF ART @@ -243,7 +244,8 @@ wikidata_enrichment: instance_of: &id005 - id: Q207694 label: art museum - description: building or space for the exhibition of art (for institution, use Q3196771) + description: building or space for the exhibition of art (for institution, use + Q3196771) wikidata_instance_of: *id005 wikidata_location: coordinates: &id008 @@ -312,3 +314,28 @@ location: postal_code: 107-8643 street_address: AKASAKA, Minato Ku, Tokyo To, 107-8643 normalization_timestamp: '2025-12-09T12:21:57.867033+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:15:58.129833+00:00' + source_url: https://www.suntory.co.jp/sma + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.suntory.co.jp/sma/apple-touch-icon.png + source_url: https://www.suntory.co.jp/sma + css_selector: '[document] > html.backdropfilter.webpalpha > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T18:15:58.129833+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.suntory.co.jp/sma/ogp/sma1.png + source_url: https://www.suntory.co.jp/sma + css_selector: '[document] > html.backdropfilter.webpalpha > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T18:15:58.129833+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-M-SOHMT.yaml b/data/custodian/JP-13-MIN-M-SOHMT.yaml index 20cf3715ab..2e00a934f8 100644 --- a/data/custodian/JP-13-MIN-M-SOHMT.yaml +++ b/data/custodian/JP-13-MIN-M-SOHMT.yaml @@ -152,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:16:07.671809+00:00' + source_url: https://sen-oku.or.jp/tokyo + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://sen-oku.or.jp/wp-content/themes/senoku/favicon.svg?v=2 + source_url: https://sen-oku.or.jp/tokyo + css_selector: '[document] > html.mod-js.mod-flexbox > head > link' + retrieved_on: '2025-12-25T18:16:07.671809+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/svg+xml + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.sen-oku.or.jp/ogp_t.png + source_url: https://sen-oku.or.jp/tokyo + css_selector: '[document] > html.mod-js.mod-flexbox > head > meta:nth-of-type(9)' + retrieved_on: '2025-12-25T18:16:07.671809+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-M-TA.yaml b/data/custodian/JP-13-MIN-M-TA.yaml index e007c1dec9..240497c1b7 100644 --- a/data/custodian/JP-13-MIN-M-TA.yaml +++ b/data/custodian/JP-13-MIN-M-TA.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-TA - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-TA valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-TA ghcid_numeric: 8219440418177892130 valid_from: '2025-12-06T23:38:33.010631+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TORAYA ARCHIVES @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:16:13.638993+00:00' + source_url: https://www.toraya-group.co.jp/toraya/bunko + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://cdn.shopify.com/oxygen-v2/26835/11847/24249/2789172/assets/favicon.5ea53f11.ico + source_url: https://www.toraya-group.co.jp/toraya/bunko + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T18:16:13.638993+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/svg+xml + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.toraya-group.co.jp/assets/images/ogimage.jpg + source_url: https://www.toraya-group.co.jp/toraya/bunko + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:16:13.638993+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-M-TATG.yaml b/data/custodian/JP-13-MIN-M-TATG.yaml index f7e6c50f24..30b1d1c393 100644 --- a/data/custodian/JP-13-MIN-M-TATG.yaml +++ b/data/custodian/JP-13-MIN-M-TATG.yaml @@ -691,3 +691,30 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/wuB0zw6Zx6s/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:16:22.098510+00:00' + source_url: https://www.tepia.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.tepia.jp/img/index/header_logo01.png + source_url: https://www.tepia.jp + css_selector: '#home > div.sp > header > h1 > a > img' + retrieved_on: '2025-12-25T18:16:22.098510+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: TEPIA 一般財団法人 高度技術社会推進協会 + - claim_type: favicon_url + claim_value: https://www.tepia.jp/apple-touch-icon.png + source_url: https://www.tepia.jp + css_selector: '[document] > html > head > link:nth-of-type(3)' + retrieved_on: '2025-12-25T18:16:22.098510+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MIN-M-TMTAM.yaml b/data/custodian/JP-13-MIN-M-TMTAM.yaml index 457986286f..20b9694fdc 100644 --- a/data/custodian/JP-13-MIN-M-TMTAM.yaml +++ b/data/custodian/JP-13-MIN-M-TMTAM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-TMTAM - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-TMTAM valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-TMTAM ghcid_numeric: 7216766343170136043 valid_from: '2025-12-06T23:38:33.040799+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: TOKYO METROPOLITAN TEIEN ART MUSEUM @@ -151,3 +152,28 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:16:40.982316+00:00' + source_url: https://www.teien-art-museum.ne.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.teien-art-museum.ne.jp/apple-touch-icon.png + source_url: https://www.teien-art-museum.ne.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T18:16:40.982316+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: https://www.teien-art-museum.ne.jp/wp-content/uploads/2023/09/OGP.png + source_url: https://www.teien-art-museum.ne.jp + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:16:40.982316+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 4 diff --git a/data/custodian/JP-13-MIN-M-UH.yaml b/data/custodian/JP-13-MIN-M-UH.yaml index 7950fdeac0..c966ae75d0 100644 --- a/data/custodian/JP-13-MIN-M-UH.yaml +++ b/data/custodian/JP-13-MIN-M-UH.yaml @@ -152,3 +152,29 @@ location: geonames_id: 1852383 geonames_name: Minato feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:16:49.643842+00:00' + source_url: https://www.unicef.or.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://www.unicef.or.jp/images/toppage/logo.gif + source_url: https://www.unicef.or.jp + css_selector: '#mode_area > header > div.hd_global-nav > div.global-nav_wrapper + > div.global-nav_01 > div.nav_01_logo-block > h1.hd_logo > a > img.top_logo' + retrieved_on: '2025-12-25T18:16:49.643842+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 日本ユニセフ協会 + - claim_type: og_image_url + claim_value: https://www.unicef.or.jp/images/ogp_img_top.jpg + source_url: https://www.unicef.or.jp + css_selector: '#ID > http-equiv > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T18:16:49.643842+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: true + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIN-M-YMM.yaml b/data/custodian/JP-13-MIN-M-YMM.yaml index 957ff72c8a..1a40abef14 100644 --- a/data/custodian/JP-13-MIN-M-YMM.yaml +++ b/data/custodian/JP-13-MIN-M-YMM.yaml @@ -43,13 +43,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIN-M-YMM - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIN-M-YMM valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIN-M-YMM ghcid_numeric: 17808761113043959496 valid_from: '2025-12-06T23:38:33.033155+00:00' @@ -108,8 +109,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: YOKU MOKU MUSEUM @@ -231,3 +232,22 @@ location: postal_code: 107-0062 street_address: MINAMIAOYAMA, Minato Ku, Tokyo To, 107-0062 normalization_timestamp: '2025-12-09T12:21:58.140267+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:17:01.550880+00:00' + source_url: https://yokumokumuseum.com + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://yokumokumuseum.com/wp-content/themes/ymmtmp/images/favicon.ico + source_url: https://yokumokumuseum.com + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T18:17:01.550880+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIT-L-ICUL.yaml b/data/custodian/JP-13-MIT-L-ICUL.yaml index 365306a368..ce869af537 100644 --- a/data/custodian/JP-13-MIT-L-ICUL.yaml +++ b/data/custodian/JP-13-MIT-L-ICUL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-ICUL - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-ICUL valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-ICUL ghcid_numeric: 11058665013116237960 valid_from: '2025-12-06T23:38:54.888488+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: International Christian University Library @@ -190,7 +191,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www-lib.icu.ac.jp wikidata_official_website: http://www-lib.icu.ac.jp @@ -212,3 +214,28 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:17:17.437758+00:00' + source_url: http://www-lib.icu.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://lh3.googleusercontent.com/sitesv/AAzXCkfi5QDZwImY6Lq9Wkr3Q0vKxFbpddfbYJlb8oEL-pmi1vrCxLWZecavQWwvYYUbcREb7UrsStPHIwW-3CHVtsV6bENlwxrhZiwR27ZQihPflj7NmEVGXQy90_54ym0_Y5qycF1S4JcrfOtS8BSNtqnsBvArFCC-jDMxEmDAr9lMxARJmpGz0xHsNs6E7CR3VVpCW3KZbq2XHCFpfpppag + source_url: http://www-lib.icu.ac.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T18:17:17.437758+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://lh3.googleusercontent.com/sitesv/AAzXCkfFCM4glIEd1QpFXMdpXNhr4MgE3p9Pts0xqamTGpD6o3aFqvdAqMgiiV7tnCxlyyRv2Ui6DY3PVylY66n5wSCvT0rtXvBJGiMLo9ahOEWHqKOfJwm2xvWGI99sdJ3pO3hYB3p4grMABewYHBNmmSlvVzIgtQVHO5CM-IOPCVtAvi_OrJxlrKiM=w16383 + source_url: http://www-lib.icu.ac.jp + css_selector: '[document] > html > head > meta:nth-of-type(15)' + retrieved_on: '2025-12-25T18:17:17.437758+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MIT-L-JLCL.yaml b/data/custodian/JP-13-MIT-L-JLCL.yaml index f91736aae6..9677ce737a 100644 --- a/data/custodian/JP-13-MIT-L-JLCL.yaml +++ b/data/custodian/JP-13-MIT-L-JLCL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-JLCL - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-JLCL valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-JLCL ghcid_numeric: 3835080323703194561 valid_from: '2025-12-06T23:38:55.206800+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Japan Lutheran College Library @@ -187,7 +188,8 @@ wikidata_enrichment: member_of: - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.luther.ac.jp/guide/affiliate/library/index.html wikidata_official_website: http://www.luther.ac.jp/guide/affiliate/library/index.html @@ -209,3 +211,28 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:17:29.442452+00:00' + source_url: http://www.luther.ac.jp/guide/affiliate/library/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.luther.ac.jp/apple-touch-icon.png + source_url: http://www.luther.ac.jp/guide/affiliate/library/index.html + css_selector: '[document] > html > head > link:nth-of-type(2)' + retrieved_on: '2025-12-25T18:17:29.442452+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.luther.ac.jp/ogp.png + source_url: http://www.luther.ac.jp/guide/affiliate/library/index.html + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:17:29.442452+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MIT-L-KUML.yaml b/data/custodian/JP-13-MIT-L-KUML.yaml index 52d21f6b79..173f4a2b5d 100644 --- a/data/custodian/JP-13-MIT-L-KUML.yaml +++ b/data/custodian/JP-13-MIT-L-KUML.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-KUML - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-KUML valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-KUML ghcid_numeric: 4311543093340900499 valid_from: '2025-12-06T23:38:54.854963+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Kyorin University Medical Library @@ -215,3 +216,37 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:17:38.699021+00:00' + source_url: http://www.kyorin-u.ac.jp/univ/center/library/medlib/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.kyorin-u.ac.jp/assets/images/BlkHeader_logo_kyorin.svg + source_url: http://www.kyorin-u.ac.jp/univ/center/library/medlib/index.html + css_selector: '[document] > html.webkit.chrome > body > div.BlkWrapper > header.BlkHeader + > div.BlkHeader__inner > p.BlkHeader__logo > a > img' + retrieved_on: '2025-12-25T18:17:38.699021+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 杏林大学 + - claim_type: favicon_url + claim_value: http://www.kyorin-u.ac.jp/assets/images/icon/apple-touch-icon-180x180.png + source_url: http://www.kyorin-u.ac.jp/univ/center/library/medlib/index.html + css_selector: '[document] > html.webkit.chrome > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T18:17:38.699021+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: 180x180 + - claim_type: og_image_url + claim_value: http://www.kyorin-u.ac.jp/assets/images/ogp.png + source_url: http://www.kyorin-u.ac.jp/univ/center/library/medlib/index.html + css_selector: '[document] > html.webkit.chrome > head > meta:nth-of-type(10)' + retrieved_on: '2025-12-25T18:17:38.699021+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 5 diff --git a/data/custodian/JP-13-MIT-L-ML-mitakashiritsumitakaekimae_library.yaml b/data/custodian/JP-13-MIT-L-ML-mitakashiritsumitakaekimae_library.yaml index dce25070a6..1e26f25e1f 100644 --- a/data/custodian/JP-13-MIT-L-ML-mitakashiritsumitakaekimae_library.yaml +++ b/data/custodian/JP-13-MIT-L-ML-mitakashiritsumitakaekimae_library.yaml @@ -152,3 +152,20 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:17:49.022688+00:00' + source_url: https://www.library.mitaka.tokyo.jp/contents?18&pid=193 + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.library.mitaka.tokyo.jp/images/ogimage.png + source_url: https://www.library.mitaka.tokyo.jp/contents?18&pid=193 + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:17:49.022688+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIT-L-ML-mitakashiritsutobu_library.yaml b/data/custodian/JP-13-MIT-L-ML-mitakashiritsutobu_library.yaml index ffb1f2c035..1faee531f2 100644 --- a/data/custodian/JP-13-MIT-L-ML-mitakashiritsutobu_library.yaml +++ b/data/custodian/JP-13-MIT-L-ML-mitakashiritsutobu_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-ML-mitakashiritsutobu_library - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-ML-mitakashiritsutobu_library valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-ML-mitakashiritsutobu_library ghcid_numeric: 2796756550464225278 valid_from: '2025-12-06T23:38:43.654360+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MITAKASHIRITSUTOBU Library @@ -151,3 +152,20 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:18:34.903123+00:00' + source_url: https://www.library.mitaka.tokyo.jp/contents?13&pid=191 + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.library.mitaka.tokyo.jp/images/ogimage.png + source_url: https://www.library.mitaka.tokyo.jp/contents?13&pid=191 + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:18:34.903123+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIT-L-ML.yaml b/data/custodian/JP-13-MIT-L-ML.yaml index b9b3a5e12f..59ec634ecc 100644 --- a/data/custodian/JP-13-MIT-L-ML.yaml +++ b/data/custodian/JP-13-MIT-L-ML.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-ML - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-ML valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-ML ghcid_numeric: 1267999272504534013 valid_from: '2025-12-06T23:38:43.652000+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MITAKASHIRITSUMITAKA Library @@ -151,3 +152,20 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:18:47.711707+00:00' + source_url: https://www.library.mitaka.tokyo.jp/contents?12&pid=190 + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.library.mitaka.tokyo.jp/images/ogimage.png + source_url: https://www.library.mitaka.tokyo.jp/contents?12&pid=190 + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:18:47.711707+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIT-L-MLM.yaml b/data/custodian/JP-13-MIT-L-MLM.yaml index 0c6aa390f0..5cd3807de5 100644 --- a/data/custodian/JP-13-MIT-L-MLM.yaml +++ b/data/custodian/JP-13-MIT-L-MLM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-MLM - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-MLM valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-MLM ghcid_numeric: 16707625640540277782 valid_from: '2025-12-06T23:38:51.088597+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MITAKASHIRITSUNAMBU Library MINNAMI @@ -151,3 +152,20 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:18:58.450536+00:00' + source_url: https://www.library.mitaka.tokyo.jp/library/south + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://www.library.mitaka.tokyo.jp/images/ogimage.png + source_url: https://www.library.mitaka.tokyo.jp/library/south + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:18:58.450536+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MIT-L-NAOJL.yaml b/data/custodian/JP-13-MIT-L-NAOJL.yaml index 114e7e683f..0744670509 100644 --- a/data/custodian/JP-13-MIT-L-NAOJL.yaml +++ b/data/custodian/JP-13-MIT-L-NAOJL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-NAOJL - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-NAOJL valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-NAOJL ghcid_numeric: 18037306652176769122 valid_from: '2025-12-06T23:38:57.541594+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: National Astronomical Observatory of Japan Library @@ -151,3 +152,23 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:19:05.625483+00:00' + source_url: http://library.nao.ac.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://library.nao.ac.jp/images/header-logo.svg + source_url: http://library.nao.ac.jp + css_selector: '#top > div.header-container > div.sitetitle > h1.header-logo > + a > img' + retrieved_on: '2025-12-25T18:19:05.625483+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: Welcome to NAOJ Library! 国立天文台図書室! + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-MIT-L-TUTSL.yaml b/data/custodian/JP-13-MIT-L-TUTSL.yaml index 5ef0c91545..71c59d92fa 100644 --- a/data/custodian/JP-13-MIT-L-TUTSL.yaml +++ b/data/custodian/JP-13-MIT-L-TUTSL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-L-TUTSL - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-L-TUTSL valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-L-TUTSL ghcid_numeric: 11094330771851470768 valid_from: '2025-12-06T23:38:55.114945+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Tokyo Union Theological Seminary Library @@ -215,3 +216,22 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:19:13.509407+00:00' + source_url: http://www.tuts.ac.jp/toshokan + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.tuts.ac.jp/favicon.ico + source_url: http://www.tuts.ac.jp/toshokan + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T18:19:13.509407+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIT-M-GMM.yaml b/data/custodian/JP-13-MIT-M-GMM.yaml index 683cdbabc0..57b560cf70 100644 --- a/data/custodian/JP-13-MIT-M-GMM.yaml +++ b/data/custodian/JP-13-MIT-M-GMM.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIT-M-GMM - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIT-M-GMM valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIT-M-GMM ghcid_numeric: 15371511933325802883 valid_from: '2025-12-06T23:38:33.590273+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: GHIBLI MUSEUM, MITAKA @@ -151,3 +152,28 @@ location: geonames_id: 11790343 geonames_name: Mitaka feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:19:18.074672+00:00' + source_url: https://www.ghibli-museum.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.ghibli-museum.jp/apple-touch-icon.png + source_url: https://www.ghibli-museum.jp + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T18:19:18.074672+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.ghibli-museum.jp/img/ghibli-museum.png + source_url: https://www.ghibli-museum.jp + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:19:18.074672+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MIT-M-ICUHYMM.yaml b/data/custodian/JP-13-MIT-M-ICUHYMM.yaml index 2ceafb9457..0614c9f47e 100644 --- a/data/custodian/JP-13-MIT-M-ICUHYMM.yaml +++ b/data/custodian/JP-13-MIT-M-ICUHYMM.yaml @@ -368,3 +368,22 @@ youtube_enrichment: comments: [] thumbnail_url: https://i.ytimg.com/vi/ZBnnV6w2ljk/hqdefault.jpg status: SUCCESS +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:19:24.463808+00:00' + source_url: https://subsites.icu.ac.jp/yuasa_museum + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://subsites.icu.ac.jp/image/yuasa_title2.gif + source_url: https://subsites.icu.ac.jp/yuasa_museum + css_selector: '#header_f > div.index_imgs2:nth-of-type(2) > a > img.index_logo' + retrieved_on: '2025-12-25T18:19:24.463808+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + summary: + total_claims: 1 + has_primary_logo: true + has_favicon: false + has_og_image: false + favicon_count: 0 diff --git a/data/custodian/JP-13-MIY-L-HL.yaml b/data/custodian/JP-13-MIY-L-HL.yaml index e758c81ee6..231e59a9bd 100644 --- a/data/custodian/JP-13-MIY-L-HL.yaml +++ b/data/custodian/JP-13-MIY-L-HL.yaml @@ -155,3 +155,22 @@ geocoding: resolved_place: Nishisho resolved_city: 'Miyoshi Gun ' timestamp: '2025-12-09T23:13:34.344579+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:19:40.691362+00:00' + source_url: http://higashimiyoshi-town-library.com + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://higashimiyoshi-town-library.com/wp/wp-content/themes/twentytwelve/img/favicon.png + source_url: http://higashimiyoshi-town-library.com + css_selector: '[document] > html > head > link' + retrieved_on: '2025-12-25T18:19:40.691362+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIY-L-M.yaml b/data/custodian/JP-13-MIY-L-M.yaml index 75e9d15e6e..e0487382ca 100644 --- a/data/custodian/JP-13-MIY-L-M.yaml +++ b/data/custodian/JP-13-MIY-L-M.yaml @@ -34,13 +34,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIY-L-M - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIY-L-M valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIY-L-M ghcid_numeric: 4322077769137226660 valid_from: '2025-12-06T23:38:43.986542+00:00' @@ -153,3 +154,22 @@ geocoding: resolved_place: Miyake-mura resolved_city: Miyake-mura timestamp: '2025-12-09T23:18:43.325474+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:19:48.604369+00:00' + source_url: https://www.vill.miyake.tokyo.jp/kakuka/kyouikuiinkai/shisetsu/toshokan.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.vill.miyake.tokyo.jp/images/base/favicon.ico + source_url: https://www.vill.miyake.tokyo.jp/kakuka/kyouikuiinkai/shisetsu/toshokan.html + css_selector: '[document] > html > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T18:19:48.604369+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIY-M-HCFHMH.yaml b/data/custodian/JP-13-MIY-M-HCFHMH.yaml index 760fc65c52..451eff36d2 100644 --- a/data/custodian/JP-13-MIY-M-HCFHMH.yaml +++ b/data/custodian/JP-13-MIY-M-HCFHMH.yaml @@ -39,13 +39,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIY-M-HCFHMH - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIY-M-HCFHMH valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIY-M-HCFHMH ghcid_numeric: 11739827447343428757 valid_from: '2025-12-06T23:38:39.343447+00:00' @@ -103,8 +104,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: HIGASHIMIYOSHI-CHO FOLK HISTORICAL MATERIAL HALL @@ -178,8 +179,8 @@ wikidata_enrichment: instance_of: &id004 - id: Q33506 label: museum - description: institution that holds artifacts and other objects of scientific, artistic, cultural, historical, or other - importance + description: institution that holds artifacts and other objects of scientific, + artistic, cultural, historical, or other importance wikidata_instance_of: *id004 wikidata_location: country: &id005 @@ -222,3 +223,22 @@ location: postal_code: 779-4703 street_address: NAKASHO, Miyoshi Gun Higashimiyoshi Cho, Tokushima Ken, 779-4703 normalization_timestamp: '2025-12-09T12:21:59.138762+00:00' +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:20:18.346862+00:00' + source_url: https://www.town.higashimiyoshi.lg.jp/institution/list/institution79 + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.town.higashimiyoshi.lg.jp/img/favicon.ico + source_url: https://www.town.higashimiyoshi.lg.jp/institution/list/institution79 + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T18:20:18.346862+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MIY-M-HYMF.yaml b/data/custodian/JP-13-MIY-M-HYMF.yaml index a9cac4e60e..ed67d07f5f 100644 --- a/data/custodian/JP-13-MIY-M-HYMF.yaml +++ b/data/custodian/JP-13-MIY-M-HYMF.yaml @@ -15,7 +15,8 @@ original_entry: city: Miyoshi Shi region: Tokushima Ken postal_code: 778-0105 - street_address: NISHIIYAYAMAMURA HIGASHINISHIOKA, Miyoshi Shi, Tokushima Ken, 778-0105 + street_address: NISHIIYAYAMAMURA HIGASHINISHIOKA, Miyoshi Shi, Tokushima Ken, + 778-0105 processing_timestamp: '2025-12-06T23:38:39.305596+00:00' ghcid: ghcid_current: JP-13-MIY-M-HYMF @@ -32,13 +33,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MIY-M-HYMF - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MIY-M-HYMF valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MIY-M-HYMF ghcid_numeric: 3351367268967300184 valid_from: '2025-12-06T23:38:39.305596+00:00' @@ -96,8 +98,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Heike Yashiki Museum of Folklore @@ -151,3 +153,20 @@ location: geonames_id: 11612340 geonames_name: Miyoshi feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:20:25.030528+00:00' + source_url: https://r.goope.jp/heike-1408 + extraction_method: crawl4ai + claims: + - claim_type: og_image_url + claim_value: https://cdn.goope.jp/181111/240808143339wuj6.jpg + source_url: https://r.goope.jp/heike-1408 + css_selector: '[document] > html > head > meta:nth-of-type(6)' + retrieved_on: '2025-12-25T18:20:25.030528+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: false + has_og_image: true + favicon_count: 0 diff --git a/data/custodian/JP-13-MOK-L-M.yaml b/data/custodian/JP-13-MOK-L-M.yaml index 127a322876..35e3cf0801 100644 --- a/data/custodian/JP-13-MOK-L-M.yaml +++ b/data/custodian/JP-13-MOK-L-M.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MOK-L-M - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MOK-L-M valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MOK-L-M ghcid_numeric: 500133292035345657 valid_from: '2025-12-06T23:38:51.471153+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MOKASHIRITSUMOKASHIKOMINKAMMOKANISHIBUNKANTOSHOSHITSU @@ -151,3 +152,36 @@ location: geonames_id: 9290061 geonames_name: Kimokawa feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:20:40.155736+00:00' + source_url: https://www.moka-lib.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2024/07/cropped-logo.png + source_url: https://www.moka-lib.jp + css_selector: '#top-anchor > div.elementor-widget-container > a > img.attachment-full.size-full' + retrieved_on: '2025-12-25T18:20:40.155736+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2025/01/cropped-favicon_monaca-180x180.png + source_url: https://www.moka-lib.jp + css_selector: '[document] > html > head > link:nth-of-type(59)' + retrieved_on: '2025-12-25T18:20:40.155736+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2024/11/FV_02.png + source_url: https://www.moka-lib.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:20:40.155736+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MOK-L-MCL.yaml b/data/custodian/JP-13-MOK-L-MCL.yaml index 03fb346e47..8041134980 100644 --- a/data/custodian/JP-13-MOK-L-MCL.yaml +++ b/data/custodian/JP-13-MOK-L-MCL.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MOK-L-MCL - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MOK-L-MCL valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MOK-L-MCL ghcid_numeric: 12304372972058695766 valid_from: '2025-12-06T23:38:42.210264+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Moka City Library @@ -151,3 +152,36 @@ location: geonames_id: 9290061 geonames_name: Kimokawa feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:20:51.683761+00:00' + source_url: https://www.moka-lib.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2024/07/cropped-logo.png + source_url: https://www.moka-lib.jp + css_selector: '#top-anchor > div.elementor-widget-container > a > img.attachment-full.size-full' + retrieved_on: '2025-12-25T18:20:51.683761+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2025/01/cropped-favicon_monaca-180x180.png + source_url: https://www.moka-lib.jp + css_selector: '[document] > html > head > link:nth-of-type(59)' + retrieved_on: '2025-12-25T18:20:51.683761+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2024/11/FV_02.png + source_url: https://www.moka-lib.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:20:51.683761+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MOK-L-ML.yaml b/data/custodian/JP-13-MOK-L-ML.yaml index 09f3a91c9c..f4b3027130 100644 --- a/data/custodian/JP-13-MOK-L-ML.yaml +++ b/data/custodian/JP-13-MOK-L-ML.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MOK-L-ML - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MOK-L-ML valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MOK-L-ML ghcid_numeric: 3890576959471481948 valid_from: '2025-12-06T23:38:51.473405+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MOKASHININOMIYA Library @@ -151,3 +152,36 @@ location: geonames_id: 9290061 geonames_name: Kimokawa feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:21:01.434504+00:00' + source_url: https://www.moka-lib.jp + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2024/07/cropped-logo.png + source_url: https://www.moka-lib.jp + css_selector: '#top-anchor > div.elementor-widget-container > a > img.attachment-full.size-full' + retrieved_on: '2025-12-25T18:21:01.434504+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: '' + - claim_type: favicon_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2025/01/cropped-favicon_monaca-180x180.png + source_url: https://www.moka-lib.jp + css_selector: '[document] > html > head > link:nth-of-type(59)' + retrieved_on: '2025-12-25T18:21:01.434504+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://mokamonaca.jp/example/wp-content/uploads/2024/11/FV_02.png + source_url: https://www.moka-lib.jp + css_selector: '[document] > html > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:21:01.434504+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MOK-M-KMTCECAEH.yaml b/data/custodian/JP-13-MOK-M-KMTCECAEH.yaml index b1f2a8eacb..ed0d0f5e7c 100644 --- a/data/custodian/JP-13-MOK-M-KMTCECAEH.yaml +++ b/data/custodian/JP-13-MOK-M-KMTCECAEH.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MOK-M-KMTCECAEH - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MOK-M-KMTCECAEH valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MOK-M-KMTCECAEH ghcid_numeric: 10435167460095439622 valid_from: '2025-12-06T23:38:31.873645+00:00' @@ -96,11 +97,12 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name - claim_value: KUBO MEMORIAL TOURISM AND CULTURE EXCHANGE CENTER ART EXHIBITION HALL + claim_value: KUBO MEMORIAL TOURISM AND CULTURE EXCHANGE CENTER ART EXHIBITION + HALL property_uri: skos:prefLabel provenance: namespace: glam @@ -151,3 +153,28 @@ location: geonames_id: 9290061 geonames_name: Kimokawa feature_code: PPL +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:21:11.977630+00:00' + source_url: https://www.kubokinen.net + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.kubokinen.net/favicon.ico + source_url: https://www.kubokinen.net + css_selector: '[document] > html.js.no-touch > head > link' + retrieved_on: '2025-12-25T18:21:11.977630+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.kubokinen.net/images/image1.jpg + source_url: https://www.kubokinen.net + css_selector: '[document] > html.js.no-touch > head > meta:nth-of-type(12)' + retrieved_on: '2025-12-25T18:21:11.977630+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 1 diff --git a/data/custodian/JP-13-MUS-A-MHM-musashino_histrical_museum.yaml b/data/custodian/JP-13-MUS-A-MHM-musashino_histrical_museum.yaml index 300a035e30..522b45005a 100644 --- a/data/custodian/JP-13-MUS-A-MHM-musashino_histrical_museum.yaml +++ b/data/custodian/JP-13-MUS-A-MHM-musashino_histrical_museum.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MUS-A-MHM-musashino_histrical_museum - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MUS-A-MHM-musashino_histrical_museum valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MUS-A-MHM-musashino_histrical_museum ghcid_numeric: 10314715769012924019 valid_from: '2025-12-06T23:38:29.572009+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Musashino Histrical Museum @@ -151,3 +152,36 @@ location: geonames_id: 1856367 geonames_name: Musashino feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:21:55.661470+00:00' + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.city.musashino.lg.jp/kurashi_guide/_template_/_site_/_default_/_res/design/images/header/tlogo.png + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T18:21:55.661470+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 武蔵野市 + - claim_type: favicon_url + claim_value: http://www.city.musashino.lg.jp/kurashi_guide/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T18:21:55.661470+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.musashino.lg.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:21:55.661470+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MUS-A-MHM.yaml b/data/custodian/JP-13-MUS-A-MHM.yaml index 513c34f0cb..1d7610869c 100644 --- a/data/custodian/JP-13-MUS-A-MHM.yaml +++ b/data/custodian/JP-13-MUS-A-MHM.yaml @@ -152,3 +152,36 @@ location: geonames_id: 1856367 geonames_name: Musashino feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:22:02.260288+00:00' + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + extraction_method: crawl4ai + claims: + - claim_type: logo_url + claim_value: http://www.city.musashino.lg.jp/kurashi_guide/_template_/_site_/_default_/_res/design/images/header/tlogo.png + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + css_selector: '#tlogo > p > a > img' + retrieved_on: '2025-12-25T18:22:02.260288+00:00' + extraction_method: crawl4ai_header_logo + detection_confidence: high + alt_text: 武蔵野市 + - claim_type: favicon_url + claim_value: http://www.city.musashino.lg.jp/kurashi_guide/_template_/_site_/_default_/_res/images/apple-touch-icon-precomposed.png + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + css_selector: '[document] > html > head > link:nth-of-type(8)' + retrieved_on: '2025-12-25T18:22:02.260288+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.city.musashino.lg.jp/_template_/_site_/_default_/_res/images/sns/ogimage.png + source_url: http://www.city.musashino.lg.jp/kurashi_guide/shogaigakushu_koza/rekishikan/index.html + css_selector: '[document] > html > head > meta:nth-of-type(11)' + retrieved_on: '2025-12-25T18:22:02.260288+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 3 + has_primary_logo: true + has_favicon: true + has_og_image: true + favicon_count: 2 diff --git a/data/custodian/JP-13-MUS-L-AUL.yaml b/data/custodian/JP-13-MUS-L-AUL.yaml index 6b57122f48..aaade88c6d 100644 --- a/data/custodian/JP-13-MUS-L-AUL.yaml +++ b/data/custodian/JP-13-MUS-L-AUL.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MUS-L-AUL - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MUS-L-AUL valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MUS-L-AUL ghcid_numeric: 15628027425931961964 valid_from: '2025-12-06T23:38:54.824151+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Asia University Library @@ -193,7 +194,8 @@ wikidata_enrichment: description: organisatie uit Japan - id: Q56056912 label: Japan Consortium for Open Access Repository - description: promotes open access and open science in Japan with knowledge dissemination via digital repositories + description: promotes open access and open science in Japan with knowledge dissemination + via digital repositories wikidata_web: official_website: http://www.asia-u.ac.jp/library/ wikidata_official_website: http://www.asia-u.ac.jp/library/ @@ -215,3 +217,28 @@ location: geonames_id: 1856367 geonames_name: Musashino feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:22:12.077071+00:00' + source_url: https://www.asia-u.ac.jp/library + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.asia-u.ac.jp/apple-touch-icon.png + source_url: https://www.asia-u.ac.jp/library + css_selector: '[document] > html > head > link:nth-of-type(5)' + retrieved_on: '2025-12-25T18:22:12.077071+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + - claim_type: og_image_url + claim_value: https://www.asia-u.ac.jp/ogp.png + source_url: https://www.asia-u.ac.jp/library + css_selector: '[document] > html > head > meta:nth-of-type(7)' + retrieved_on: '2025-12-25T18:22:12.077071+00:00' + extraction_method: crawl4ai_meta_og + summary: + total_claims: 2 + has_primary_logo: false + has_favicon: true + has_og_image: true + favicon_count: 3 diff --git a/data/custodian/JP-13-MUS-L-CAPSSU.yaml b/data/custodian/JP-13-MUS-L-CAPSSU.yaml index 502e8cf9a4..f189e8da86 100644 --- a/data/custodian/JP-13-MUS-L-CAPSSU.yaml +++ b/data/custodian/JP-13-MUS-L-CAPSSU.yaml @@ -37,13 +37,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MUS-L-CAPSSU - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MUS-L-CAPSSU valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MUS-L-CAPSSU ghcid_numeric: 17064315705967605663 valid_from: '2025-12-06T23:38:58.811104+00:00' @@ -101,8 +102,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: Center for Asian and Pacific Studies, Seikei University @@ -204,3 +205,22 @@ location: geonames_id: 1856367 geonames_name: Musashino feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:22:20.601307+00:00' + source_url: http://www.seikei.ac.jp/university/caps/index.html + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: http://www.seikei.ac.jp/university/favicon.ico + source_url: http://www.seikei.ac.jp/university/caps/index.html + css_selector: '[document] > html.ua-chrome.ua-chrome-135 > head > link:nth-of-type(7)' + retrieved_on: '2025-12-25T18:22:20.601307+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: image/x-icon + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 1 diff --git a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsumitsugichiku_library.yaml b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsumitsugichiku_library.yaml index d64bf6bcb3..689f0efc3a 100644 --- a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsumitsugichiku_library.yaml +++ b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsumitsugichiku_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MUS-L-ML-musashimurayamashiritsumitsugichiku_library - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MUS-L-ML-musashimurayamashiritsumitsugichiku_library valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MUS-L-ML-musashimurayamashiritsumitsugichiku_library ghcid_numeric: 7833834124575383779 valid_from: '2025-12-06T23:38:43.910291+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MUSASHIMURAYAMASHIRITSUMITSUGICHIKU Library @@ -151,3 +152,22 @@ location: geonames_id: 6822130 geonames_name: Musashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:22:33.194656+00:00' + source_url: https://www.library.musashimurayama.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.musashimurayama.tokyo.jp/img/favicon.ico + source_url: https://www.library.musashimurayama.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T18:22:33.194656+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakakubo_library.yaml b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakakubo_library.yaml index b1c666a1c6..1dca9e138e 100644 --- a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakakubo_library.yaml +++ b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakakubo_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 6822130 geonames_name: Musashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:22:42.908373+00:00' + source_url: https://www.library.musashimurayama.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.musashimurayama.tokyo.jp/img/favicon.ico + source_url: https://www.library.musashimurayama.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T18:22:42.908373+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakatochiku_library.yaml b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakatochiku_library.yaml index 88ab163bbf..0e9b1da1cd 100644 --- a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakatochiku_library.yaml +++ b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsunakatochiku_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 6822130 geonames_name: Musashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:22:50.645194+00:00' + source_url: https://www.library.musashimurayama.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.musashimurayama.tokyo.jp/img/favicon.ico + source_url: https://www.library.musashimurayama.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T18:22:50.645194+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuominamichiku_library.yaml b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuominamichiku_library.yaml index 3da9422fd9..df22ce020b 100644 --- a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuominamichiku_library.yaml +++ b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuominamichiku_library.yaml @@ -152,3 +152,22 @@ location: geonames_id: 6822130 geonames_name: Musashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:22:58.185838+00:00' + source_url: https://www.library.musashimurayama.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.musashimurayama.tokyo.jp/img/favicon.ico + source_url: https://www.library.musashimurayama.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T18:22:58.185838+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuraizuka_library.yaml b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuraizuka_library.yaml index 3e9ee430df..d23ee77aff 100644 --- a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuraizuka_library.yaml +++ b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuraizuka_library.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MUS-L-ML-musashimurayamashiritsuraizuka_library - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MUS-L-ML-musashimurayamashiritsuraizuka_library valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MUS-L-ML-musashimurayamashiritsuraizuka_library ghcid_numeric: 14333679254499910448 valid_from: '2025-12-06T23:38:43.903363+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MUSASHIMURAYAMASHIRITSURAIZUKA Library @@ -151,3 +152,22 @@ location: geonames_id: 6822130 geonames_name: Musashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:23:04.374419+00:00' + source_url: https://www.library.musashimurayama.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.musashimurayama.tokyo.jp/img/favicon.ico + source_url: https://www.library.musashimurayama.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T18:23:04.374419+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2 diff --git a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuzamboriinadairachiku_librar.yaml b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuzamboriinadairachiku_librar.yaml index 198c303a23..a2ab6bdcbc 100644 --- a/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuzamboriinadairachiku_librar.yaml +++ b/data/custodian/JP-13-MUS-L-ML-musashimurayamashiritsuzamboriinadairachiku_librar.yaml @@ -32,13 +32,14 @@ ghcid: method: CH_ANNOTATOR_SOURCE ghcid_history: - ghcid: JP-13-MUS-L-ML-musashimurayamashiritsuzamboriinadairachiku_librar - valid_from: "2025-12-10T09:44:08Z" + valid_from: '2025-12-10T09:44:08Z' valid_to: null - reason: "Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO 3166-2:JP" + reason: Corrected region code from JP-TO (abbreviation) to JP-13 (Tokyo) per ISO + 3166-2:JP - ghcid: JP-TO-MUS-L-ML-musashimurayamashiritsuzamboriinadairachiku_librar valid_from: null - valid_to: "2025-12-10T09:44:08Z" - reason: "Previous GHCID with incorrect region code" + valid_to: '2025-12-10T09:44:08Z' + reason: Previous GHCID with incorrect region code - ghcid: JP-TO-MUS-L-ML-musashimurayamashiritsuzamboriinadairachiku_librar ghcid_numeric: 12588404130414037218 valid_from: '2025-12-06T23:38:43.914895+00:00' @@ -96,8 +97,8 @@ ch_annotator: annotation_metadata: confidence_score: 0.98 verified: false - verification_date: - verified_by: + verification_date: null + verified_by: null entity_claims: - claim_type: full_name claim_value: MUSASHIMURAYAMASHIRITSUZAMBORIINADAIRACHIKU Library @@ -151,3 +152,22 @@ location: geonames_id: 6822130 geonames_name: Musashimurayama feature_code: PPLA2 +logo_enrichment: + enrichment_timestamp: '2025-12-25T18:23:11.164401+00:00' + source_url: https://www.library.musashimurayama.tokyo.jp + extraction_method: crawl4ai + claims: + - claim_type: favicon_url + claim_value: https://www.library.musashimurayama.tokyo.jp/img/favicon.ico + source_url: https://www.library.musashimurayama.tokyo.jp + css_selector: '[document] > html > head > link:nth-of-type(4)' + retrieved_on: '2025-12-25T18:23:11.164401+00:00' + extraction_method: crawl4ai_link_rel + favicon_type: '' + favicon_sizes: '' + summary: + total_claims: 1 + has_primary_logo: false + has_favicon: true + has_og_image: false + favicon_count: 2