- Added logo_enrichment to 771 Czech custodian files - 87% logo hit rate using crawl4ai favicon extraction - Total checkpoint: 9,257 files across all countries - CZ remaining: 6,642 files
223 lines
7.6 KiB
YAML
223 lines
7.6 KiB
YAML
original_entry:
|
|
name: Libri Prohibiti
|
|
source: UNESCO Memory of the World (via Wikidata)
|
|
wikidata_id: Q630847
|
|
mow_inscriptions:
|
|
- wikidata_id: Q28028233
|
|
name: 'Libri Prohibiti: Collection of periodicals of Czech and Slovak Samizdat
|
|
in the years 1948-1989'
|
|
country: Czech Republic
|
|
processing_timestamp: '2025-12-06T20:58:52.885193+00:00'
|
|
wikidata_enrichment:
|
|
wikidata_entity_id: Q630847
|
|
api_metadata:
|
|
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
|
|
fetch_timestamp: '2025-12-08T23:41:32.140045+00:00'
|
|
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
|
|
enrichment_version: 2.0_full
|
|
properties_found:
|
|
- P373
|
|
- P18
|
|
- P31
|
|
- P17
|
|
- P856
|
|
- P571
|
|
- P2427
|
|
- P159
|
|
- P6782
|
|
- P276
|
|
- P968
|
|
- P2013
|
|
wikidata_labels:
|
|
cs: Libri prohibiti
|
|
en: Libri Prohibiti
|
|
es: Libri Prohibiti
|
|
pl: Libri Prohibiti
|
|
ja: リブリ・プロハイビティ
|
|
la: Libri Prohibiti
|
|
ru: Libri prohibiti
|
|
de: Libri prohibiti
|
|
fr: Libri prohibiti
|
|
sk: Libri prohibiti
|
|
sl: Libri prohibiti
|
|
sr: Libri Prohibiti
|
|
wikidata_label_en: Libri Prohibiti
|
|
wikidata_label_ja: リブリ・プロハイビティ
|
|
wikidata_label_de: Libri prohibiti
|
|
wikidata_label_fr: Libri prohibiti
|
|
wikidata_label_es: Libri Prohibiti
|
|
wikidata_descriptions:
|
|
nl: bibliotheek in Tsjechië
|
|
he: ספרייה בצ'כיה
|
|
ko: 도서관
|
|
de: Bibliothek in Prag
|
|
ru: библиотека
|
|
ar: مكتبة
|
|
fr: bibliothèque
|
|
ja: 図書館
|
|
tg: китобхона
|
|
zh: 图书馆
|
|
en: Czech library
|
|
bg: библиотека
|
|
ky: китепкана
|
|
br: levraoueg Republik Tchek
|
|
cs: knihovna československé exilové a samizdatové literatury
|
|
sl: knjižnica izgnanske in samoizdane literature v Pragi (Češka)
|
|
sr: Češka biblioteka
|
|
wikidata_description_en: Czech library
|
|
wikidata_aliases:
|
|
en:
|
|
- Society of Libri Prohibiti
|
|
cs:
|
|
- Společnost Libri prohibiti
|
|
wikidata_sitelinks:
|
|
commonswiki: Category:Libri prohibiti
|
|
enwiki: Libri Prohibiti
|
|
plwiki: Libri Prohibiti
|
|
cswiki: Libri prohibiti
|
|
lawiki: Libri Prohibiti
|
|
ruwiki: Libri prohibiti
|
|
wikidata_temporal:
|
|
inception: '1990-10-22'
|
|
wikidata_inception: '1990-10-22'
|
|
wikidata_classification:
|
|
instance_of: &id001
|
|
- id: Q7075
|
|
label: library
|
|
description: institution charged with the care of a collection of literary,
|
|
musical, artistic, or reference materials, such as books, manuscripts, recordings,
|
|
or films
|
|
wikidata_instance_of: *id001
|
|
wikidata_location:
|
|
country: &id003
|
|
id: Q213
|
|
label: Czech Republic
|
|
description: country in Central Europe
|
|
headquarters_location: &id002
|
|
id: Q1085
|
|
label: Prague
|
|
description: capital city of the Czech Republic
|
|
location: *id002
|
|
wikidata_country: *id003
|
|
wikidata_web:
|
|
official_website: &id004
|
|
- http://libpro.cts.cuni.cz/EN/index_en.html
|
|
- https://www.libpro.cz/
|
|
wikidata_official_website: *id004
|
|
wikidata_social_media:
|
|
facebook_id: '100064434712083'
|
|
wikidata_media:
|
|
commons_category: Libri prohibiti
|
|
image: Libri prohibiti 02.JPG
|
|
wikidata_image: Libri prohibiti 02.JPG
|
|
wikidata_contact:
|
|
email: mailto:knihovna@libpro.cz
|
|
ghcid:
|
|
ghcid_current: CZ-10-PRA-L-LP
|
|
ghcid_original: CZ-XX-XXX-L-LP
|
|
ghcid_uuid: 11f4512b-d39e-5358-aa4a-69d50c9812fe
|
|
ghcid_uuid_sha256: 2fe14b64-2f15-88da-b65e-487c793281a4
|
|
ghcid_numeric: 3450121683201280218
|
|
record_id: 6edc4c11-b2e0-4b48-b786-362cfff99c57
|
|
generation_timestamp: '2025-12-06T20:58:52.885193+00:00'
|
|
ghcid_history:
|
|
- ghcid: CZ-XX-XXX-L-LP
|
|
ghcid_numeric: 3450121683201280218
|
|
valid_from: '2025-12-06T20:58:52.885193+00:00'
|
|
reason: Initial GHCID from UNESCO MoW Wikidata data (Dec 2025)
|
|
- ghcid: CZ-10-XXX-L-LP
|
|
valid_from: '2025-12-06T23:34:20.117144+00:00'
|
|
reason: 'Region resolved via Wikidata P131: XX->10 (CZ-10)'
|
|
- ghcid: CZ-10-PRA-L-LP
|
|
valid_from: '2025-12-07T00:31:30.622091+00:00'
|
|
reason: 'City resolved via Wikidata Q630847 coordinates: XXX->PRA (Prague)'
|
|
location_resolution:
|
|
method: WIKIDATA_COORDS_REVERSE_GEOCODE
|
|
country_code: CZ
|
|
country_label: Czech Republic
|
|
region_code: '10'
|
|
city_code: PRA
|
|
city_label: Prague
|
|
region_name: CZ-10
|
|
iso_code_source: CZ-10
|
|
resolution_timestamp: '2025-12-07T00:31:30.622068+00:00'
|
|
geonames_id: 3067696
|
|
custodian_name:
|
|
claim_type: custodian_name
|
|
claim_value: Libri Prohibiti
|
|
source_type: wikidata
|
|
emic_name: Libri prohibiti
|
|
name_language: cs
|
|
standardized_name: Libri prohibiti
|
|
alternative_names:
|
|
- name: Libri Prohibiti
|
|
language: en
|
|
source: wikidata
|
|
unesco_mow_enrichment:
|
|
is_mow_custodian: true
|
|
inscription_count: 1
|
|
inscriptions:
|
|
- wikidata_id: Q28028233
|
|
name: 'Libri Prohibiti: Collection of periodicals of Czech and Slovak Samizdat
|
|
in the years 1948-1989'
|
|
inscription_country: Czech Republic
|
|
enrichment_timestamp: '2025-12-06T20:58:52.885193+00:00'
|
|
data_source: Wikidata SPARQL (UNESCO has no MoW API)
|
|
provenance:
|
|
notes:
|
|
- 'Region resolved 2025-12-06T23:34:20Z: XX->10 via Wikidata P131 (CZ-10)'
|
|
- 'City resolved 2025-12-07T00:31:30Z: XXX->PRA via Wikidata Q630847 coords (50.0875,14.4214)
|
|
-> Prague (GeoNames:3067696)'
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:06Z
|
|
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:30Z
|
|
- 'YouTube/Google Maps enrichment 2025-12-09T09:28:43Z: YouTube: not found'
|
|
location:
|
|
region: CZ-10
|
|
region_code: '10'
|
|
country: CZ
|
|
geonames_id: 3067696
|
|
normalization_timestamp: '2025-12-09T15:34:41.816238+00:00'
|
|
latitude: 50.08804
|
|
longitude: 14.42076
|
|
coordinate_provenance:
|
|
source_type: GEONAMES_LOCAL
|
|
source_path: data/reference/geonames.db
|
|
entity_id: 3067696
|
|
original_timestamp: '2025-12-09T15:34:41.816190+00:00'
|
|
geonames_name: Prague
|
|
feature_code: PPLC
|
|
youtube_status: NOT_FOUND
|
|
youtube_search_query: Libri Prohibiti official
|
|
youtube_search_timestamp: '2025-12-09T09:28:43.266340+00:00'
|
|
logo_enrichment:
|
|
enrichment_timestamp: '2025-12-23T21:14:54.320147+00:00'
|
|
source_url: http://libpro.cts.cuni.cz/EN/index_en.html
|
|
extraction_method: crawl4ai
|
|
claims:
|
|
- claim_type: logo_url
|
|
claim_value: https://cdn.libpro.cz/content/uploads/2019/06/logo.png
|
|
source_url: http://libpro.cts.cuni.cz/EN/index_en.html
|
|
css_selector: '#masthead > div.elementor.elementor-2793 > section.elementor-section.elementor-top-section
|
|
> div.elementor-container.elementor-column-gap-no > div.elementor-column.elementor-col-100
|
|
> div.elementor-widget-wrap.elementor-element-populated > section.elementor-section.elementor-inner-section:nth-of-type(2)
|
|
> div.elementor-container.elementor-column-gap-no > div.elementor-column.elementor-col-50
|
|
> div.elementor-widget-wrap.elementor-element-populated > div.elementor-element.elementor-element-bb2711e
|
|
> div.elementor-widget-container > a > noscript > img.attachment-large.size-large'
|
|
retrieved_on: '2025-12-23T21:14:54.320147+00:00'
|
|
extraction_method: crawl4ai_header_logo
|
|
detection_confidence: high
|
|
alt_text: ''
|
|
- claim_type: favicon_url
|
|
claim_value: https://cdn.libpro.cz/content/uploads/2019/06/favicon.ico
|
|
source_url: http://libpro.cts.cuni.cz/EN/index_en.html
|
|
css_selector: '[document] > html > head > link:nth-of-type(18)'
|
|
retrieved_on: '2025-12-23T21:14:54.320147+00:00'
|
|
extraction_method: crawl4ai_link_rel
|
|
favicon_type: ''
|
|
favicon_sizes: 32x32
|
|
summary:
|
|
total_claims: 2
|
|
has_primary_logo: true
|
|
has_favicon: true
|
|
has_og_image: false
|
|
favicon_count: 1
|