glam/data/custodian.backup.20251230/CZ-10-PRA-A-NA.yaml
2025-12-30 23:07:03 +01:00

451 lines
19 KiB
YAML
Raw Permalink Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: Národní archiv
institution_type: ARCHIVE
source: CH-Annotator (czech_unified_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: ARON_UUID
identifier_value: 7ac8c281-6c44-44b2-9e00-3a16d557f830
identifier_url: https://portal.nacr.cz/aron/apu/7ac8c281-6c44-44b2-9e00-3a16d557f830
- &id002
identifier_scheme: INSTITUTION_CODE
identifier_value: '100000010'
- &id003
identifier_scheme: Wikidata
identifier_value: Q6970414
identifier_url: https://www.wikidata.org/wiki/Q6970414
- &id004
identifier_scheme: VIAF
identifier_value: '173002833'
identifier_url: https://viaf.org/viaf/173002833
locations: []
processing_timestamp: '2025-12-06T23:37:44.336818+00:00'
ghcid:
ghcid_current: CZ-10-PRA-A-NA
ghcid_original: XX-XX-XXX-A-NA
ghcid_uuid: f76b040b-1c4e-5272-bbce-8e8b30dd07ec
ghcid_uuid_sha256: b4db8d8b-b904-8e95-b3bc-a699011f29ca
ghcid_numeric: 13032165577970732693
record_id: ae69bd49-a485-4bff-9189-4ad083fad27c
generation_timestamp: '2025-12-06T23:37:44.336818+00:00'
location_resolution:
country_code: CZ
region_code: 10
city_code: PRA
method: WIKIDATA_LOCATION_RESEARCH
resolution_timestamp: '2025-12-06T23:54:39.506378+00:00'
resolution_notes: National Archives in Prague, confirmed via Wikidata P131
ghcid_history:
- ghcid: XX-XX-XXX-A-NA
ghcid_numeric: 13032165577970732693
valid_from: '2025-12-06T23:37:44.336818+00:00'
reason: Initial GHCID from CH-Annotator (czech_unified_ch_annotator.yaml)
- ghcid: CZ-XX-XXX-A-NA
valid_from: '2025-12-06T23:54:39.506383+00:00'
reason: 'Country resolved via Wikidata P17: XX→CZ'
- ghcid: CZ-10-PRA-A-NA
valid_from: '2025-12-07T12:36:58.331408+00:00'
reason: 'Location resolved via Wikidata research: Prague, region 10'
custodian_name:
claim_type: custodian_name
claim_value: Národní archiv
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: XX-XX-XXX-A-NA
- identifier_scheme: GHCID_UUID
identifier_value: f76b040b-1c4e-5272-bbce-8e8b30dd07ec
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: b4db8d8b-b904-8e95-b3bc-a699011f29ca
- identifier_scheme: GHCID_NUMERIC
identifier_value: '13032165577970732693'
- identifier_scheme: RECORD_ID
identifier_value: ae69bd49-a485-4bff-9189-4ad083fad27c
- *id001
- *id002
- *id003
- *id004
provenance:
data_source: API_SCRAPING
data_tier: TIER_1_AUTHORITATIVE
extraction_date: '2025-11-19T11:35:45.744536+00:00'
extraction_method: 'Created from CH-Annotator file: czech_unified_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'Country resolved 2025-12-06T23:54:39Z: XX→CZ via Wikidata P17'
- 'YouTube/Google Maps enrichment 2025-12-08T19:47:31Z: Maps: National Archives of the Czech Republic (conf: 1.00); YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:48:04Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:49:28Z
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-UC08pEIX/vl43uf1KbjHBK5eIiDQxqspgQ1scbE3LFY=
verified_at: '2025-12-28T19:58:21.538924+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q6970414
google_maps_enrichment:
content_hash: sha256-yqqNTooF0NoG/Wv8muZIG9QfMBYXF/WqgY5Ml+js3sc=
verified_at: '2025-12-28T19:58:21.539026+00:00'
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:58:21.539038+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.744536+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:12:32.389491+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: czech_unified.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date:
verified_by:
entity_claims:
- claim_type: full_name
claim_value: Národní archiv
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.744536+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.85
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /files/czech_unified.yaml
timestamp: '2025-11-19T11:35:45.744536+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
- claim_type: wikidata_id
claim_value: Q6970414
property_uri: owl:sameAs
provenance:
namespace: wikidata
path: /entity/Q6970414
timestamp: '2025-11-19T11:35:45.744536+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.98
integration_note:
created_from: czech_unified_ch_annotator.yaml
creation_date: '2025-12-06T23:37:44.336818+00:00'
creation_method: create_custodian_from_ch_annotator.py
wikidata_enrichment:
wikidata_entity_id: Q6970414
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-08T23:41:25.621828+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P373
- P18
- P31
- P214
- P227
- P244
- P213
- P17
- P856
- P2427
- P1436
- P159
- P6782
- P571
- P968
- P1329
- P131
- P276
- P268
- P269
- P463
- P2002
- P2013
- P2003
wikidata_labels:
cs: Národní archiv
en: National Archives
uk: Народний архів Чехії
zh: 國家檔案館
it: Archivi Nazionali
fr: Archives Nationales
hu: Cseh Nemzeti Levéltár
tt: Чехия милли архивлары
mul: Národní archiv
de: Národní archiv
wikidata_label_en: National Archives
wikidata_label_de: Národní archiv
wikidata_label_fr: Archives Nationales
wikidata_descriptions:
en: national archives of the Czech Republic
cs: národní archiv České republiky
ko: 도서관
ar: مكتبة في براغ، التشيك
it: archivi nazionali della Repubblica Ceca
fr: archives nationales de la République Tchèque
hu: Csehország (korábban Csehszlovákia) nemzeti levéltára Prágában
de: Tschechisches Nationalarchiv
wikidata_description_en: national archives of the Czech Republic
wikidata_aliases:
cs:
- NAČR
- SÚA
- Národní archiv České republiky
- NA
en:
- National Archives of the Czech Republic
- nacr.cz
it:
- Archivi nazionali della Repubblica Ceca
fr:
- Archives nationales de la République Tchèque
de:
- NA
- NAČR
wikidata_sitelinks:
cswiki: Národní archiv
enwiki: National Archives (Czech Republic)
ukwiki: Національний архів Чехії
wikidata_temporal:
inception: '1954-00-00'
wikidata_inception: '1954-00-00'
wikidata_classification:
instance_of: &id005
- id: Q2122214
label: national archives
description: archives of a country
- id: Q7075
label: library
description: institution charged with the care of a collection of literary, musical, artistic, or reference materials, such as books, manuscripts, recordings, or films
- id: Q27031009
label: public archive
description: repository for official documents
- id: Q108935461
label: Czech research institution
description: type of Czech research organization
- id: Q2085381
label: publishing company
description: company that prints and distributes pressed goods or electronic media
wikidata_instance_of: *id005
wikidata_location:
country: &id007
id: Q213
label: Czech Republic
description: country in Central Europe
headquarters_location: &id006
id: Q1085
label: Prague
description: capital city of the Czech Republic
located_in_admin_entity: *id006
location: *id006
wikidata_country: *id007
wikidata_located_in: *id006
wikidata_organization:
member_of:
- id: Q106192307
label: Czech Republic Libraries Association
description: organization in Czechia
- id: Q5205559
label: DLM Forum
description: European membership community of public archives
wikidata_web:
official_website: &id008
- http://www.nacr.cz/eindex.htm
- http://www.nacr.cz/
wikidata_official_website: *id008
wikidata_social_media:
twitter_username: NarodniArchivCZ
facebook_id: '61560464377399'
instagram_username: narodniarchiv
wikidata_media:
commons_category: Národní archiv
image: National Archive, Prague Chodov.jpg
wikidata_image: National Archive, Prague Chodov.jpg
wikidata_contact:
email: mailto:na@nacr.cz
phone_number: +420-974-847-290
_provenance:
content_hash:
algorithm: sha256
value: sha256-UC08pEIX/vl43uf1KbjHBK5eIiDQxqspgQ1scbE3LFY=
scope: enrichment_section
computed_at: '2025-12-28T19:58:21.538924+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q6970414
verification:
status: verified
last_verified: '2025-12-28T19:58:21.538935+00:00'
google_maps_enrichment:
place_id: ChIJpeVeWjWSC0cRLiagLWqyF5U
name: National Archives of the Czech Republic
fetch_timestamp: '2025-12-08T19:47:29.028861+00:00'
api_status: OK
coordinates:
latitude: 50.0389097
longitude: 14.492836599999997
formatted_address: Archivní 2257/4, 149 00 Praha 4-Chodov, Czechia
short_address: Archivní 2257/4, Praha 4-Chodov
phone_local: 974 847 247
phone_international: +420 974 847 247
website: http://www.nacr.cz/
google_place_types:
- point_of_interest
- establishment
business_status: OPERATIONAL
rating: 4.6
total_ratings: 155
reviews:
- author_name: Bernhard Struck
author_uri: https://www.google.com/maps/contrib/111303903784806922325/reviews
rating: 5
relative_time_description: 5 years ago
text: Super welcoming and very helpful archivists (for visitors like myself who are new and struggle with Czech). Thanks so much, keep up the great work.
publish_time: '2020-09-22T12:20:41.750155Z'
- author_name: Mały Oisior
author_uri: https://www.google.com/maps/contrib/100968724745138285308/reviews
rating: 5
relative_time_description: 5 years ago
text: Great
publish_time: '2020-04-29T23:36:09.585776Z'
- author_name: Kate Challis
author_uri: https://www.google.com/maps/contrib/111098916841330643337/reviews
rating: 5
relative_time_description: 8 years ago
text: Excellent archive
publish_time: '2017-12-05T09:47:33.419Z'
- author_name: Josef Brožek
author_uri: https://www.google.com/maps/contrib/105362763666969692195/reviews
rating: 1
relative_time_description: 3 weeks ago
text: The working hours of the employees of this office are ridiculous... Starting at 9, being gone by 1 pm... Paying for something like this out of taxes is a joy...
publish_time: '2025-11-14T12:59:55.176030204Z'
- author_name: David Veselík
author_uri: https://www.google.com/maps/contrib/116735262197680877900/reviews
rating: 3
relative_time_description: 5 months ago
text: Professional approach when searching for documents on the topic of the study. However, they themselves spoiled the positive evaluation several times. Unfortunately, it happened to me several times that I received inaccurate information from the research room staff when searching for information about the fund in the inventories. When I asked whether there was a fund for police stations and it was accessible in the research room, I was told that it was not. When I wrote directly to the relevant department, they sent it to me for viewing by email without any problems. It also happened to me once that a younger research room employee in glasses, who hands over archival materials for the study, was sleeping in his chair and I was very embarrassed to wake him up so that I wouldn't waste time waiting for him to hand me more archival materials. It happened at the beginning of January. Other researchers noticed it too. That definitely doesn't add to trust. I wouldn't expect something like that in an institution like the National Archives. It was clear that the younger archivist didn't even find it inappropriate and he didn't even need an apology for it.
publish_time: '2025-06-27T19:06:48.934404281Z'
opening_hours:
open_now: false
weekday_text:
- 'Monday: 9:00AM5:30PM'
- 'Tuesday: 9:00AM4:00PM'
- 'Wednesday: 9:00AM5:30PM'
- 'Thursday: 9:00AM4:00PM'
- 'Friday: Closed'
- 'Saturday: Closed'
- 'Sunday: Closed'
photo_count: 10
photos_metadata:
- name: places/ChIJpeVeWjWSC0cRLiagLWqyF5U/photos/AZLasHoPaUTQ0Cq-l8DRXNopH4rQN_dbMPpuZHBgi75iWfcrUc7uJkdzVFw_sI0G5_ytqL5lOmliMdW76Q6VFZF3fbIqbE-ebq_3PxlYbwnlJAkZVPMVPSF1YVd7kE5yN2L37YWT_eEypIK29dsIZ0d4EpojbCYFARTve5-ahIRxSk7OtrXuBpWiDq5T08pN9CennBKiY5U0neaTIiXch83k3KvJhURxu4ltW6nDw2sWFJPrBEjv6mYBrKg0mlmoAMV-5z-VCj5NomupGFX_bVeGMzoAabbjSXyjPbTMpA6HrVSlBhRlFbKLnOBAs1Wxnx109QDcfI6rL2_eDFZ8kA2ipP4SS6i5fLeQtXSXdWEWYUMvBUUCFQTCBLd95E6hMvM3PJlthH15uiXk9-W5zx7OzOILmscFRX6jh9EKsRTjqoRnkg
height: 3456
width: 4608
- name: places/ChIJpeVeWjWSC0cRLiagLWqyF5U/photos/AZLasHoTdPgUDgrEWJawKXBSgFBWe_x-wDHC9HT6r5hdzi6R7tN-M6AOVhJ5bRlOZPLbfjO6PYNxfRcKIlnDBRNSt80CAc-fX541otXW35xF7MFXD3eiNcWVVW8DvI-lQ2Ewz19jYYxJgXNnRezXQeTvCYRl71Ft87gc9rgYr2FAzaXYRbGvxyvHo9hfqYME2_ES8nuF-EUNdKGAhr0TLHSKoe0wPU_GWduuxUfj_kSMH7ADxJPqUyFnJue0p80gKo0_UDpjiXvknX3yGbudMWtxQFEcisD-dOp5We74B8TqmsMDb1UrDlZvlL4d3LABvrTn4XnLHNt0r52SKRTAnYGQu96qNpmqf_YvRr5XuS1V_w7IdpV5197ARbOl0hYxlU-ohgVZyN5Puqg1wqfXBTKLZkhMSF1pXn_zb-VGJFdxPUX9vvV4
height: 3120
width: 4160
- name: places/ChIJpeVeWjWSC0cRLiagLWqyF5U/photos/AZLasHrq4pWkwjdAzfEjdkgrAnqCOt-63zK1p5hljh3tXPozHdXyN0QF2z86HunordTpQMX4FCIRkewIVVgDBuWCMEPvRupLG9EuSEerRbGbMYeUiv-VhDk6R2b6Kx5qUJDE9_baHpzEV30qx4ipi4_QCTyuSOi0vDN45e0erBcO59tWkKpE8JlUDrB68YuUK-__IMYWae--rb434xCuWousoe5fimgqBf55W2-zCEiWQFzBlagqtfOm-KeMjAEPvM2BI7N8GVM0_JomgobT1BH8KXEhOhb_nvnXvX6epOZR1uMXJhmlK5WJevXAREZYGDC3PJYCE6Wy-B3Z6HjYXNE9Rmx7AbHZCdGSP4J5CLUQ2SFkuiWPK_x2rldpNYzXkX8sRyR_ersJfwbBDjm1VAvknOMiLR6YQCH2GWHnhWaNEstStJe3jQ5kjVq3oF7KTsz0
height: 4032
width: 3024
- name: places/ChIJpeVeWjWSC0cRLiagLWqyF5U/photos/AZLasHqY4JLHwfVe-ti3wqxKcPh0faKIYY0HfgYA0T28E5UBjeyzS_J9JdaQojkUW-8H2RAK1HMQyXghkKg7_ZThJ3Arr7E436eZc_fRpfTulJaP_qKTweRV2x8l-6B0gGymdP-1SsTKdjQtUBdp4FAjhIMg4HNnBVHslHhvGB56GTJhNPYStV9H14L3XZBYiIARvuIOfGox4GVm6SF3h9w0C8DfNxF1broYMfVKySFqoPb14o6yyS9EVDg8qec7Tq73a8U5-BdxmqbrP8PNbTyd4i5AAK4sm4Ill3QLqTNzDMibMaKQK91boTs_lvqY4b3_sgBAsgE_7XDQVbmsGCdQCtZTkeBV0t0vJlk42VlEEj6rVfgAdmM4VjXU_LWFvL5rxE70GJlcEPWNBLhqWi1nPZnMrdESoN_yxvg9ZSSP-qm_Wg
height: 3000
width: 4000
- name: places/ChIJpeVeWjWSC0cRLiagLWqyF5U/photos/AZLasHpKSe7jxGBdIwTX5hHAbVIqQnsR7PlU6PD0ohDu41MxRLyFJDtAqwQF2kQV_lBuX3xJN59SSF7RfMq9QK0y6cdIxINKRkTTAtctreCuakNG8CNkrhXUYu2lJWUkG99wgOqOcLRRxWouokHJ2WA6W61OrPVqM85CZ0ynHQWTeRMIkZu6TDye5NIoDd-qkUiENxuv6L2DC12WHWIdUCcrgaCCiEeFKFvhtnbDaYAB9Xc_enAWpkL5uSpUa5wP-fumcTZnDgDvso5wEvN1fIbqZE_RyTlhr8LvYKDrY7HbtCFTn1jmEYZwEPeLLHzSyCNKh3lyH9vB6T5lGfx46zw7-7xZ5-5-3WCbI0PbEm6hwCOxuQ8tlLPqGR54Uk6M_53MxnUGjeSai2ZGPsBJ_7oozGhNpfpT8z74ibftPgX98Qo0Rv8jRjKYado-JTMhGw
height: 4032
width: 3024
google_maps_url: https://maps.google.com/?cid=10743251605217355310&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
llm_verification:
is_match: true
confidence: 1.0
entity_type: GRP.HER
reasoning: 'Perfect match. 1. Name is a direct translation: ''Národní archiv'' (Czech) and ''National Archives of the Czech Republic'' (English). 2. Location matches: The address is in Prague, Czechia, which is consistent with the source''s country code ''CZ''. 3. Type matches: The name ''National Archives'' and website confirm it is an archive, a type of heritage institution. 4. Entity type is correct.'
agent: glm-4.6
verified: true
ch_annotator_version: ch_annotator-v1_7_0
_provenance:
content_hash:
algorithm: sha256
value: sha256-yqqNTooF0NoG/Wv8muZIG9QfMBYXF/WqgY5Ml+js3sc=
scope: enrichment_section
computed_at: '2025-12-28T19:58:21.539026+00:00'
prov:
wasDerivedFrom: https://maps.googleapis.com/maps/api/place/details/json?place_id=ChIJpeVeWjWSC0cRLiagLWqyF5U
generatedAtTime: '2025-12-08T19:47:29.028861+00:00'
wasGeneratedBy:
'@type': prov:Activity
name: google_maps_api_fetch
used: https://maps.googleapis.com/maps/api/place
verification:
status: verified
last_verified: '2025-12-28T19:58:21.539030+00:00'
google_maps_status: SUCCESS
youtube_status: NOT_FOUND
youtube_search_query: Národní archiv official
youtube_search_timestamp: '2025-12-08T19:47:31.533149+00:00'
location:
latitude: 50.0389097
longitude: 14.492836599999997
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-12-08T19:47:29.028861+00:00'
entity_id: ChIJpeVeWjWSC0cRLiagLWqyF5U
region_code: 10
country: CZ
street_address: Archivní 2257/4, Praha 4-Chodov
formatted_address: Archivní 2257/4, 149 00 Praha 4-Chodov, Czechia
normalization_timestamp: '2025-12-09T06:49:28.591723+00:00'
logo_enrichment:
enrichment_timestamp: '2025-12-23T20:57:48.334183+00:00'
source_url: http://www.nacr.cz/eindex.htm
extraction_method: crawl4ai
claims:
- claim_type: logo_url
claim_value: https://www.nacr.cz/wp-content/themes/narodni_archiv/img/logo_na_cs.png
source_url: http://www.nacr.cz/eindex.htm
css_selector: '#wrapper-navbar > header.header > div.header__main:nth-of-type(2) > nav.navbar.navbar-expand-lg > div.navbar-mobile-top > div.navbar-brand > a > img'
retrieved_on: '2025-12-23T20:57:48.334183+00:00'
extraction_method: crawl4ai_header_logo
detection_confidence: high
alt_text: Národní archiv
- claim_type: favicon_url
claim_value: https://www.nacr.cz/wp-content/themes/narodni_archiv/img/favicon/apple-icon-180x180.png
source_url: http://www.nacr.cz/eindex.htm
css_selector: '[document] > html > head > link:nth-of-type(9)'
retrieved_on: '2025-12-23T20:57:48.334183+00:00'
extraction_method: crawl4ai_link_rel
favicon_type: ''
favicon_sizes: 180x180
summary:
total_claims: 2
has_primary_logo: true
has_favicon: true
has_og_image: false
favicon_count: 13