glam/data/custodian.backup.20251230/BR-DI-BRA-A-APD.yaml
2025-12-30 23:07:03 +01:00

406 lines
17 KiB
YAML
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

original_entry:
name: Arquivo Público DF
institution_type: ARCHIVE
source: CH-Annotator (latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: OpenStreetMap
identifier_value: way/546440775
identifier_url: https://www.openstreetmap.org/way/546440775
- identifier_scheme: GHCID
identifier_value: BR-DF-BRA-A-APD
- identifier_scheme: GHCID_NUMERIC
identifier_value: '17173642500678551557'
- &id002
identifier_scheme: OLD_ID
identifier_value: https://w3id.org/heritage/custodian/br/arquivo-publico-df
- identifier_scheme: GHCID_UUID
identifier_value: 22fee297-929d-5df3-9e09-08a174ac19ea
identifier_url: urn:uuid:22fee297-929d-5df3-9e09-08a174ac19ea
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: ee5508dd-507f-8805-92f7-836d99bdc8e0
identifier_url: urn:uuid:ee5508dd-507f-8805-92f7-836d99bdc8e0
- identifier_scheme: RECORD_ID
identifier_value: 019a58fd-3226-77cc-b03f-0e71083ecd60
identifier_url: urn:uuid:019a58fd-3226-77cc-b03f-0e71083ecd60
- &id003
identifier_scheme: OLD_ID
identifier_value: 17173642500678551557
- &id004
identifier_scheme: Wikidata
identifier_value: Q56693579
identifier_url: https://www.wikidata.org/wiki/Q56693579
locations:
- country: BR
region: DISTRITO FEDERAL
city: Brasília
latitude: -15.7713876
longitude: -47.9107101
processing_timestamp: '2025-12-06T23:35:51.834862+00:00'
ghcid:
ghcid_current: BR-DI-BRA-A-APD
ghcid_original: BR-DI-BRA-A-APD
ghcid_uuid: 5c70b7b3-d318-508b-abe0-9b38202d925d
ghcid_uuid_sha256: 2f123162-8cb5-8ad7-0952-56476ac71200
ghcid_numeric: 3391827768700676823
record_id: 825d81f6-ce15-4324-84e8-ce70f7e71f21
generation_timestamp: '2025-12-06T23:35:51.834862+00:00'
location_resolution:
country_code: BR
region_code: DI
city_code: BRA
method: CH_ANNOTATOR_SOURCE
ghcid_history:
- ghcid: BR-DI-BRA-A-APD
ghcid_numeric: 3391827768700676823
valid_from: '2025-12-06T23:35:51.834862+00:00'
reason: Initial GHCID from CH-Annotator (latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml)
custodian_name:
claim_type: custodian_name
claim_value: Arquivo Público DF
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: BR-DI-BRA-A-APD
- identifier_scheme: GHCID_UUID
identifier_value: 5c70b7b3-d318-508b-abe0-9b38202d925d
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 2f123162-8cb5-8ad7-0952-56476ac71200
- identifier_scheme: GHCID_NUMERIC
identifier_value: '3391827768700676823'
- identifier_scheme: RECORD_ID
identifier_value: 825d81f6-ce15-4324-84e8-ce70f7e71f21
- *id001
- *id002
- *id003
- *id004
provenance:
data_source: CONVERSATION_NLP
data_tier: TIER_4_INFERRED
extraction_date: '2025-11-06T08:31:18.910256+00:00'
extraction_method: 'Created from CH-Annotator file: latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml'
confidence_score: 0.75
notes:
- 'YouTube/Google Maps enrichment 2025-12-08T20:11:57Z: Maps: Public Archive of the Federal District (conf: 0.95); YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:55Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:20Z
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-LqtZ64AGy96otUp/L8n6SyzWGCt/2p11prZlrnW2+bo=
verified_at: '2025-12-28T19:57:35.251571+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q56693579
google_maps_enrichment:
content_hash: sha256-sWEPrdTSsntBCE/cAAJaE79PZnQIVu+fFCYgMXvmkKE=
verified_at: '2025-12-28T19:57:35.251670+00:00'
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:57:35.251683+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.ARC
subtype_label: ARCHIVE
ontology_class: schema:ArchiveOrganization
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
timestamp: '2025-11-06T08:31:18.910256+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:13:56.173868+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: latin_american_institutions_AUTHORITATIVE.yaml
annotation_metadata:
confidence_score: 0.75
verified: false
verification_date:
verified_by:
entity_claims:
- claim_type: full_name
claim_value: Arquivo Público DF
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
timestamp: '2025-11-06T08:31:18.910256+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.75
- claim_type: institution_type
claim_value: ARCHIVE
property_uri: rdf:type
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
timestamp: '2025-11-06T08:31:18.910256+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.95
- claim_type: located_in_city
claim_value: Brasília
property_uri: schema:addressLocality
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
timestamp: '2025-11-06T08:31:18.910256+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.9
- claim_type: wikidata_id
claim_value: Q56693579
property_uri: owl:sameAs
provenance:
namespace: wikidata
path: /entity/Q56693579
timestamp: '2025-11-06T08:31:18.910256+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 0.98
- claim_type: ghcid
claim_value: BR-DF-BRA-A-APD
property_uri: glam:ghcid
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
timestamp: '2025-11-06T08:31:18.910256+00:00'
agent: claude-conversation
context_convention: ch_annotator-v1_7_0
confidence: 1.0
integration_note:
created_from: latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml
creation_date: '2025-12-06T23:35:51.834862+00:00'
creation_method: create_custodian_from_ch_annotator.py
wikidata_enrichment:
wikidata_entity_id: Q56693579
api_metadata:
api_endpoint: https://www.wikidata.org/w/rest.php/wikibase/v1
fetch_timestamp: '2025-12-08T23:20:44.971796+00:00'
user_agent: GLAMDataExtractor/1.1 (glam-data@example.com) Python/httpx
enrichment_version: 2.0_full
properties_found:
- P17
- P31
- P131
- P968
- P625
- P856
- P1329
- P281
- P973
wikidata_labels:
pt: Fundação Museu e Arquivo Público do Município de Campo Belo
pt-br: Fundação Museu e Arquivo Público do Município de Campo Belo
wikidata_descriptions:
pt: arquivo em Campo Belo, Minas Gerais
pt-br: arquivo em Campo Belo, Minas Gerais
en: archive in Campo Belo, Minas Gerais
de: Archiv in Brasilien
wikidata_description_en: archive in Campo Belo, Minas Gerais
wikidata_classification:
instance_of: &id005
- id: Q166118
label: archive
description: agency or institution responsible for the preservation and communication of records selected for permanent preservation
wikidata_instance_of: *id005
wikidata_location:
country: &id006
id: Q155
label: Brazil
description: country in South America
located_in_admin_entity: &id007
id: Q595804
label: Campo Belo
description: town and municipality in the state of Minas Gerais, in Brazil
coordinates: &id008
latitude: -20.8933848
longitude: -45.2731018
precision: 1.0e-06
postal_code: 37270-000
wikidata_country: *id006
wikidata_located_in: *id007
wikidata_coordinates: *id008
wikidata_web:
official_website: https://www.campobelo.mg.gov.br/portal/servicos/60/INSTITUCIONAL/Funda%C3%A7%C3%A3o-Museu-e-Arquivo-P%C3%BAblico
described_at_url: https://dibrarq.arquivonacional.gov.br/index.php/fundacao-museu-e-arquivo-publico-do-municipio-de-campo-belo
wikidata_official_website: https://www.campobelo.mg.gov.br/portal/servicos/60/INSTITUCIONAL/Funda%C3%A7%C3%A3o-Museu-e-Arquivo-P%C3%BAblico
wikidata_contact:
email: mailto:admin@museucampobelo.org
phone_number: +55-35-3832-5753
_provenance:
content_hash:
algorithm: sha256
value: sha256-LqtZ64AGy96otUp/L8n6SyzWGCt/2p11prZlrnW2+bo=
scope: enrichment_section
computed_at: '2025-12-28T19:57:35.251571+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q56693579
verification:
status: verified
last_verified: '2025-12-28T19:57:35.251579+00:00'
google_maps_enrichment:
place_id: ChIJHyjj6jcwWpMRz4DaDzguqwc
name: Public Archive of the Federal District
fetch_timestamp: '2025-12-08T20:11:54.770290+00:00'
api_status: OK
coordinates:
latitude: -15.7718782
longitude: -47.910947
formatted_address: SGO Qd. 05 Lote 23 Bloco B (Antigo TSE - Asa Norte, Brasília - DF, 70610-650, Brazil
short_address: SGO Qd. 05 Lote 23 Bloco B (Antigo TSE - Asa Norte, Brasília
phone_local: (61) 3313-5981
phone_international: +55 61 3313-5981
website: https://www.arpdf.df.gov.br/
google_place_types:
- cultural_center
- point_of_interest
- establishment
primary_type: cultural_center
business_status: OPERATIONAL
rating: 4.4
total_ratings: 329
reviews:
- author_name: Robson Alves
author_uri: https://www.google.com/maps/contrib/117029445471804808852/reviews
rating: 5
relative_time_description: 6 months ago
text: Top
publish_time: '2025-06-07T16:53:12.458400Z'
- author_name: Clayton Alves
author_uri: https://www.google.com/maps/contrib/100324000903105902902/reviews
rating: 5
relative_time_description: 6 years ago
text: Very good
publish_time: '2019-11-03T15:04:00.733924Z'
- author_name: Wesley Punk
author_uri: https://www.google.com/maps/contrib/112392639271864780491/reviews
rating: 5
relative_time_description: a year ago
text: Legal
publish_time: '2024-08-09T20:29:14.995785Z'
- author_name: Francisco Mota
author_uri: https://www.google.com/maps/contrib/111823137529859984321/reviews
rating: 5
relative_time_description: 6 years ago
text: Top
publish_time: '2019-10-03T04:14:52.777556Z'
- author_name: Marcelo Judice
author_uri: https://www.google.com/maps/contrib/114891886476276807491/reviews
rating: 5
relative_time_description: a year ago
text: 'Muito satisfeito de ter conhecido instituição tão importante para a memória do Distrito Federal.
Atua como protetora de materiais impressos e audiovisuais com o registro histoʻrico dobque aconteceu na Capital do Brasil, desde antes de sua fundação.'
publish_time: '2024-11-28T00:06:44.177534Z'
opening_hours:
open_now: false
weekday_text:
- 'Monday: 9:00AM5:00PM'
- 'Tuesday: 9:00AM5:00PM'
- 'Wednesday: 9:00AM5:00PM'
- 'Thursday: 9:00AM5:00PM'
- 'Friday: 9:00AM5:00PM'
- 'Saturday: Closed'
- 'Sunday: Closed'
photo_count: 10
photos_metadata:
- name: places/ChIJHyjj6jcwWpMRz4DaDzguqwc/photos/AZLasHoZLF52sqNntJaxUFR6_M8qwGS2jXvN6SL5apcfuzWSy9sBkCqRzWtT8u7miwgUkKP4ZzBAq8qcyKN2ymRX-qu6RXIFr_rmNiE3qb0AfMq2M3vk1hnFShx2GefUh94DcZmildTwTSWyQv1xIoTLlZe19XLnkE0npLuw8JdRtgvr-W94l6UnrVA9pfb3XTo3MAz1eF9wurd8-RBdOnQ8zzCgHJzUA576SBFthbNYX5kS5uWK46-Gc4T7FjpRnCuqmdgw8tc35TTDsAWn-F__bWUMFcKO-cglS7MZN0Ok6EIv3o7eHjxlIQIVUynUed0IvuVXE96yTh41gEOJo_8S_dm2kSL2HzMaw-LHVuUB-K9WZNFstG2JdHNzTa44mx8jTVFU0QnXIXRv8OoTbX3hmaM36qFOQ4bfvrYXbvkGwoCxrLQ
height: 720
width: 1280
- name: places/ChIJHyjj6jcwWpMRz4DaDzguqwc/photos/AZLasHqtKEAnSlsiQWelificmIze5yPUjmUMVzTClexB1yWhcqn7hrn7mD9MucE44qG8mGxu0iPCL4Ht73fF1SPLPWoC9av0uni7x_v5P57YqRWKMsMMpDmZkX625zaXXCxBlE_ZSngi3N8Ca3ITGFHlDHD03K4atQY5ZL9_Kwn4klsI22utxY72za8gu1W8I30QQKJFdwna-wJvXtudFisEzJhojd2xunitdgLQIDjCsaOVjgFG77rbeR-g_uBvu6jbkeQkYt0tRlvezREpzTSgqUWZDf5gVObxaYJk2KAfviLZKUpU6wn0yMMvQfcM0zN3LwSaJR3lurukKaaltkPqzdv1Cqy4UlALsZpe2yVVdyzYDAzVClNdY_gp1TP9VFPTqURNLWkRHO9tdz8wg6e7w93KxcwLobqkse9N3jPh2HI
height: 3072
width: 4096
- name: places/ChIJHyjj6jcwWpMRz4DaDzguqwc/photos/AZLasHpSGQ0yk4AXtKMeitsiHBWIjw34-jEF-GpD4YnJ6qjokvyz4edAzSLvePoVYHStPF4diy7xNFs2XSms6Ja5D7wWe6xeUgAz84PPwAb3cjscPG-PrNj3foV4CyKTaNE13PcagaE4G9B5rzoseD2ZYJZab0paXzdi1b7XgN-QrMEJFmcFKNEgKR9CAFkO574fhkSxRfq2a0bKK_ZB0PbpG1Zx1Xs2tecU2kk47CYnfOvXe9EGoOpuHjO4z3ow-Abb7HnE3Kb0kbRER6dzRd9j4KdIuoNSdVWlbv-vOSxJs8zFNymfJOtQC-yopEPjCW6mJiYX6OmQg3yX_oPdOFVtD3FDAsqQt4GCJv6LnvjXHPRnTM1iuZk3km_cKnc3z1avgxWkvMXRiV8me8v-L1tQmMBB9jBTlti_1i6czETXZSJkiMhx
height: 720
width: 1280
- name: places/ChIJHyjj6jcwWpMRz4DaDzguqwc/photos/AZLasHrzlA0SYQtKC2rSgGd2cqGqKZCbzi0qY0y_DV3az21gzh8eHWEkpSOccQ1qq0ad9BqfDlV3OWhHZNAzyUpg6sZpUlOjiSQLRaKc_EpT-k0SJbOOTpXxaF4CxQKMMeba30qfgIZOsN-GvxC132Gj0GaJh0ZC2ZliDnbgQq4HVXqJzBbH29rzjbZWvPUEkOsh898i8uDklL-QncwB4rJctlVwuJpuGC0jgjffk-OO4sY1Pz484v8v_W3MtdE8Z9W9MY7tlbEhADF0weB0KL8xnV3YVfZgsLQGVrsoRASB-qsGOFyB-efPb3WT-v-bp-FInCwMSfYyFBZbnjGSvP5pYndmkwpP79JXjWCzVOYYvcx3KBZElxUw6mJSnPNSomD8ZuFtpWi9YFFjzCqFksANnKcAvTJKYSoSB60VOP59jYL75A
height: 1456
width: 2592
- name: places/ChIJHyjj6jcwWpMRz4DaDzguqwc/photos/AZLasHro8zY1Kj4PXHRNr8gxsqHmSCm8vNUUR1_nChWwdtCDCuaoJdV8jIX0ZAfTL__2rnTq-eIf_ZSAGpCFGVqMev1lqITPrQsBE7oqG4RfpErHzi1I2RM40speDj-Oj6yndIy9hd3xcQ-twPg45AmUh6MdxQkHKKGYsJkikxTcJMivPd49RK7f-s5xyPTGRdoZJ-cSZW97MojXKrkeFrU11nXrIeB2x8QHSuD-A2u5WabgjAXV-EMr0MXgFrYKNIctYkQlyAAyakyfxBwf8FZF7EH5lm75Lj0MCCJbQiZ8ZJDwacdjotB6qxQiWb2Hdj5LxAus6I4StLDibiUUmu_jGaAk2gPsdTwZQcz4yq49Z-b3B4_nmxZ9abS087d8NwPyQ3NbDQ_8yGI5zcakPRs_1ZVhKRWeUWCHYiHC8HH6KzgOzv05
height: 720
width: 1280
google_maps_url: https://maps.google.com/?cid=552586197602042063&g_mp=Cidnb29nbGUubWFwcy5wbGFjZXMudjEuUGxhY2VzLlNlYXJjaFRleHQQAhgEIAA
llm_verification:
is_match: true
confidence: 0.95
entity_type: GRP.HER
reasoning: Name is a direct translation from Portuguese to English. Location in Brasília, DF, Brazil is a match. The official website confirms the identity. While Google's primary type is 'cultural_center', the institution's name 'Public Archive' confirms it is an archive, which is a type of heritage institution.
agent: glm-4.6
verified: true
ch_annotator_version: ch_annotator-v1_7_0
_provenance:
content_hash:
algorithm: sha256
value: sha256-sWEPrdTSsntBCE/cAAJaE79PZnQIVu+fFCYgMXvmkKE=
scope: enrichment_section
computed_at: '2025-12-28T19:57:35.251670+00:00'
prov:
wasDerivedFrom: https://maps.googleapis.com/maps/api/place/details/json?place_id=ChIJHyjj6jcwWpMRz4DaDzguqwc
generatedAtTime: '2025-12-08T20:11:54.770290+00:00'
wasGeneratedBy:
'@type': prov:Activity
name: google_maps_api_fetch
used: https://maps.googleapis.com/maps/api/place
verification:
status: verified
last_verified: '2025-12-28T19:57:35.251674+00:00'
google_maps_status: SUCCESS
youtube_status: NOT_FOUND
youtube_search_query: Arquivo Público DF official
youtube_search_timestamp: '2025-12-08T20:11:57.553273+00:00'
location:
latitude: -15.7718782
longitude: -47.910947
coordinate_provenance:
source_type: GOOGLE_MAPS
source_path: google_maps_enrichment.coordinates
original_timestamp: '2025-12-08T20:11:54.770290+00:00'
entity_id: ChIJHyjj6jcwWpMRz4DaDzguqwc
city: Brasília
region: DISTRITO FEDERAL
region_code: DI
country: BR
street_address: SGO Qd. 05 Lote 23 Bloco B (Antigo TSE - Asa Norte, Brasília
formatted_address: SGO Qd. 05 Lote 23 Bloco B (Antigo TSE - Asa Norte, Brasília - DF, 70610-650, Brazil
normalization_timestamp: '2025-12-09T06:48:20.985901+00:00'
logo_enrichment:
enrichment_timestamp: '2025-12-22T14:33:40.718847+00:00'
source_url: https://www.campobelo.mg.gov.br/portal/servicos/60/INSTITUCIONAL/Funda%C3%A7%C3%A3o-Museu-e-Arquivo-P%C3%BAblico
extraction_method: crawl4ai
claims:
- claim_type: logo_url
claim_value: https://www.campobelo.mg.gov.br/img/logo_branca.png
source_url: https://www.campobelo.mg.gov.br/portal/servicos/60/INSTITUCIONAL/Funda%C3%A7%C3%A3o-Museu-e-Arquivo-P%C3%BAblico
css_selector: '#logo_branca > img'
retrieved_on: '2025-12-22T14:33:40.718847+00:00'
extraction_method: crawl4ai_header_logo
detection_confidence: high
alt_text: Logo
- claim_type: og_image_url
claim_value: https://www.campobelo.mg.gov.br/fotos/b9440a1b721aa771420cf69e73b64106.jpg
source_url: https://www.campobelo.mg.gov.br/portal/servicos/60/INSTITUCIONAL/Funda%C3%A7%C3%A3o-Museu-e-Arquivo-P%C3%BAblico
css_selector: '[document] > html > head > meta:nth-of-type(12)'
retrieved_on: '2025-12-22T14:33:40.718847+00:00'
extraction_method: crawl4ai_meta_og
summary:
total_claims: 2
has_primary_logo: true
has_favicon: false
has_og_image: true
favicon_count: 0