glam/data/custodian/BR-PE-VAR-X-F.yaml
2025-12-30 23:01:01 +01:00

254 lines
10 KiB
YAML

original_entry:
name: FUNDAJ
institution_type: MIXED
source: CH-Annotator (latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml)
identifiers:
- &id001
identifier_scheme: Website
identifier_value: http://digitalizacao.fundaj.gov.br/
identifier_url: http://digitalizacao.fundaj.gov.br/
- &id002
identifier_scheme: OpenStreetMap
identifier_value: node/5745593875
identifier_url: https://www.openstreetmap.org/node/5745593875
- identifier_scheme: GHCID
identifier_value: BR-PE-REC-M-F
- identifier_scheme: GHCID_NUMERIC
identifier_value: '4969544443987841306'
- &id003
identifier_scheme: OLD_ID
identifier_value: https://w3id.org/heritage/custodian/br/fundaj
- identifier_scheme: GHCID_UUID
identifier_value: 76b46cca-2df5-5f74-bbb9-b9b69d1eb51c
identifier_url: urn:uuid:76b46cca-2df5-5f74-bbb9-b9b69d1eb51c
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 44f75e57-8f69-811a-84d1-1122295e7de8
identifier_url: urn:uuid:44f75e57-8f69-811a-84d1-1122295e7de8
- identifier_scheme: RECORD_ID
identifier_value: 019a58fd-3226-75ea-a38e-7cfb5ff65112
identifier_url: urn:uuid:019a58fd-3226-75ea-a38e-7cfb5ff65112
- &id004
identifier_scheme: OLD_ID
identifier_value: 4969544443987841306
locations:
- country: BR
region: PERNAMBUCO
city: Recife
latitude: -8.0200442
longitude: -34.9364669
street_address: Rua Dois irmãos 92
postal_code: 55071-440
processing_timestamp: '2025-12-06T23:35:51.924216+00:00'
ghcid:
ghcid_current: BR-PE-VAR-X-F
ghcid_original: BR-PE-REC-X-F
ghcid_uuid: 338c7ad2-a2d3-52b3-baa6-c350e48b9327
ghcid_uuid_sha256: 69838a90-d27b-83db-647e-8fa92cc3ae87
ghcid_numeric: 7603072950542791643
record_id: bdda657b-c234-49d1-a774-d0b219e7582f
generation_timestamp: '2025-12-06T23:35:51.924216+00:00'
location_resolution:
method: REVERSE_GEOCODE
country_code: BR
region_code: PE
region_name: Pernambuco
city_code: VAR
city_name: Várzea
geonames_id: 3385478
feature_code: PPL
resolution_date: '2025-12-06T23:54:44.715310+00:00'
ghcid_history:
- ghcid: BR-30-VAR-X-F
ghcid_numeric: 7603072950542791643
valid_from: '2025-12-06T23:54:44.715310+00:00'
reason: Updated via GeoNames reverse geocoding (matched Várzea, geonames:3385478)
- ghcid: BR-PE-REC-X-F
ghcid_numeric: 11188838590843757112
valid_from: '2025-12-06T23:35:51.924216+00:00'
reason: Initial GHCID from CH-Annotator (latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml)
valid_to: '2025-12-06T23:54:44.715310+00:00'
superseded_by: BR-30-VAR-X-F
- ghcid: BR-30-VAR-X-F
valid_from: '2025-12-06T23:35:51.924216+00:00'
valid_to: '2025-12-10T10:20:50Z'
reason: Region code corrected from GeoNames admin1 (30) to ISO 3166-2 (PE)
custodian_name:
claim_type: custodian_name
claim_value: FUNDAJ
source_type: ch_annotator
identifiers:
- identifier_scheme: GHCID
identifier_value: BR-PE-VAR-X-F
- identifier_scheme: GHCID_UUID
identifier_value: 338c7ad2-a2d3-52b3-baa6-c350e48b9327
- identifier_scheme: GHCID_UUID_SHA256
identifier_value: 69838a90-d27b-83db-647e-8fa92cc3ae87
- identifier_scheme: GHCID_NUMERIC
identifier_value: '7603072950542791643'
- identifier_scheme: RECORD_ID
identifier_value: bdda657b-c234-49d1-a774-d0b219e7582f
- *id001
- *id002
- *id003
- *id004
provenance:
data_source: CONVERSATION_NLP
data_tier: TIER_4_INFERRED
extraction_date: '2025-11-06T08:32:03.951400+00:00'
extraction_method: 'Created from CH-Annotator file: latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml'
confidence_score: 0.85
notes:
- 'YouTube/Google Maps enrichment 2025-12-08T20:10:23Z: Maps: rejected by LLM; YouTube: not found'
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:10:52Z
- Canonical location added via normalize_custodian_files.py on 2025-12-08T23:46:54Z
- Canonical location added via normalize_custodian_files.py on 2025-12-09T06:48:19Z
schema_version: 2.0.0
enrichment_provenance:
wikidata_enrichment:
content_hash: sha256-vNJ/OKWaztgg86Us/iemxY8secjZm/VGYx5gQ0aEUAU=
verified_at: '2025-12-28T19:57:36.431367+00:00'
wasDerivedFrom: https://www.wikidata.org/wiki/Q10286348
provenance_schema_version: '2.0'
standards_compliance:
- W3C PROV-O
- W3C SRI (content hashes)
generated_at: '2025-12-28T19:57:36.431380+00:00'
ch_annotator:
convention_id: ch_annotator-v1_7_0
convention_version: 1.7.0
entity_classification:
hypernym: GRP
hypernym_label: GROUP
subtype: GRP.HER.MIX
subtype_label: MIXED
ontology_class: glam:HeritageCustodian
alternative_classes:
- org:FormalOrganization
- rov:RegisteredOrganization
- glam:HeritageCustodian
extraction_provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-06T08:32:03.951400+00:00'
statement_created_at: '2025-12-30T21:23:24.226782+00:00'
migration_note: Migrated from agent:claude-conversation on 2025-12-30 (ch_annotator.extraction_provenance)
annotation_provenance:
annotation_agent: opencode-claude-sonnet-4
annotation_date: '2025-12-06T21:13:56.173868+00:00'
annotation_method: retroactive CH-Annotator application via batch script
source_file: latin_american_institutions_AUTHORITATIVE.yaml
annotation_metadata:
confidence_score: 0.85
verified: false
verification_date: null
verified_by: null
entity_claims:
- claim_type: full_name
claim_value: FUNDAJ
property_uri: skos:prefLabel
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-06T08:32:03.951400+00:00'
statement_created_at: '2025-12-30T21:23:24.226790+00:00'
migration_note: Migrated from agent:claude-conversation on 2025-12-30 (entity_claims[0].provenance)
confidence: 0.85
- claim_type: institution_type
claim_value: MIXED
property_uri: rdf:type
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-06T08:32:03.951400+00:00'
statement_created_at: '2025-12-30T21:23:24.226792+00:00'
migration_note: Migrated from agent:claude-conversation on 2025-12-30 (entity_claims[1].provenance)
confidence: 0.95
- claim_type: located_in_city
claim_value: Recife
property_uri: schema:addressLocality
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-06T08:32:03.951400+00:00'
statement_created_at: '2025-12-30T21:23:24.226793+00:00'
migration_note: Migrated from agent:claude-conversation on 2025-12-30 (entity_claims[2].provenance)
confidence: 0.9
- claim_type: ghcid
claim_value: BR-PE-REC-M-F
property_uri: glam:ghcid
provenance:
namespace: glam
path: /conversations/2025-09-22T14-40-15-0102c00a-4c0a-4488-bdca-5dd9fb94c9c5
agent: batch-script-create-custodian-from-ch-annotator
context_convention: ch_annotator-v1_7_0
source_archived_at: '2025-11-06T08:32:03.951400+00:00'
statement_created_at: '2025-12-30T21:23:24.226795+00:00'
migration_note: Migrated from agent:claude-conversation on 2025-12-30 (entity_claims[3].provenance)
confidence: 1.0
integration_note:
created_from: latin_american_institutions_AUTHORITATIVE_ch_annotator.yaml
creation_date: '2025-12-06T23:35:51.924216+00:00'
creation_method: create_custodian_from_ch_annotator.py
google_maps_status: NO_MATCH
google_maps_rejected:
candidate_name: Fundação Joaquim Nabuco Movie Theater
rejection_reason: 'NAME MATCH: Partial match. The candidate is a ''Movie Theater'' part of the ''Fundação Joaquim Nabuco''
institution. However, it is a sub-entity, not the parent institution itself, which is the target for annotation. LOCATION
MATCH: Match. Both are in the Recife metropolitan area, Brazil. TYPE MATCH: Mismatch. The Google Place type ''movie_theater''
is not an expected heritage institution type (museum, library, gallery, archive). ENTITY TYPE: REJECT. The specific entity
is a cinema, not a heritage custodian institution.'
timestamp: '2025-12-08T20:10:22.902908+00:00'
youtube_status: NOT_FOUND
youtube_search_query: FUNDAJ official
youtube_search_timestamp: '2025-12-08T20:10:23.237851+00:00'
location:
latitude: -8.0200442
longitude: -34.9364669
coordinate_provenance:
source_type: ORIGINAL_ENTRY
source_path: original_entry.locations[0]
city: Várzea
region: Pernambuco
region_code: PE
country: BR
postal_code: 55071-440
street_address: Rua Dois irmãos 92
geonames_id: 3385478
feature_code: PPL
normalization_timestamp: '2025-12-09T06:48:19.870119+00:00'
wikidata_enrichment:
wikidata_id: Q10286348
wikidata_url: https://www.wikidata.org/wiki/Q10286348
label: Joaquim Nabuco Foundation
description: historical-cultural preservation foundation in Recife, Brazil
enrichment_timestamp: '2025-01-13T00:00:00Z'
enrichment_method: manual_wikidata_lookup
identifiers:
VIAF: '140738855'
LCNAF: n82048151
official_website: http://www.fundaj.gov.br
_provenance:
content_hash:
algorithm: sha256
value: sha256-vNJ/OKWaztgg86Us/iemxY8secjZm/VGYx5gQ0aEUAU=
scope: enrichment_section
computed_at: '2025-12-28T19:57:36.431367+00:00'
prov:
wasGeneratedBy:
'@type': prov:Activity
name: wikidata_api_fetch
used: https://www.wikidata.org/w/rest.php/wikibase/v1
wasDerivedFrom: https://www.wikidata.org/wiki/Q10286348
generatedAtTime: '2025-01-13T00:00:00Z'
verification:
status: verified
last_verified: '2025-12-28T19:57:36.431372+00:00'
wikidata_entity_id: Q10286348