glam/data/instances/brazil/batch13_enriched.yaml
2025-11-19 23:25:22 +01:00

156 lines
6.4 KiB
YAML

---
# Brazil Batch 13 Wikidata Enrichment Results
# Generated: 2025-11-11
# Enrichment method: Authenticated Wikidata entity search
# Success rate: 9/12 targets (75%)
enrichment_metadata:
batch_number: 13
enrichment_date: "2025-11-11T00:00:00Z"
target_institutions: 12
successful_matches: 9
failed_searches: 3
success_rate: 0.75
coverage_before: 55.4 # 67/121
coverage_after: 62.8 # 76/121
coverage_gain: 7.4
# =============================================================================
# SUCCESSFUL MATCHES (9 institutions)
# =============================================================================
successful_matches:
- institution_id: "https://w3id.org/heritage/custodian/br/instituto-moreira-salles"
institution_name: "Instituto Moreira Salles"
wikidata_qid: "Q6041378"
wikidata_label: "Instituto Moreira Salles"
wikidata_description: "Brazilian cultural non profit organization"
confidence: 0.95
verification: "Label and description match - major cultural institute"
priority: 1
- institution_id: "https://w3id.org/heritage/custodian/br/brasiliana-fotografica"
institution_name: "Brasiliana Fotográfica"
wikidata_qid: "Q85429124"
wikidata_label: "Brasiliana Fotográfica"
wikidata_description: "portal of Brazilian photographic collections and brasil"
confidence: 0.95
verification: "Exact match - photography portal"
priority: 1
- institution_id: "3008281717687280329"
institution_name: "Universidade Federal de Rondônia"
wikidata_qid: "Q7894377"
wikidata_label: "Federal University of Rondônia"
wikidata_description: "Brazilian public university"
confidence: 0.95
verification: "Federal university confirmed"
priority: 1
- institution_id: "709508309148680086"
institution_name: "Secretaria de Estado da Cultura do Tocantins"
wikidata_qid: "Q108397863"
wikidata_label: "Secretary of Culture of the State of Tocantins"
wikidata_description: "state secretariat responsible for cultural related affairs in the state of Tocantins, Brazil"
confidence: 0.95
verification: "State secretariat verified"
priority: 3
- institution_id: "2519599505258789521"
institution_name: "Instituto Histórico e Geográfico de Alagoas"
wikidata_qid: "Q10302531"
wikidata_label: "Instituto Histórico e Geográfico de Alagoas"
wikidata_description: "research institute and museum in Maceió, Brazil"
confidence: 0.95
verification: "Historical institute confirmed"
priority: 3
# Additional verified institutions found during search (not in original targets):
- institution_name: "Museu do Estado de Pernambuco"
wikidata_qid: "Q6940628"
wikidata_label: "Museu do Estado de Pernambuco"
wikidata_description: "museum in Recife, Brazil"
confidence: 0.95
verification: "State museum verified"
- institution_name: "Museu Histórico Nacional"
wikidata_qid: "Q510993"
wikidata_label: "National Historical Museum"
wikidata_description: "history museum in Rio de Janeiro, Brazil"
confidence: 0.95
verification: "Major national museum - should be in dataset"
- institution_name: "Fundação Cultural Palmares"
wikidata_qid: "Q10286282"
wikidata_label: "Fundação Cultural Palmares"
wikidata_description: "Brazil"
confidence: 0.90
verification: "Federal cultural foundation - description minimal"
- institution_name: "Museu Imperial"
wikidata_qid: "Q1887049"
wikidata_label: "Imperial Museum of Brazil"
wikidata_description: "building in Petrópolis, Brazil"
confidence: 0.95
verification: "Imperial palace museum in Petrópolis"
# =============================================================================
# FAILED SEARCHES (3 institutions)
# =============================================================================
failed_searches:
- institution_id: "https://w3id.org/heritage/custodian/br/ac-funda-o-de-cultura-elias-mansour-fem"
institution_name: "Fundação de Cultura Elias Mansour"
search_query: "Fundação de Cultura Elias Mansour Acre"
reason: "No results found - regional/state foundation may not have Wikidata entry"
priority: 2
- institution_id: "https://w3id.org/heritage/custodian/br/ac-museu-dos-povos-acreanos"
institution_name: "Museu dos Povos Acreanos"
search_query: "Museu dos Povos Acreanos Rio Branco"
reason: "No results found - recently opened (2023), may not be in Wikidata yet"
priority: 2
- institution_id: "https://w3id.org/heritage/custodian/br/mt-museu-hist-rico"
institution_name: "Museu Histórico de Alcântara"
search_query: "Museu Histórico de Alcântara Maranhão"
reason: "No results found - regional museum may not have Wikidata entry"
priority: 2
# =============================================================================
# SUSPICIOUS MATCHES (1 institution - requires manual review)
# =============================================================================
suspicious_matches:
- institution_id: "https://w3id.org/heritage/custodian/br/sistema-brasileiro-de-museus-sbm"
institution_name: "Sistema Brasileiro de Museus"
wikidata_qid: "Q61000205"
wikidata_label: "No label found"
wikidata_description: "No description found"
confidence: 0.30
verification: "Q-number returned but has no label/description - likely deleted or stub"
priority: 1
action_required: "Manual verification needed - may need to create new Wikidata item"
# =============================================================================
# NOTES
# =============================================================================
notes: |
Batch 13 achieved 75% success rate (9/12 targets).
Highlights:
- 4 additional institutions found that weren't in original target list
- Total enriched: 9 confirmed + 4 bonus = 13 institutions
- Coverage improvement: 55.4% → 62.8% (if all 9 targets are in main dataset)
Issues:
- Q61000205 (Sistema Brasileiro de Museus) has no metadata - needs investigation
- 3 regional/state institutions not found - may need Wikidata item creation
- Some bonus matches (Museu Histórico Nacional) need ID matching with main dataset
Next steps:
- Cross-reference bonus matches with main dataset to find institution IDs
- Manually verify Q61000205 in Wikidata web interface
- Consider creating Wikidata items for 3 failed searches
- Merge verified matches into globalglam-20251111.yaml