glam/data/custodian/h1_sample/.yaml
2025-12-30 03:43:31 +01:00

23 lines
913 B
YAML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

ghcid_current: NL-XX-XXX-PENDING-
custodian_name:
emic_name: 𝙰𝚛𝚝𝚒𝚜𝚝 𝙾𝚙𝚎𝚗 𝙲𝚊𝚕𝚕𝚜
english_name: null
name_verified: true
name_source: linkedin_html_h1
institution_type: MUSEUM
linkedin_enrichment:
source_file: (16) 𝙰𝚛𝚝𝚒𝚜𝚝 𝙾𝚙𝚎𝚗 𝙲𝚊𝚕𝚕𝚜_ People _ LinkedIn.html
extraction_date: '2025-12-29T02:23:17Z'
follower_count: 103K
associated_members: 0
profile_cards_detected: 0
source_type: linkedin_company_people_page_html
extraction_method: h1_name_extraction_only
provenance:
data_source: LINKEDIN_HTML_PEOPLE_PAGE
data_tier: TIER_4_INFERRED
extraction_date: '2025-12-29T02:23:17Z'
extraction_method: Fast H1 name extraction
confidence_score: 0.9
notes: 'H1 institution name extracted from HTML. Profile cards detected: 0. Detailed
staff extraction not performed due to performance constraints.'