glam/data/custodian/US-XX-SFO-D-PDL.yaml
kempersc eb122e2532 data(custodian): remove 380 PENDING files after collision merge
PENDING files were merged into existing custodian records in commit eaf80ec.
These temporary collision placeholder files are no longer needed.
2026-01-09 21:06:22 +01:00

45 lines
1.6 KiB
YAML

ghcid_current: US-XX-SFO-D-PDL
custodian_name:
emic_name: Public Domain Library
english_name: null
name_verified: true
name_source: linkedin_html_h1
institution_type: MUSEUM
staff:
provenance:
source_type: linkedin_company_people_page_html
registered_timestamp: '2025-12-30T10:17:19Z'
registration_method: html_parsing_with_full_staff_data
total_staff_extracted: 1
staff_list:
- staff_id: public-domain-library_staff_0001_simon_kemper
person_name: Simon Kemper
person_profile_path: data/custodian/person/entity/ruiguerracv_*.json
role_title: Research Services
heritage_relevant: true
heritage_type: R
linkedin_profile_url: https://www.linkedin.com/in/ruiguerracv
linkedin_slug: ruiguerracv
linkedin_enrichment:
source_file: (29) Public Domain Library_ People _ LinkedIn.html
extraction_date: '2025-12-30T10:17:19Z'
follower_count: '886'
associated_members: 1
profile_cards_detected: 6
source_type: linkedin_company_people_page_html
extraction_method: html_parsing_with_full_staff_data
provenance:
data_source: LINKEDIN_HTML_PEOPLE_PAGE
data_tier: TIER_4_INFERRED
extraction_date: '2025-12-30T10:17:19.121662+00:00'
extraction_method: Comprehensive batch processing with H1 name extraction and full
staff data
confidence_score: 0.9
notes: 'Staff extracted from LinkedIn company People page. H1 name used: Public
Domain Library. Total staff: 1. Location research needed for GHCID.'
location:
city: San Francisco
country: US
ghcid_resolution:
method: known_organization_database
resolved_at: '2026-01-09T19:47:18.522827+00:00'