glam/data/person/ID_XX-XX-XXX_196X_XX-XX-XXX_XXXX_ANCA-EGAS.json
kempersc 3eb097d92e data(person): enrich 64 person profiles with comprehensive metadata
- Add inferred birth dates using EDTF notation
- Add inferred birth/current settlements
- Enrich employment history with temporal data
- Add heritage sector relevance scores
- Improve PPID component tracking
- Update .gitignore with large file patterns (warc, nt, trix, geonames.db)
2026-01-11 00:38:09 +01:00

250 lines
No EOL
8.4 KiB
JSON

{
"ppid": "ID_XX-XX-XXX_196X_XX-XX-XXX_XXXX_ANCA-EGAS",
"ppid_type": "ID",
"ppid_components": {
"type": "ID",
"first_location": "XX-XX-XXX",
"first_date": "196X",
"last_location": "XX-XX-XXX",
"last_date": "XXXX",
"name_tokens": [
"ANCA",
"EGAS"
],
"first_date_source": "inferred_birth_decade.primary_value",
"first_date_alternatives": [
"197X"
]
},
"name": {
"full_name": "Anca Egas",
"display_name": "Anca Egas",
"name_romanized": null,
"name_tokens": [
"ANCA",
"EGAS"
],
"source": "linkedin_profile"
},
"birth_date": {
"edtf": "XXXX",
"precision": "unknown",
"note": "See inferred_birth_decade for heuristic estimate"
},
"is_living": true,
"heritage_relevance": {
"is_heritage_relevant": true,
"heritage_types": [
"M"
],
"rationale": "Identified as heritage staff at Nederlands Openluchtmuseum"
},
"affiliations": [],
"profile_data": {
"name": "Anca Egas",
"linkedin_url": "https://www.linkedin.com/in/anca-egas-4b81355",
"headline": "curator at The Open Air Museum",
"location": "",
"connections": "155 connections • 155 followers",
"about": "Total Experience: 35 years and 5 months",
"experience": [
{
"title": "Curator",
"company": "The Open Air Museum (Current)"
},
{
"title": "Conservator Projectleider",
"company": "Dutch Open Air Museum Arnhem (Current)",
"date_range": "Jan 1992 - Present • 33 years and 2 months"
},
{
"title": "Curator And Project Leader",
"company": "Nederlands Openlucht Museum",
"date_range": "Jan 1992 - Present • 33 years and 9 months"
},
{
"title": "Curator Leader Of Projects",
"company": "Nederlands Openluchtmuseum",
"date_range": "Jan 1992 - Present • 33 years and 9 months"
},
{
"title": "Conservator Project Leider",
"company": "Nederlands Openluchtmuseum",
"date_range": "Jan 1991 - Present • 34 years and 9 months"
}
],
"education": [],
"skills": [
"projects"
],
"languages": [],
"profile_image_url": "https://static.licdn.com/aero-v1/sc/h/9c8pery4andzj6ohjkjp54ma2"
},
"web_claims": [
{
"claim_type": "position",
"claim_value": {
"title": "curator",
"organization": "The Open Air Museum or details about her education",
"year": null
},
"provenance": {
"statement_created_at": "2026-01-10T23:07:14.646896+00:00",
"source_archived_at": "2026-01-10T23:07:10.952954+00:00",
"retrieval_agent": "enrich_person_comprehensive.py v1.1.1",
"retrieval_method": "linkup_web_search",
"api_endpoint": "https://api.linkup.so/v1/search",
"search_query": "\"Anca Egas\" curator at The Open Air Museum education career university",
"search_depth": "standard",
"source_url": "https://www.linkedin.com/company/association-of-academic-museums-and-galleries",
"source_title": "Association of Academic Museums and Galleries | LinkedIn",
"source_snippet": "bout Anca Egas as a curator at The Open Air Museum or details about her education or university career",
"extraction_method": "regex_pattern_matching",
"pattern_type": "position",
"verified": false,
"verification_status": "machine_extracted",
"requires_human_review": true,
"http_status": 200,
"answer_position": "answer[38:140]",
"all_sources": [
{
"url": "https://www.linkedin.com/company/association-of-academic-museums-and-galleries",
"name": "Association of Academic Museums and Galleries | LinkedIn"
},
{
"url": "https://www.artcurators.org/networking/opening_search.asp",
"name": "Career Center - Search for Openings - AAMC & AAMC Foundation"
},
{
"url": "https://www.aamg-us.org/category/general-announcement/jobs/",
"name": "Job Postings Archives - Association of Academic Museums and Galleries"
},
{
"url": "https://www.artcurators.org/networking/",
"name": "Career Center - AAMC & AAMC Foundation"
},
{
"url": "https://www.purdue.edu/science/careers/what_can_i_do_with_a_major/Career%20Pages/museum_curator.html",
"name": "Museum Curator - College of Science - Purdue University"
}
],
"source_count": 20,
"answer_content_hash": "0d1b56e640cf4cc9"
}
}
],
"source_observations": [
{
"source_file": "/Users/kempersc/apps/glam/data/custodian/person/entity/anca-egas-4b81355_20251214T110559Z.json",
"observed_on": "2025-12-14T11:05:59.036496+00:00",
"extraction_agent": "claude-sonnet-4-20250514"
}
],
"enrichment_metadata": {
"birth_date_search": {
"attempted": false,
"notes": "Not yet searched - requires manual enrichment"
}
},
"provenance": {
"created_at": "2026-01-09T17:29:48.668865+00:00",
"created_by": "generate_ppids.py",
"source_files": [
"/Users/kempersc/apps/glam/data/custodian/person/entity/anca-egas-4b81355_20251214T110559Z.json"
],
"modified_at": "2026-01-09T19:51:05.598427+00:00",
"modified_by": "enrich_ppids.py"
},
"linkedin_slug": "anca-egas-4b81355",
"ppid_history": [
{
"previous_ppid": "ID_XX-XX-XXX_XXXX_XX-XX-XXX_XXXX_ANCA-EGAS",
"new_ppid": "ID_XX-XX-XXX_196X_XX-XX-XXX_XXXX_ANCA-EGAS",
"changed_at": "2026-01-09T17:43:04.859441+00:00",
"reason": "observation_based_inference",
"inferred_fields": [
"inferred_birth_decade"
]
}
],
"inferred_birth_decade": {
"values": [
"196X",
"197X"
],
"edtf": "[196X,197X]",
"edtf_meaning": "one of: 1960s or 1970s",
"precision": "decade_set",
"primary_value": "196X",
"primary_rationale": "1968 is in 196X, but range extends into 197X",
"confidence": "very_low",
"inference_provenance": {
"method": "earliest_experience_heuristic",
"inference_chain": [
{
"step": 1,
"observation": "First job record found (no education data)",
"source_field": "profile_data.experience",
"source_value": {
"company": "Nederlands Openluchtmuseum",
"title": "Conservator Project Leider",
"date_range": "Jan 1991 - Present • 34 years and 9 months"
}
},
{
"step": 2,
"extraction": "Start year extracted from date_range",
"extracted_value": 1991
},
{
"step": 3,
"assumption": "First job age is approximately 23 (±5 years)",
"rationale": "Assumes first job after typical university completion",
"confidence_impact": "Higher uncertainty; first job age varies ±5 years"
},
{
"step": 4,
"calculation": "1991 - 23 = 1968",
"result": "Estimated birth year: 1968",
"range": "1963-1973 (accounting for ±5 year variance)"
},
{
"step": 5,
"generalization": "Birth year range spans decade boundary",
"input_range": [
1963,
1973
],
"output": [
"196X",
"197X"
],
"edtf": "[196X,197X]",
"rationale": "Cannot determine which decade with certainty; using EDTF 'one of' set notation"
}
],
"assumptions": [
"Entry age for education/first job: 23 years (±5)",
"Career records are complete in LinkedIn profile"
],
"boundary_note": "Birth year estimate 1968 spans decades 196X/197X",
"inferred_at": "2026-01-09T19:51:05.598410+00:00",
"inferred_by": "enrich_ppids.py"
}
},
"enrichment_history": [
{
"enrichment_timestamp": "2026-01-10T23:07:06.345737+00:00",
"enrichment_agent": "enrich_person_comprehensive.py v1.1.1",
"person_name": "Anca Egas",
"context_used": "curator at The Open Air Museum",
"searches_performed": [
"\"Anca Egas\" born biography",
"\"Anca Egas\" curator at The Open Air Museum education career university",
"\"Anca Egas\" publications awards honors books",
"\"Anca Egas\" contact email twitter linkedin orcid profile photo"
],
"data_fabrication_check": "PASSED"
}
]
}