glam/schemas/20251121/linkml/modules/enums/ProfileExtractionMethodEnum.yaml
2026-01-08 15:56:28 +01:00

46 lines
1.7 KiB
YAML

id: https://nde.nl/ontology/hc/enum/ProfileExtractionMethodEnum
name: profile_extraction_method_enum
title: Profile Extraction Method Enum
version: 1.0.0
prefixes:
linkml: https://w3id.org/linkml/
hc: https://nde.nl/ontology/hc/
schema: http://schema.org/
prov: http://www.w3.org/ns/prov#
imports:
- linkml:types
default_prefix: hc
enums:
ProfileExtractionMethodEnum:
description: |
Enumeration of extraction methods/tools used for person profile data extraction.
Used for LinkedIn profiles, web scraping of staff pages, and similar person data sources.
permissible_values:
exa_crawling_exa:
description: Exa AI crawling API - primary LinkedIn extraction
meaning: schema:SoftwareApplication
exa_contents:
description: Exa contents endpoint - cached content retrieval
meaning: schema:SoftwareApplication
exa_crawling_glm47:
description: Exa crawling with GLM 4.7 processing
meaning: schema:SoftwareApplication
linkedin_html_parser:
description: Local HTML parsing of saved LinkedIn pages
meaning: schema:SoftwareApplication
manual:
description: Manual data entry by human operator
meaning: prov:Person
firecrawl:
description: Firecrawl web scraping service
meaning: schema:SoftwareApplication
playwright:
description: Playwright browser automation
meaning: schema:SoftwareApplication
web_archive:
description: Internet Archive Wayback Machine
meaning: schema:SoftwareApplication
institutional_website:
description: Direct scraping from institutional website
meaning: schema:SoftwareApplication