glam/schemas/20251121/linkml/modules/classes/ConnectionSourceMetadata.yaml
kempersc 86a627fcb7 Update schemas and mappings in LinkML files
- Updated the generated timestamp in manifest.json.
- Modified imports in AccessPolicy.yaml, Activity.yaml, ApplicantRequirement.yaml, ConfidenceMeasure.yaml, ConnectionNetwork.yaml, ConnectionSourceMetadata.yaml, CurrentArchiveRecordSetType.yaml, CustodianArchiveRecordSetType.yaml, CustodianLegalNameClaim.yaml, CustodianNameConsensus.yaml, DarkArchiveRecordSetType.yaml, DepositArchiveRecordSetType.yaml, DigitalArchiveRecordSetType.yaml, DigitalPlatform.yaml, DimArchivesRecordSetType.yaml, DiocesanArchiveRecordSetType.yaml, Expenses.yaml, FindingAid.yaml, Label.yaml, PaymentMethod.yaml, PersonalCollectionType.yaml, Policy.yaml, Provenance.yaml, ProvenanceBlock.yaml, StorageConditionPolicy.yaml, TaxScheme.yaml, TransferPolicy.yaml, UnspecifiedType.yaml, WebPortal.yaml to reflect new slot names and remove deprecated ones.
- Enhanced ontology alignment in analyze.yaml, categorized_as.yaml, collect.yaml, has_activity.yaml, has_annotation.yaml, has_name.yaml, has_note.yaml, has_subject.yaml, has_title.yaml, and identified_by.yaml with additional mappings and clarifications.
2026-02-09 09:20:55 +01:00

121 lines
3.8 KiB
YAML

id: https://nde.nl/ontology/hc/class/ConnectionSourceMetadata
name: connection_source_metadata_class
title: Connection Source Metadata Class
version: 1.0.0
prefixes:
linkml: https://w3id.org/linkml/
hc: https://nde.nl/ontology/hc/
schema: http://schema.org/
prov: http://www.w3.org/ns/prov#
dct: http://purl.org/dc/terms/
dcterms: http://purl.org/dc/terms/
crm: http://www.cidoc-crm.org/cidoc-crm/
skos: http://www.w3.org/2004/02/skos/core#
rdfs: http://www.w3.org/2000/01/rdf-schema#
org: http://www.w3.org/ns/org#
xsd: http://www.w3.org/2001/XMLSchema#
imports:
- linkml:types
- ../enums/ScrapeMethodEnum
- ../slots/20260202_matang/new/connections_extracted
- ../slots/20260202_matang/has_label
- ../slots/20260202_matang/has_profile
- ../slots/20260202_matang/has_score
- ../slots/20260202_matang/has_note
- ../slots/20260202_matang/new/scrape_method
- ../slots/20260202_matang/new/scraped_timestamp
- ../slots/20260202_matang/new/source_url
default_prefix: hc
classes:
ConnectionSourceMetadata:
class_uri: prov:Activity
description: 'Provenance metadata about how the connections were extracted.
Records the extraction context including:
- Source URL (LinkedIn search or profile page)
- When the extraction occurred
- Which method was used (manual browse, automated scrape)
- Target profile being analyzed
- Count of connections extracted
**Scrape Methods**:
- manual_linkedin_browse: Manual copy-paste while logged in
- linkedin_html_parser: Parsed from saved HTML file
- exa_search: Extracted via Exa API
'
exact_mappings:
- prov:Activity
slots:
- connections_extracted
- note
- scrape_method
- scraped_timestamp
- source_url
- has_label
- has_profile
- has_score
slot_usage:
source_url:
range: uri
required: true
examples:
- value: https://www.linkedin.com/search/results/people/?network=%5B%22F%22%2C%22S%22%2C%22O%22%5D
scraped_timestamp:
range: datetime
required: true
examples:
- value: '2025-12-09T22:00:00Z'
scrape_method:
range: ScrapeMethodEnum
required: true
examples:
- value: alexandr-belov-bb547b46
has_label:
# range: string
inlined: false # Fixed invalid inline for primitive type
required: true
examples:
- value: "Label:\n label_value: \"Giovanna Fossati\"\n label_type: \"person_name\"\n"
has_profile:
range: SocialMediaProfile
inlined: true
required: true
examples:
- value:
social_media_profile_id: https://nde.nl/ontology/hc/social-media/giovanna-fossati-linkedin
platform_type: LINKEDIN
profile_url: https://www.linkedin.com/in/giovanna-fossati-12345/
refers_to_custodian: https://nde.nl/ontology/hc/nl-nh-ams-m-efm
- value:
social_media_profile_id: https://nde.nl/ontology/hc/social-media/alexandr-belov-linkedin
platform_type: LINKEDIN
profile_url: https://www.linkedin.com/in/alexandr-belov-bb547b46/
connections_extracted:
range: integer
required: true
minimum_value: 0
examples:
- value: 776
note:
# range: string
examples:
- value: Raw scrape in giovannafossati_connections_20251209T220000Z_note-max100p-1st2nd3th.md
comments:
- Aligns with PROV-O Activity pattern
- scraped_timestamp maps to prov:endedAtTime
- has_profile links to SocialMediaProfile representing the LinkedIn profile analyzed
annotations:
specificity_score: 0.1
specificity_rationale: Generic utility class/slot created during migration
custodian_types: "['*']"