glam/schemas/20251121/linkml/modules/classes/Provenance.yaml
2026-01-16 12:50:50 +01:00

113 lines
3.5 KiB
YAML

# Provenance - A single provenance statement tracking the origin and lineage of data
# Distinct from ProvenanceBlock which bundles multiple provenance sources
# Created per slot_fixes.yaml migration for: binding_provenance, xpath, type_hypothesis
# Creation date: 2026-01-14
id: https://nde.nl/ontology/hc/classes/Provenance
name: Provenance
title: Provenance
prefixes:
linkml: https://w3id.org/linkml/
hc: https://nde.nl/ontology/hc/
prov: http://www.w3.org/ns/prov#
dct: http://purl.org/dc/terms/
schema: http://schema.org/
xsd: http://www.w3.org/2001/XMLSchema#
imports:
- linkml:types
- ../slots/has_or_had_agent
- ../slots/temporal_extent
- ../slots/confidence_score
default_range: string
classes:
Provenance:
description: >-
A single provenance statement describing the origin, lineage, or derivation
of a piece of data.
**DISTINCTION FROM ProvenanceBlock**:
- `Provenance` represents a SINGLE provenance statement (one source, one activity)
- `ProvenanceBlock` bundles MULTIPLE provenance sources together
Use `Provenance` when:
- Tracking provenance of individual data elements
- Recording specific extraction or transformation activities
- Linking data to its source agent/entity
**ONTOLOGY MAPPING**:
- class_uri: prov:Activity (the extraction/derivation activity)
- Links to prov:Agent via has_or_had_agent
- Links to prov:Entity via used (source) and generated (result)
class_uri: prov:Activity
close_mappings:
- dct:ProvenanceStatement
- schema:Action
related_mappings:
- prov:Entity
- prov:Derivation
slots:
- has_or_had_agent
- temporal_extent
- confidence_score
attributes:
source_entity:
range: uriorcurie
description: >-
URI of the source entity from which data was derived (prov:used).
slot_uri: prov:used
generated_entity:
range: uriorcurie
description: >-
URI of the entity generated by this provenance activity (prov:generated).
slot_uri: prov:generated
extraction_method:
range: string
description: >-
Method or process used to extract/derive the data.
Examples: "xpath_extraction", "api_query", "manual_entry"
note:
range: string
description: >-
Human-readable note about this provenance statement.
slot_uri: prov:value
annotations:
custodian_types: '["*"]'
custodian_types_rationale: >-
Provenance tracking is universal across all custodian types.
custodian_types_primary: "*"
specificity_score: 0.15
specificity_rationale: >-
Very low specificity - provenance metadata applies universally.
examples:
- value: |
Provenance:
extraction_method: "xpath_extraction"
source_entity: "https://example.org/webpage/12345"
confidence_score: 0.95
note: "Extracted from archived HTML using XPath"
description: >-
Provenance for an XPath-extracted value from an archived webpage.
- value: |
Provenance:
has_or_had_agent:
agent_type: "software"
name: "glam-extractor-v2.1"
extraction_method: "api_scraping"
confidence_score: 0.85
description: >-
Provenance for API-scraped data with agent identification.