- Apply Rule 39: RiC-O style hasOrHad*/isOrWas* for temporal slots - Apply Rule 43: Singular noun convention (keywords → keyword) - Update slot references to match renamed slot files - Maintain schema integrity across all class definitions
105 lines
2.9 KiB
YAML
105 lines
2.9 KiB
YAML
id: https://nde.nl/ontology/hc/class/FindingAidProvenance
|
|
name: finding_aid_provenance_class
|
|
title: FindingAidProvenance Class
|
|
prefixes:
|
|
linkml: https://w3id.org/linkml/
|
|
hc: https://nde.nl/ontology/hc/
|
|
prov: http://www.w3.org/ns/prov#
|
|
schema: http://schema.org/
|
|
default_prefix: hc
|
|
default_range: string
|
|
imports:
|
|
- linkml:types
|
|
- ../metadata
|
|
- ./SpecificityAnnotation
|
|
- ./TemplateSpecificityScores
|
|
- ../slots/extraction_method
|
|
- ../slots/extraction_note
|
|
- ../slots/retrieval_agent
|
|
- ../slots/source_url
|
|
- ../slots/note
|
|
- ../slots/claims_count
|
|
- ../slots/crawler_version
|
|
- ../slots/date_retrieved
|
|
- ../slots/html_snapshot_path
|
|
- ../slots/specificity_annotation
|
|
- ../slots/template_specificity
|
|
- ../slots/validation_status
|
|
|
|
classes:
|
|
FindingAidProvenance:
|
|
class_uri: prov:Activity
|
|
description: |
|
|
Provenance metadata for web-harvested finding aid information.
|
|
|
|
Tracks when and how the metadata was retrieved, enabling data freshness
|
|
assessment and re-crawling decisions.
|
|
slots:
|
|
- claims_count
|
|
- crawler_version
|
|
- date_retrieved
|
|
- extraction_method
|
|
- extraction_note
|
|
- html_snapshot_path
|
|
- note
|
|
- retrieval_agent
|
|
- source_url
|
|
- specificity_annotation
|
|
- template_specificity
|
|
- validation_status
|
|
slot_usage:
|
|
date_retrieved:
|
|
description: ISO 8601 date when data was retrieved
|
|
range: date
|
|
required: true
|
|
retrieval_agent:
|
|
description: Tool/method used for retrieval
|
|
required: true
|
|
source_url:
|
|
description: Original source URL
|
|
range: uri
|
|
extraction_note:
|
|
description: Notes about extraction process or quality
|
|
extraction_method:
|
|
description: Method used (manual, automated, hybrid)
|
|
crawler_version:
|
|
description: Version of crawling tool used
|
|
html_snapshot_path:
|
|
description: Relative path to archived HTML snapshot
|
|
claims_count:
|
|
description: Number of web claims extracted
|
|
range: integer
|
|
validation_status:
|
|
description: Status of validation (validated, pending, failed)
|
|
note:
|
|
description: Additional provenance notes or remarks
|
|
specificity_annotation:
|
|
range: SpecificityAnnotation
|
|
inlined: true
|
|
template_specificity:
|
|
range: TemplateSpecificityScores
|
|
inlined: true
|
|
exact_mappings:
|
|
- prov:Activity
|
|
|
|
slots:
|
|
date_retrieved:
|
|
slot_uri: prov:endedAtTime
|
|
description: Date when data was retrieved
|
|
range: date
|
|
crawler_version:
|
|
slot_uri: prov:wasAssociatedWith
|
|
description: Version of crawler used
|
|
range: string
|
|
html_snapshot_path:
|
|
slot_uri: prov:used
|
|
description: Path to HTML snapshot
|
|
range: string
|
|
claims_count:
|
|
slot_uri: schema:numberOfItems
|
|
description: Number of claims extracted
|
|
range: integer
|
|
validation_status:
|
|
slot_uri: schema:status
|
|
description: Validation status
|
|
range: string
|