glam/schemas/20251121/linkml/modules/classes/DataTierLevel.yaml

id: https://nde.nl/ontology/hc/class/DataTierLevel
name: data_tier_level_class
title: DataTierLevel Class
description: >-
  Data quality tier classification indicating the trustworthiness and
  verification status of heritage data.

  The tier system reflects the provenance and verification level of information,
  from authoritative official registries to algorithmically inferred data.

prefixes:
  linkml: https://w3id.org/linkml/
  hc: https://nde.nl/ontology/hc/
  prov: http://www.w3.org/ns/prov#
  dqv: http://www.w3.org/ns/dqv#

imports:
  - linkml:types
  - ../slots/has_or_had_label
  - ../slots/has_or_had_description
  - ../slots/has_or_had_code

default_prefix: hc

classes:
  DataTierLevel:
    class_uri: hc:DataTierLevel
    description: >-
      Data quality tier level classification.

      **Standard Tier Levels** (from most to least authoritative):

      | Tier | Short Code | Description | Examples |
      |------|------------|-------------|----------|
      | Tier 1 | TIER_1_AUTHORITATIVE | Official registry data | NDE CSV, ISIL registry, government databases |
      | Tier 2 | TIER_2_VERIFIED | Verified external sources | Wikidata (verified), Google Maps, official websites |
      | Tier 3 | TIER_3_CROWD_SOURCED | Community-contributed data | Reviews, user edits, Wikipedia |
      | Tier 4 | TIER_4_INFERRED | Algorithmically extracted | Website scrape, LLM extraction, API inference |

      **Usage Guidelines**:
      - Always prefer higher-tier data when available
      - TIER_4 data requires verification before promotion
      - Data can be promoted to higher tiers after verification
      - Track tier changes in provenance history

      **PROV-O Alignment**: Maps to prov:qualifiedDerivation for data quality tracking.
    exact_mappings:
      - dqv:QualityMeasurement
    close_mappings:
      - prov:qualifiedDerivation
    slots:
      - has_or_had_label
      - has_or_had_code
      - has_or_had_description
    slot_usage:
      has_or_had_label:
        description: Human-readable name for the data tier.
        range: string
        required: true
        examples:
          - value: "Authoritative"
            description: Tier 1 - official registry data
          - value: "Inferred"
            description: Tier 4 - algorithmically extracted
      has_or_had_code:
        description: >-
          Short code identifier for the data tier.
          Standard codes: TIER_1_AUTHORITATIVE, TIER_2_VERIFIED,
          TIER_3_CROWD_SOURCED, TIER_4_INFERRED
        range: string
        required: true
        pattern: "^TIER_[1-4]_[A-Z_]+$"
        examples:
          - value: "TIER_1_AUTHORITATIVE"
            description: Official registry data
          - value: "TIER_4_INFERRED"
            description: Algorithmically extracted data
      has_or_had_description:
        description: Detailed description of what this tier means and its data sources.
        range: string
        required: false
        examples:
          - value: "Extracted from NDE CSV registry - authoritative Dutch heritage data"
            description: Tier 1 example
          - value: "Extracted via LLM from website - requires verification"
            description: Tier 4 example
    annotations:
      specificity_score: 0.35
      specificity_rationale: >-
        Data tier levels are broadly useful across all data provenance contexts.
      custodian_types: '["*"]'
      custodian_types_rationale: >-
        Data quality tiers apply universally to all custodian types.
    examples:
      - value:
          has_or_had_label: "Authoritative"
          has_or_had_code: "TIER_1_AUTHORITATIVE"
          has_or_had_description: "Official data from NDE registry CSV"
        description: Tier 1 authoritative data
      - value:
          has_or_had_label: "Verified"
          has_or_had_code: "TIER_2_VERIFIED"
          has_or_had_description: "Verified against institutional website"
        description: Tier 2 verified data
      - value:
          has_or_had_label: "Inferred"
          has_or_had_code: "TIER_4_INFERRED"
          has_or_had_description: "Extracted via Exa search - pending verification"
        description: Tier 4 inferred data