glam/schemas/20251121/linkml/modules/classes/ProvenanceSources.yaml
2026-01-19 00:09:28 +01:00

179 lines
6.2 KiB
YAML

# ProvenanceSources - Sources organized by type
# Extracted from custodian_source.yaml per Rule 38 (modular schema files)
# Extraction date: 2026-01-08
id: https://nde.nl/ontology/hc/classes/ProvenanceSources
name: ProvenanceSources
title: ProvenanceSources
prefixes:
linkml: https://w3id.org/linkml/
hc: https://nde.nl/ontology/hc/
schema: http://schema.org/
prov: http://www.w3.org/ns/prov#
xsd: http://www.w3.org/2001/XMLSchema#
imports:
- linkml:types
- ./SourceRecord
- ./YoutubeSourceRecord
default_range: string
classes:
ProvenanceSources:
description: >-
Sources organized by type, aggregating multiple source records from different
data providers (Google Maps, Wikidata, web archives, etc.) with data tier
classification (TIER_1 through TIER_4).
Ontology mapping rationale:
- class_uri is prov:Collection because this aggregates multiple provenance
sources into a typed collection structure
- close_mappings includes prov:Bundle as it groups related provenance records
- related_mappings includes schema:ItemList for list-based organization
class_uri: prov:Collection
close_mappings:
- prov:Bundle
related_mappings:
- schema:ItemList
attributes:
original_entry:
description: Source records from the original data entry or CSV import
range: SourceRecord
multivalued: true
inlined_as_list: true
google_maps:
description: Source records from Google Maps Places API enrichment
range: SourceRecord
multivalued: true
inlined_as_list: true
genealogiewerkbalk:
description: Source records from Genealogiewerkbalk heritage platform
range: SourceRecord
multivalued: true
inlined_as_list: true
wikidata:
description: Source records from Wikidata SPARQL queries
range: SourceRecord
multivalued: true
inlined_as_list: true
web_archive:
description: Source records from Internet Archive or other web archives
range: SourceRecord
multivalued: true
inlined_as_list: true
exa:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Exa AI search source records
website_scrape:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Website scrape source records
youtube:
range: YoutubeSourceRecord
multivalued: true
inlined_as_list: true
description: YouTube Data API source records
kien:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: KIEN intangible heritage registry source records
nan_isil_registry:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Nationaal Archief ISIL registry source records
whois_research:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: WHOIS domain research source records
manual_research:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Manual research source records
# RENAMED 2026-01-16: website → website_source to resolve OWL ambiguous type warning
# (website is used elsewhere with range: uri, here it's range: SourceRecord)
website_source:
slot_uri: hc:hasWebsiteSource
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Website source records (institution website data)
close_mappings:
- prov:hadPrimarySource
web_scrape:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Web scrape source records (scraped website data)
TIER_1_AUTHORITATIVE:
range: string
multivalued: true
inlined_as_list: true
description: List of TIER_1 authoritative sources
TIER_2_VERIFIED:
range: string
multivalued: true
inlined_as_list: true
description: List of TIER_2 verified sources
TIER_3_CROWD_SOURCED:
range: string
multivalued: true
inlined_as_list: true
description: List of TIER_3 crowd-sourced sources
TIER_4_INFERRED:
range: string
multivalued: true
inlined_as_list: true
description: List of TIER_4 inferred sources
museum_register:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Museum register source records
linkup_timespan:
range: Any
description: Linkup timespan source records (can be string or structured object)
linkedin:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: LinkedIn source records for institution data
firecrawl:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Firecrawl API source records for web scraping
web_search:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Web search source records (Exa, Google, etc.)
web_research:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Web research source records (travel directories, MapQuest, TripHobo, etc.)
linkup_financial:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Linkup financial research source records
linkup_publications:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Linkup publications research source records
linkup_youtube:
range: SourceRecord
multivalued: true
inlined_as_list: true
description: Linkup YouTube research source records