Class: Dataset
A single component of related observations and/or information that can be read, manipulated, transformed, and otherwise interpreted.
URI: dcat:Distribution
classDiagram
class Dataset
Information <|-- Dataset
Dataset <|-- DataSubset
Dataset : acquisition_methods
Dataset --|> InstanceAcquisition : acquisition_methods
Dataset : addressing_gaps
Dataset --|> AddressingGap : addressing_gaps
Dataset : anomalies
Dataset --|> DataAnomaly : anomalies
Dataset : bytes
Dataset : cleaning_strategies
Dataset --|> CleaningStrategy : cleaning_strategies
Dataset : collection_mechanisms
Dataset --|> CollectionMechanism : collection_mechanisms
Dataset : collection_timeframes
Dataset --|> CollectionTimeframe : collection_timeframes
Dataset : compression
Dataset --|> CompressionEnum : compression
Dataset : confidential_elements
Dataset --|> Confidentiality : confidential_elements
Dataset : conforms_to
Dataset : conforms_to_class
Dataset : conforms_to_schema
Dataset : content_warnings
Dataset --|> ContentWarning : content_warnings
Dataset : created_by
Dataset --|> CreatorOrMaintainerEnum : created_by
Dataset : created_on
Dataset : creators
Dataset --|> Creator : creators
Dataset : data_collectors
Dataset --|> DataCollector : data_collectors
Dataset : data_protection_impacts
Dataset --|> DataProtectionImpact : data_protection_impacts
Dataset : description
Dataset : dialect
Dataset : discouraged_uses
Dataset --|> DiscouragedUse : discouraged_uses
Dataset : distribution_dates
Dataset --|> DistributionDate : distribution_dates
Dataset : distribution_formats
Dataset --|> DistributionFormat : distribution_formats
Dataset : doi
Dataset : download_url
Dataset : encoding
Dataset --|> EncodingEnum : encoding
Dataset : errata
Dataset --|> Erratum : errata
Dataset : ethical_reviews
Dataset --|> EthicalReview : ethical_reviews
Dataset : existing_uses
Dataset --|> ExistingUse : existing_uses
Dataset : extension_mechanism
Dataset --|> ExtensionMechanism : extension_mechanism
Dataset : external_resources
Dataset --|> ExternalResource : external_resources
Dataset : format
Dataset --|> FormatEnum : format
Dataset : funders
Dataset --|> FundingMechanism : funders
Dataset : future_use_impacts
Dataset --|> FutureUseImpact : future_use_impacts
Dataset : hash
Dataset : id
Dataset : instances
Dataset --|> Instance : instances
Dataset : ip_restrictions
Dataset --|> IPRestrictions : ip_restrictions
Dataset : is_deidentified
Dataset --|> Deidentification : is_deidentified
Dataset : is_tabular
Dataset : issued
Dataset : keywords
Dataset : labeling_strategies
Dataset --|> LabelingStrategy : labeling_strategies
Dataset : language
Dataset : last_updated_on
Dataset : license
Dataset : license_and_use_terms
Dataset --|> LicenseAndUseTerms : license_and_use_terms
Dataset : maintainers
Dataset --|> Maintainer : maintainers
Dataset : md5
Dataset : media_type
Dataset : modified_by
Dataset --|> CreatorOrMaintainerEnum : modified_by
Dataset : other_tasks
Dataset --|> OtherTask : other_tasks
Dataset : page
Dataset : path
Dataset : preprocessing_strategies
Dataset --|> PreprocessingStrategy : preprocessing_strategies
Dataset : publisher
Dataset : purposes
Dataset --|> Purpose : purposes
Dataset : raw_sources
Dataset --|> RawData : raw_sources
Dataset : regulatory_restrictions
Dataset --|> ExportControlRegulatoryRestrictions : regulatory_restrictions
Dataset : retention_limit
Dataset --|> RetentionLimits : retention_limit
Dataset : sampling_strategies
Dataset --|> SamplingStrategy : sampling_strategies
Dataset : sensitive_elements
Dataset --|> SensitiveElement : sensitive_elements
Dataset : sha256
Dataset : status
Dataset : subpopulations
Dataset --|> Subpopulation : subpopulations
Dataset : subsets
Dataset --|> DataSubset : subsets
Dataset : tasks
Dataset --|> Task : tasks
Dataset : title
Dataset : updates
Dataset --|> UpdatePlan : updates
Dataset : use_repository
Dataset --|> UseRepository : use_repository
Dataset : version
Dataset : version_access
Dataset --|> VersionAccess : version_access
Dataset : was_derived_from
Inheritance
- Information
- Dataset
Slots
Usages
used by | used in | type | used |
---|---|---|---|
DatasetCollection | resources | range | Dataset |
Aliases
- data resource
- data file
- data package
See Also
Identifier and Mapping Information
Schema Source
- from schema: https://w3id.org/bridge2ai/data-sheets-schema
Mappings
Mapping Type | Mapped Value |
---|---|
self | dcat:Distribution |
native | data_sheets_schema:Dataset |
exact | schema:DataDownload |
LinkML Source
Direct
name: Dataset
description: A single component of related observations and/or information that can
be read, manipulated, transformed, and otherwise interpreted.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
see_also:
- https://specs.frictionlessdata.io/data-resource
aliases:
- data resource
- data file
- data package
exact_mappings:
- schema:DataDownload
is_a: Information
slots:
- bytes
- dialect
- encoding
- format
- hash
- md5
- media_type
- path
- sha256
attributes:
purposes:
name: purposes
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Purpose
tasks:
name: tasks
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Task
addressing_gaps:
name: addressing_gaps
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: AddressingGap
creators:
name: creators
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Creator
funders:
name: funders
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: FundingMechanism
subsets:
name: subsets
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- schema:distribution
rank: 1000
slot_uri: dcat:distribution
multivalued: true
range: DataSubset
instances:
name: instances
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Instance
anomalies:
name: anomalies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: DataAnomaly
external_resources:
name: external_resources
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: ExternalResource
confidential_elements:
name: confidential_elements
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Confidentiality
content_warnings:
name: content_warnings
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: ContentWarning
subpopulations:
name: subpopulations
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Subpopulation
sensitive_elements:
name: sensitive_elements
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: SensitiveElement
acquisition_methods:
name: acquisition_methods
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: InstanceAcquisition
collection_mechanisms:
name: collection_mechanisms
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: CollectionMechanism
sampling_strategies:
name: sampling_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: SamplingStrategy
data_collectors:
name: data_collectors
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: DataCollector
collection_timeframes:
name: collection_timeframes
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: CollectionTimeframe
ethical_reviews:
name: ethical_reviews
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: EthicalReview
data_protection_impacts:
name: data_protection_impacts
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: DataProtectionImpact
preprocessing_strategies:
name: preprocessing_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: PreprocessingStrategy
cleaning_strategies:
name: cleaning_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: CleaningStrategy
labeling_strategies:
name: labeling_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: LabelingStrategy
raw_sources:
name: raw_sources
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: RawData
existing_uses:
name: existing_uses
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: ExistingUse
use_repository:
name: use_repository
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: UseRepository
other_tasks:
name: other_tasks
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: OtherTask
future_use_impacts:
name: future_use_impacts
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: FutureUseImpact
discouraged_uses:
name: discouraged_uses
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: DiscouragedUse
distribution_formats:
name: distribution_formats
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: DistributionFormat
distribution_dates:
name: distribution_dates
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: DistributionDate
license_and_use_terms:
name: license_and_use_terms
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: LicenseAndUseTerms
ip_restrictions:
name: ip_restrictions
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: IPRestrictions
regulatory_restrictions:
name: regulatory_restrictions
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: ExportControlRegulatoryRestrictions
maintainers:
name: maintainers
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Maintainer
errata:
name: errata
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
range: Erratum
updates:
name: updates
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: UpdatePlan
retention_limit:
name: retention_limit
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: RetentionLimits
version_access:
name: version_access
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: VersionAccess
extension_mechanism:
name: extension_mechanism
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: ExtensionMechanism
is_deidentified:
name: is_deidentified
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: Deidentification
is_tabular:
name: is_tabular
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
range: boolean
class_uri: dcat:Distribution
Induced
name: Dataset
description: A single component of related observations and/or information that can
be read, manipulated, transformed, and otherwise interpreted.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
see_also:
- https://specs.frictionlessdata.io/data-resource
aliases:
- data resource
- data file
- data package
exact_mappings:
- schema:DataDownload
is_a: Information
attributes:
purposes:
name: purposes
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: purposes
owner: Dataset
domain_of:
- Dataset
range: Purpose
tasks:
name: tasks
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: tasks
owner: Dataset
domain_of:
- Dataset
range: Task
addressing_gaps:
name: addressing_gaps
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: addressing_gaps
owner: Dataset
domain_of:
- Dataset
range: AddressingGap
creators:
name: creators
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: creators
owner: Dataset
domain_of:
- Dataset
range: Creator
funders:
name: funders
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: funders
owner: Dataset
domain_of:
- Dataset
range: FundingMechanism
subsets:
name: subsets
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- schema:distribution
rank: 1000
slot_uri: dcat:distribution
multivalued: true
alias: subsets
owner: Dataset
domain_of:
- Dataset
range: DataSubset
instances:
name: instances
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: instances
owner: Dataset
domain_of:
- Dataset
range: Instance
anomalies:
name: anomalies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: anomalies
owner: Dataset
domain_of:
- Dataset
range: DataAnomaly
external_resources:
name: external_resources
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: external_resources
owner: Dataset
domain_of:
- Dataset
- ExternalResource
range: ExternalResource
confidential_elements:
name: confidential_elements
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: confidential_elements
owner: Dataset
domain_of:
- Dataset
range: Confidentiality
content_warnings:
name: content_warnings
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: content_warnings
owner: Dataset
domain_of:
- Dataset
range: ContentWarning
subpopulations:
name: subpopulations
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: subpopulations
owner: Dataset
domain_of:
- Dataset
range: Subpopulation
sensitive_elements:
name: sensitive_elements
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: sensitive_elements
owner: Dataset
domain_of:
- Dataset
range: SensitiveElement
acquisition_methods:
name: acquisition_methods
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: acquisition_methods
owner: Dataset
domain_of:
- Dataset
range: InstanceAcquisition
collection_mechanisms:
name: collection_mechanisms
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: collection_mechanisms
owner: Dataset
domain_of:
- Dataset
range: CollectionMechanism
sampling_strategies:
name: sampling_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: sampling_strategies
owner: Dataset
domain_of:
- Dataset
- Instance
range: SamplingStrategy
data_collectors:
name: data_collectors
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: data_collectors
owner: Dataset
domain_of:
- Dataset
range: DataCollector
collection_timeframes:
name: collection_timeframes
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: collection_timeframes
owner: Dataset
domain_of:
- Dataset
range: CollectionTimeframe
ethical_reviews:
name: ethical_reviews
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: ethical_reviews
owner: Dataset
domain_of:
- Dataset
range: EthicalReview
data_protection_impacts:
name: data_protection_impacts
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: data_protection_impacts
owner: Dataset
domain_of:
- Dataset
range: DataProtectionImpact
preprocessing_strategies:
name: preprocessing_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: preprocessing_strategies
owner: Dataset
domain_of:
- Dataset
range: PreprocessingStrategy
cleaning_strategies:
name: cleaning_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: cleaning_strategies
owner: Dataset
domain_of:
- Dataset
range: CleaningStrategy
labeling_strategies:
name: labeling_strategies
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: labeling_strategies
owner: Dataset
domain_of:
- Dataset
range: LabelingStrategy
raw_sources:
name: raw_sources
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: raw_sources
owner: Dataset
domain_of:
- Dataset
range: RawData
existing_uses:
name: existing_uses
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: existing_uses
owner: Dataset
domain_of:
- Dataset
range: ExistingUse
use_repository:
name: use_repository
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: use_repository
owner: Dataset
domain_of:
- Dataset
range: UseRepository
other_tasks:
name: other_tasks
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: other_tasks
owner: Dataset
domain_of:
- Dataset
range: OtherTask
future_use_impacts:
name: future_use_impacts
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: future_use_impacts
owner: Dataset
domain_of:
- Dataset
range: FutureUseImpact
discouraged_uses:
name: discouraged_uses
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: discouraged_uses
owner: Dataset
domain_of:
- Dataset
range: DiscouragedUse
distribution_formats:
name: distribution_formats
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: distribution_formats
owner: Dataset
domain_of:
- Dataset
range: DistributionFormat
distribution_dates:
name: distribution_dates
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: distribution_dates
owner: Dataset
domain_of:
- Dataset
range: DistributionDate
license_and_use_terms:
name: license_and_use_terms
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: license_and_use_terms
owner: Dataset
domain_of:
- Dataset
range: LicenseAndUseTerms
ip_restrictions:
name: ip_restrictions
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: ip_restrictions
owner: Dataset
domain_of:
- Dataset
range: IPRestrictions
regulatory_restrictions:
name: regulatory_restrictions
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: regulatory_restrictions
owner: Dataset
domain_of:
- Dataset
range: ExportControlRegulatoryRestrictions
maintainers:
name: maintainers
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: maintainers
owner: Dataset
domain_of:
- Dataset
range: Maintainer
errata:
name: errata
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
multivalued: true
alias: errata
owner: Dataset
domain_of:
- Dataset
range: Erratum
updates:
name: updates
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: updates
owner: Dataset
domain_of:
- Dataset
range: UpdatePlan
retention_limit:
name: retention_limit
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: retention_limit
owner: Dataset
domain_of:
- Dataset
range: RetentionLimits
version_access:
name: version_access
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: version_access
owner: Dataset
domain_of:
- Dataset
range: VersionAccess
extension_mechanism:
name: extension_mechanism
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: extension_mechanism
owner: Dataset
domain_of:
- Dataset
range: ExtensionMechanism
is_deidentified:
name: is_deidentified
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: is_deidentified
owner: Dataset
domain_of:
- Dataset
range: Deidentification
is_tabular:
name: is_tabular
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: is_tabular
owner: Dataset
domain_of:
- Dataset
range: boolean
bytes:
name: bytes
description: Size of the data in bytes.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: dcat:byteSize
alias: bytes
owner: Dataset
domain_of:
- Dataset
range: integer
dialect:
name: dialect
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: csvw:dialect
alias: dialect
owner: Dataset
domain_of:
- Dataset
range: string
encoding:
name: encoding
description: The encoding of the data. This is not the same as the media type.
Rather, this is the encoding of the data in a more specific sense, e.g., UTF-8,
ASCII, etc.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: encoding
owner: Dataset
domain_of:
- Dataset
range: EncodingEnum
format:
name: format
description: The format of the data. This is not the same as the media type. Rather,
this is the format of the data in a more specific sense, e.g., CSV, JSON, etc.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: dcterms:format
alias: format
owner: Dataset
domain_of:
- Dataset
range: FormatEnum
hash:
name: hash
description: The hash representation of the data, e.g., sha256, md5, etc. Subtypes
have their own slots.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: hash
owner: Dataset
domain_of:
- Dataset
range: string
md5:
name: md5
description: The md5 hash representation of the data.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
is_a: hash
alias: md5
owner: Dataset
domain_of:
- Dataset
range: string
media_type:
name: media_type
description: The media type of the data. This is not the same as the format. Rather,
this is the media type of the data in a more general sense, e.g., text/csv,
application/json, etc., though as it is defined here the media type can be any
string.
examples:
- value: text/csv
- value: application/json
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- frictionless:mediatype
- schema:encodingFormat
rank: 1000
slot_uri: dcat:mediaType
alias: media_type
owner: Dataset
domain_of:
- Dataset
range: string
path:
name: path
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
close_mappings:
- frictionless:path
rank: 1000
alias: path
owner: Dataset
domain_of:
- Dataset
range: string
sha256:
name: sha256
description: The sha256 hash representation of the data.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
is_a: hash
alias: sha256
owner: Dataset
domain_of:
- Dataset
range: string
compression:
name: compression
description: The compression format of the data. This is not the same as the media
type. Rather, this is the compression format of the data in a more specific
sense, e.g., zip, gzip, etc.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: compression
owner: Dataset
domain_of:
- Information
range: CompressionEnum
conforms_to:
name: conforms_to
description: The standard to which the data conforms. This is not the same as
the media type. Rather, this is the standard to which the data conforms in a
more specific sense, e.g., frictionless, schema.org, etc. This should be a standard
from the Bridge2AI standards registry.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
values_from:
- B2AI_STANDARD
slot_uri: dcterms:conformsTo
alias: conforms_to
owner: Dataset
domain_of:
- Information
range: uriorcurie
conforms_to_class:
name: conforms_to_class
description: The class in the schema to which the data object instantiates.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
is_a: conforms_to
alias: conforms_to_class
owner: Dataset
domain_of:
- Information
range: uriorcurie
conforms_to_schema:
name: conforms_to_schema
description: The schema to which the data conforms. This is not the same as the
media type. Rather, this is the schema to which the data conforms in a more
specific sense, and even more specific than the general set of standards it
conforms to.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- frictionless:schema
rank: 1000
is_a: conforms_to
alias: conforms_to_schema
owner: Dataset
domain_of:
- Information
range: uriorcurie
created_by:
name: created_by
description: Agent that created the element
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: pav:createdBy
multivalued: true
alias: created_by
owner: Dataset
domain_of:
- Information
range: CreatorOrMaintainerEnum
created_on:
name: created_on
description: Date and Time at which the element was created
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: pav:createdOn
alias: created_on
owner: Dataset
domain_of:
- Information
range: datetime
description:
name: description
description: A human-readable description for a thing.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: schema:description
alias: description
owner: Dataset
domain_of:
- Information
- Relationships
- Splits
- DataAnomaly
- Confidentiality
- Deidentification
- SensitiveElement
- InstanceAcquisition
- CollectionMechanism
- DataCollector
- CollectionTimeframe
- EthicalReview
- DirectCollection
- CollectionNotification
- CollectionConsent
- ConsentRevocation
- DataProtectionImpact
- PreprocessingStrategy
- CleaningStrategy
- LabelingStrategy
- RawData
- ExistingUse
- UseRepository
- OtherTask
- FutureUseImpact
- DiscouragedUse
- ThirdPartySharing
- DistributionFormat
- DistributionDate
- LicenseAndUseTerms
- IPRestrictions
- ExportControlRegulatoryRestrictions
- Maintainer
- Erratum
- UpdatePlan
- RetentionLimits
- VersionAccess
- ExtensionMechanism
- NamedThing
range: string
doi:
name: doi
description: The Digital Object Identifier of the data, with the doi prefix.
examples:
- value: doi:10.48550/arXiv.2310.03666
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: doi
owner: Dataset
domain_of:
- Information
range: uriorcurie
download_url:
name: download_url
description: URL from which the data can be downloaded. This is not the same as
the landing page, which is a page that describes the dataset. Rather, this URL
points directly to the data itself.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- schema:url
close_mappings:
- frictionless:path
rank: 1000
slot_uri: dcat:downloadURL
alias: download_url
owner: Dataset
domain_of:
- Information
range: uri
id:
name: id
description: A unique identifier for a thing.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: schema:identifier
identifier: true
alias: id
owner: Dataset
domain_of:
- Information
- FormatDialect
- NamedThing
range: uriorcurie
required: true
issued:
name: issued
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: dcterms:issued
alias: issued
owner: Dataset
domain_of:
- Information
range: datetime
keywords:
name: keywords
description: Keywords associated with the data. These may be provided by the data
creator or assigned later in a manual or automated manner.
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- schema:keywords
rank: 1000
singular_name: keyword
slot_uri: dcat:keyword
multivalued: true
alias: keywords
owner: Dataset
domain_of:
- Information
range: string
language:
name: language
description: language in which the information is expressed
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
alias: language
owner: Dataset
domain_of:
- Information
range: string
last_updated_on:
name: last_updated_on
description: Date and Time at which the element was last updated
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: pav:lastUpdatedOn
alias: last_updated_on
owner: Dataset
domain_of:
- Information
range: datetime
license:
name: license
description: license for the data
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- frictionless:licenses
rank: 1000
slot_uri: dcterms:license
alias: license
owner: Dataset
domain_of:
- Information
- Software
range: string
modified_by:
name: modified_by
description: agent that modified the element
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: oslc:modifiedBy
alias: modified_by
owner: Dataset
domain_of:
- Information
range: CreatorOrMaintainerEnum
page:
name: page
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: dcat:landingPage
alias: page
owner: Dataset
domain_of:
- Information
range: string
publisher:
name: publisher
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: dcterms:publisher
alias: publisher
owner: Dataset
domain_of:
- Information
range: uriorcurie
status:
name: status
description: Status of the element in terms of its maturity or life cycle
examples:
- value: bibo:draft
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: bibo:status
alias: status
owner: Dataset
domain_of:
- Information
range: uriorcurie
title:
name: title
description: the official title of the element
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: dcterms:title
alias: title
owner: Dataset
domain_of:
- Information
range: string
version:
name: version
description: particular version of schema
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
exact_mappings:
- schema:version
- dcterms:hasVersion
rank: 1000
slot_uri: pav:version
alias: version
owner: Dataset
domain_of:
- Information
- Software
range: string
was_derived_from:
name: was_derived_from
description: A derivation is a transformation of an entity into another, an update
of an entity resulting in a new one, or the construction of a new entity based
on a pre-existing entity.@en
from_schema: https://w3id.org/bridge2ai/data-sheets-schema
rank: 1000
slot_uri: prov:wasDerivedFrom
alias: was_derived_from
owner: Dataset
domain_of:
- Information
range: string
class_uri: dcat:Distribution