diff --git a/project/jsonld/data_sheets_schema.jsonld b/project/jsonld/data_sheets_schema.jsonld index 0c051caf..a449322d 100644 --- a/project/jsonld/data_sheets_schema.jsonld +++ b/project/jsonld/data_sheets_schema.jsonld @@ -2067,15 +2067,15 @@ }, { "name": "dataset__file_collections", - "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart.", + "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart in RO-Crate converters.", "from_schema": "https://w3id.org/bridge2ai/data-sheets-schema", "mappings": [ - "http://schema.org/hasPart" + "https://w3id.org/bridge2ai/data-sheets-schema/fileCollections" ], "exact_mappings": [ "http://www.w3.org/ns/dcat#distribution" ], - "slot_uri": "http://schema.org/hasPart", + "slot_uri": "https://w3id.org/bridge2ai/data-sheets-schema/fileCollections", "alias": "file_collections", "owner": "Dataset", "domain_of": [ @@ -6865,11 +6865,11 @@ "attributes": [ { "name": "file_collections", - "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart.", + "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart in RO-Crate converters.", "exact_mappings": [ "dcat:distribution" ], - "slot_uri": "schema:hasPart", + "slot_uri": "d4d:fileCollections", "range": "FileCollection", "multivalued": true, "inlined_as_list": true, @@ -10713,9 +10713,9 @@ ], "metamodel_version": "1.7.0", "source_file": "data_sheets_schema.yaml", - "source_file_date": "2026-03-26T22:44:02", - "source_file_size": 18530, - "generation_date": "2026-04-06T21:13:16", + "source_file_date": "2026-04-07T13:01:39", + "source_file_size": 18558, + "generation_date": "2026-04-07T13:03:27", "@type": "SchemaDefinition", "@context": [ "project/jsonld/data_sheets_schema.context.jsonld", diff --git a/project/jsonschema/data_sheets_schema.schema.json b/project/jsonschema/data_sheets_schema.schema.json index b348955a..c97dc721 100644 --- a/project/jsonschema/data_sheets_schema.schema.json +++ b/project/jsonschema/data_sheets_schema.schema.json @@ -1207,7 +1207,7 @@ ] }, "file_collections": { - "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart.", + "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart in RO-Crate converters.", "items": { "$ref": "#/$defs/FileCollection" }, @@ -2005,7 +2005,7 @@ ] }, "file_collections": { - "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart.", + "description": "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart in RO-Crate converters.", "items": { "$ref": "#/$defs/FileCollection" }, diff --git a/project/owl/data_sheets_schema.owl.ttl b/project/owl/data_sheets_schema.owl.ttl index 29506e46..eee1fd30 100644 --- a/project/owl/data_sheets_schema.owl.ttl +++ b/project/owl/data_sheets_schema.owl.ttl @@ -15,10 +15,10 @@ data_sheets_schema:DatasetCollection a owl:Class, linkml:ClassDefinition ; rdfs:label "DatasetCollection" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom data_sheets_schema:Dataset ; owl:onProperty data_sheets_schema:resources ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:Dataset ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:resources ], data_sheets_schema:Information ; skos:altLabel "data resource collection", @@ -34,49 +34,49 @@ data_sheets_schema:FormatDialect a owl:Class, rdfs:label "FormatDialect" ; rdfs:subClassOf [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:delimiter ], + owl:onProperty data_sheets_schema:header ], [ a owl:Restriction ; owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:delimiter ], + [ a owl:Restriction ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:quote_char ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:delimiter ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:comment_prefix ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:quote_char ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:header ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:double_quote ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:delimiter ], + owl:onProperty data_sheets_schema:double_quote ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:delimiter ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:double_quote ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:quote_char ], + owl:onProperty data_sheets_schema:delimiter ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:comment_prefix ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:double_quote ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:quote_char ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:comment_prefix ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:header ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:comment_prefix ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:header ] ; + owl:onProperty data_sheets_schema:comment_prefix ] ; skos:definition "Additional format information for a file" ; skos:inScheme data_sheets_schema:base . @@ -84,20 +84,20 @@ data_sheets_schema:FormatDialect a owl:Class, linkml:ClassDefinition ; rdfs:label "DirectCollection" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom linkml:Boolean ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; + owl:minCardinality 0 ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Indicates whether the data was collected directly from the individuals in question or obtained via third parties/other sources. """ ; @@ -107,10 +107,10 @@ data_sheets_schema:FormatDialect a owl:Class, linkml:ClassDefinition ; rdfs:label "Relationships" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Are relationships between individual instances made explicit (e.g., users' movie ratings, social network links)? @@ -121,10 +121,10 @@ data_sheets_schema:FormatDialect a owl:Class, linkml:ClassDefinition ; rdfs:label "Splits" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Are there recommended data splits (e.g., training, validation, testing)? If so, how are they defined and why? @@ -152,10 +152,10 @@ data_sheets_schema:FormatDialect a owl:Class, linkml:ClassDefinition ; rdfs:label "CollectionConsent" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Did the individuals in question consent to the collection and use of their data? If so, how was consent requested and provided, and what language did individuals consent to? @@ -166,10 +166,10 @@ data_sheets_schema:FormatDialect a owl:Class, linkml:ClassDefinition ; rdfs:label "CollectionNotification" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Were the individuals in question notified about the data collection? If so, please describe (or show with screenshots, etc.) how notice was provided, and reproduce the language of the notification itself if possible. @@ -215,17 +215,17 @@ data_sheets_schema:DataSubset a owl:Class, owl:minCardinality 0 ; owl:onProperty data_sheets_schema:is_subpopulation ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:is_data_split ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:is_subpopulation ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:is_data_split ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom linkml:Boolean ; owl:onProperty data_sheets_schema:is_subpopulation ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:is_data_split ], data_sheets_schema:Dataset ; skos:definition "A subset of a dataset, likely containing multiple files of multiple potential purposes and properties." ; skos:inScheme . @@ -234,104 +234,104 @@ data_sheets_schema:File a owl:Class, linkml:ClassDefinition ; rdfs:label "File" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:sha256 ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:md5 ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:dialect ], + owl:allValuesFrom data_sheets_schema:EncodingEnum ; + owl:onProperty data_sheets_schema:encoding ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:dialect ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:FileTypeEnum ; - owl:onProperty data_sheets_schema:file_type ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:format ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:hash ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:sha256 ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:sha256 ], + owl:onProperty data_sheets_schema:compression ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:md5 ], + owl:allValuesFrom linkml:Integer ; + owl:onProperty data_sheets_schema:bytes ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:file_type ], + owl:onProperty data_sheets_schema:encoding ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Integer ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:bytes ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:path ], + owl:onProperty data_sheets_schema:dialect ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:hash ], + owl:onProperty data_sheets_schema:encoding ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom data_sheets_schema:MediaTypeEnum ; owl:onProperty data_sheets_schema:media_type ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:file_type ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:hash ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:compression ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:md5 ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:encoding ], + owl:onProperty data_sheets_schema:file_type ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:format ], + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:hash ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:bytes ], + owl:onProperty data_sheets_schema:media_type ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:path ], + owl:onProperty data_sheets_schema:format ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:md5 ], + owl:onProperty data_sheets_schema:media_type ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:compression ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:path ], + [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:FileTypeEnum ; + owl:onProperty data_sheets_schema:file_type ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:format ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:dialect ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:bytes ], + owl:onProperty data_sheets_schema:file_type ], [ a owl:Restriction ; owl:allValuesFrom data_sheets_schema:CompressionEnum ; owl:onProperty data_sheets_schema:compression ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:media_type ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:EncodingEnum ; - owl:onProperty data_sheets_schema:encoding ], + owl:onProperty data_sheets_schema:path ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:dialect ], + owl:onProperty data_sheets_schema:sha256 ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:md5 ], + owl:allValuesFrom data_sheets_schema:FormatEnum ; + owl:onProperty data_sheets_schema:format ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:path ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:encoding ], + owl:onProperty data_sheets_schema:bytes ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:MediaTypeEnum ; - owl:onProperty data_sheets_schema:media_type ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:sha256 ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:FormatEnum ; - owl:onProperty data_sheets_schema:format ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:hash ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:md5 ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:sha256 ], data_sheets_schema:Information ; skos:altLabel "data file", "file", @@ -345,29 +345,29 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "Software" ; rdfs:subClassOf [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:version ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:license ], - [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:license ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:url ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:version ], + owl:onProperty data_sheets_schema:license ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:version ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:url ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:url ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:version ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:version ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:license ], @@ -396,19 +396,16 @@ data_sheets_schema:Software a owl:Class, rdfs:label "CollectionTimeframe" ; rdfs:subClassOf [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Date ; owl:onProperty ], @@ -416,8 +413,11 @@ data_sheets_schema:Software a owl:Class, owl:allValuesFrom linkml:Date ; owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Over what timeframe was the data collected, and does this timeframe match the creation timeframe of the underlying data? """ ; @@ -428,6 +428,12 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "DataCollector" ; rdfs:subClassOf [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; @@ -436,12 +442,6 @@ data_sheets_schema:Software a owl:Class, [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Who was involved in the data collection (e.g., students, crowdworkers, contractors), and how they were compensated. """ ; @@ -452,46 +452,46 @@ data_sheets_schema:Software a owl:Class, rdfs:label "InstanceAcquisition" ; rdfs:subClassOf [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; + owl:onProperty ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; - owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Describes how data associated with each instance was acquired (e.g., directly observed, reported by subjects, inferred). """ ; @@ -505,22 +505,22 @@ data_sheets_schema:Software a owl:Class, owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Documentation of missing data in the dataset, including patterns, causes, and strategies for handling missing values. """ ; @@ -532,34 +532,34 @@ data_sheets_schema:Software a owl:Class, rdfs:label "RawDataSource" ; rdfs:subClassOf [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:minCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Description of raw data sources before preprocessing, cleaning, or labeling. Documents where the original data comes from and how it can be accessed. """ ; @@ -570,19 +570,19 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "Confidentiality" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; - owl:onProperty ], - [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Boolean ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Does the dataset contain data that might be confidential (e.g., protected by legal privilege, patient data, non-public communications)? @@ -593,20 +593,20 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "ContentWarning" ; rdfs:subClassOf [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:allValuesFrom linkml:Boolean ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Does the dataset contain any data that might be offensive, insulting, threatening, or otherwise anxiety-provoking if viewed directly? """ ; @@ -634,34 +634,34 @@ data_sheets_schema:Software a owl:Class, owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:BiasTypeEnum ; - owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:BiasTypeEnum ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Documents known biases present in the dataset. Biases are systematic errors or prejudices that may affect the representativeness or fairness of the data. Distinct from anomalies (data quality issues) and limitations (scope constraints). """ ; @@ -672,41 +672,41 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "DatasetLimitation" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:allValuesFrom data_sheets_schema:LimitationTypeEnum ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:LimitationTypeEnum ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Documents known limitations of the dataset that may affect its use or interpretation. Distinct from biases (systematic errors) and anomalies (data quality issues). """ ; @@ -718,16 +718,7 @@ data_sheets_schema:Software a owl:Class, rdfs:label "DatasetRelationship" ; rdfs:subClassOf [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:DatasetRelationshipTypeEnum ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], @@ -739,10 +730,19 @@ data_sheets_schema:Software a owl:Class, owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:DatasetRelationshipTypeEnum ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 1 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 1 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Typed relationship to another dataset, enabling precise specification of how datasets relate to each other (e.g., supplements, derives from, is version of). Supports RO-Crate-style dataset interlinking. """ ; @@ -752,23 +752,11 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "Deidentification" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], @@ -776,11 +764,23 @@ data_sheets_schema:Software a owl:Class, owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Is it possible to identify individuals in the dataset, either directly or indirectly (in combination with other data)? """ ; @@ -793,26 +793,38 @@ data_sheets_schema:Software a owl:Class, owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Uriorcurie ; - owl:onProperty ], + owl:allValuesFrom ; + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Uriorcurie ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Uriorcurie ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], @@ -825,36 +837,24 @@ data_sheets_schema:Software a owl:Class, [ a owl:Restriction ; owl:allValuesFrom linkml:Integer ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom ; owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:Uriorcurie ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """What do the instances that comprise the dataset represent (e.g., documents, photos, people, countries)? """ ; @@ -864,14 +864,14 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "MissingInfo" ; rdfs:subClassOf [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], @@ -886,6 +886,9 @@ data_sheets_schema:Software a owl:Class, rdfs:subClassOf [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], @@ -895,9 +898,6 @@ data_sheets_schema:Software a owl:Class, [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Does the dataset contain data that might be considered sensitive (e.g., race, sexual orientation, religion, biometrics)? """ ; @@ -908,6 +908,15 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "Subpopulation" ; rdfs:subClassOf [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; @@ -916,18 +925,9 @@ data_sheets_schema:Software a owl:Class, [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Does the dataset identify any subpopulations (e.g., by age, gender)? If so, how are they identified and what are their distributions? """ ; @@ -937,44 +937,44 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "ExportControlRegulatoryRestrictions" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:ConfidentialityLevelEnum ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:ComplianceStatusEnum ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom data_sheets_schema:Person ; owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:Person ; + owl:allValuesFrom data_sheets_schema:ConfidentialityLevelEnum ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:ComplianceStatusEnum ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Do any export controls or other regulatory restrictions apply to the dataset or to individual instances? Includes compliance tracking for regulations like HIPAA and other US regulations. If so, please describe these restrictions and provide a link or copy of any supporting documentation. Maps to DUO terms related to ethics approval, geographic restrictions, and institutional requirements. """ ; @@ -998,25 +998,25 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "LicenseAndUseTerms" ; rdfs:subClassOf [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:Person ; + owl:onProperty ], + [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:Person ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:DataUsePermissionEnum ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom data_sheets_schema:DataUsePermissionEnum ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Will the dataset be distributed under a copyright or other IP license, and/or under applicable terms of use? Provide a link or copy of relevant licensing terms and any fees. @@ -1027,10 +1027,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "DistributionDate" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """When will the dataset be distributed? @@ -1041,10 +1041,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "DistributionFormat" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """How will the dataset be distributed (e.g., tarball on a website, API, GitHub)? @@ -1055,10 +1055,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "DataProtectionImpact" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Has an analysis of the potential impact of the dataset and its use on data subjects (e.g., a data protection impact analysis) been conducted? If so, please provide a description of this analysis, including the outcomes, and any supporting documentation. @@ -1069,28 +1069,28 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "EthicalReview" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:Organization ; - owl:onProperty ], - [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:Person ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:Person ; + owl:allValuesFrom data_sheets_schema:Organization ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Were any ethical or compliance review processes conducted (e.g., by an institutional review board)? If so, please provide a description of these review processes, including the frequency of review and documentation of outcomes, as well as a link or other access point to any supporting documentation. @@ -1101,8 +1101,8 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "AtRiskPopulations" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], @@ -1110,23 +1110,23 @@ data_sheets_schema:Software a owl:Class, owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Information about protections for at-risk populations in human subjects research. """ ; @@ -1136,32 +1136,32 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "HumanSubjectCompensation" ; rdfs:subClassOf [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:allValuesFrom linkml:Boolean ; + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Information about compensation or incentives provided to human research participants. """ ; @@ -1171,38 +1171,38 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "HumanSubjectResearch" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom linkml:Boolean ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Information about whether the dataset involves human subjects research and what regulatory or ethical review processes were followed. """ ; @@ -1212,38 +1212,38 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "InformedConsent" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Boolean ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Details about informed consent procedures used in human subjects research. """ ; @@ -1253,29 +1253,29 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "ParticipantPrivacy" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Information about privacy protections and anonymization procedures for human research participants. """ ; @@ -1285,16 +1285,16 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "Erratum" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:Uri ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:allValuesFrom linkml:Uri ; + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; @@ -1308,20 +1308,20 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "ExtensionMechanism" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; owl:allValuesFrom linkml:Uri ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """If others want to extend/augment/build on/contribute to the dataset, is there a mechanism for them to do so? If so, please describe how those contributions are validated and communicated. """ ; @@ -1331,17 +1331,17 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "Maintainer" ; rdfs:subClassOf [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:CreatorOrMaintainerEnum ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:allValuesFrom data_sheets_schema:CreatorOrMaintainerEnum ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], @@ -1354,20 +1354,20 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "RetentionLimits" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """If the dataset relates to people, are there applicable limits on the retention of their data (e.g., were individuals told their data would be deleted after a certain time)? If so, please describe these limits and how they will be enforced. """ ; @@ -1386,10 +1386,10 @@ data_sheets_schema:Software a owl:Class, owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Will the dataset be updated (e.g., to correct labeling errors, add new instances, delete instances)? If so, how often, by whom, and how will these updates be communicated? @@ -1401,26 +1401,26 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "VersionAccess" ; rdfs:subClassOf [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Will older versions of the dataset continue to be supported/hosted/maintained? If so, how? If not, how will obsolescence be communicated to dataset consumers? """ ; @@ -1430,13 +1430,13 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "AddressingGap" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition "Was there a specific gap that needed to be filled by creation of the dataset?" ; @@ -1447,25 +1447,25 @@ data_sheets_schema:Software a owl:Class, rdfs:label "Creator" ; rdfs:subClassOf [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:CRediTRoleEnum ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom data_sheets_schema:Person ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom data_sheets_schema:Organization ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:CRediTRoleEnum ; - owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Who created the dataset (e.g., which team, research group) and on behalf of which entity (e.g., company, institution, organization)? This may also be considered a team. """ ; @@ -1475,20 +1475,20 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "FundingMechanism" ; rdfs:subClassOf [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; owl:allValuesFrom ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom ; owl:onProperty ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Who funded the creation of the dataset? If there is an associated grant, please provide the name of the grantor and the grant name and number. """ ; @@ -1498,10 +1498,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "Grant" ; rdfs:subClassOf [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; @@ -1555,44 +1555,44 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "AnnotationAnalysis" ; rdfs:subClassOf [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty ], + [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:Float ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Float ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Analysis of annotation quality, inter-annotator agreement metrics, and systematic patterns in annotation disagreements. """ ; @@ -1603,10 +1603,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "CleaningStrategy" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Was any cleaning of the data done (e.g., removal of instances, processing of missing values)? @@ -1618,6 +1618,12 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "ImputationProtocol" ; rdfs:subClassOf [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; @@ -1632,17 +1638,11 @@ data_sheets_schema:Software a owl:Class, [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Description of data imputation methodology, including techniques used to handle missing values and rationale for chosen approaches. @@ -1655,49 +1655,49 @@ data_sheets_schema:Software a owl:Class, rdfs:label "LabelingStrategy" ; rdfs:subClassOf [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Integer ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:Integer ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Was any labeling of the data done (e.g., part-of-speech tagging)? This class documents the annotation process and quality metrics. """ ; @@ -1707,20 +1707,20 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "MachineAnnotationTools" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], @@ -1749,6 +1749,9 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "RawData" ; rdfs:subClassOf [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty ], + [ a owl:Restriction ; owl:allValuesFrom linkml:Uri ; owl:onProperty ], [ a owl:Restriction ; @@ -1757,9 +1760,6 @@ data_sheets_schema:Software a owl:Class, [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], @@ -1772,10 +1772,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "DiscouragedUse" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Are there tasks for which the dataset should not be used? @@ -1786,10 +1786,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "ExistingUse" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Has the dataset been used for any tasks already? @@ -1800,10 +1800,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "FutureUseImpact" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Is there anything about the dataset's composition or collection that might impact future uses or create risks/harm (e.g., unfair treatment, legal or financial risks)? If so, describe these impacts and any mitigation strategies. @@ -1815,16 +1815,16 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "IntendedUse" ; rdfs:subClassOf [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; @@ -1834,7 +1834,7 @@ data_sheets_schema:Software a owl:Class, owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Explicit statement of intended uses for this dataset. Complements FutureUseImpact by focusing on positive, recommended applications rather than risks. Aligns with RO-Crate "Intended Use" field. """ ; @@ -1859,10 +1859,10 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "ProhibitedUse" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Explicit statement of prohibited or forbidden uses for this dataset. Stronger than DiscouragedUse - these are uses that are explicitly not permitted by license, ethics, or policy. Aligns with RO-Crate "Prohibited Uses" field. @@ -1873,12 +1873,6 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "UseRepository" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; @@ -1887,6 +1881,12 @@ data_sheets_schema:Software a owl:Class, [ a owl:Restriction ; owl:allValuesFrom linkml:Uri ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Is there a repository that links to any or all papers or systems that use the dataset? If so, provide a link or other access point. """ ; @@ -1896,119 +1896,119 @@ data_sheets_schema:Software a owl:Class, linkml:ClassDefinition ; rdfs:label "VariableMetadata" ; rdfs:subClassOf [ a owl:Restriction ; + owl:allValuesFrom linkml:Boolean ; + owl:onProperty ], + [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Integer ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Float ; + owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; - owl:onProperty ], + owl:minCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 1 ; - owl:onProperty ], + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Integer ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Uriorcurie ; - owl:onProperty ], + owl:allValuesFrom linkml:Float ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:VariableTypeEnum ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:maxCardinality 1 ; + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:allValuesFrom linkml:Uriorcurie ; + owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Float ; - owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Float ; owl:onProperty ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty ], + owl:allValuesFrom linkml:Boolean ; + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom data_sheets_schema:VariableTypeEnum ; + owl:onProperty ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; owl:onProperty ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition "Metadata describing an individual variable, field, or column in a dataset. Variables may represent measurements, observations, derived values, or categorical attributes." ; skos:exactMatch schema1:PropertyValue ; @@ -2623,59 +2623,59 @@ data_sheets_schema:FileCollection a owl:Class, linkml:ClassDefinition ; rdfs:label "FileCollection" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:FileCollectionTypeEnum ; - owl:onProperty data_sheets_schema:collection_type ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:external_resources ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:path ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Integer ; owl:onProperty data_sheets_schema:total_bytes ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:file_count ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:collection_type ], [ a owl:Restriction ; owl:allValuesFrom linkml:Integer ; owl:onProperty data_sheets_schema:file_count ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:compression ], + owl:onProperty data_sheets_schema:file_count ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:collection_type ], + owl:onProperty data_sheets_schema:external_resources ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:external_resources ], + owl:onProperty data_sheets_schema:resources ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:external_resources ], + owl:allValuesFrom [ owl:intersectionOf ( [ owl:unionOf ( data_sheets_schema:File data_sheets_schema:FileCollection ) ] data_sheets_schema:Dataset ) ] ; + owl:onProperty data_sheets_schema:resources ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:path ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:file_count ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:path ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:compression ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:path ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:total_bytes ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:total_bytes ], [ a owl:Restriction ; - owl:allValuesFrom [ owl:intersectionOf ( [ owl:unionOf ( data_sheets_schema:File data_sheets_schema:FileCollection ) ] data_sheets_schema:Dataset ) ] ; - owl:onProperty data_sheets_schema:resources ], - [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:path ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:CompressionEnum ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:compression ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:resources ], + owl:allValuesFrom data_sheets_schema:FileCollectionTypeEnum ; + owl:onProperty data_sheets_schema:collection_type ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom data_sheets_schema:CompressionEnum ; owl:onProperty data_sheets_schema:compression ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:Integer ; - owl:onProperty data_sheets_schema:total_bytes ], data_sheets_schema:Information ; skos:altLabel "data files", "file collection", @@ -3186,29 +3186,29 @@ data_sheets_schema:collection_type a owl:ObjectProperty, linkml:ClassDefinition ; rdfs:label "ExternalResource" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:external_resources ], + [ a owl:Restriction ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:external_resources ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:external_resources ], - [ a owl:Restriction ; - owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:Boolean ; owl:onProperty ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:external_resources ], data_sheets_schema:DatasetProperty ; skos:definition """Is the dataset self-contained or does it rely on external resources (e.g., websites, other datasets)? If external, are there guarantees that those resources will remain available and unchanged? """ ; @@ -3218,47 +3218,47 @@ data_sheets_schema:collection_type a owl:ObjectProperty, linkml:ClassDefinition ; rdfs:label "SamplingStrategy" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:String ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; + owl:onProperty ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; + owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:Boolean ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty ], + owl:onProperty ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty ], + owl:allValuesFrom linkml:Boolean ; + owl:onProperty ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty ], - [ a owl:Restriction ; - owl:minCardinality 0 ; owl:onProperty ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty ], + owl:minCardinality 0 ; + owl:onProperty ], data_sheets_schema:DatasetProperty ; skos:definition """Does the dataset contain all possible instances, or is it a sample (not necessarily random) of instances from a larger set? If so, how representative is it? """ ; @@ -3573,7 +3573,7 @@ data_sheets_schema:existing_uses a owl:ObjectProperty, data_sheets_schema:file_collections a owl:ObjectProperty, linkml:SlotDefinition ; rdfs:label "file_collections" ; - skos:definition "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart." ; + skos:definition "Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset entities via schema:hasPart in RO-Crate converters." ; skos:exactMatch dcat:distribution ; skos:inScheme . @@ -4924,184 +4924,184 @@ data_sheets_schema:Information a owl:Class, linkml:ClassDefinition ; rdfs:label "Information" ; rdfs:subClassOf [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:publisher ], - [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:issued ], + owl:onProperty data_sheets_schema:compression ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:page ], + owl:onProperty data_sheets_schema:language ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:CompressionEnum ; - owl:onProperty data_sheets_schema:compression ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:conforms_to_schema ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:version ], + owl:onProperty data_sheets_schema:created_by ], [ a owl:Restriction ; owl:allValuesFrom linkml:Datetime ; owl:onProperty data_sheets_schema:last_updated_on ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:modified_by ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:conforms_to_class ], + owl:onProperty data_sheets_schema:keywords ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Uri ; - owl:onProperty data_sheets_schema:download_url ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:issued ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:modified_by ], + owl:onProperty data_sheets_schema:created_on ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:language ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:status ], + owl:onProperty data_sheets_schema:doi ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:title ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:conforms_to_class ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:language ], + owl:onProperty data_sheets_schema:status ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:created_on ], + owl:onProperty data_sheets_schema:last_updated_on ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:created_by ], + owl:onProperty data_sheets_schema:conforms_to ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:language ], + owl:onProperty data_sheets_schema:conforms_to ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:was_derived_from ], + owl:onProperty data_sheets_schema:download_url ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:doi ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:created_on ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:conforms_to_class ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:license ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:last_updated_on ], + owl:onProperty data_sheets_schema:page ], [ a owl:Restriction ; owl:allValuesFrom linkml:Datetime ; - owl:onProperty data_sheets_schema:issued ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:keywords ], + owl:onProperty data_sheets_schema:created_on ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:keywords ], + owl:onProperty data_sheets_schema:version ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:license ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:publisher ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:conforms_to_schema ], + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:title ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:compression ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:conforms_to_schema ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:conforms_to ], + owl:onProperty data_sheets_schema:conforms_to_class ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:allValuesFrom linkml:Uri ; owl:onProperty data_sheets_schema:download_url ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:status ], + owl:allValuesFrom linkml:Uriorcurie ; + owl:onProperty data_sheets_schema:publisher ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:conforms_to ], + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:created_by ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:compression ], + owl:onProperty data_sheets_schema:title ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:license ], [ a owl:Restriction ; owl:allValuesFrom [ a rdfs:Datatype ; owl:onDatatype xsd:string ; owl:withRestrictions ( [ xsd:pattern "10\\.\\d{4,}\\/.+" ] ) ] ; owl:onProperty data_sheets_schema:doi ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:page ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:was_derived_from ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:download_url ], - [ a owl:Restriction ; - owl:minCardinality 0 ; owl:onProperty data_sheets_schema:version ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:license ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:title ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:created_by ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:license ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:page ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:version ], + owl:onProperty data_sheets_schema:page ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Datetime ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:created_on ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:title ], + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:modified_by ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:conforms_to_schema ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:conforms_to_class ], + owl:allValuesFrom linkml:Datetime ; + owl:onProperty data_sheets_schema:issued ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:publisher ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:issued ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:was_derived_from ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:status ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:modified_by ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Uriorcurie ; - owl:onProperty data_sheets_schema:publisher ], + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:keywords ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:conforms_to ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:created_by ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:issued ], + owl:onProperty data_sheets_schema:version ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:download_url ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:publisher ], + owl:onProperty data_sheets_schema:language ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:last_updated_on ], + owl:onProperty data_sheets_schema:was_derived_from ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:status ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:conforms_to_class ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:conforms_to ], + [ a owl:Restriction ; + owl:allValuesFrom data_sheets_schema:CompressionEnum ; + owl:onProperty data_sheets_schema:compression ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:doi ], + owl:onProperty data_sheets_schema:page ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:last_updated_on ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:modified_by ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:conforms_to_schema ], data_sheets_schema:NamedThing ; skos:closeMatch schema1:CreativeWork ; skos:definition "Grouping for datasets and data files" ; @@ -5120,31 +5120,31 @@ data_sheets_schema:Person a owl:Class, rdfs:label "Person" ; rdfs:subClassOf [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:email ], - [ a owl:Restriction ; - owl:allValuesFrom [ a rdfs:Datatype ; - owl:intersectionOf ( linkml:String [ a rdfs:Datatype ; - owl:onDatatype xsd:string ; - owl:withRestrictions ( [ xsd:pattern "^\\d{4}-\\d{4}-\\d{4}-\\d{3}[0-9X]$" ] ) ] ) ] ; owl:onProperty data_sheets_schema:orcid ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:affiliation ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:email ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:orcid ], + owl:onProperty data_sheets_schema:email ], [ a owl:Restriction ; - owl:minCardinality 0 ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:orcid ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:affiliation ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:email ], [ a owl:Restriction ; owl:allValuesFrom data_sheets_schema:Organization ; owl:onProperty data_sheets_schema:affiliation ], + [ a owl:Restriction ; + owl:allValuesFrom [ a rdfs:Datatype ; + owl:intersectionOf ( linkml:String [ a rdfs:Datatype ; + owl:onDatatype xsd:string ; + owl:withRestrictions ( [ xsd:pattern "^\\d{4}-\\d{4}-\\d{4}-\\d{3}[0-9X]$" ] ) ] ) ] ; + owl:onProperty data_sheets_schema:orcid ], data_sheets_schema:NamedThing ; skos:definition "An individual human being. This class represents a person in the context of a specific dataset. Attributes like affiliation and email represent the person's current or most relevant contact information for this dataset. For stable cross-dataset identification, use the ORCID field. Note that contributor roles (CRediT) are specified in the usage context (e.g., Creator class) rather than on the Person directly, since roles vary by dataset." ; skos:exactMatch schema1:Person ; @@ -5161,32 +5161,32 @@ data_sheets_schema:NamedThing a owl:Class, linkml:ClassDefinition ; rdfs:label "NamedThing" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:name ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:description ], + owl:allValuesFrom linkml:Uriorcurie ; + owl:onProperty data_sheets_schema:id ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:id ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:name ], + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:description ], [ a owl:Restriction ; - owl:minCardinality 1 ; - owl:onProperty data_sheets_schema:id ], + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:name ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:description ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Uriorcurie ; - owl:onProperty data_sheets_schema:id ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:name ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:name ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:description ] ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:description ], + [ a owl:Restriction ; + owl:minCardinality 1 ; + owl:onProperty data_sheets_schema:id ] ; skos:definition "A generic grouping for any identifiable entity." ; skos:exactMatch schema1:Thing ; skos:inScheme data_sheets_schema:base . @@ -5202,431 +5202,431 @@ data_sheets_schema:Dataset a owl:Class, linkml:ClassDefinition ; rdfs:label "Dataset" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:related_datasets ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:extension_mechanism ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:raw_sources ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:external_resources ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:parent_datasets ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:errata ], + owl:onProperty data_sheets_schema:informed_consent ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:resources ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:citation ], + owl:onProperty data_sheets_schema:cleaning_strategies ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:related_datasets ], + owl:onProperty data_sheets_schema:is_tabular ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:ip_restrictions ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:content_warnings ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:file_collections ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:updates ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:participant_privacy ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:data_collectors ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:collection_mechanisms ], + owl:onProperty data_sheets_schema:known_limitations ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:raw_sources ], + owl:onProperty data_sheets_schema:distribution_formats ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:errata ], + owl:onProperty data_sheets_schema:parent_datasets ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:retention_limit ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:anomalies ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Integer ; - owl:onProperty data_sheets_schema:total_file_count ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:ethical_reviews ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:is_deidentified ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:known_biases ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:distribution_dates ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:errata ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:use_repository ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:known_limitations ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:maintainers ], + owl:onProperty data_sheets_schema:total_file_count ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:confidential_elements ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:distribution_formats ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:cleaning_strategies ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:version_access ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:instances ], - [ a owl:Restriction ; - owl:allValuesFrom ; owl:onProperty data_sheets_schema:existing_uses ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:content_warnings ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:citation ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:informed_consent ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:total_size_bytes ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:ethical_reviews ], + owl:onProperty data_sheets_schema:future_use_impacts ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:tasks ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:labeling_strategies ], + owl:onProperty data_sheets_schema:ethical_reviews ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:at_risk_populations ], + owl:onProperty data_sheets_schema:human_subject_research ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:regulatory_restrictions ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:sensitive_elements ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:preprocessing_strategies ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:human_subject_research ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:instances ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:ip_restrictions ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:participant_compensation ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:intended_uses ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:creators ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:ethical_reviews ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:creators ], - [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:FileCollection ; - owl:onProperty data_sheets_schema:file_collections ], + owl:onProperty data_sheets_schema:anomalies ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:missing_data_documentation ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:addressing_gaps ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:sensitive_elements ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:labeling_strategies ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:sensitive_elements ], + owl:onProperty data_sheets_schema:version_access ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:funders ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:regulatory_restrictions ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:distribution_formats ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:cleaning_strategies ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:use_repository ], + owl:onProperty data_sheets_schema:known_biases ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:existing_uses ], + owl:onProperty data_sheets_schema:collection_mechanisms ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:raw_data_sources ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:data_protection_impacts ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:collection_timeframes ], - [ a owl:Restriction ; - owl:allValuesFrom linkml:Boolean ; - owl:onProperty data_sheets_schema:is_tabular ], + owl:onProperty data_sheets_schema:confidential_elements ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:distribution_dates ], + owl:onProperty data_sheets_schema:license_and_use_terms ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:subpopulations ], + owl:onProperty data_sheets_schema:retention_limit ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:confidential_elements ], + owl:onProperty data_sheets_schema:participant_privacy ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:citation ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:related_datasets ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:intended_uses ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:maintainers ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:version_access ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:annotation_analyses ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:preprocessing_strategies ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:use_repository ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:known_biases ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:license_and_use_terms ], + owl:onProperty data_sheets_schema:tasks ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:addressing_gaps ], + owl:onProperty data_sheets_schema:variables ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:prohibited_uses ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:content_warnings ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:discouraged_uses ], + owl:onProperty data_sheets_schema:resources ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:preprocessing_strategies ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:human_subject_research ], + owl:onProperty data_sheets_schema:is_tabular ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:imputation_protocols ], + owl:onProperty data_sheets_schema:subsets ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:external_resources ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:creators ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:other_tasks ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:at_risk_populations ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:extension_mechanism ], + owl:onProperty data_sheets_schema:participant_compensation ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:tasks ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:ip_restrictions ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:addressing_gaps ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:at_risk_populations ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:future_use_impacts ], + owl:onProperty data_sheets_schema:annotation_analyses ], [ a owl:Restriction ; owl:minCardinality 0 ; owl:onProperty data_sheets_schema:missing_data_documentation ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:discouraged_uses ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:is_tabular ], + owl:onProperty data_sheets_schema:creators ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:license_and_use_terms ], + owl:onProperty data_sheets_schema:total_file_count ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:version_access ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:total_size_bytes ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:acquisition_methods ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:external_resources ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:sampling_strategies ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:other_tasks ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:data_protection_impacts ], + owl:allValuesFrom data_sheets_schema:DataSubset ; + owl:onProperty data_sheets_schema:subsets ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:cleaning_strategies ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:distribution_dates ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:annotation_analyses ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:subpopulations ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:data_protection_impacts ], + owl:onProperty data_sheets_schema:sensitive_elements ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:intended_uses ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:participant_compensation ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:anomalies ], + owl:onProperty data_sheets_schema:at_risk_populations ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:is_deidentified ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:funders ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:human_subject_research ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:purposes ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Boolean ; + owl:onProperty data_sheets_schema:is_tabular ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:total_size_bytes ], + owl:onProperty data_sheets_schema:instances ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:acquisition_methods ], + owl:onProperty data_sheets_schema:imputation_protocols ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:known_biases ], + owl:allValuesFrom linkml:Integer ; + owl:onProperty data_sheets_schema:total_size_bytes ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:is_tabular ], + owl:onProperty data_sheets_schema:ip_restrictions ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:purposes ], + owl:onProperty data_sheets_schema:data_collectors ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:version_access ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:license_and_use_terms ], + owl:onProperty data_sheets_schema:raw_sources ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:known_limitations ], + owl:allValuesFrom data_sheets_schema:FileCollection ; + owl:onProperty data_sheets_schema:file_collections ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:at_risk_populations ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:updates ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:annotation_analyses ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:updates ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:imputation_protocols ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:instances ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:extension_mechanism ], [ a owl:Restriction ; owl:allValuesFrom ; owl:onProperty data_sheets_schema:participant_privacy ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:informed_consent ], + owl:onProperty data_sheets_schema:is_deidentified ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:labeling_strategies ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:collection_mechanisms ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:machine_annotation_tools ], + owl:onProperty data_sheets_schema:updates ], [ a owl:Restriction ; owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:human_subject_research ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:future_use_impacts ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:retention_limit ], + [ a owl:Restriction ; + owl:allValuesFrom ; owl:onProperty data_sheets_schema:raw_data_sources ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:imputation_protocols ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:total_file_count ], + owl:onProperty data_sheets_schema:related_datasets ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:extension_mechanism ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:other_tasks ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:data_collectors ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:labeling_strategies ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:external_resources ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:license_and_use_terms ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:confidential_elements ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:regulatory_restrictions ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:citation ], [ a owl:Restriction ; owl:allValuesFrom data_sheets_schema:Dataset ; owl:onProperty data_sheets_schema:resources ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:content_warnings ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:retention_limit ], + owl:onProperty data_sheets_schema:at_risk_populations ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:variables ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:informed_consent ], [ a owl:Restriction ; - owl:maxCardinality 1 ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:discouraged_uses ], + [ a owl:Restriction ; + owl:minCardinality 0 ; owl:onProperty data_sheets_schema:regulatory_restrictions ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:purposes ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:known_limitations ], + owl:onProperty data_sheets_schema:addressing_gaps ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:collection_mechanisms ], + owl:onProperty data_sheets_schema:machine_annotation_tools ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:tasks ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:acquisition_methods ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:anomalies ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:distribution_dates ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:funders ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:extension_mechanism ], + [ a owl:Restriction ; + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:citation ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:raw_sources ], [ a owl:Restriction ; owl:allValuesFrom ; owl:onProperty data_sheets_schema:variables ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:DataSubset ; - owl:onProperty data_sheets_schema:subsets ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:is_deidentified ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:collection_timeframes ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:machine_annotation_tools ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:subsets ], + owl:onProperty data_sheets_schema:maintainers ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:human_subject_research ], + owl:onProperty data_sheets_schema:prohibited_uses ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:total_size_bytes ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:sampling_strategies ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:updates ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:errata ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:retention_limit ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:use_repository ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:subpopulations ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:existing_uses ], [ a owl:Restriction ; owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:citation ], + owl:onProperty data_sheets_schema:retention_limit ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:regulatory_restrictions ], + owl:onProperty data_sheets_schema:collection_timeframes ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:sampling_strategies ], + owl:onProperty data_sheets_schema:discouraged_uses ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:participant_compensation ], + owl:onProperty data_sheets_schema:preprocessing_strategies ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:purposes ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:missing_data_documentation ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:distribution_formats ], - [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:maintainers ], - [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:total_file_count ], + owl:onProperty data_sheets_schema:raw_data_sources ], [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:Dataset ; - owl:onProperty data_sheets_schema:parent_datasets ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:acquisition_methods ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:prohibited_uses ], + owl:onProperty data_sheets_schema:data_protection_impacts ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:version_access ], + owl:onProperty data_sheets_schema:subpopulations ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:ip_restrictions ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:is_deidentified ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:Integer ; + owl:onProperty data_sheets_schema:total_file_count ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:other_tasks ], + owl:onProperty data_sheets_schema:extension_mechanism ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:future_use_impacts ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:data_collectors ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:collection_timeframes ], + owl:allValuesFrom data_sheets_schema:Dataset ; + owl:onProperty data_sheets_schema:parent_datasets ], + [ a owl:Restriction ; + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:prohibited_uses ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:updates ], + owl:onProperty data_sheets_schema:intended_uses ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:is_deidentified ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:funders ], [ a owl:Restriction ; - owl:allValuesFrom ; - owl:onProperty data_sheets_schema:machine_annotation_tools ], + owl:allValuesFrom ; + owl:onProperty data_sheets_schema:sampling_strategies ], [ a owl:Restriction ; - owl:allValuesFrom linkml:Integer ; - owl:onProperty data_sheets_schema:total_size_bytes ], + owl:maxCardinality 1 ; + owl:onProperty data_sheets_schema:license_and_use_terms ], data_sheets_schema:Information ; skos:altLabel "data file", "data package", @@ -5944,38 +5944,38 @@ data_sheets_schema:DatasetProperty a owl:Class, linkml:ClassDefinition ; rdfs:label "DatasetProperty" ; rdfs:subClassOf [ a owl:Restriction ; - owl:allValuesFrom data_sheets_schema:Software ; - owl:onProperty data_sheets_schema:used_software ], - [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:name ], [ a owl:Restriction ; - owl:allValuesFrom linkml:String ; - owl:onProperty data_sheets_schema:name ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:id ], [ a owl:Restriction ; owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:used_software ], + owl:onProperty data_sheets_schema:description ], [ a owl:Restriction ; owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:id ], [ a owl:Restriction ; - owl:maxCardinality 1 ; - owl:onProperty data_sheets_schema:description ], + owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:used_software ], [ a owl:Restriction ; owl:minCardinality 0 ; + owl:onProperty data_sheets_schema:name ], + [ a owl:Restriction ; + owl:maxCardinality 1 ; owl:onProperty data_sheets_schema:description ], [ a owl:Restriction ; owl:allValuesFrom linkml:String ; owl:onProperty data_sheets_schema:description ], [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:id ], - [ a owl:Restriction ; - owl:minCardinality 0 ; - owl:onProperty data_sheets_schema:name ], + owl:allValuesFrom data_sheets_schema:Software ; + owl:onProperty data_sheets_schema:used_software ], [ a owl:Restriction ; owl:allValuesFrom linkml:Uriorcurie ; - owl:onProperty data_sheets_schema:id ] ; + owl:onProperty data_sheets_schema:id ], + [ a owl:Restriction ; + owl:allValuesFrom linkml:String ; + owl:onProperty data_sheets_schema:name ] ; skos:definition "Represents a single property of a dataset, or a set of related properties." ; skos:inScheme data_sheets_schema:base . diff --git a/src/data_sheets_schema/datamodel/data_sheets_schema.py b/src/data_sheets_schema/datamodel/data_sheets_schema.py index d61c40f9..c92d2412 100644 --- a/src/data_sheets_schema/datamodel/data_sheets_schema.py +++ b/src/data_sheets_schema/datamodel/data_sheets_schema.py @@ -1,5 +1,5 @@ # Auto generated from data_sheets_schema.yaml by pythongen.py version: 0.0.1 -# Generation date: 2026-04-06T21:13:18 +# Generation date: 2026-04-07T13:03:28 # Schema: data-sheets-schema # # id: https://w3id.org/bridge2ai/data-sheets-schema @@ -3788,7 +3788,7 @@ class slots: slots.resources = Slot(uri=SCHEMA.hasPart, name="resources", curie=SCHEMA.curie('hasPart'), model_uri=DATA_SHEETS_SCHEMA.resources, domain=None, range=Optional[Union[Union[str, DatasetId], list[Union[str, DatasetId]]]]) -slots.dataset__file_collections = Slot(uri=SCHEMA.hasPart, name="dataset__file_collections", curie=SCHEMA.curie('hasPart'), +slots.dataset__file_collections = Slot(uri=D4D.fileCollections, name="dataset__file_collections", curie=D4D.curie('fileCollections'), model_uri=DATA_SHEETS_SCHEMA.dataset__file_collections, domain=None, range=Optional[Union[dict[Union[str, FileCollectionId], Union[dict, FileCollection]], list[Union[dict, FileCollection]]]]) slots.dataset__total_file_count = Slot(uri=D4D.totalFileCount, name="dataset__total_file_count", curie=D4D.curie('totalFileCount'), diff --git a/src/data_sheets_schema/schema/D4D_FileCollection.yaml b/src/data_sheets_schema/schema/D4D_FileCollection.yaml index 25813955..8bdfd70b 100644 --- a/src/data_sheets_schema/schema/D4D_FileCollection.yaml +++ b/src/data_sheets_schema/schema/D4D_FileCollection.yaml @@ -103,6 +103,10 @@ classes: - range: FileCollection multivalued: true inlined_as_list: true + # NOTE: LinkML generator limitation - Generated artifacts (Python datamodel, + # JSON Schema) do not fully reflect this union type constraint. The generated + # code still types resources as Dataset rather than (File | FileCollection). + # This is a known limitation of LinkML's union type handling. attributes: collection_type: description: >- diff --git a/src/data_sheets_schema/schema/data_sheets_schema.yaml b/src/data_sheets_schema/schema/data_sheets_schema.yaml index ccd416b3..e19f8861 100644 --- a/src/data_sheets_schema/schema/data_sheets_schema.yaml +++ b/src/data_sheets_schema/schema/data_sheets_schema.yaml @@ -120,8 +120,8 @@ classes: Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested - RO-Crate Dataset entities via schema:hasPart. - slot_uri: schema:hasPart + RO-Crate Dataset entities via schema:hasPart in RO-Crate converters. + slot_uri: d4d:fileCollections range: FileCollection multivalued: true inlined_as_list: true diff --git a/src/data_sheets_schema/schema/data_sheets_schema_all.yaml b/src/data_sheets_schema/schema/data_sheets_schema_all.yaml index c7edfb8a..e864172e 100644 --- a/src/data_sheets_schema/schema/data_sheets_schema_all.yaml +++ b/src/data_sheets_schema/schema/data_sheets_schema_all.yaml @@ -2171,11 +2171,11 @@ classes: description: Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset - entities via schema:hasPart. + entities via schema:hasPart in RO-Crate converters. from_schema: https://w3id.org/bridge2ai/data-sheets-schema exact_mappings: - dcat:distribution - slot_uri: schema:hasPart + slot_uri: d4d:fileCollections alias: file_collections owner: Dataset domain_of: @@ -3567,11 +3567,11 @@ classes: description: Collections of files within this dataset. Each collection represents a logical grouping of files with shared characteristics (e.g., all training data, all image files, all raw data files). Maps to nested RO-Crate Dataset - entities via schema:hasPart. + entities via schema:hasPart in RO-Crate converters. from_schema: https://w3id.org/bridge2ai/data-sheets-schema exact_mappings: - dcat:distribution - slot_uri: schema:hasPart + slot_uri: d4d:fileCollections alias: file_collections owner: DataSubset domain_of: diff --git a/src/fairscape_integration/d4d_to_fairscape.py b/src/fairscape_integration/d4d_to_fairscape.py index 442f41b7..d4b8a295 100644 --- a/src/fairscape_integration/d4d_to_fairscape.py +++ b/src/fairscape_integration/d4d_to_fairscape.py @@ -121,6 +121,15 @@ def _build_dataset(self, d4d_dict: Dict[str, Any], hasPart_ids: List[str] = None author_str = str(authors) # Build dataset params using JSON-LD field names (aliases) + # Collect all hasPart references: file collections + other resources + all_hasPart_ids = list(hasPart_ids or []) + + # Include Dataset.resources (non-file-collection nested datasets) in hasPart + if "resources" in d4d_dict and d4d_dict["resources"]: + for resource in d4d_dict["resources"]: + if isinstance(resource, dict) and "id" in resource: + all_hasPart_ids.append(resource["id"]) + dataset_params = { "@id": "./", "@type": ["Dataset", "https://w3id.org/EVI#ROCrate"], @@ -130,7 +139,7 @@ def _build_dataset(self, d4d_dict: Dict[str, Any], hasPart_ids: List[str] = None "version": d4d_dict.get("version", "1.0"), "author": author_str, "license": d4d_dict.get("license", "No license specified"), # Required field - "hasPart": [{"@id": id} for id in (hasPart_ids or [])] # Add file collection references + "hasPart": [{"@id": id} for id in all_hasPart_ids] } # Add optional Schema.org fields @@ -280,6 +289,11 @@ def _build_file_collections(self, d4d_dict: Dict[str, Any]) -> tuple[List[ROCrat if "file_count" in fc: collection_params["d4d:fileCount"] = fc["file_count"] + # TODO: Convert FileCollection.resources (File objects) to RO-Crate File entities + # Currently, file-level metadata in resources is not converted to RO-Crate. + # Future work: iterate fc.get('resources', []), create RO-Crate File entities, + # and add their @ids to hasPart. + # Create nested Dataset element collection_elem = ROCrateMetadataElem(**collection_params) file_collections.append(collection_elem) diff --git a/src/fairscape_integration/fairscape_to_d4d.py b/src/fairscape_integration/fairscape_to_d4d.py index e8dae984..be3121ca 100644 --- a/src/fairscape_integration/fairscape_to_d4d.py +++ b/src/fairscape_integration/fairscape_to_d4d.py @@ -286,6 +286,11 @@ def _build_file_collections(self, nested_datasets: List[Dict]) -> List[Dict[str, if 'd4d:fileCount' in dataset: collection['file_count'] = dataset['d4d:fileCount'] + # TODO: Parse nested Dataset's hasPart to build FileCollection.resources + # Currently, file-level information in RO-Crate File entities is not converted + # to FileCollection.resources (File objects). Future work: parse dataset['hasPart'], + # fetch referenced File entities, and convert to D4D File objects in resources. + # Only add non-empty collections if collection: file_collections.append(collection) diff --git a/src/validation/unified_validator.py b/src/validation/unified_validator.py index 15614f2c..7f68e293 100644 --- a/src/validation/unified_validator.py +++ b/src/validation/unified_validator.py @@ -187,7 +187,7 @@ def migrate_legacy_file_properties(data: Dict[str, Any]) -> tuple[Dict[str, Any] # Check if migration needed all_legacy_props = file_level_props + collection_props + ['bytes'] has_file_props = any(k in data for k in all_legacy_props) - has_collections = 'file_collections' in data and data['file_collections'] + has_collections = 'file_collections' in data if has_file_props and not has_collections: # Create default file collection diff --git a/tests/test_file_collection.py b/tests/test_file_collection.py index a469f11b..cd92d826 100644 --- a/tests/test_file_collection.py +++ b/tests/test_file_collection.py @@ -21,7 +21,7 @@ def test_filecollection_basic_validation(self): 'id': 'test-collection-1', 'name': 'Training Data', 'description': 'Training dataset files', - 'collection_type': 'training_split', + 'collection_type': ['training_split'], 'total_bytes': 1048576, 'file_count': 100 } @@ -29,7 +29,7 @@ def test_filecollection_basic_validation(self): # This should validate without errors when using linkml-validate # For now, just test the data structure is correct self.assertIn('id', filecollection_data) - self.assertEqual(filecollection_data['collection_type'], 'training_split') + self.assertEqual(filecollection_data['collection_type'], ['training_split']) def test_dataset_with_file_collections(self): """Test Dataset containing FileCollections.""" @@ -41,13 +41,13 @@ def test_dataset_with_file_collections(self): { 'id': 'collection-1', 'name': 'Training Files', - 'collection_type': 'training_split', + 'collection_type': ['training_split'], 'total_bytes': 1048576 }, { 'id': 'collection-2', 'name': 'Test Files', - 'collection_type': 'test_split', + 'collection_type': ['test_split'], 'total_bytes': 524288 } ], @@ -77,9 +77,9 @@ def test_filecollection_enum_values(self): collection = { 'id': f'collection-{collection_type}', 'name': f'{collection_type} files', - 'collection_type': collection_type + 'collection_type': [collection_type] } - self.assertEqual(collection['collection_type'], collection_type) + self.assertEqual(collection['collection_type'], [collection_type]) def test_filecollection_properties_complete(self): """Test FileCollection with all collection-level properties.""" @@ -87,7 +87,7 @@ def test_filecollection_properties_complete(self): 'id': 'complete-collection', 'name': 'Complete File Collection', 'description': 'A collection with all properties', - 'collection_type': 'processed_data', + 'collection_type': ['processed_data'], 'total_bytes': 2097152, 'file_count': 50, 'path': '/data/processed/', @@ -231,9 +231,17 @@ def test_write_and_read_filecollection_yaml(self): { 'id': 'test-collection', 'name': 'Test Files', - 'collection_type': 'test_split', - 'format': 'CSV', - 'bytes': 1024 + 'collection_type': ['test_split'], + 'total_bytes': 1024, + 'file_count': 1, + 'resources': [ + { + 'id': 'test001.csv', + 'file_type': 'data_file', + 'format': 'CSV', + 'bytes': 1024 + } + ] } ] } @@ -250,6 +258,7 @@ def test_write_and_read_filecollection_yaml(self): self.assertEqual(loaded_data['id'], 'test-dataset') self.assertEqual(loaded_data['file_collections'][0]['name'], 'Test Files') + self.assertEqual(loaded_data['file_collections'][0]['resources'][0]['format'], 'CSV') finally: Path(temp_path).unlink()