diff --git a/assessments/11_embed_metadata_add_license_fix_html.json b/assessments/11_embed_metadata_add_license_fix_html.json new file mode 100644 index 0000000..4315166 --- /dev/null +++ b/assessments/11_embed_metadata_add_license_fix_html.json @@ -0,0 +1,1699 @@ +{ + "test_id": "b8602b6752b1ecac585ea25af930be5fb4ee698e", + "request": { + "object_identifier": "https:\/\/sandbox.zenodo.org\/records\/502989", + "metadata_service_endpoint": "", + "metadata_service_type": "oai_pmh", + "test_debug": true, + "use_datacite": true, + "metric_version": "metrics_v0.8" + }, + "resolved_url": "https:\/\/sandbox.zenodo.org\/records\/502989", + "start_timestamp": "2026-05-21T16:34:08Z", + "end_timestamp": "2026-05-21T16:34:15Z", + "metric_specification": "https:\/\/doi.org\/10.5281\/zenodo.15045911", + "metric_version": "0.8", + "software_version": "3.5.1", + "total_metrics": 17, + "summary": { + "score_earned": { + "A": 6, + "F": 5, + "I": 2, + "R": 6, + "A1": 2, + "A1.1": 2, + "A1.2": 2, + "F1": 1, + "F2": 1, + "F3": 1, + "F4": 2, + "I1": 2, + "I2": 0, + "I3": 0, + "R1": 2, + "R1.1": 1, + "R1.2": 1, + "R1.3": 2, + "FAIR": 19 + }, + "score_total": { + "A": 7, + "F": 7, + "I": 6, + "R": 6, + "A1": 3, + "A1.1": 2, + "A1.2": 2, + "F1": 2, + "F2": 2, + "F3": 1, + "F4": 2, + "I1": 2, + "I2": 2, + "I3": 2, + "R1": 2, + "R1.1": 1, + "R1.2": 1, + "R1.3": 2, + "FAIR": 26 + }, + "score_percent": { + "A": 85.71, + "F": 71.43, + "I": 33.33, + "R": 100, + "A1": 66.67, + "A1.1": 100, + "A1.2": 100, + "F1": 50, + "F2": 50, + "F3": 100, + "F4": 100, + "I1": 100, + "I2": 0, + "I3": 0, + "R1": 100, + "R1.1": 100, + "R1.2": 100, + "R1.3": 100, + "FAIR": 73.08 + }, + "status_total": { + "A1": 2, + "A1.1": 1, + "A1.2": 1, + "F1": 2, + "F2": 1, + "F3": 1, + "F4": 1, + "I1": 1, + "I2": 1, + "I3": 1, + "R1": 1, + "R1.1": 1, + "R1.2": 1, + "R1.3": 2, + "A": 4, + "F": 5, + "I": 3, + "R": 5, + "FAIR": 17 + }, + "status_passed": { + "A1": 1, + "A1.1": 1, + "A1.2": 1, + "F1": 1, + "F2": 1, + "F3": 1, + "F4": 1, + "I1": 0, + "I2": 0, + "I3": 0, + "R1": 1, + "R1.1": 1, + "R1.2": 1, + "R1.3": 2, + "A": 3, + "F": 4, + "I": 0, + "R": 5, + "FAIR": 12 + }, + "maturity": { + "A": 2, + "F": 2, + "I": 1, + "R": 2, + "A1": 2, + "A1.1": 3, + "A1.2": 3, + "F1": 2, + "F2": 2, + "F3": 3, + "F4": 3, + "I1": 2, + "I2": 0, + "I3": 0, + "R1": 3, + "R1.1": 3, + "R1.2": 2, + "R1.3": 2, + "FAIR": 1.75 + } + }, + "results": [ + { + "output": { + "unique_identifiers": [ + { + "guid": "https:\/\/sandbox.zenodo.org\/records\/502989", + "guid_scheme": "url", + "target": "metadata" + }, + { + "guid": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "guid_scheme": "url", + "target": "data" + } + ], + "guid": "https:\/\/sandbox.zenodo.org\/records\/502989", + "guid_scheme": [ + "url" + ] + }, + "test_debug": [ + "INFO: Using IDUTILS schemes to identify unique or persistent identifiers for metadata", + "INFO: Starting assessment on identifier: https:\/\/sandbox.zenodo.org\/records\/502989", + "SUCCESS: Unique identifier schemes found ['url']", + "INFO: Finalized unique identifier scheme - url", + "INFO: Using idutils schemes to identify unique or persistent identifiers for data", + "INFO: Starting assessment on data identifier: https:\/\/sandbox.zenodo.org\/records\/502989", + "SUCCESS: Unique data identifier schemes found: - ['url']" + ], + "id": 1, + "metric_identifier": "FsF-F1-01MD", + "metric_name": "Metadata and data are assigned a globally unique identifier.", + "metric_tests": { + "FsF-F1-01MD-1": { + "metric_test_name": "Metadata identifier follows a defined unique identifier syntax or scheme (IRI, URL, UUID, HASH or PID)", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property\/object_identifier", + "comment": "identifier can be given as user input", + "target": "https:\/\/f-uji.net\/vocab\/identifier\/unique" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + }, + "FsF-F1-01MD-2": { + "metric_test_name": "Data identifier follows a defined unique identifier syntax (IRI, URL, UUID, HASH or PID)", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property\/object_identifier", + "comment": "For backwards compatibility reasons this test is not scored", + "target": "https:\/\/f-uji.net\/vocab\/identifier\/unique" + } + ], + "metric_test_score": { + "earned": 0, + "total": 0 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 1, + "total": 1 + }, + "maturity": 3 + }, + { + "id": 2, + "metric_identifier": "FsF-F1-02MD", + "metric_name": "Metadata and data are assigned a persistent identifier.", + "metric_tests": { + "FsF-F1-02MD-1": { + "metric_test_name": "Metadata identifier follows a defined persistent identifier syntax", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property\/object_identifier", + "comment": "Identifier can be given as user input", + "target": "https:\/\/f-uji.net\/vocab\/identifier\/persistent" + } + ], + "metric_test_score": { + "earned": 0, + "total": 0.5 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + }, + "FsF-F1-02MD-2": { + "metric_test_name": "Persistent identifier for metadata is registered and maintained by a PID authority", + "metric_test_requirements": [ + { + "modality": null, + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property\/object_identifier", + "comment": "Identifier has to be redirected which verifies it is registered in a PID system", + "target": "https:\/\/f-uji.net\/vocab\/identifier\/persistent" + } + ], + "metric_test_score": { + "earned": 0, + "total": 0.5 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + }, + "FsF-F1-02MD-4": { + "metric_test_name": "Data identifier follows a defined persistent identifier syntax", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property\/object_identifier", + "comment": "For backwards compatibility reasons this test is not scored", + "target": "https:\/\/f-uji.net\/vocab\/identifier\/persistent" + } + ], + "metric_test_score": { + "earned": 0, + "total": 0 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + }, + "FsF-F1-02MD-5": { + "metric_test_name": "Persistent identifier for data is registered and maintained by a PID authority", + "metric_test_requirements": [ + { + "modality": null, + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property\/object_identifier", + "comment": "Identifier has to be redirected which verifies it is registered in a PID system; test is not scored", + "target": "https:\/\/f-uji.net\/vocab\/identifier\/persistent" + } + ], + "metric_test_score": { + "earned": 0, + "total": 0 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "fail", + "score": { + "earned": 0, + "total": 1 + }, + "maturity": 0, + "output": { + "persistent_identifiers": [ + { + "pid": "https:\/\/doi.org\/10.5072\/zenodo.502989", + "pid_scheme": "doi", + "resolvable_status": false, + "resolved_url": null, + "target": "metadata" + } + ] + }, + "test_debug": [ + "INFO: Retrieving page -: https:\/\/sandbox.zenodo.org\/records\/502989 as text\/html, *\/*", + "INFO: Content negotiation on https:\/\/sandbox.zenodo.org\/records\/502989 accept=text\/html, *\/*, status=200", + "INFO: Creating Cached response content", + "INFO: Found HTML page!", + "INFO: PID schemes-based assessment supported by the assessment service - dict_keys(['ark', 'arxiv', 'bioproject', 'biosample', 'doi', 'ensembl', 'genome', 'gnd', 'handle', 'lsid', 'pmid', 'pmcid', 'purl', 'refseq', 'sra', 'uniprot', 'urn', 'identifiers.org', 'w3id'])", + "WARNING: PID syntax is OK but the PID seems to resolve to a different entity, will not use this PID for content negotiation", + "INFO: Could not find any persistent identifier for metadata which complies with a known PID syntax", + "WARNING: Could not find any persistent identifier for metadata which is registered", + "INFO: Could not find any persistent identifier for data which complies with a known PID syntax", + "INFO: Could not find any persistent identifier for data which is registered" + ] + }, + { + "id": 5, + "metric_identifier": "FsF-F2-01M", + "metric_name": "Metadata includes descriptive core elements (creator, title, data identifier, publisher, publication date, summary and keywords) to support data findability.", + "metric_tests": { + "FsF-F2-01M-2": { + "metric_test_name": "Core data citation metadata is available", + "metric_test_requirements": [ + { + "modality": "all", + "required": { + "name": [ + "creator", + "title", + "object_identifier", + "publication_date", + "publisher", + "object_type" + ] + }, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/metadata\/property" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 2, + "metric_test_status": "pass" + }, + "FsF-F2-01M-3": { + "metric_test_name": "Core descriptive metadata is available", + "metric_test_requirements": [ + { + "modality": "all", + "required": { + "name": [ + "creator", + "title", + "object_identifier", + "publication_date", + "publisher", + "object_type", + "summary", + "keywords" + ] + }, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/metadata\/property" + } + ], + "metric_test_score": { + "earned": 0, + "total": 1 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "pass", + "score": { + "earned": 1, + "total": 2 + }, + "maturity": 2, + "output": { + "core_metadata_status": "partial metadata", + "core_metadata_found": { + "object_identifier": [ + "https:\/\/doi.org\/10.5072\/zenodo.502989", + "https:\/\/sandbox.zenodo.org\/records\/502989", + "10.5072\/zenodo.502989" + ], + "title": "marirenab\/fair-hackathon_group2: v1.1", + "summary": "FAIR-data hackathon: iteratively destroy then repair an open dataset, scored by F-UJI", + "publication_date": "2026-05-21", + "publisher": [ + "Zenodo" + ], + "creator": [ + "Marirena Bafaloukou", + "Mateus Harrington" + ], + "object_type": [ + "SoftwareSourceCode", + "http:\/\/schema.org\/WebPage" + ] + }, + "core_metadata_source": [ + [ + "DUBLINCORE_EMBEDDED", + "meta_tag" + ], + [ + "SCHEMAORG_EMBEDDED", + "json_in_html" + ], + [ + "MICRODATA_EMBEDDED", + "microdata" + ], + [ + "HIGHWIRE_EPRINTS_EMBEDDED", + "meta_tag" + ], + [ + "OPENGRAPH_EMBEDDED", + "rdfa" + ] + ] + }, + "test_debug": [ + "INFO: Trying to resolve input URL -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Starting to analyse EMBEDDED metadata at -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Trying to identify EMBEDDED Microdata, OpenGraph or Schema.org -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Trying to retrieve schema.org JSON-LD metadata from html page", + "INFO: Try to parse RDF (JSON-LD) from -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Try to parse JSON-LD using RDFLib retrieved as string from -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Found RDF Graph which was sucessfully parsed", + "INFO: Trying to identify namespaces in RDF Graph", + "INFO: RDF Graph seems to contain schema.org metadata elements", + "INFO: Detected main entity found in RDF graph seems not to be a creative work type", + "INFO: Trying to get some core domain agnostic (DCAT, DC, schema.org) metadata from RDF graph", + "INFO: Found some core domain agnostic (DCAT, DC, schema.org) metadata from RDF graph -: {'object_identifier': ['https:\/\/doi.org\/10.5072\/zenodo.502989', 'https:\/\/sandbox.zenodo.org\/records\/502989'], 'title': 'marirenab\/fair-hackathon_group2: v1.1', 'summary': 'FAIR-data hackathon: iteratively destroy then repair an open dataset, scored by F-UJI', 'publication_date': '2026-05-21', 'publisher': ['Zenodo'], 'creator': ['Marirena Bafaloukou', 'Mateus Harrington', 'Marirena Bafaloukou', 'Mateus Harrington'], 'license': 'https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode', 'object_type': ['SoftwareSourceCode']}", + "SUCCESS: Found embedded (schema.org) JSON-LD metadata in html page -: dict_keys(['object_identifier', 'title', 'summary', 'publication_date', 'publisher', 'creator', 'license', 'object_type', 'object_size'])", + "INFO: Trying to retrieve Dublin Core metadata from html page", + "SUCCESS: Found DublinCore metadata -: dict_keys(['summary'])", + "INFO: Trying to retrieve Microdata metadata from html page", + "INFO: Trying to extract Microdata metadata from -: MetadataSources.MICRODATA_EMBEDDED", + "SUCCESS: Found microdata metadata -: dict_keys(['object_type'])", + "INFO: Trying to retrieve RDFa metadata from html page", + "INFO: Found RDF Graph which was sucessfully parsed", + "INFO: Trying to identify namespaces in RDF Graph", + "INFO: Could not find DCAT, schema.org or SKOS\/OWL metadata, continuing with generic SPARQL", + "INFO: Trying to query generic SPARQL on RDF, found triples: -:25", + "INFO: Found RDFa like triples but at least some of them seem to be XHTML or OpenGraph properties which are excluded", + "INFO: Trying to retrieve Highwire and eprints metadata from html page", + "INFO: Metadata property differs from metadata previously offered in a different formats -: summary: FAIR-data hackathon: iteratively destroy then repa vs. https:\/\/sandbox.zenodo.org\/records\/502989", + "SUCCESS: Found Highwire or eprints metadata -: dict_keys(['title', 'object_identifier', 'summary'])", + "INFO: Trying to retrieve OpenGraph metadata from html page", + "INFO: Found OpenGraph metadata-: dict_keys(['title', 'object_identifier', 'summary', 'publisher'])", + "SUCCESS: Found OpenGraph metadata -: dict_keys(['title', 'object_identifier', 'summary', 'publisher'])", + "INFO: Trying to identify Typed Links to data items in html page", + "INFO: Starting to identify EXTERNAL metadata through content negotiation or typed (signposting) links", + "INFO: Trying to retrieve XML metadata through content negotiation from URL -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Retrieving page -: https:\/\/sandbox.zenodo.org\/records\/502989 as application\/xml, text\/xml;q=0.5", + "INFO: Content negotiation on https:\/\/sandbox.zenodo.org\/records\/502989 accept=application\/xml, text\/xml;q=0.5, status=200", + "INFO: Using Cached response content", + "INFO: Trying to extract\/parse XML metadata from URL -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Expected XML but content negotiation responded -: MetadataFormats.HTML", + "INFO: Could not identify metadata properties in XML", + "INFO: Trying to retrieve schema.org JSON-LD metadata through content negotiation from URL -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Retrieving page -: https:\/\/sandbox.zenodo.org\/records\/502989 as application\/ld+json", + "INFO: Content negotiation on https:\/\/sandbox.zenodo.org\/records\/502989 accept=application\/ld+json, status=200", + "INFO: Using Cached response content", + "INFO: Schema.org metadata through content negotiation UNAVAILABLE", + "INFO: Trying to retrieve RDF metadata through content negotiation from URL -: https:\/\/sandbox.zenodo.org\/records\/502989", + "INFO: Retrieving page -: https:\/\/sandbox.zenodo.org\/records\/502989 as text\/turtle, application\/turtle, application\/x-turtle;q=0.8, application\/rdf+xml, text\/n3;q=0.9, text\/rdf+n3;q=0.9,application\/ld+json", + "INFO: Content negotiation on https:\/\/sandbox.zenodo.org\/records\/502989 accept=text\/turtle, application\/turtle, application\/x-turtle;q=0.8, application\/rdf+xml, text\/n3;q=0.9, text\/rdf+n3;q=0.9,application\/ld+json, status=200", + "INFO: Using Cached response content", + "INFO: Try to parse RDF from -: https:\/\/sandbox.zenodo.org\/records\/502989 as turtle", + "WARNING: Failed to parse RDF, trying to fix RDF string and retry parsing everything before line -: 9", + "INFO: Failed to parse RDF -: https:\/\/sandbox.zenodo.org\/records\/502989 at line 8 of <>:", + "INFO: Linked Data metadata UNAVAILABLE", + "INFO: Trying to retrieve datacite metadata", + "INFO: Retrieving page -: https:\/\/sandbox.zenodo.org\/records\/502989 as application\/vnd.datacite.datacite+json", + "INFO: Content negotiation on https:\/\/sandbox.zenodo.org\/records\/502989 accept=application\/vnd.datacite.datacite+json, status=200", + "INFO: Using Cached response content", + "WARNING: Failed to extract Datacite JSON -: 'bytes' object has no attribute 'get'", + "INFO: Datacite metadata UNAVAILABLE", + "INFO: Found typed link or signposting link but will ignore (can't handle) mime type -:application\/zip", + "INFO: Type of object described by the metadata -: None", + "INFO: Testing if any metadata has been made available via common web standards", + "SUCCESS: Found required core citation metadata elements -: ['creator', 'title', 'object_identifier', 'publication_date', 'publisher', 'object_type']", + "INFO: Will exclusively consider community specific metadata properties which are specified in metrics -: {'name': ['creator', 'title', 'object_identifier', 'publication_date', 'publisher', 'object_type', 'summary', 'keywords']}", + "WARNING: Not all required core descriptive metadata elements exist, missing -: ['keywords']" + ] + }, + { + "id": 6, + "metric_identifier": "FsF-F3-01M", + "metric_name": "Metadata includes the identifier of the data it describes.", + "metric_tests": { + "FsF-F3-01M-2": { + "metric_test_name": "Metadata contains a PID or URL which indicates the location of the downloadable data content", + "metric_test_requirements": [ + { + "modality": "any", + "required": { + "name": [ + "url" + ] + }, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property\/object_content_identifier", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/data\/property" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 1, + "total": 1 + }, + "maturity": 3, + "output": { + "object_identifier_included": null, + "object_content_identifier_included": [ + { + "content_identifier_included": { + "url": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "scheme": null + } + } + ] + }, + "test_debug": [ + "INFO: Found data links in HTML head (link rel=item) -: 1", + "SUCCESS: Number of object content identifier found -: 1" + ] + }, + { + "id": 7, + "metric_identifier": "FsF-F4-01M", + "metric_name": "Metadata is offered in such a way that it can be registered or indexed by search engines.", + "metric_tests": { + "FsF-F4-01M-1": { + "metric_test_name": "Metadata is given in a way major search engines can ingest it for their catalogues (Dublin Core or schema.org or DCAT encoded in microdata, RDFa, embedded JSON-LD or meta tags see e.g. Google Dataset Search webmaster guidelines)", + "metric_test_requirements": [ + { + "modality": "any", + "required": { + "name": [ + "dublin-core", + "schemaorg", + "dcat-data-catalog-vocabulary" + ] + }, + "tested_on": "http:\/\/f-uji.net\/vocab\/metadata", + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/standard" + }, + { + "modality": "any", + "required": { + "name": [ + "rdfa", + "microdata", + "meta_tag", + "json_in_html" + ] + }, + "tested_on": "http:\/\/f-uji.net\/vocab\/metadata", + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/offering_method" + } + ], + "metric_test_score": { + "earned": 2, + "total": 2 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 2, + "total": 2 + }, + "maturity": 3, + "output": { + "search_mechanisms": [ + { + "mechanism": "structured data", + "mechanism_info": [ + "schemaorg via: json_in_html", + "dublin-core via: meta_tag", + "schemaorg via: microdata" + ] + } + ] + }, + "test_debug": [ + "INFO: Will exclusively consider community specific metadata standards for FsF-F4-01M-1 which are specified in metrics -: ['dublin-core', 'schemaorg', 'dcat-data-catalog-vocabulary']", + "INFO: Will exclusively consider community specific metadata offering methods for FsF-F4-01M-1 which are specified in metrics -: ['rdfa', 'microdata', 'meta_tag', 'json_in_html']", + "SUCCESS: Metadata is offered in a way major search engines can ingest it -: ['schemaorg via: json_in_html', 'dublin-core via: meta_tag', 'schemaorg via: microdata']" + ] + }, + { + "id": 8, + "metric_identifier": "FsF-A1-01M", + "metric_name": "Metadata contains access level and access conditions of the data.", + "metric_tests": { + "FsF-A1-01M-1": { + "metric_test_name": "Information about access restrictions or rights can be identified in metadata", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": null, + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/property\/access_level" + } + ], + "metric_test_score": { + "earned": 0, + "total": 1 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "fail", + "score": { + "earned": 0, + "total": 1 + }, + "maturity": 0, + "output": { + "access_level": null, + "access_details": [] + }, + "test_debug": [ + "WARNING: NO access information is available in metadata", + "INFO: Skipping standard terms test since NO access information is available in metadata", + "INFO: Skipping standard terms test since NO access information is available in metadata", + "INFO: Skipping machine readablility test since NO access information is available in metadata", + "WARNING: Unable to determine the access level" + ] + }, + { + "output": { + "retrievable_objects": [ + { + "format": "http:\/\/schema.org", + "method": "json_in_html", + "resolved_url": "https:\/\/sandbox.zenodo.org\/records\/502989", + "target": "metadata" + }, + { + "format": null, + "method": "url", + "resolved_url": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "target": "data" + } + ] + }, + "test_debug": [ + "SUCCESS: Found retrievable metadata using the given identifier", + "SUCCESS: Found retrievable data using the given identifier" + ], + "id": 9, + "metric_identifier": "FsF-A1-02MD", + "metric_name": "Metadata and data are retrievable by their identifier", + "metric_tests": { + "FsF-A1-02MD-1": { + "metric_test_name": "Metadata are retrievable via their specified identifier", + "metric_test_requirements": [ + { + "modality": null, + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/transport_protocol", + "comment": "expected is e.g. http code 20x", + "target": null + }, + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/metadata\/property" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + }, + "FsF-A1-02MD-2": { + "metric_test_name": "Data are retrievable via the identifiers given in metadata", + "metric_test_requirements": [ + { + "modality": null, + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/transport_protocol", + "comment": "expected is e.g. http code 20x", + "target": null + }, + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/data", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/data\/property\/url" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 2, + "total": 2 + }, + "maturity": 3 + }, + { + "output": { + "standard_protocol": [ + { + "protocol_type": "https", + "auth_method": null, + "found_in": "https:\/\/sandbox.zenodo.org\/records\/502989", + "target": "metadata" + }, + { + "protocol_type": "https", + "auth_method": null, + "found_in": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "target": "data" + } + ] + }, + "test_debug": [ + "SUCCESS: Standard protocol for access to metadata which is assumed to be present found in link -: https:\/\/sandbox.zenodo.org\/records\/502989https", + "SUCCESS: Standard protocol for access to data object found -: https" + ], + "id": 11, + "metric_identifier": "FsF-A1.1-01MD", + "metric_name": "A standardized communication protocol is used to access metadata and data.", + "metric_tests": { + "FsF-A1.1-01MD-1": { + "metric_test_name": "Identifier leading to metadata matches a scheme indicating a standardized web communication protocol.", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": null, + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/transport_protocol" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + }, + "FsF-A1.1-01MD-2": { + "metric_test_name": "Identifier leading to data are matching a schema indicating a standardized web communication protocol.", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": null, + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/transport_protocol" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 2, + "total": 2 + }, + "maturity": 3 + }, + { + "output": { + "standard_protocol": [ + { + "protocol_type": "https", + "auth_method": "TLS, BASIC", + "found_in": "https:\/\/sandbox.zenodo.org\/records\/502989", + "target": "metadata" + }, + { + "protocol_type": "https", + "auth_method": "TLS, BASIC", + "found_in": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "target": "data" + } + ] + }, + "test_debug": [ + "SUCCESS: Standard protocol which supports authentication to access metadata found -: ('https', 'TLS, BASIC')", + "SUCCESS: Standard protocol which supports authentication to access data object found -: ('https', 'TLS, BASIC')" + ], + "id": 12, + "metric_identifier": "FsF-A1.2-01MD", + "metric_name": "Metadata and data are accessible through a standardized communication protocol which supports authentication.", + "metric_tests": { + "FsF-A1.2-01MD-1": { + "metric_test_name": "The communication protocol found in identifiers (IRIs) leading to metadata supports authentication.", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/transport_protocol", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/authentication_method" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + }, + "FsF-A1.2-01MD-2": { + "metric_test_name": "The communication protocol identified in data links (IRIs) supports authentication.", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": "https:\/\/f-uji.net\/vocab\/transport_protocol", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/authentication_method" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 2, + "total": 2 + }, + "maturity": 3 + }, + { + "id": 13, + "metric_identifier": "FsF-I1-01M", + "metric_name": "Metadata is represented using a formal knowledge representation language.", + "metric_tests": { + "FsF-I1-01M-1": { + "metric_test_name": "Parsable, structured metadata (JSON-LD, RDFa) is embedded in the landing page XHTML\/HTML code", + "metric_test_requirements": [ + { + "modality": "any", + "required": { + "name": [ + "RDF", + "JSON-LD", + "RDFa" + ] + }, + "tested_on": null, + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/format" + }, + { + "modality": "any", + "required": { + "name": [ + "meta_tag", + "microdata", + "rdfa", + "json_in_html" + ] + }, + "tested_on": null, + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/offering_method" + } + ], + "metric_test_score": { + "earned": 2, + "total": 2 + }, + "metric_test_maturity": 2, + "metric_test_status": "pass" + }, + "FsF-I1-01M-2": { + "metric_test_name": "Parsable, structured metadata (RDF, JSON-LD) is accessible through content negotiation, typed links or sparql endpoint", + "metric_test_requirements": [ + { + "modality": "any", + "required": { + "name": [ + "RDF", + "JSON-LD", + "RDFa" + ] + }, + "tested_on": null, + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/format" + }, + { + "modality": "any", + "required": { + "name": [ + "content_negotiation" + ] + }, + "tested_on": null, + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/offering_method" + }, + { + "modality": "any", + "required": { + "name": [ + "sparql" + ] + }, + "tested_on": null, + "comment": null, + "target": "http:\/\/f-uji.net\/vocab\/metadata\/exchange_service" + } + ], + "metric_test_score": { + "earned": 0, + "total": 2 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "fail", + "score": { + "earned": 2, + "total": 2 + }, + "maturity": 2, + "output": [ + { + "serialization_format": "JSON-LD", + "source": "structured_data", + "is_metadata_found": true + }, + { + "serialization_format": "RDFa", + "source": "structured_data", + "is_metadata_found": true + } + ], + "test_debug": [ + "INFO: Check of structured data (RDF serialization) embedded in the data page", + "INFO: JSON-LD (schema.org) serialization found in the data page - JSON-LD", + "INFO: RDFa like (OpenGraph) serialization found in the data page - RDFa", + "SUCCESS: Found structured data (RDF serialization) in the data page", + "INFO: Check if RDF-based typed link included", + "INFO: NO RDF-based typed link found", + "INFO: Check if RDF metadata available through content negotiation", + "INFO: NO RDF metadata available through content negotiation", + "INFO: NO SPARQL endpoint found through re3data based on the object URI provided" + ] + }, + { + "id": 14, + "metric_identifier": "FsF-I2-01M", + "metric_name": "Metadata uses registered semantic resources", + "metric_tests": { + "FsF-I2-01M-2": { + "metric_test_name": "Metadata uses terms from registered vocabularies that are identified by their namespaces", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": null, + "comment": "Semantic resources listed here are registered or indexed", + "target": "http:\/\/f-uji.net\/vocab\/semantic_resource" + } + ], + "metric_test_score": { + "earned": 0, + "total": 2 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "fail", + "score": { + "earned": 0, + "total": 2 + }, + "maturity": 0, + "output": [], + "test_debug": [ + "INFO: Removing default namespaces from 10 vocabulary namespaces found in structured metadata", + "INFO: Default vocabulary namespace(s) excluded -: ['https:\/\/schema.org', 'http:\/\/schema.org', 'http:\/\/schema.org', 'http:\/\/ogp.me\/ns', 'https:\/\/schema.org', 'http:\/\/www.w3.org\/1999\/02\/22-rdf-syntax-ns', 'http:\/\/purl.org\/dc\/elements\/1.1']", + "INFO: Removing default namespaces from 1 vocabulary namespaces extracted from links found in metadata", + "INFO: Default vocabulary namespace(s) excluded -: ['http:\/\/schema.org']", + "INFO: Check if known namespace(s) are used in structured metadata (RDF, XML) which exist(s) in a LOD registry -: ['https:\/\/doi.org\/10.5072', 'https:\/\/creativecommons.org\/licenses\/by\/4.0', 'https:\/\/sandbox.zenodo.org\/records']", + "WARNING: NO known vocabulary namespace URI is found which is listed in the LOD registry" + ] + }, + { + "id": 15, + "metric_identifier": "FsF-I3-01M", + "metric_name": "Metadata includes qualified references between the data and its related entities.", + "metric_tests": { + "FsF-I3-01M-1": { + "metric_test_name": "Related resources are referenced in plain text within appropriate metadata properties indicating the relation type", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": "http:\/\/f-uji.net\/vocab\/metadata\/property\/related_resources", + "comment": "The presence of a (typed, default = related) related resource is checked which is expressed as plain text", + "target": "http:\/\/f-uji.net\/vocab\/relation_type" + } + ], + "metric_test_score": { + "earned": 0, + "total": 2 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + }, + "FsF-I3-01M-2": { + "metric_test_name": "Related resources are referenced by machine readable links or identifiers within appropriate metadata properties indicating the relation type", + "metric_test_requirements": [ + { + "modality": null, + "required": null, + "tested_on": null, + "comment": "same as above but relations have to be machine readable\/actionable", + "target": null + } + ], + "metric_test_score": { + "earned": 0, + "total": 2 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "fail", + "score": { + "earned": 0, + "total": 2 + }, + "maturity": 0, + "output": [], + "test_debug": [ + "INFO: No related resource(s) found in Dublin Core metadata", + "WARNING: Could not identify qualified related resources in metadata" + ] + }, + { + "id": 16, + "metric_identifier": "FsF-R1-01M", + "metric_name": "Metadata specifies the content of the data.", + "metric_tests": { + "FsF-R1-01M-1": { + "metric_test_name": "Minimum information (resource type) about the available data content is specified in the metadata", + "metric_test_requirements": [], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 1, + "metric_test_status": "pass" + }, + "FsF-R1-01M-2": { + "metric_test_name": "Information on the manner and form (file size and type or service (API) endpoint and protocol) in which data is delivered is provided", + "metric_test_requirements": [], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + }, + "FsF-R1-01M-3": { + "metric_test_name": "Measured variables or observation types are specified in metadata", + "metric_test_requirements": [ + { + "modality": null, + "required": null, + "tested_on": null, + "comment": "test is not scored", + "target": null + } + ], + "metric_test_score": { + "earned": 0, + "total": 0 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "pass", + "score": { + "earned": 2, + "total": 2 + }, + "maturity": 3, + "output": { + "object_type": "['SoftwareSourceCode', 'http:\/\/schema.org\/WebPage']", + "data_content_descriptor": [ + { + "descriptor": "file size", + "descriptor_value": 6680000, + "matches_content": false + }, + { + "descriptor": "file type", + "descriptor_value": "application\/zip", + "matches_content": true + } + ] + }, + "test_debug": [ + "INFO: File info about exactly one object found for which no size is given but since size at object level is given, will take this for file level testing", + "SUCCESS: Valid resource type (e.g. subtype of schema.org\/CreativeWork, DCMI Type or DataCite resourceType) specified -: ['softwaresourcecode', 'webpage']", + "ERROR: The evaluated resource does not identify itself as a \u201cdataset\u201d but as ['softwaresourcecode', 'webpage'], so F-UJI may not be the right tool for this type of resource", + "SUCCESS: Found file size and type specified in metadata for -: https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "INFO: NO info about data service endpoint available in given metadata for -: https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "INFO: Since file was truncated will rely on content size given in HTTP header -: 7008524", + "WARNING: Could not verify content size from downloaded file -: (expected: 6680000.0, found: 7008524)", + "INFO: Sucessfully verified content type from downloaded file -: (expected: application\/zip, found: via tika ['application\/zip', 'text\/x-web-markdown', 'text\/csv', 'application\/json', 'text\/plain', 'text\/web-markdown'] or via header application\/octet-stream)" + ] + }, + { + "id": 17, + "metric_identifier": "FsF-R1.1-01M", + "metric_name": "Metadata includes license information under which data can be reused.", + "metric_tests": { + "FsF-R1.1-01M-1": { + "metric_test_name": "Licence information is given in an appropriate metadata element", + "metric_test_requirements": [ + { + "modality": "all", + "required": { + "name": [ + "license" + ] + }, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property", + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/metadata\/property" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 1, + "total": 1 + }, + "maturity": 3, + "output": [ + { + "license": "https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode", + "osi_approved": true, + "details_url": "https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode" + } + ], + "test_debug": [ + "INFO: Found CreativeCommons license -: https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode", + "SUCCESS: Found SPDX license representation (spdx url, osi_approved)", + "SUCCESS: Found licence information in metadata" + ] + }, + { + "id": 18, + "metric_identifier": "FsF-R1.2-01M", + "metric_name": "Metadata includes provenance information about data creation or generation.", + "metric_tests": { + "FsF-R1.2-01M-1": { + "metric_test_name": "Metadata contains elements which hold provenance information which can be mapped to PROV based on PROV-DC.", + "metric_test_requirements": [ + { + "modality": "any", + "required": { + "name": [ + "contributor", + "creator-", + "publisher", + "right_holder", + "created_date", + "publication_date", + "accepted_date", + "submitted_date", + "modified_date", + "hasFormat", + "isFormatOf", + "isVersionOf", + "isNewVersionOf", + "isReferencedBy", + "isReplacedBy", + "References", + "IsDerivedFrom", + "isBasedOn", + "hasVersion", + "Obsoletes", + "Replaces" + ] + }, + "tested_on": "https:\/\/f-uji.net\/vocab\/metadata\/property", + "comment": "PROV-O mapping based on https:\/\/www.w3.org\/TR\/prov-dc\/", + "target": "https:\/\/f-uji.net\/vocab\/metadata\/property" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 2, + "metric_test_status": "pass" + }, + "FsF-R1.2-01M-2": { + "metric_test_name": "Metadata contains elements which hold provenance information using formal provenance ontologies (PROV, PAV).", + "metric_test_requirements": [ + { + "modality": "any", + "required": { + "uri": [ + "http:\/\/www.w3.org\/ns\/prov", + "http:\/\/purl.org\/pav" + ] + }, + "tested_on": null, + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/semantic_resource" + } + ], + "metric_test_score": { + "earned": 0, + "total": 1 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + } + }, + "test_status": "pass", + "score": { + "earned": 1, + "total": 1 + }, + "maturity": 2, + "output": { + "provenance_metadata_included": { + "is_available": true, + "provenance_metadata": [ + { + "prov_o_mapping": "prov:generatedAtTime", + "metadata_element": "publication_date", + "metadata_value": "2026-05-21" + }, + { + "prov_o_mapping": "prov:wasAttributedTo", + "metadata_element": "publisher", + "metadata_value": [ + "Zenodo" + ] + }, + { + "prov_o_mapping": "prov:wasAttributedTo", + "metadata_element": "creator", + "metadata_value": [ + "Marirena Bafaloukou", + "Mateus Harrington" + ] + } + ] + }, + "structured_provenance_available": { + "is_available": false, + "provenance_metadata": [] + } + }, + "test_debug": [ + "INFO: Check if provenance information is available in descriptive metadata", + "INFO: Check if provenance information is available in metadata about related resources", + "WARNING: No provenance information found in metadata about related resources", + "SUCCESS: Found data creation-related provenance information", + "INFO: Check if provenance specific namespaces are listed in metadata", + "WARNING: Formal provenance metadata is unavailable" + ] + }, + { + "id": 19, + "metric_identifier": "FsF-R1.3-01M", + "metric_name": "Metadata follows a standard recommended by the target research community of the data.", + "metric_tests": { + "FsF-R1.3-01M-1": { + "metric_test_name": "Community specific metadata standard is detected using namespaces or schemas found in provided metadata", + "metric_test_requirements": [ + { + "modality": "any except", + "required": { + "field_of_science": [ + "science", + "generic" + ] + }, + "tested_on": null, + "comment": "test performed on namespaces or schemas found in exposed metadata", + "target": "https:\/\/f-uji.net\/vocab\/metadata\/standards" + } + ], + "metric_test_score": { + "earned": 0, + "total": 1 + }, + "metric_test_maturity": 0, + "metric_test_status": "fail" + }, + "FsF-R1.3-01M-3": { + "metric_test_name": "Multidisciplinary but community endorsed metadata (RDA Metadata Standards Catalog, fairsharing) standard is detected by namespace", + "metric_test_requirements": [ + { + "modality": "any", + "required": { + "field_of_science": [ + "science", + "generic" + ], + "source": [ + "rd-alliance.org", + "fairsharing.org" + ] + }, + "tested_on": null, + "comment": null, + "target": "https:\/\/f-uji.net\/vocab\/metadata\/standards" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 1, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 1, + "total": 1 + }, + "maturity": 1, + "output": [ + { + "metadata_standard": "Schema.org", + "url": "https:\/\/schema.org\/", + "subject_areas": [ + "sciences" + ], + "type": "generic", + "source": [ + "https:\/\/doi.org\/10.25504\/FAIRsharing.hzdzq8", + "https:\/\/rdamsc.bath.ac.uk\/msc\/m101" + ] + }, + { + "metadata_standard": "Schema.org", + "url": "http:\/\/schema.org", + "subject_areas": [ + "sciences" + ], + "type": "generic", + "source": [ + "https:\/\/doi.org\/10.25504\/FAIRsharing.hzdzq8", + "https:\/\/rdamsc.bath.ac.uk\/msc\/m101" + ] + }, + { + "metadata_standard": "Schema.org", + "url": "http:\/\/schema.org\/", + "subject_areas": [ + "sciences" + ], + "type": "generic", + "source": [ + "https:\/\/doi.org\/10.25504\/FAIRsharing.hzdzq8", + "https:\/\/rdamsc.bath.ac.uk\/msc\/m101" + ] + }, + { + "metadata_standard": "Schema.org", + "url": "https:\/\/schema.org", + "subject_areas": [ + "sciences" + ], + "type": "generic", + "source": [ + "https:\/\/doi.org\/10.25504\/FAIRsharing.hzdzq8", + "https:\/\/rdamsc.bath.ac.uk\/msc\/m101" + ] + }, + { + "metadata_standard": "Dublin Core", + "url": "http:\/\/purl.org\/dc\/elements\/1.1\/", + "subject_areas": [ + "sciences" + ], + "type": "generic", + "source": [ + "https:\/\/rdamsc.bath.ac.uk\/msc\/m15", + "https:\/\/doi.org\/10.25504\/FAIRsharing.3nx7t", + "http:\/\/www.dcc.ac.uk\/resources\/metadata-standards\/dublin-core" + ] + } + ], + "test_debug": [ + "INFO: re3data\/datacite client id -: None", + "INFO: Namespaces included in the metadata -: ['https:\/\/schema.org\/', 'https:\/\/doi.org\/10.5072', 'http:\/\/schema.org', 'http:\/\/schema.org\/', 'http:\/\/ogp.me\/ns#', 'https:\/\/schema.org', 'http:\/\/www.w3.org\/1999\/02\/22-rdf-syntax-ns#', 'https:\/\/creativecommons.org\/licenses\/by\/4.0', 'https:\/\/sandbox.zenodo.org\/records', 'http:\/\/purl.org\/dc\/elements\/1.1\/']", + "INFO: Found non-disciplinary standard (but RDA listed) -: via ns: Schema.org - https:\/\/schema.org\/", + "INFO: Found non-disciplinary standard (but RDA listed) -: via ns: Schema.org - http:\/\/schema.org", + "INFO: Found non-disciplinary standard (but RDA listed) -: via ns: Schema.org - http:\/\/schema.org\/", + "INFO: Found disciplinary standard -: via ns : The Open Graph protocol metadata format - http:\/\/ogp.me\/ns#", + "INFO: Found non-disciplinary standard (but RDA listed) -: via ns: Schema.org - https:\/\/schema.org", + "INFO: Found non-disciplinary standard (but RDA listed) -: via ns: Dublin Core - http:\/\/purl.org\/dc\/elements\/1.1\/", + "INFO: Retrieving API and Standards", + "INFO: No Datacite client id found, therefore skipping re3data metadata retrieval", + "INFO: Found non-disciplinary standards (but RDA listed) using namespaces or schemas in provided metadata" + ] + }, + { + "id": 20, + "metric_identifier": "FsF-R1.3-02D", + "metric_name": "Data is available in a file format recommended by the target research community.", + "metric_tests": { + "FsF-R1.3-02D-1": { + "metric_test_name": "Data is available in a file format recommended by the research community (long term file formats, open file formats or scientific file format)", + "metric_test_requirements": [ + { + "modality": "any", + "required": null, + "tested_on": null, + "comment": "format has to be tagged as open, long term or scientific, including all text based formats (though some may not be listed here)", + "target": "https:\/\/f-uji.net\/vocab\/data\/format" + } + ], + "metric_test_score": { + "earned": 1, + "total": 1 + }, + "metric_test_maturity": 3, + "metric_test_status": "pass" + } + }, + "test_status": "pass", + "score": { + "earned": 1, + "total": 1 + }, + "maturity": 3, + "output": [ + { + "file_uri": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "mime_type": "text\/x-web-markdown", + "is_preferred_format": true, + "preference_reason": [ + "open format", + "long term format", + "generic science format" + ], + "subject_areas": [ + "General" + ] + }, + { + "file_uri": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "mime_type": "text\/csv", + "is_preferred_format": true, + "preference_reason": [ + "open format", + "long term format", + "generic science format" + ], + "subject_areas": [ + "General" + ] + }, + { + "file_uri": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "mime_type": "application\/json", + "is_preferred_format": true, + "preference_reason": [ + "open format", + "long term format", + "generic science format" + ], + "subject_areas": [ + "General" + ] + }, + { + "file_uri": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "mime_type": "text\/plain", + "is_preferred_format": true, + "preference_reason": [ + "open format", + "long term format", + "generic science format" + ], + "subject_areas": [ + "General" + ] + }, + { + "file_uri": "https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip", + "mime_type": "text\/web-markdown", + "is_preferred_format": true, + "preference_reason": [ + "open format", + "long term format", + "generic science format" + ], + "subject_areas": [ + "General" + ] + } + ], + "test_debug": [ + "INFO: Data content identifier provided -: ['https:\/\/sandbox.zenodo.org\/records\/502989\/files\/marirenab\/fair-hackathon_group2-v1.1.zip']", + "INFO: Archiving\/compression format specified -: application\/zip", + "INFO: Extracted file formats for selected data object (see FsF-R1-01MD) -: ['text\/x-web-markdown', 'text\/csv', 'application\/json', 'text\/plain', 'text\/web-markdown']", + "SUCCESS: Could identify a file format commonly used by the scientific community -:text\/x-web-markdown", + "SUCCESS: Could identify a file format commonly used by the scientific community -:text\/csv", + "SUCCESS: Could identify a file format commonly used by the scientific community -:application\/json", + "SUCCESS: Could identify a file format commonly used by the scientific community -:text\/plain", + "SUCCESS: Could identify a file format commonly used by the scientific community -:text\/web-markdown" + ] + } + ], + "harvested_metadata": [ + { + "method": "json_in_html", + "url": "https:\/\/sandbox.zenodo.org\/records\/502989", + "format": "json-ld", + "schema": "http:\/\/schema.org", + "namespaces": [ + "http:\/\/schema.org", + "https:\/\/schema.org\/", + "https:\/\/doi.org\/10.5072", + "http:\/\/schema.org\/", + "https:\/\/schema.org", + "http:\/\/www.w3.org\/1999\/02\/22-rdf-syntax-ns#", + "https:\/\/creativecommons.org\/licenses\/by\/4.0", + "https:\/\/sandbox.zenodo.org\/records", + "http:\/\/schema.org" + ], + "metadata": { + "object_identifier": [ + "https:\/\/doi.org\/10.5072\/zenodo.502989", + "https:\/\/sandbox.zenodo.org\/records\/502989" + ], + "title": "marirenab\/fair-hackathon_group2: v1.1", + "summary": "FAIR-data hackathon: iteratively destroy then repair an open dataset, scored by F-UJI", + "publication_date": "2026-05-21", + "publisher": [ + "Zenodo" + ], + "creator": [ + "Marirena Bafaloukou", + "Mateus Harrington" + ], + "license": [ + "https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode" + ], + "object_type": [ + "SoftwareSourceCode" + ], + "object_size": "6.68 MB" + } + }, + { + "method": "meta_tag", + "url": "https:\/\/sandbox.zenodo.org\/records\/502989", + "format": "xhtml", + "schema": "http:\/\/purl.org\/dc\/elements\/1.1\/", + "namespaces": [ + "http:\/\/purl.org\/dc\/elements\/1.1\/", + "http:\/\/purl.org\/dc\/elements\/1.1\/" + ], + "metadata": { + "summary": "FAIR-data hackathon: iteratively destroy then repair an open dataset, scored by F-UJI" + } + }, + { + "method": "microdata", + "url": "https:\/\/sandbox.zenodo.org\/records\/502989", + "format": "microdata", + "schema": "http:\/\/www.w3.org\/TR\/microdata", + "namespaces": [ + "http:\/\/www.w3.org\/TR\/microdata", + "http:\/\/schema.org\/" + ], + "metadata": { + "object_type": [ + "http:\/\/schema.org\/WebPage" + ] + } + }, + { + "method": "meta_tag", + "url": "https:\/\/sandbox.zenodo.org\/records\/502989", + "format": "html", + "schema": "highwire_eprints", + "namespaces": [ + "highwire_eprints" + ], + "metadata": { + "title": "marirenab\/fair-hackathon_group2: v1.1", + "object_identifier": [ + "10.5072\/zenodo.502989" + ], + "summary": "https:\/\/sandbox.zenodo.org\/records\/502989" + } + }, + { + "method": "rdfa", + "url": "https:\/\/sandbox.zenodo.org\/records\/502989", + "format": "rdfa", + "schema": "https:\/\/ogp.me\/", + "namespaces": [ + "https:\/\/ogp.me\/", + "http:\/\/ogp.me\/ns#" + ], + "metadata": { + "title": "marirenab\/fair-hackathon_group2: v1.1", + "object_identifier": [ + "https:\/\/sandbox.zenodo.org\/records\/502989" + ], + "summary": "FAIR-data hackathon: iteratively destroy then repair an open dataset, scored by F-UJI", + "publisher": "Zenodo" + } + } + ] +} diff --git a/dataset/LICENSE b/dataset/LICENSE new file mode 100644 index 0000000..da6ab6c --- /dev/null +++ b/dataset/LICENSE @@ -0,0 +1,396 @@ +Attribution 4.0 International + +======================================================================= + +Creative Commons Corporation ("Creative Commons") is not a law firm and +does not provide legal services or legal advice. Distribution of +Creative Commons public licenses does not create a lawyer-client or +other relationship. Creative Commons makes its licenses and related +information available on an "as-is" basis. Creative Commons gives no +warranties regarding its licenses, any material licensed under their +terms and conditions, or any related information. Creative Commons +disclaims all liability for damages resulting from their use to the +fullest extent possible. + +Using Creative Commons Public Licenses + +Creative Commons public licenses provide a standard set of terms and +conditions that creators and other rights holders may use to share +original works of authorship and other material subject to copyright +and certain other rights specified in the public license below. The +following considerations are for informational purposes only, are not +exhaustive, and do not form part of our licenses. + + Considerations for licensors: Our public licenses are + intended for use by those authorized to give the public + permission to use material in ways otherwise restricted by + copyright and certain other rights. Our licenses are + irrevocable. Licensors should read and understand the terms + and conditions of the license they choose before applying it. + Licensors should also secure all rights necessary before + applying our licenses so that the public can reuse the + material as expected. Licensors should clearly mark any + material not subject to the license. This includes other CC- + licensed material, or material used under an exception or + limitation to copyright. More considerations for licensors: + wiki.creativecommons.org/Considerations_for_licensors + + Considerations for the public: By using one of our public + licenses, a licensor grants the public permission to use the + licensed material under specified terms and conditions. If + the licensor's permission is not necessary for any reason--for + example, because of any applicable exception or limitation to + copyright--then that use is not regulated by the license. Our + licenses grant only permissions under copyright and certain + other rights that a licensor has authority to grant. Use of + the licensed material may still be restricted for other + reasons, including because others have copyright or other + rights in the material. A licensor may make special requests, + such as asking that all changes be marked or described. + Although not required by our licenses, you are encouraged to + respect those requests where reasonable. More considerations + for the public: + wiki.creativecommons.org/Considerations_for_licensees + +======================================================================= + +Creative Commons Attribution 4.0 International Public License + +By exercising the Licensed Rights (defined below), You accept and agree +to be bound by the terms and conditions of this Creative Commons +Attribution 4.0 International Public License ("Public License"). To the +extent this Public License may be interpreted as a contract, You are +granted the Licensed Rights in consideration of Your acceptance of +these terms and conditions, and the Licensor grants You such rights in +consideration of benefits the Licensor receives from making the +Licensed Material available under these terms and conditions. + + +Section 1 -- Definitions. + + a. Adapted Material means material subject to Copyright and Similar + Rights that is derived from or based upon the Licensed Material + and in which the Licensed Material is translated, altered, + arranged, transformed, or otherwise modified in a manner requiring + permission under the Copyright and Similar Rights held by the + Licensor. For purposes of this Public License, where the Licensed + Material is a musical work, performance, or sound recording, + Adapted Material is always produced where the Licensed Material is + synched in timed relation with a moving image. + + b. Adapter's License means the license You apply to Your Copyright + and Similar Rights in Your contributions to Adapted Material in + accordance with the terms and conditions of this Public License. + + c. Copyright and Similar Rights means copyright and/or similar rights + closely related to copyright including, without limitation, + performance, broadcast, sound recording, and Sui Generis Database + Rights, without regard to how the rights are labeled or + categorized. For purposes of this Public License, the rights + specified in Section 2(b)(1)-(2) are not Copyright and Similar + Rights. + + d. Effective Technological Measures means those measures that, in the + absence of proper authority, may not be circumvented under laws + fulfilling obligations under Article 11 of the WIPO Copyright + Treaty adopted on December 20, 1996, and/or similar international + agreements. + + e. Exceptions and Limitations means fair use, fair dealing, and/or + any other exception or limitation to Copyright and Similar Rights + that applies to Your use of the Licensed Material. + + f. Licensed Material means the artistic or literary work, database, + or other material to which the Licensor applied this Public + License. + + g. Licensed Rights means the rights granted to You subject to the + terms and conditions of this Public License, which are limited to + all Copyright and Similar Rights that apply to Your use of the + Licensed Material and that the Licensor has authority to license. + + h. Licensor means the individual(s) or entity(ies) granting rights + under this Public License. + + i. Share means to provide material to the public by any means or + process that requires permission under the Licensed Rights, such + as reproduction, public display, public performance, distribution, + dissemination, communication, or importation, and to make material + available to the public including in ways that members of the + public may access the material from a place and at a time + individually chosen by them. + + j. Sui Generis Database Rights means rights other than copyright + resulting from Directive 96/9/EC of the European Parliament and of + the Council of 11 March 1996 on the legal protection of databases, + as amended and/or succeeded, as well as other essentially + equivalent rights anywhere in the world. + + k. You means the individual or entity exercising the Licensed Rights + under this Public License. Your has a corresponding meaning. + + +Section 2 -- Scope. + + a. License grant. + + 1. Subject to the terms and conditions of this Public License, + the Licensor hereby grants You a worldwide, royalty-free, + non-sublicensable, non-exclusive, irrevocable license to + exercise the Licensed Rights in the Licensed Material to: + + a. reproduce and Share the Licensed Material, in whole or + in part; and + + b. produce, reproduce, and Share Adapted Material. + + 2. Exceptions and Limitations. For the avoidance of doubt, where + Exceptions and Limitations apply to Your use, this Public + License does not apply, and You do not need to comply with + its terms and conditions. + + 3. Term. The term of this Public License is specified in Section + 6(a). + + 4. Media and formats; technical modifications allowed. The + Licensor authorizes You to exercise the Licensed Rights in + all media and formats whether now known or hereafter created, + and to make technical modifications necessary to do so. The + Licensor waives and/or agrees not to assert any right or + authority to forbid You from making technical modifications + necessary to exercise the Licensed Rights, including + technical modifications necessary to circumvent Effective + Technological Measures. For purposes of this Public License, + simply making modifications authorized by this Section 2(a) + (4) never produces Adapted Material. + + 5. Downstream recipients. + + a. Offer from the Licensor -- Licensed Material. Every + recipient of the Licensed Material automatically + receives an offer from the Licensor to exercise the + Licensed Rights under the terms and conditions of this + Public License. + + b. No downstream restrictions. You may not offer or impose + any additional or different terms or conditions on, or + apply any Effective Technological Measures to, the + Licensed Material if doing so restricts exercise of the + Licensed Rights by any recipient of the Licensed + Material. + + 6. No endorsement. Nothing in this Public License constitutes or + may be construed as permission to assert or imply that You + are, or that Your use of the Licensed Material is, connected + with, or sponsored, endorsed, or granted official status by, + the Licensor or others designated to receive attribution as + provided in Section 3(a)(1)(A)(i). + + b. Other rights. + + 1. Moral rights, such as the right of integrity, are not + licensed under this Public License, nor are publicity, + privacy, and/or other similar personality rights; however, to + the extent possible, the Licensor waives and/or agrees not to + assert any such rights held by the Licensor to the limited + extent necessary to allow You to exercise the Licensed + Rights, but not otherwise. + + 2. Patent and trademark rights are not licensed under this + Public License. + + 3. To the extent possible, the Licensor waives any right to + collect royalties from You for the exercise of the Licensed + Rights, whether directly or through a collecting society + under any voluntary or waivable statutory or compulsory + licensing scheme. In all other cases the Licensor expressly + reserves any right to collect such royalties. + + +Section 3 -- License Conditions. + +Your exercise of the Licensed Rights is expressly made subject to the +following conditions. + + a. Attribution. + + 1. If You Share the Licensed Material (including in modified + form), You must: + + a. retain the following if it is supplied by the Licensor + with the Licensed Material: + + i. identification of the creator(s) of the Licensed + Material and any others designated to receive + attribution, in any reasonable manner requested by + the Licensor (including by pseudonym if + designated); + + ii. a copyright notice; + + iii. a notice that refers to this Public License; + + iv. a notice that refers to the disclaimer of + warranties; + + v. a URI or hyperlink to the Licensed Material to the + extent reasonably practicable; + + b. indicate if You modified the Licensed Material and + retain an indication of any previous modifications; and + + c. indicate the Licensed Material is licensed under this + Public License, and include the text of, or the URI or + hyperlink to, this Public License. + + 2. You may satisfy the conditions in Section 3(a)(1) in any + reasonable manner based on the medium, means, and context in + which You Share the Licensed Material. For example, it may be + reasonable to satisfy the conditions by providing a URI or + hyperlink to a resource that includes the required + information. + + 3. If requested by the Licensor, You must remove any of the + information required by Section 3(a)(1)(A) to the extent + reasonably practicable. + + 4. If You Share Adapted Material You produce, the Adapter's + License You apply must not prevent recipients of the Adapted + Material from complying with this Public License. + + +Section 4 -- Sui Generis Database Rights. + +Where the Licensed Rights include Sui Generis Database Rights that +apply to Your use of the Licensed Material: + + a. for the avoidance of doubt, Section 2(a)(1) grants You the right + to extract, reuse, reproduce, and Share all or a substantial + portion of the contents of the database; + + b. if You include all or a substantial portion of the database + contents in a database in which You have Sui Generis Database + Rights, then the database in which You have Sui Generis Database + Rights (but not its individual contents) is Adapted Material; and + + c. You must comply with the conditions in Section 3(a) if You Share + all or a substantial portion of the contents of the database. + +For the avoidance of doubt, this Section 4 supplements and does not +replace Your obligations under this Public License where the Licensed +Rights include other Copyright and Similar Rights. + + +Section 5 -- Disclaimer of Warranties and Limitation of Liability. + + a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE + EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS + AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF + ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS, + IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION, + WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR + PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS, + ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT + KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT + ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU. + + b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE + TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION, + NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT, + INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES, + COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR + USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN + ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR + DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR + IN PART, THIS LIMITATION MAY NOT APPLY TO YOU. + + c. The disclaimer of warranties and limitation of liability provided + above shall be interpreted in a manner that, to the extent + possible, most closely approximates an absolute disclaimer and + waiver of all liability. + + +Section 6 -- Term and Termination. + + a. This Public License applies for the term of the Copyright and + Similar Rights licensed here. However, if You fail to comply with + this Public License, then Your rights under this Public License + terminate automatically. + + b. Where Your right to use the Licensed Material has terminated under + Section 6(a), it reinstates: + + 1. automatically as of the date the violation is cured, provided + it is cured within 30 days of Your discovery of the + violation; or + + 2. upon express reinstatement by the Licensor. + + For the avoidance of doubt, this Section 6(b) does not affect any + right the Licensor may have to seek remedies for Your violations + of this Public License. + + c. For the avoidance of doubt, the Licensor may also offer the + Licensed Material under separate terms or conditions or stop + distributing the Licensed Material at any time; however, doing so + will not terminate this Public License. + + d. Sections 1, 5, 6, 7, and 8 survive termination of this Public + License. + + +Section 7 -- Other Terms and Conditions. + + a. The Licensor shall not be bound by any additional or different + terms or conditions communicated by You unless expressly agreed. + + b. Any arrangements, understandings, or agreements regarding the + Licensed Material not stated herein are separate from and + independent of the terms and conditions of this Public License. + + +Section 8 -- Interpretation. + + a. For the avoidance of doubt, this Public License does not, and + shall not be interpreted to, reduce, limit, restrict, or impose + conditions on any use of the Licensed Material that could lawfully + be made without permission under this Public License. + + b. To the extent possible, if any provision of this Public License is + deemed unenforceable, it shall be automatically reformed to the + minimum extent necessary to make it enforceable. If the provision + cannot be reformed, it shall be severed from this Public License + without affecting the enforceability of the remaining terms and + conditions. + + c. No term or condition of this Public License will be waived and no + failure to comply consented to unless expressly agreed to by the + Licensor. + + d. Nothing in this Public License constitutes or may be interpreted + as a limitation upon, or waiver of, any privileges and immunities + that apply to the Licensor or You, including from the legal + processes of any jurisdiction or authority. + + +======================================================================= + +Creative Commons is not a party to its public +licenses. Notwithstanding, Creative Commons may elect to apply one of +its public licenses to material it publishes and in those instances +will be considered the “Licensor.” The text of the Creative Commons +public licenses is dedicated to the public domain under the CC0 Public +Domain Dedication. Except for the limited purpose of indicating that +material is shared under a Creative Commons public license or as +otherwise permitted by the Creative Commons policies published at +creativecommons.org/policies, Creative Commons does not authorize the +use of the trademark "Creative Commons" or any other trademark or logo +of Creative Commons without its prior written consent including, +without limitation, in connection with any unauthorized modifications +to any of its public licenses or any other arrangements, +understandings, or agreements concerning use of licensed material. For +the avoidance of doubt, this paragraph does not form part of the +public licenses. + +Creative Commons may be contacted at creativecommons.org. + diff --git a/dataset/README.md b/dataset/README.md new file mode 100644 index 0000000..aca9eff --- /dev/null +++ b/dataset/README.md @@ -0,0 +1,71 @@ +# TIHM dataset + +This hosted copy contains the same tabular records as the reference `TIHM_Dataset` +package, exposed here with explicit `.csv` filenames and dataset-level +documentation so the files are easier to identify and reuse. + +## Provenance + +- Original dataset title: *TIHM: An open dataset for remote healthcare monitoring in dementia* +- Original DOI: +- Coverage: 2019-04-01 to 2019-06-30 +- Resource type: tabular time-series dataset + +## Files + +| File | Rows | Columns | Description | +| --- | ---: | --- | --- | +| `data/Activity.csv` | 1,030,559 | `patient_id`, `location_name`, `date` | Room-level activity events per patient. | +| `data/Demographics.csv` | 56 | `patient_id`, `age`, `sex` | Patient sex and age band. | +| `data/Labels.csv` | 608 | `patient_id`, `date`, `type` | Clinical labels such as agitation and blood pressure. | +| `data/Physiology.csv` | 17,679 | `patient_id`, `date`, `device_type`, `value`, `unit` | Physiology measurements including blood pressure, heart rate, and temperature. | +| `data/Sleep.csv` | 461,423 | `patient_id`, `date`, `state`, `heart_rate`, `respiratory_rate`, `snoring` | Sleep stage observations with associated vital signs. | + +## Column dictionary + +### Activity + +| Column | Type | Description | +| --- | --- | --- | +| `patient_id` | categorical | Participant hash code. | +| `location_name` | categorical | Room or sensor location, for example `Hallway`, `Lounge`, `Fridge Door`, `Bedroom`, or `Kitchen`. | +| `date` | datetime | Event timestamp from 2019-04-01 to 2019-06-30. | + +### Labels + +| Column | Type | Description | +| --- | --- | --- | +| `patient_id` | categorical | Participant hash code. | +| `date` | datetime | Label timestamp from 2019-04-04 to 2019-06-30. | +| `type` | categorical | Clinical label type, including `Agitation`, `Blood pressure`, and related observations. | + +### Physiology + +| Column | Type | Description | +| --- | --- | --- | +| `patient_id` | categorical | Participant hash code. | +| `date` | datetime | Measurement timestamp from 2019-04-01 to 2019-06-30. | +| `device_type` | categorical | Measurement source or modality, for example `Body Temperature`, `Heart rate`, or blood pressure devices. | +| `value` | float | Numeric measurement value. | +| `unit` | categorical | Measurement unit, for example `Cel`, `beats/min`, `%`, `kg`, or `mm[Hg]`. | + +### Sleep + +| Column | Type | Description | +| --- | --- | --- | +| `patient_id` | categorical | Participant hash code. | +| `date` | datetime | Sleep observation timestamp from 2019-04-01 to 2019-06-30. | +| `state` | categorical | Sleep state: `LIGHT`, `AWAKE`, `DEEP`, or `REM`. | +| `heart_rate` | float | Heart rate during the sleep observation. | +| `respiratory_rate` | float | Respiratory rate during the sleep observation. | +| `snoring` | boolean | Whether snoring was detected. | + +### Demographics + +| Column | Type | Description | +| --- | --- | --- | +| `patient_id` | categorical | Participant hash code. | +| `sex` | categorical | `Male` or `Female`. | +| `age` | categorical | Age band: `(70, 80]`, `(80, 90]`, or `(90, 110]`. | + + diff --git a/dataset/data/Activity.dat b/dataset/data/Activity.csv similarity index 100% rename from dataset/data/Activity.dat rename to dataset/data/Activity.csv diff --git a/dataset/data/Demographics.dat b/dataset/data/Demographics.csv similarity index 100% rename from dataset/data/Demographics.dat rename to dataset/data/Demographics.csv diff --git a/dataset/data/Labels.dat b/dataset/data/Labels.csv similarity index 100% rename from dataset/data/Labels.dat rename to dataset/data/Labels.csv diff --git a/dataset/data/Physiology.dat b/dataset/data/Physiology.csv similarity index 100% rename from dataset/data/Physiology.dat rename to dataset/data/Physiology.csv diff --git a/dataset/data/Sleep.dat b/dataset/data/Sleep.csv similarity index 100% rename from dataset/data/Sleep.dat rename to dataset/data/Sleep.csv diff --git a/dataset/index.html b/dataset/index.html index 1cfea08..32ef02a 100644 --- a/dataset/index.html +++ b/dataset/index.html @@ -2,7 +2,117 @@ -TIHM +TIHM: An open dataset for remote healthcare monitoring in dementia + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +

TIHM: An open dataset for remote healthcare monitoring in dementia

@@ -15,14 +125,19 @@

TIHM: An open dataset for remote healthcare monitoring in dementia

TIHM is an open in-home remote-monitoring dataset for People Living with Dementia (PLWD), comprising per-patient time-series of activity, sleep, physiology, demographics and clinical labels collected between 2019-04-01 and 2019-06-30 by the UK DRI Care Research & Technology Centre at Imperial College London. This re-hosted copy is provided as a FAIR-by-design teaching dataset.

+

The hosted CSV files below preserve the same tabular content as the reference TIHM dataset while restoring meaningful filenames and dataset-level documentation for easier discovery and reuse.

+

Files

Provenance

diff --git a/dataset/metadata.jsonld b/dataset/metadata.jsonld new file mode 100644 index 0000000..24f9f7a --- /dev/null +++ b/dataset/metadata.jsonld @@ -0,0 +1,59 @@ +{ + "@context": { + "schema": "https://schema.org/", + "dcat": "http://www.w3.org/ns/dcat#", + "dcterms": "http://purl.org/dc/terms/", + "prov": "http://www.w3.org/ns/prov#", + "foaf": "http://xmlns.com/foaf/0.1/" + }, + "@id": "https://w3id.org/fair-hackathon/tihm/v1", + "@type": ["dcat:Dataset", "schema:Dataset"], + "dcterms:identifier": "https://w3id.org/fair-hackathon/tihm/v1", + "schema:identifier": [ + "https://w3id.org/fair-hackathon/tihm/v1", + "https://doi.org/10.5281/zenodo.7622128" + ], + "dcterms:title": "TIHM: An open dataset for remote healthcare monitoring in dementia", + "schema:name": "TIHM: An open dataset for remote healthcare monitoring in dementia", + "dcterms:description": "TIHM is an open in-home remote-monitoring dataset for People Living with Dementia (PLWD), comprising per-patient time-series of activity, sleep, physiology, demographics and clinical labels collected between 2019-04-01 and 2019-06-30 by the UK DRI Care Research & Technology Centre.", + "schema:description": "TIHM is an open in-home remote-monitoring dataset for People Living with Dementia (PLWD), comprising per-patient time-series of activity, sleep, physiology, demographics and clinical labels collected between 2019-04-01 and 2019-06-30 by the UK DRI Care Research & Technology Centre.", + "dcterms:issued": "2023-02-10", + "dcterms:modified": "2026-05-21", + "dcterms:language": "en", + "dcterms:publisher": { + "@type": "foaf:Organization", + "foaf:name": "UK DRI Care Research & Technology Centre, Imperial College London", + "foaf:homepage": "https://ukdri.ac.uk/centres/care-research-technology" + }, + "dcterms:creator": [ + {"@type":"foaf:Person","foaf:name":"Francesca Palermo"}, + {"@type":"foaf:Person","foaf:name":"Yu Chen"}, + {"@type":"foaf:Person","foaf:name":"Alexander Capstick"}, + {"@type":"foaf:Person","foaf:name":"Nan Fletcher-Loyd"}, + {"@type":"foaf:Person","foaf:name":"Chloe Walsh"}, + {"@type":"foaf:Person","foaf:name":"Samaneh Kouchaki"}, + {"@type":"foaf:Person","foaf:name":"Jessica True"}, + {"@type":"foaf:Person","foaf:name":"Olga Balazikova"}, + {"@type":"foaf:Person","foaf:name":"Eyal Soreq"}, + {"@type":"foaf:Person","foaf:name":"Gregory Scott"}, + {"@type":"foaf:Person","foaf:name":"Helen Rostill"}, + {"@type":"foaf:Person","foaf:name":"Ramin Nilforooshan"}, + {"@type":"foaf:Person","foaf:name":"Payam Barnaghi"} + ], + "dcat:keyword": ["Time-Series","Machine Learning","Remote Healthcare","Monitoring","Dementia"], + "dcat:theme": ["http://eurovoc.europa.eu/4636","http://eurovoc.europa.eu/2476"], + "dcterms:rights": "https://creativecommons.org/licenses/by/4.0/", + "dcterms:license": "https://creativecommons.org/licenses/by/4.0/", + "dcterms:accessRights": "http://publications.europa.eu/resource/authority/access-right/PUBLIC", + "dcterms:conformsTo": "https://www.w3.org/TR/vocab-dcat-2/", + "prov:wasDerivedFrom": "https://doi.org/10.5281/zenodo.7622128", + "dcterms:source": "https://doi.org/10.5281/zenodo.7622128", + "dcat:distribution": [ + {"@type":"dcat:Distribution","dcat:accessURL":"data/Activity.csv", "dcat:mediaType":"text/csv","dcterms:title":"Activity.csv"}, + {"@type":"dcat:Distribution","dcat:accessURL":"data/Demographics.csv", "dcat:mediaType":"text/csv","dcterms:title":"Demographics.csv"}, + {"@type":"dcat:Distribution","dcat:accessURL":"data/Labels.csv", "dcat:mediaType":"text/csv","dcterms:title":"Labels.csv"}, + {"@type":"dcat:Distribution","dcat:accessURL":"data/Physiology.csv", "dcat:mediaType":"text/csv","dcterms:title":"Physiology.csv"}, + {"@type":"dcat:Distribution","dcat:accessURL":"data/Sleep.csv", "dcat:mediaType":"text/csv","dcterms:title":"Sleep.csv"} + ], + "dcterms:temporal": {"dcterms:start":"2019-04-01","dcterms:end":"2019-06-30"} +} diff --git a/dataset/metadata.xml b/dataset/metadata.xml new file mode 100644 index 0000000..032610f --- /dev/null +++ b/dataset/metadata.xml @@ -0,0 +1,132 @@ + + + + https://w3id.org/fair-hackathon/tihm/v1 + TIHM: An open dataset for remote healthcare monitoring in dementia + TIHM is an open in-home remote-monitoring dataset for People Living with Dementia (PLWD), comprising per-patient time-series of activity, sleep, physiology, demographics and clinical labels collected between 2019-04-01 and 2019-06-30 by the UK DRI Care Research & Technology Centre. + 2023-02-10 + 2026-05-21 + + + Francesca Palermo + + + + + Yu Chen + + + + + Alexander Capstick + + + + + Nan Fletcher-Loyd + + + + + Chloe Walsh + + + + + Samaneh Kouchaki + + + + + Jessica True + + + + + Olga Balazikova + + + + + Eyal Soreq + + + + + Gregory Scott + + + + + Helen Rostill + + + + + Ramin Nilforooshan + + + + + Payam Barnaghi + + + en + + + UK DRI Care Research & Technology Centre, Imperial College London + + + + Time-Series + Machine Learning + Remote Healthcare + Monitoring + Dementia + + + + + + + + + Activity.csv + + text/csv + + + + + Sleep.csv + + text/csv + + + + + Physiology.csv + + text/csv + + + + + Labels.csv + + text/csv + + + + + Demographics.csv + + text/csv + + + +