diff --git a/dataset/example01/README.md b/dataset/example01/README.md index ea76fbb..92ec7e5 100644 --- a/dataset/example01/README.md +++ b/dataset/example01/README.md @@ -20,8 +20,9 @@ Each record consists mostly of numerical data with some categorical data. The file `codebook.csv` contains the column names from the header of `data.csv`, together with their description, unit, and source. -The content of this example is an excerpt of Our World in Data CO2 and -Greenhouse Gas Emissions dataset, available in full, under Creative Commons -Attribution 4.0 International License, at . +The content of this example is an excerpt of the Our World in Data CO2 and +Greenhouse Gas Emissions dataset. It is available in full, under Creative +Commons Attribution 4.0 International License, at +. -[![A diagram of SPDX 3.0 of Dataset Example 01](./spdx3.0/example01.spdx3.png "A diagram of SPDX 3.0 of Dataset Example 01")](./spdx3.0/example01.spdx3.png) +[![A diagram of a bill of materials of Dataset Example 01](./spdx3.0/example01.png "A diagram of a bill of materials of Dataset Example 01")](./spdx3.0/example01.png) diff --git a/dataset/example01/spdx3.0/example01.png b/dataset/example01/spdx3.0/example01.png new file mode 100644 index 0000000..fe521d1 Binary files /dev/null and b/dataset/example01/spdx3.0/example01.png differ diff --git a/dataset/example01/spdx3.0/example01.spdx3.json b/dataset/example01/spdx3.0/example01.spdx3.json index 39fd747..351c814 100644 --- a/dataset/example01/spdx3.0/example01.spdx3.json +++ b/dataset/example01/spdx3.0/example01.spdx3.json @@ -19,7 +19,7 @@ { "type": "ExternalIdentifier", "externalIdentifierType": "email", - "identifier": "arthit@example.com" + "identifier": "suriyawa@tcd.ie" } ] }, @@ -27,7 +27,18 @@ "type": "Organization", "spdxId": "https://spdx.org/spdxdocs/Organization1-cb617656-1023-45e7-84c7-a9311644337b", "creationInfo": "_:creationinfo", - "name": "Our World in Data" + "name": "Our World in Data", + "externalIdentifier": [ + { + "type": "ExternalIdentifier", + "externalIdentifierType": "other", + "issuingAuthority": "GitHub", + "identifier": "owid", + "identifierLocator": [ + "https://github.com/owid/" + ] + } + ] }, { "type": "SpdxDocument", @@ -66,7 +77,11 @@ "software_downloadLocation": "https://github.com/owid/co2-data/", "software_primaryPurpose": "data", "dataset_confidentialityLevel": "clear", + "dataset_dataPreprocessing": [ + "The dataset is built upon a number of datasets and processing steps. See: https://github.com/owid/co2-data/blob/master/README.md" + ], "dataset_datasetAvailability": "directDownload", + "dataset_dataCollectionProcess": "The data is collected from various sources, including international organizations and research institutions.", "dataset_datasetSize": 2689, "dataset_datasetType": [ "structured", @@ -77,14 +92,15 @@ "dataset_intendedUse": "To make the data about greenhouse gas emissions accessible.", "dataset_knownBias": [ "Data in some geographical areas are more completed than the others." - ] + ], + "comment": "This is a small excerpt of the full dataset." }, { "type": "software_File", "spdxId": "https://spdx.org/spdxdocs/File1-d029fccb-7ee9-42be-a445-5e2066db0de8", "creationInfo": "_:creationinfo", "name": "data.csv", - "software_contentType": "text/csv", + "software_contentType": "text/csv;charset=UTF-8", "software_primaryPurpose": "data", "releaseTime": "2024-04-15T08:10:00Z", "originatedBy": [ @@ -96,12 +112,13 @@ "spdxId": "https://spdx.org/spdxdocs/File2-caf55baf-cd02-406a-b7ec-838842ca869f", "creationInfo": "_:creationinfo", "name": "codebook.csv", - "software_contentType": "text/csv", + "software_contentType": "text/csv;charset=UTF-8", "software_primaryPurpose": "data", "releaseTime": "2024-04-15T08:10:00Z", "originatedBy": [ "https://spdx.org/spdxdocs/Organization1-cb617656-1023-45e7-84c7-a9311644337b" - ] + ], + "description": "A description of each column in data.csv." }, { "type": "Relationship", @@ -112,7 +129,19 @@ "to": [ "https://spdx.org/spdxdocs/File1-d029fccb-7ee9-42be-a445-5e2066db0de8", "https://spdx.org/spdxdocs/File2-caf55baf-cd02-406a-b7ec-838842ca869f" - ] + ], + "description": "DatasetPackage1 contains data.csv and codebook.csv." + }, + { + "type": "Relationship", + "spdxId": "https://spdx.org/spdxdocs/Relationship/describes-de3f5855-bd5a-403f-9aa6-95dd97599c32", + "creationInfo": "_:creationinfo", + "relationshipType": "describes", + "from": "https://spdx.org/spdxdocs/File2-caf55baf-cd02-406a-b7ec-838842ca869f", + "to": [ + "https://spdx.org/spdxdocs/File1-d029fccb-7ee9-42be-a445-5e2066db0de8" + ], + "description": "codebook.csv describes data.csv." }, { "type": "Relationship", @@ -122,7 +151,8 @@ "from": "https://spdx.org/spdxdocs/DatasetPackage1-035470d9-3ede-4952-91c8-c2abb943c90b", "to": [ "https://spdx.org/licenses/CC-BY-4.0" - ] + ], + "description": "DatasetPackage1 has a concluded license as CC-BY-4.0." }, { "type": "Relationship", @@ -132,14 +162,16 @@ "from": "https://spdx.org/spdxdocs/DatasetPackage1-035470d9-3ede-4952-91c8-c2abb943c90b", "to": [ "https://spdx.org/licenses/CC-BY-4.0" - ] + ], + "description": "DatasetPackage1 has a declared license as CC-BY-4.0." }, { "type": "simplelicensing_LicenseExpression", "spdxId": "https://spdx.org/licenses/CC-BY-4.0", "creationInfo": "_:creationinfo", "simplelicensing_licenseExpression": "CC-BY-4.0", - "simplelicensing_licenseListVersion": "3.24.0" + "simplelicensing_licenseListVersion": "3.24.0", + "comment": "Added as a workaround for the lack of https://spdx.org/licenses/CC-BY-4.0 as a valid ListedLicense in SPDX 3.0.0 RDF. This will be removed once https://github.com/spdx/LicenseListPublisher/issues/183 is implemented." } ] } \ No newline at end of file diff --git a/dataset/example01/spdx3.0/example01.spdx3.png b/dataset/example01/spdx3.0/example01.spdx3.png deleted file mode 100644 index 74fc3b1..0000000 Binary files a/dataset/example01/spdx3.0/example01.spdx3.png and /dev/null differ