Unverified Commit 382af8c9 authored by Hailey Schoelkopf's avatar Hailey Schoelkopf Committed by GitHub
Browse files

Merge pull request #948 from glerzing/licenses

Dataset licenses - PR 2
parents cc9778fb b0686dd9
...@@ -43,8 +43,8 @@ level (for indicating the level of difficulty). ...@@ -43,8 +43,8 @@ level (for indicating the level of difficulty).
_HOMEPAGE = "https://github.com/chaochun/nlu-asdiv-dataset" _HOMEPAGE = "https://github.com/chaochun/nlu-asdiv-dataset"
# TODO: Add the licence for the dataset here if you can find it # License declared at https://github.com/chaochun/nlu-asdiv-dataset/blob/master/README.md
_LICENSE = "" _LICENSE = "CC BY-NC 4.0"
_URLS = "https://github.com/chaochun/nlu-asdiv-dataset/archive/55790e5270bb91ccfa5053194b25732534696b50.zip" _URLS = "https://github.com/chaochun/nlu-asdiv-dataset/archive/55790e5270bb91ccfa5053194b25732534696b50.zip"
......
...@@ -44,8 +44,7 @@ appear in a conversation. ...@@ -44,8 +44,7 @@ appear in a conversation.
_HOMEPAGE = "https://stanfordnlp.github.io/coqa/" _HOMEPAGE = "https://stanfordnlp.github.io/coqa/"
# TODO: Add the licence for the dataset here if you can find it _LICENSE = "Different licenses depending on the content (see https://stanfordnlp.github.io/coqa/ for details)"
_LICENSE = ""
_URLS = { _URLS = {
"train": "https://nlp.stanford.edu/data/coqa/coqa-train-v1.0.json", "train": "https://nlp.stanford.edu/data/coqa/coqa-train-v1.0.json",
......
...@@ -43,8 +43,8 @@ and perform discrete operations over them (such as addition, counting, or sortin ...@@ -43,8 +43,8 @@ and perform discrete operations over them (such as addition, counting, or sortin
_HOMEPAGE = "https://allenai.org/data/drop" _HOMEPAGE = "https://allenai.org/data/drop"
# TODO: Add the licence for the dataset here if you can find it # License declared at https://allenai.org/data/drop
_LICENSE = "" _LICENSE = "CC BY"
_URLS = { _URLS = {
"drop": "https://s3-us-west-2.amazonaws.com/allennlp/datasets/drop/drop_dataset.zip", "drop": "https://s3-us-west-2.amazonaws.com/allennlp/datasets/drop/drop_dataset.zip",
......
...@@ -51,7 +51,10 @@ The dataset contains questions about the following topics: medicine, nursing, ps ...@@ -51,7 +51,10 @@ The dataset contains questions about the following topics: medicine, nursing, ps
_HOMEPAGE = "https://aghie.github.io/head-qa/" _HOMEPAGE = "https://aghie.github.io/head-qa/"
_LICENSE = "MIT License" # The Spanish data comes from the "Ministerio de Sanidad, Consumo y Bienestar Social", as indicated here : https://github.com/aghie/head-qa
# This Spanish data seems to follow the intellectual property rights stated here : https://www.sanidad.gob.es/avisoLegal/home.htm
# The English data was translated by the authors of head-qa (https://arxiv.org/pdf/1906.04701.pdf).
_LICENSE = "Custom license"
_URL = "https://drive.google.com/uc?export=download&confirm=t&id=1a_95N5zQQoUCq8IBNVZgziHbeM-QxG2t" _URL = "https://drive.google.com/uc?export=download&confirm=t&id=1a_95N5zQQoUCq8IBNVZgziHbeM-QxG2t"
......
...@@ -41,8 +41,10 @@ learning agents. ...@@ -41,8 +41,10 @@ learning agents.
_HOMEPAGE = "https://github.com/hendrycks/ethics" _HOMEPAGE = "https://github.com/hendrycks/ethics"
# TODO: Add the licence for the dataset here if you can find it # The authors declared that the dataset is not distributed under a copyright or intellectual property (https://arxiv.org/pdf/2008.02275.pdf)
_LICENSE = "" # On Hugging Face, the dataset is distributed under the MIT license (https://huggingface.co/datasets/hendrycks/ethics)
# The common sense portion is from Reddit and might incur some licensing complications.
_LICENSE = "Ambiguous"
_URLS = "https://people.eecs.berkeley.edu/~hendrycks/ethics.tar" _URLS = "https://people.eecs.berkeley.edu/~hendrycks/ethics.tar"
......
...@@ -38,8 +38,8 @@ models to generate answer derivations and explanations. ...@@ -38,8 +38,8 @@ models to generate answer derivations and explanations.
_HOMEPAGE = "https://github.com/hendrycks/math" _HOMEPAGE = "https://github.com/hendrycks/math"
# TODO: Add the licence for the dataset here if you can find it # License declared at https://arxiv.org/pdf/2103.03874.pdf
_LICENSE = "" _LICENSE = "MIT License"
_URLS = "https://people.eecs.berkeley.edu/~hendrycks/MATH.tar" _URLS = "https://people.eecs.berkeley.edu/~hendrycks/MATH.tar"
......
...@@ -38,8 +38,7 @@ NLP setting. ...@@ -38,8 +38,7 @@ NLP setting.
_HOMEPAGE = "https://github.com/lgw863/LogiQA-dataset" _HOMEPAGE = "https://github.com/lgw863/LogiQA-dataset"
# TODO: Add the licence for the dataset here if you can find it _LICENSE = "No license found"
_LICENSE = ""
_URLS = { _URLS = {
"train": "https://raw.githubusercontent.com/lgw863/LogiQA-dataset/master/Train.txt", "train": "https://raw.githubusercontent.com/lgw863/LogiQA-dataset/master/Train.txt",
......
...@@ -38,8 +38,7 @@ modified from Chinese high school English listening comprehension test data. ...@@ -38,8 +38,7 @@ modified from Chinese high school English listening comprehension test data.
_HOMEPAGE = "https://github.com/Nealcly/MuTual" _HOMEPAGE = "https://github.com/Nealcly/MuTual"
# TODO: Add the licence for the dataset here if you can find it _LICENSE = "No license found"
_LICENSE = ""
_URLS = "https://github.com/Nealcly/MuTual/archive/master.zip" _URLS = "https://github.com/Nealcly/MuTual/archive/master.zip"
......
...@@ -38,8 +38,8 @@ math, computer science, and philosophy papers. ...@@ -38,8 +38,8 @@ math, computer science, and philosophy papers.
_HOMEPAGE = "https://pile.eleuther.ai/" _HOMEPAGE = "https://pile.eleuther.ai/"
# TODO: Add the licence for the dataset here if you can find it # More details at https://arxiv.org/pdf/2201.07311.pdf
_LICENSE = "" _LICENSE = "Multiple licenses"
_URLS = { _URLS = {
"validation": "https://the-eye.eu/public/AI/pile/val.jsonl.zst", "validation": "https://the-eye.eu/public/AI/pile/val.jsonl.zst",
......
...@@ -39,8 +39,8 @@ a teacher who answers the questions by providing short excerpts (spans) from the ...@@ -39,8 +39,8 @@ a teacher who answers the questions by providing short excerpts (spans) from the
_HOMEPAGE = "https://quac.ai/" _HOMEPAGE = "https://quac.ai/"
# TODO: Add the licence for the dataset here if you can find it # License declared at https://quac.ai/
_LICENSE = "" _LICENSE = "CC BY-SA 4.0"
_URLS = { _URLS = {
"train": "https://s3.amazonaws.com/my89public/quac/train_v0.2.json", "train": "https://s3.amazonaws.com/my89public/quac/train_v0.2.json",
......
...@@ -39,8 +39,7 @@ multiple-choice analogy questions; 5 choices per question. ...@@ -39,8 +39,7 @@ multiple-choice analogy questions; 5 choices per question.
_HOMEPAGE = "https://aclweb.org/aclwiki/SAT_Analogy_Questions_(State_of_the_art)" _HOMEPAGE = "https://aclweb.org/aclwiki/SAT_Analogy_Questions_(State_of_the_art)"
# TODO: Add the licence for the dataset here if you can find it _LICENSE = "No license found"
_LICENSE = ""
class SatAnalogies(datasets.GeneratorBasedBuilder): class SatAnalogies(datasets.GeneratorBasedBuilder):
......
...@@ -42,8 +42,7 @@ addition, or deletion of characters, and asking it to recover the original word. ...@@ -42,8 +42,7 @@ addition, or deletion of characters, and asking it to recover the original word.
_HOMEPAGE = "https://github.com/openai/gpt-3/tree/master/data" _HOMEPAGE = "https://github.com/openai/gpt-3/tree/master/data"
# TODO: Add the licence for the dataset here if you can find it _LICENSE = "No license found"
_LICENSE = ""
_BASE_URL = "https://raw.githubusercontent.com/openai/gpt-3/master/data" _BASE_URL = "https://raw.githubusercontent.com/openai/gpt-3/master/data"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment