common.py 1.38 KB
Newer Older
Jason Phang's avatar
checkin  
Jason Phang committed
1
2
import nlp
import numpy as np
Jason Phang's avatar
Jason Phang committed
3
import random
Jason Phang's avatar
checkin  
Jason Phang committed
4
5
6
from ..base import Dataset


Leo Gao's avatar
Leo Gao committed
7
class HFNLPTask(Dataset):
Jason Phang's avatar
checkin  
Jason Phang committed
8
9
10
    NLP_PATH = None
    NLP_NAME = None

Jason Phang's avatar
Jason Phang committed
11
12
13
14
    def __init__(self):
        super().__init__()
        self._training_docs = None

Jason Phang's avatar
checkin  
Jason Phang committed
15
16
17
18
    def _load_nlp_dataset(self):
        return nlp.load_dataset(path=self.NLP_PATH, name=self.NLP_NAME)

    def training_docs(self):
Jason Phang's avatar
Jason Phang committed
19
20
        # Cache training for faster few-shot.
        # If data is too large to fit in memory, override this method.
Jason Phang's avatar
checkin  
Jason Phang committed
21
        if self.has_training_docs():
Jason Phang's avatar
Jason Phang committed
22
23
24
            if self._training_docs is None:
                self._training_docs = list(self._load_nlp_dataset()["train"])
            return self._training_docs
Jason Phang's avatar
checkin  
Jason Phang committed
25
26
27
28
29
30
31
32
33

    def validation_docs(self):
        if self.has_validation_docs():
            return self._load_nlp_dataset()["validation"]

    def test_docs(self):
        if self.has_test_docs():
            return self._load_nlp_dataset()["test"]

Jason Phang's avatar
Jason Phang committed
34
35
36
37
38
39
    def fewshot_examples(self, k):
        training_docs = self.training_docs()
        n = len(training_docs)
        indices = random.sample(range(n), k)
        return [training_docs[i] for i in indices]

Jason Phang's avatar
checkin  
Jason Phang committed
40
41
42
43
44
45
46
47

def simple_accuracy_metric(preds, golds):
    acc = float((np.array(preds) == np.array(golds)).mean())
    return {
        "major": acc,
        "minor": {"acc": acc},
        "higher_is_better": True,
    }
Jason Phang's avatar
Jason Phang committed
48
49
50
51
52
53
54


def yesno(x):
    if x:
        return 'yes'
    else:
        return 'no'