Add gpt3 chunking

1ff4e07f · Leo Gao · f3bf1c07 · 1ff4e07f · 1ff4e07f
Commit 1ff4e07f authored Feb 20, 2021 by Leo Gao
Hide whitespace changes
Inline Side-by-side

Showing with 30 additions and 11 deletions

lm_eval/models/gpt3.py lm_eval/models/gpt3.py +28 -10

requirements.txt requirements.txt +2 -1

No files found.
--- a/lm_eval/models/gpt3.py
+++ b/lm_eval/models/gpt3.py
@@ -37,7 +37,7 @@ def oa_completion(**kwargs):
 class GPT3LM(LM):
    MAX_LENGTH = 2048
-    REQ_CHUNK_SIZE = 64
+    REQ_CHUNK_SIZE = 20
    MAX_GEN_TOKS = 256
    def __init__(self, engine, truncate=False):
@@ -101,28 +101,46 @@ class GPT3LM(LM):
        return res
    def greedy_until(self, requests):
+        if not requests: return []
        import openai
        res = []
-        for context, until in tqdm(requests):
+        def sameuntil_chunks(xs, size):
-            context_enc = self.tokenizer.encode(context)
+            ret = []
-            inp = context_enc[-(self.MAX_LENGTH - self.MAX_GEN_TOKS):]
+            lastuntil = xs[0][1]
-            ctxlen = len(context_enc) - max(0, len(context_enc) - (self.MAX_LENGTH - self.MAX_GEN_TOKS))
+            for x in xs:
+                if len(ret) >= size or x[1] != lastuntil:
+                    yield ret, lastuntil
+                    ret = []
+                    lastuntil = x[1]
+                ret.append(x)
+            if ret: yield ret, lastuntil
+        # todo: more intelligent batching for heterogenous `until`
+        for chunk, until in tqdm(list(sameuntil_chunks(requests, self.REQ_CHUNK_SIZE))):
+            inps = []
+            for context, _ in chunk:
+                context_enc = self.tokenizer.encode(context)
+                inp = context_enc[-(self.MAX_LENGTH - self.MAX_GEN_TOKS):]
+                inps.append(inp)
            response = oa_completion(
                engine=self.engine,
-                prompt=[inp],
+                prompt=inps,
                max_tokens=self.MAX_GEN_TOKS, 
                temperature=0.,
                logprobs=10,
                stop=until
            )
-            s = response.choices[0]['text']
-            for term in until:
+            for resp in response.choices:
-                s = s.split(term)[0]
+                s = response.choices[0]['text']
+                for term in until:
+                    s = s.split(term)[0]
-            res.append(s)
+                res.append(s)
        return res
--- a/requirements.txt
+++ b/requirements.txt
@@ -8,4 +8,5 @@ transformers>=4.1
 sqlitedict==1.6.0
 pytablewriter==0.58.0
 sacrebleu==1.5.0
 pycountry==20.7.3
\ No newline at end of file
+numexpr==2.7.2
\ No newline at end of file