rename to ggml

ac9f4be2 · Matt Hoffner · 3ee4c2e2 · ac9f4be2 · ac9f4be2 · ac9f4be2
Commit ac9f4be2 authored Jun 26, 2023 by Matt Hoffner
Hide whitespace changes
Inline Side-by-side

Showing with 19 additions and 19 deletions

lm_eval/models/__init__.py lm_eval/models/__init__.py +2 -2

lm_eval/models/ggml.py lm_eval/models/ggml.py +4 -4

tests/test_ggml.py tests/test_ggml.py +13 -13

No files found.
--- a/lm_eval/models/__init__.py
+++ b/lm_eval/models/__init__.py
@@ -4,7 +4,7 @@ from . import anthropic_llms
 from . import huggingface
 from . import textsynth
 from . import dummy
-from . import llama
+from . import ggml

 MODEL_REGISTRY = {
    "hf": gpt2.HFLM,
@@ -16,7 +16,7 @@ MODEL_REGISTRY = {
    "anthropic": anthropic_llms.AnthropicLM,
    "textsynth": textsynth.TextSynthLM,
    "dummy": dummy.DummyLM,
-    "llama": llama.LlamaCppLM
+    "ggml": ggml.GGMLLM
 }



--- a/lm_eval/models/llama.py
+++ b/lm_eval/models/llama.py
@@ -9,7 +9,7 @@ import time

 logger = logging.getLogger(__name__)

-def llama_completion(base_url, prompt, **kwargs):
+def ggml_completion(base_url, prompt, **kwargs):
    try:
        response = requests.post(f"{base_url}/v1/completions", json=kwargs)
        response.raise_for_status()
@@ -18,7 +18,7 @@ def llama_completion(base_url, prompt, **kwargs):
        print(f"RequestException: {e}")
        return None

-class LlamaCppLM(BaseLM):
+class GGMLLM(BaseLM):
    def __init__(self, base_url, truncate=False):
        super().__init__()
        self.base_url = base_url
@@ -27,7 +27,7 @@ class LlamaCppLM(BaseLM):
    def loglikelihood(self, requests):
        res = []
        for context, continuation in tqdm(requests):
-            response = llama_completion(self.base_url, context, continuation=continuation)
+            response = ggml_completion(self.base_url, context, continuation=continuation)
            print(f"Loglikelihood response: {response}")
            if response and "choices" in response and response["choices"]:
                choice = response["choices"][0]
@@ -49,7 +49,7 @@ class LlamaCppLM(BaseLM):
            inp = request[0]
            request_args = request[1]
            until = request_args["until"]
-            response = self.llama_completion(inp, context=res, stop=until)  # Pass the context
+            response = self.ggml_completion(inp, context=res, stop=until)  # Pass the context
            print(f"Greedy_until response: {response}")
            if response and "text" in response:
                generated_text = response["text"].strip()

--- a/tests/test_llama.py
+++ b/tests/test_llama.py
 import unittest
 from unittest.mock import MagicMock
-from lm_eval.models.llama import LlamaCppLM
+from lm_eval.models.ggml import GGMLLM

-class LlamaCppLMTest(unittest.TestCase):
+class GGMLLMTest(unittest.TestCase):
    def test_loglikelihood(self):
        base_url = "https://matthoffner-ggml-llm-api.hf.space"
-        lm = LlamaCppLM(base_url)
+        lm = GGMLLM(base_url)

-        # Create a MagicMock object to mock llama_completion
-        llama_completion_mock = MagicMock()
+        # Create a MagicMock object to mock ggml_completion
+        ggml_completion_mock = MagicMock()

        # Set the return value for the mocked function
-        llama_completion_mock.return_value = {
+        ggml_completion_mock.return_value = {
            "logprob": -1.2345,
            "is_greedy": True
        }

-        # Patch the llama_completion function with the mocked function
-        lm.llama_completion = llama_completion_mock
+        # Patch the ggml_completion function with the mocked function
+        lm.ggml_completion = ggml_completion_mock

        # Test loglikelihood
        requests = [("context1", "continuation1"), ("context2", "continuation2")]
@@ -29,16 +29,16 @@ class LlamaCppLMTest(unittest.TestCase):

    def test_greedy_until(self):
        base_url = "https://matthoffner-ggml-llm-api.hf.space"
-        lm = LlamaCppLM(base_url)
+        lm = GGMLLM(base_url)

-        # Define the llama_completion method with the desired behavior
-        def llama_completion_mock(url, context, stop=None):
+        # Define the ggml_completion method with the desired behavior
+        def ggml_completion_mock(url, context, stop=None):
            if stop is not None:
                return {"text": f"generated_text{stop[-1]}"}
            return {"text": "generated_text"}

-        # Set the llama_completion method to the defined mock
-        lm.llama_completion = llama_completion_mock
+        # Set the ggml_completion method to the defined mock
+        lm.ggml_completion = ggml_completion_mock

        # Test greedy_until
        requests = [("input1", {"until": "stop1"}), ("input2", {"until": "stop2"})]