add batch_size to `get_sample_size`

8335e43a · Baber · fb963f0f · 8335e43a · 8335e43a
Commit 8335e43a authored Sep 17, 2024 by Baber
Show whitespace changes
Inline Side-by-side

Showing with 12 additions and 2 deletions

lm_eval/evaluator.py lm_eval/evaluator.py +1 -1

lm_eval/evaluator_utils.py lm_eval/evaluator_utils.py +11 -1

No files found.
--- a/lm_eval/evaluator.py
+++ b/lm_eval/evaluator.py
@@ -436,7 +436,7 @@ def evaluate(
    for task_output in eval_tasks:
        task: Task = task_output.task
-        limit = get_sample_size(task, limit)
+        limit = get_sample_size(task, limit, getattr(lm, "batch_size", None))
        task.build_all_requests(
            limit=limit,
            rank=lm.rank,

--- a/lm_eval/evaluator_utils.py
+++ b/lm_eval/evaluator_utils.py
@@ -4,6 +4,8 @@ import pathlib
 import sys
 from typing import List, Optional, Tuple, Union
+from pandas.core.dtypes.inference import is_float
 from lm_eval.api.group import ConfigurableGroup
 from lm_eval.api.metrics import (
    aggregate_subtask_metrics,
@@ -200,8 +202,16 @@ def print_writeout(task) -> None:
            eval_logger.info(f"Request: {str(inst)}")
-def get_sample_size(task, limit: Optional[int]) -> Union[int, None]:
+def get_sample_size(
+    task, limit: Optional[int], batch_size: Optional[int]
+) -> Union[int, None]:
    if limit is not None:
+        if batch_size is not None and is_float(limit) and limit == 1.0:
+            eval_logger.warning(
+                "Limit is 1.0, adjusting the sample size to be a multiple of the batch size"
+            )
+            return (len(task.eval_docs) // batch_size) * batch_size
+    elif limit is not None:
        limit = (
            int(math.ceil(len(task.eval_docs) * limit)) if limit < 1.0 else int(limit)
        )