test_misc.py 342 Bytes
Newer Older
Leo Gao's avatar
Leo Gao committed
1
import pytest
haileyschoelkopf's avatar
haileyschoelkopf committed
2
import lm_eval.api.metrics as metrics
Leo Gao's avatar
Leo Gao committed
3
import random
Leo Gao's avatar
Leo Gao committed
4
5
6


def test_bootstrapping():
Leo Gao's avatar
Leo Gao committed
7
    random.seed(42)
Leo Gao's avatar
Leo Gao committed
8
    arr = [random.random() for _ in range(1000)]
Leo Gao's avatar
Leo Gao committed
9
    expected = metrics.mean_stderr(arr)
Leo Gao's avatar
Leo Gao committed
10
    bootstrapped = metrics.bootstrap_stderr(metrics.mean, arr, iters=100000)
Leo Gao's avatar
Leo Gao committed
11

Leo Gao's avatar
Leo Gao committed
12
    assert bootstrapped == pytest.approx(expected, abs=1e-4)