description="Upload your data to the Zeno AI evaluation platform to visualize results. This requires a ZENO_API_KEY in your environment variables. The eleuther harness must be run with log_samples=True and an output_path set for data to be written to disk."
description="Upload your data to the Zeno AI evaluation platform to visualize results. This requires a ZENO_API_KEY in your environment variables. The eleuther harness must be run with log_samples=True and an output_path set for data to be written to disk."
# NOTE(jinwei): EleutherAI/pythia-70m is not supported by SGlang yet. Instead we use Qwen models.
cls.LM=SGLangLM(
pretrained="Qwen/Qwen2-1.5B-Instruct",
batch_size=1,
tp_size=1,
max_model_len=1024,
)
exceptExceptionase:
pytest.fail(f"🔥 SGLangLM failed to initialize: {e}")
deftest_logliklihood(self)->None:
res=self.LM.loglikelihood(self.MULTIPLE_CH)
assertlen(res)==len(self.MULTIPLE_CH)
forxinres:
assertisinstance(x[0],float)
deftest_generate_until(self)->None:
res=self.LM.generate_until(self.generate_until)
assertlen(res)==len(self.generate_until)
forxinres:
assertisinstance(x,str)
# NOTE(Jinwei):A100 80GB is enough for our tests. If you run the last test "test_logliklihood_rolling" and OOM happens, please reduce the "max_model_len".