"fair_dev/testing/testing.py" did not exist on "543d56935ee39c9b288d78f577eae8a2199bca7d"
Unverified Commit fc9c3153 authored by Daniël de Kok's avatar Daniël de Kok Committed by GitHub
Browse files

Add pytest release marker (#2114)

* Add pytest release marker

Annotate a test with `@pytest.mark.release` and it only gets run
with `pytest integration-tests --release`.

* Mark many models as `release` to speed up CI
parent e563983d
...@@ -13,6 +13,7 @@ async def flash_santacoder(flash_santacoder_handle): ...@@ -13,6 +13,7 @@ async def flash_santacoder(flash_santacoder_handle):
return flash_santacoder_handle.client return flash_santacoder_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_flash_santacoder(flash_santacoder, response_snapshot): async def test_flash_santacoder(flash_santacoder, response_snapshot):
response = await flash_santacoder.generate( response = await flash_santacoder.generate(
...@@ -23,6 +24,7 @@ async def test_flash_santacoder(flash_santacoder, response_snapshot): ...@@ -23,6 +24,7 @@ async def test_flash_santacoder(flash_santacoder, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_flash_santacoder_load( async def test_flash_santacoder_load(
flash_santacoder, generate_load, response_snapshot flash_santacoder, generate_load, response_snapshot
......
...@@ -13,6 +13,7 @@ async def flash_starcoder(flash_starcoder_handle): ...@@ -13,6 +13,7 @@ async def flash_starcoder(flash_starcoder_handle):
return flash_starcoder_handle.client return flash_starcoder_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_starcoder(flash_starcoder, response_snapshot): async def test_flash_starcoder(flash_starcoder, response_snapshot):
...@@ -24,6 +25,7 @@ async def test_flash_starcoder(flash_starcoder, response_snapshot): ...@@ -24,6 +25,7 @@ async def test_flash_starcoder(flash_starcoder, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_starcoder_default_params(flash_starcoder, response_snapshot): async def test_flash_starcoder_default_params(flash_starcoder, response_snapshot):
...@@ -40,6 +42,7 @@ async def test_flash_starcoder_default_params(flash_starcoder, response_snapshot ...@@ -40,6 +42,7 @@ async def test_flash_starcoder_default_params(flash_starcoder, response_snapshot
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_starcoder_load(flash_starcoder, generate_load, response_snapshot): async def test_flash_starcoder_load(flash_starcoder, generate_load, response_snapshot):
......
...@@ -13,6 +13,7 @@ async def flash_starcoder2(flash_starcoder2_handle): ...@@ -13,6 +13,7 @@ async def flash_starcoder2(flash_starcoder2_handle):
return flash_starcoder2_handle.client return flash_starcoder2_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_starcoder2(flash_starcoder2, response_snapshot): async def test_flash_starcoder2(flash_starcoder2, response_snapshot):
...@@ -24,6 +25,7 @@ async def test_flash_starcoder2(flash_starcoder2, response_snapshot): ...@@ -24,6 +25,7 @@ async def test_flash_starcoder2(flash_starcoder2, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_starcoder2_default_params(flash_starcoder2, response_snapshot): async def test_flash_starcoder2_default_params(flash_starcoder2, response_snapshot):
...@@ -40,6 +42,7 @@ async def test_flash_starcoder2_default_params(flash_starcoder2, response_snapsh ...@@ -40,6 +42,7 @@ async def test_flash_starcoder2_default_params(flash_starcoder2, response_snapsh
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_starcoder2_load( async def test_flash_starcoder2_load(
......
...@@ -13,6 +13,7 @@ async def flash_starcoder_gptq(flash_starcoder_gptq_handle): ...@@ -13,6 +13,7 @@ async def flash_starcoder_gptq(flash_starcoder_gptq_handle):
return flash_starcoder_gptq_handle.client return flash_starcoder_gptq_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_flash_starcoder_gptq(flash_starcoder_gptq, generous_response_snapshot): async def test_flash_starcoder_gptq(flash_starcoder_gptq, generous_response_snapshot):
response = await flash_starcoder_gptq.generate( response = await flash_starcoder_gptq.generate(
...@@ -24,6 +25,7 @@ async def test_flash_starcoder_gptq(flash_starcoder_gptq, generous_response_snap ...@@ -24,6 +25,7 @@ async def test_flash_starcoder_gptq(flash_starcoder_gptq, generous_response_snap
assert response == generous_response_snapshot assert response == generous_response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_flash_starcoder_gptq_default_params( async def test_flash_starcoder_gptq_default_params(
flash_starcoder_gptq, generous_response_snapshot flash_starcoder_gptq, generous_response_snapshot
...@@ -40,6 +42,7 @@ async def test_flash_starcoder_gptq_default_params( ...@@ -40,6 +42,7 @@ async def test_flash_starcoder_gptq_default_params(
assert response == generous_response_snapshot assert response == generous_response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_flash_starcoder_gptq_load( async def test_flash_starcoder_gptq_load(
flash_starcoder_gptq, generate_load, generous_response_snapshot flash_starcoder_gptq, generate_load, generous_response_snapshot
......
...@@ -21,6 +21,7 @@ async def non_flash_llama_grammar(non_flash_llama_grammar_handle): ...@@ -21,6 +21,7 @@ async def non_flash_llama_grammar(non_flash_llama_grammar_handle):
return non_flash_llama_grammar_handle.client return non_flash_llama_grammar_handle.client
@pytest.mark.release
@pytest.mark.skip @pytest.mark.skip
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_non_flash_llama_grammar_json(non_flash_llama_grammar, response_snapshot): async def test_non_flash_llama_grammar_json(non_flash_llama_grammar, response_snapshot):
......
...@@ -22,6 +22,7 @@ async def llama_grammar(llama_grammar_handle): ...@@ -22,6 +22,7 @@ async def llama_grammar(llama_grammar_handle):
return llama_grammar_handle.client return llama_grammar_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_grammar_response_format_llama_json(llama_grammar, response_snapshot): async def test_grammar_response_format_llama_json(llama_grammar, response_snapshot):
...@@ -62,6 +63,7 @@ async def test_grammar_response_format_llama_json(llama_grammar, response_snapsh ...@@ -62,6 +63,7 @@ async def test_grammar_response_format_llama_json(llama_grammar, response_snapsh
assert chat_completion == response_snapshot assert chat_completion == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_grammar_response_format_llama_error_if_tools_not_installed( async def test_grammar_response_format_llama_error_if_tools_not_installed(
llama_grammar, llama_grammar,
......
...@@ -45,6 +45,7 @@ async def test_idefics(idefics, response_snapshot): ...@@ -45,6 +45,7 @@ async def test_idefics(idefics, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_idefics_two_images(idefics, response_snapshot): async def test_idefics_two_images(idefics, response_snapshot):
...@@ -60,6 +61,7 @@ async def test_idefics_two_images(idefics, response_snapshot): ...@@ -60,6 +61,7 @@ async def test_idefics_two_images(idefics, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_idefics_load(idefics, generate_load, response_snapshot): async def test_idefics_load(idefics, generate_load, response_snapshot):
chicken = get_chicken() chicken = get_chicken()
......
...@@ -26,6 +26,7 @@ async def flash_llava_next(flash_llava_next_handle): ...@@ -26,6 +26,7 @@ async def flash_llava_next(flash_llava_next_handle):
return flash_llava_next_handle.client return flash_llava_next_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_llava_next_simple(flash_llava_next, response_snapshot): async def test_flash_llava_next_simple(flash_llava_next, response_snapshot):
...@@ -41,6 +42,7 @@ async def test_flash_llava_next_simple(flash_llava_next, response_snapshot): ...@@ -41,6 +42,7 @@ async def test_flash_llava_next_simple(flash_llava_next, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_llava_next_all_params(flash_llava_next, response_snapshot): async def test_flash_llava_next_all_params(flash_llava_next, response_snapshot):
...@@ -64,6 +66,7 @@ async def test_flash_llava_next_all_params(flash_llava_next, response_snapshot): ...@@ -64,6 +66,7 @@ async def test_flash_llava_next_all_params(flash_llava_next, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
@pytest.mark.private @pytest.mark.private
async def test_flash_llava_next_load( async def test_flash_llava_next_load(
......
...@@ -13,6 +13,7 @@ async def fused_kernel_mamba(fused_kernel_mamba_handle): ...@@ -13,6 +13,7 @@ async def fused_kernel_mamba(fused_kernel_mamba_handle):
return fused_kernel_mamba_handle.client return fused_kernel_mamba_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mamba(fused_kernel_mamba, response_snapshot): async def test_mamba(fused_kernel_mamba, response_snapshot):
response = await fused_kernel_mamba.generate( response = await fused_kernel_mamba.generate(
...@@ -24,6 +25,7 @@ async def test_mamba(fused_kernel_mamba, response_snapshot): ...@@ -24,6 +25,7 @@ async def test_mamba(fused_kernel_mamba, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mamba_all_params(fused_kernel_mamba, response_snapshot): async def test_mamba_all_params(fused_kernel_mamba, response_snapshot):
response = await fused_kernel_mamba.generate( response = await fused_kernel_mamba.generate(
...@@ -50,6 +52,7 @@ async def test_mamba_all_params(fused_kernel_mamba, response_snapshot): ...@@ -50,6 +52,7 @@ async def test_mamba_all_params(fused_kernel_mamba, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mamba_load( async def test_mamba_load(
fused_kernel_mamba, generate_load, generous_response_snapshot fused_kernel_mamba, generate_load, generous_response_snapshot
......
...@@ -13,6 +13,7 @@ async def mpt_sharded(mpt_sharded_handle): ...@@ -13,6 +13,7 @@ async def mpt_sharded(mpt_sharded_handle):
return mpt_sharded_handle.client return mpt_sharded_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mpt(mpt_sharded, response_snapshot): async def test_mpt(mpt_sharded, response_snapshot):
response = await mpt_sharded.generate( response = await mpt_sharded.generate(
...@@ -29,6 +30,7 @@ async def test_mpt(mpt_sharded, response_snapshot): ...@@ -29,6 +30,7 @@ async def test_mpt(mpt_sharded, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mpt_load(mpt_sharded, generate_load, response_snapshot): async def test_mpt_load(mpt_sharded, generate_load, response_snapshot):
responses = await generate_load( responses = await generate_load(
......
...@@ -13,6 +13,7 @@ async def mt0_base(mt0_base_handle): ...@@ -13,6 +13,7 @@ async def mt0_base(mt0_base_handle):
return mt0_base_handle.client return mt0_base_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mt0_base(mt0_base, response_snapshot): async def test_mt0_base(mt0_base, response_snapshot):
response = await mt0_base.generate( response = await mt0_base.generate(
...@@ -27,6 +28,7 @@ async def test_mt0_base(mt0_base, response_snapshot): ...@@ -27,6 +28,7 @@ async def test_mt0_base(mt0_base, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mt0_base_all_params(mt0_base, response_snapshot): async def test_mt0_base_all_params(mt0_base, response_snapshot):
response = await mt0_base.generate( response = await mt0_base.generate(
...@@ -49,6 +51,7 @@ async def test_mt0_base_all_params(mt0_base, response_snapshot): ...@@ -49,6 +51,7 @@ async def test_mt0_base_all_params(mt0_base, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_mt0_base_load(mt0_base, generate_load, response_snapshot): async def test_mt0_base_load(mt0_base, generate_load, response_snapshot):
responses = await generate_load( responses = await generate_load(
......
...@@ -15,6 +15,7 @@ async def neox(neox_handle): ...@@ -15,6 +15,7 @@ async def neox(neox_handle):
return neox_handle.client return neox_handle.client
@pytest.mark.release
@pytest.mark.skip @pytest.mark.skip
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_neox(neox, response_snapshot): async def test_neox(neox, response_snapshot):
...@@ -28,6 +29,7 @@ async def test_neox(neox, response_snapshot): ...@@ -28,6 +29,7 @@ async def test_neox(neox, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.skip @pytest.mark.skip
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_neox_load(neox, generate_load, response_snapshot): async def test_neox_load(neox, generate_load, response_snapshot):
......
...@@ -15,6 +15,7 @@ async def neox_sharded(neox_sharded_handle): ...@@ -15,6 +15,7 @@ async def neox_sharded(neox_sharded_handle):
return neox_sharded_handle.client return neox_sharded_handle.client
@pytest.mark.release
@pytest.mark.skip @pytest.mark.skip
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_neox(neox_sharded, response_snapshot): async def test_neox(neox_sharded, response_snapshot):
...@@ -28,6 +29,7 @@ async def test_neox(neox_sharded, response_snapshot): ...@@ -28,6 +29,7 @@ async def test_neox(neox_sharded, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.skip @pytest.mark.skip
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_neox_load(neox_sharded, generate_load, response_snapshot): async def test_neox_load(neox_sharded, generate_load, response_snapshot):
......
...@@ -13,6 +13,7 @@ async def t5_sharded(t5_sharded_handle): ...@@ -13,6 +13,7 @@ async def t5_sharded(t5_sharded_handle):
return t5_sharded_handle.client return t5_sharded_handle.client
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_t5_sharded(t5_sharded, response_snapshot): async def test_t5_sharded(t5_sharded, response_snapshot):
response = await t5_sharded.generate( response = await t5_sharded.generate(
...@@ -24,6 +25,7 @@ async def test_t5_sharded(t5_sharded, response_snapshot): ...@@ -24,6 +25,7 @@ async def test_t5_sharded(t5_sharded, response_snapshot):
assert response == response_snapshot assert response == response_snapshot
@pytest.mark.release
@pytest.mark.asyncio @pytest.mark.asyncio
async def test_t5_sharded_load(t5_sharded, generate_load, response_snapshot): async def test_t5_sharded_load(t5_sharded, generate_load, response_snapshot):
responses = await generate_load( responses = await generate_load(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment