Unverified Commit bea23536 authored by Andreas Karatzas's avatar Andreas Karatzas Committed by GitHub
Browse files

[CI] Add temperature=0.0, reduce max_tokens, and add debug prints to audio_in_video tests (#38492)


Signed-off-by: default avatarAndreas Karatzas <akaratza@amd.com>
parent c133f337
...@@ -64,11 +64,12 @@ async def test_online_audio_in_video( ...@@ -64,11 +64,12 @@ async def test_online_audio_in_video(
] ]
# multi-turn to test mm processor cache as well # multi-turn to test mm processor cache as well
for _ in range(2): for turn in range(2):
chat_completion = await client.chat.completions.create( chat_completion = await client.chat.completions.create(
model=MODEL_NAME, model=MODEL_NAME,
messages=messages, messages=messages,
max_tokens=16, max_tokens=8,
temperature=0.0,
extra_body={ extra_body={
"mm_processor_kwargs": { "mm_processor_kwargs": {
"use_audio_in_video": True, "use_audio_in_video": True,
...@@ -78,6 +79,12 @@ async def test_online_audio_in_video( ...@@ -78,6 +79,12 @@ async def test_online_audio_in_video(
assert len(chat_completion.choices) == 1 assert len(chat_completion.choices) == 1
choice = chat_completion.choices[0] choice = chat_completion.choices[0]
print(
f"[DEBUG][single-video] turn={turn} "
f"finish_reason={choice.finish_reason!r} "
f"content={choice.message.content!r} "
f"usage={chat_completion.usage}"
)
assert choice.finish_reason == "length" assert choice.finish_reason == "length"
...@@ -111,11 +118,12 @@ async def test_online_audio_in_video_multi_videos( ...@@ -111,11 +118,12 @@ async def test_online_audio_in_video_multi_videos(
] ]
# multi-turn to test mm processor cache as well # multi-turn to test mm processor cache as well
for _ in range(2): for turn in range(2):
chat_completion = await client.chat.completions.create( chat_completion = await client.chat.completions.create(
model=MODEL_NAME, model=MODEL_NAME,
messages=messages, messages=messages,
max_tokens=16, max_tokens=8,
temperature=0.0,
extra_body={ extra_body={
"mm_processor_kwargs": { "mm_processor_kwargs": {
"use_audio_in_video": True, "use_audio_in_video": True,
...@@ -125,6 +133,12 @@ async def test_online_audio_in_video_multi_videos( ...@@ -125,6 +133,12 @@ async def test_online_audio_in_video_multi_videos(
assert len(chat_completion.choices) == 1 assert len(chat_completion.choices) == 1
choice = chat_completion.choices[0] choice = chat_completion.choices[0]
print(
f"[DEBUG][multi-video] turn={turn} "
f"finish_reason={choice.finish_reason!r} "
f"content={choice.message.content!r} "
f"usage={chat_completion.usage}"
)
assert choice.finish_reason == "length" assert choice.finish_reason == "length"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment