[Bugfix] Fix broken vision language example (#14292)

Signed-off-by: Isotr0py <2037008807@qq.com>

[Bugfix] Fix broken vision language example (#14292)
Signed-off-by: Isotr0py <2037008807@qq.com>
f71b00a1 · Isotr0py · GitHub · 8f808cf8 · f71b00a1
Unverified Commit f71b00a1 authored Mar 05, 2025 by Isotr0py Committed by GitHub Mar 05, 2025
Show whitespace changes
Inline Side-by-side

Showing with 18 additions and 22 deletions

examples/offline_inference/vision_language.py examples/offline_inference/vision_language.py +18 -22

No files found.
--- a/examples/offline_inference/vision_language.py
+++ b/examples/offline_inference/vision_language.py
@@ -152,15 +152,13 @@ def run_h2ovl(questions: list[str], modality: str):
    tokenizer = AutoTokenizer.from_pretrained(model_name,
                                              trust_remote_code=True)
-    prompts = [
+    messages = [[{
-        tokenizer.apply_chat_template([{
        'role': 'user',
        'content': f"<image>\n{question}"
-        }],
+    }] for question in questions]
+    prompts = tokenizer.apply_chat_template(messages,
                                            tokenize=False,
                                            add_generation_prompt=True)
-        for question in questions
-    ]
    # Stop tokens for H2OVL-Mississippi
    # https://huggingface.co/h2oai/h2ovl-mississippi-800m
@@ -209,15 +207,13 @@ def run_internvl(questions: list[str], modality: str):
    tokenizer = AutoTokenizer.from_pretrained(model_name,
                                              trust_remote_code=True)
-    prompts = [
+    messages = [[{
-        tokenizer.apply_chat_template([{
        'role': 'user',
        'content': f"<image>\n{question}"
-        }],
+    }] for question in questions]
+    prompts = tokenizer.apply_chat_template(messages,
                                            tokenize=False,
                                            add_generation_prompt=True)
-        for question in questions
-    ]
    # Stop tokens for InternVL
    # models variants may have different stop tokens
@@ -399,7 +395,7 @@ def run_mllama(questions: list[str], modality: str):
    )
    tokenizer = AutoTokenizer.from_pretrained(model_name)
-    messages = [{
+    messages = [[{
        "role":
        "user",
        "content": [{
@@ -408,7 +404,7 @@ def run_mllama(questions: list[str], modality: str):
            "type": "text",
            "text": f"{question}"
        }]
-    } for question in questions]
+    }] for question in questions]
    prompts = tokenizer.apply_chat_template(messages,
                                            add_generation_prompt=True,
                                            tokenize=False)
@@ -454,10 +450,10 @@ def run_nvlm_d(questions: list[str], modality: str):
    tokenizer = AutoTokenizer.from_pretrained(model_name,
                                              trust_remote_code=True)
-    messages = [{
+    messages = [[{
        'role': 'user',
        'content': f"<image>\n{question}"
-    } for question in questions]
+    }] for question in questions]
    prompts = tokenizer.apply_chat_template(messages,
                                            tokenize=False,
                                            add_generation_prompt=True)