from scripts.inference import inference_once import time # model_path = "mtgv/MobileVLM-1.7B" # MobileVLM model_path = "mtgv/MobileVLM_V2-1.7B" # MobileVLM V2 image_file = "assets/samples/demo.jpg" prompt_str = "Who is the author of this book?\nAnswer the question using a single word or phrase." # (or) What is the title of this book? # (or) Is this book related to Education & Teaching? args = type('Args', (), { "model_path": model_path, "image_file": image_file, "prompt": prompt_str, "conv_mode": "v1", "temperature": 0, "top_p": None, "num_beams": 1, "max_new_tokens": 512, "load_8bit": False, "load_4bit": False, })() start_time = time.time() inference_once(args) print("infer time:", time.time() - start_time, "秒")