Fix typing in AsyncLLMEngine & add toml to requirements-dev (#2100)

6774bd50 · mezuzza · GitHub · 31c1f325 · 6774bd50 · 6774bd50
Unverified Commit 6774bd50 authored Dec 14, 2023 by mezuzza Committed by GitHub Dec 14, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 8 additions and 6 deletions

requirements-dev.txt requirements-dev.txt +1 -0

vllm/engine/async_llm_engine.py vllm/engine/async_llm_engine.py +7 -6

No files found.
--- a/requirements-dev.txt
+++ b/requirements-dev.txt
 # formatting
 yapf==0.32.0
+toml==0.10.2
 ruff==0.1.5

 # type checking

--- a/vllm/engine/async_llm_engine.py
+++ b/vllm/engine/async_llm_engine.py
@@ -2,7 +2,7 @@ import asyncio
 import time
 from functools import partial
 from typing import (Any, Dict, Iterable, List, Optional, Set, Tuple, Type,
-                    Union)
+                    Union, AsyncIterator)

 from vllm.config import ModelConfig
 from vllm.engine.arg_utils import AsyncEngineArgs
@@ -401,11 +401,12 @@ class AsyncLLMEngine:
        return stream

    async def generate(
-            self,
-            prompt: Optional[str],
-            sampling_params: SamplingParams,
-            request_id: str,
-            prompt_token_ids: Optional[List[int]] = None) -> RequestOutput:
+        self,
+        prompt: Optional[str],
+        sampling_params: SamplingParams,
+        request_id: str,
+        prompt_token_ids: Optional[List[int]] = None
+    ) -> AsyncIterator[RequestOutput]:
        """Generate outputs for a request.

        Generate outputs for a request. This method is a coroutine. It adds the