Fix typing in AsyncLLMEngine & add toml to requirements-dev (#2100)

2023-12-14 03:19:41 -05:00 · 2023-12-14 03:19:41 -05:00 · 6774bd50b0
commit 6774bd50b0
parent 31c1f3255e
2 changed files with 8 additions and 6 deletions
--- a/requirements-dev.txt
+++ b/requirements-dev.txt
@ -1,5 +1,6 @@
 # formatting
 yapf==0.32.0
 toml==0.10.2
 ruff==0.1.5
 # type checking
--- a/vllm/engine/async_llm_engine.py
+++ b/vllm/engine/async_llm_engine.py
@ -2,7 +2,7 @@ import asyncio
 import time
 from functools import partial
 from typing import (Any, Dict, Iterable, List, Optional, Set, Tuple, Type,
-                    Union)
+                    Union, AsyncIterator)
 from vllm.config import ModelConfig
 from vllm.engine.arg_utils import AsyncEngineArgs
@ -405,7 +405,8 @@ class AsyncLLMEngine:
        prompt: Optional[str],
        sampling_params: SamplingParams,
        request_id: str,
-            prompt_token_ids: Optional[List[int]] = None) -> RequestOutput:
+        prompt_token_ids: Optional[List[int]] = None
    ) -> AsyncIterator[RequestOutput]:
        """Generate outputs for a request.
        Generate outputs for a request. This method is a coroutine. It adds the