Revert "[Core] Rename PromptInputs to PromptType, and inputs to prompt" (#8750)

2024-09-23 22:45:20 -07:00
parent 0250dd68c5
commit 3185fb0cca
18 changed files with 162 additions and 157 deletions
--- a/vllm/engine/async_llm_engine.py
+++ b/vllm/engine/async_llm_engine.py
@@ -17,7 +17,7 @@ from vllm.engine.metrics_types import StatLoggerBase
 from vllm.executor.executor_base import ExecutorAsyncBase
 from vllm.executor.gpu_executor import GPUExecutorAsync
 from vllm.executor.ray_utils import initialize_ray_cluster
-from vllm.inputs import PromptType
+from vllm.inputs import PromptInputs
 from vllm.logger import init_logger
 from vllm.lora.request import LoRARequest
 from vllm.model_executor.layers.sampler import SamplerOutput
@@ -405,7 +405,7 @@ class _AsyncLLMEngine(LLMEngine):
    async def add_request_async(
        self,
        request_id: str,
-        prompt: PromptType,
+        inputs: PromptInputs,
        params: Union[SamplingParams, PoolingParams],
        arrival_time: Optional[float] = None,
        lora_request: Optional[LoRARequest] = None,
@@ -420,7 +420,7 @@ class _AsyncLLMEngine(LLMEngine):
            arrival_time = time.time()

        preprocessed_inputs = await self.input_preprocessor.preprocess_async(
-            prompt,
+            inputs,
            request_id=request_id,
            lora_request=lora_request,
            prompt_adapter_request=prompt_adapter_request,
@@ -777,7 +777,7 @@ class AsyncLLMEngine:
    async def add_request(
        self,
        request_id: str,
-        prompt: PromptType,
+        inputs: PromptInputs,
        params: Union[SamplingParams, PoolingParams],
        arrival_time: Optional[float] = None,
        lora_request: Optional[LoRARequest] = None,
@@ -797,7 +797,7 @@ class AsyncLLMEngine:
        stream = self._request_tracker.add_request(
            request_id,
            verbose=self.log_requests,
-            prompt=prompt,
+            inputs=inputs,
            params=params,
            arrival_time=arrival_time or time.time(),
            lora_request=lora_request,
@@ -808,7 +808,7 @@ class AsyncLLMEngine:

    async def generate(
        self,
-        prompt: PromptType,
+        inputs: PromptInputs,
        sampling_params: SamplingParams,
        request_id: str,
        lora_request: Optional[LoRARequest] = None,
@@ -822,7 +822,8 @@ class AsyncLLMEngine:
        from the LLMEngine to the caller.

        Args:
-            prompt: The prompt to the LLM. See :class:`~vllm.inputs.PromptType`
+            inputs: The inputs to the LLM. See
+                :class:`~vllm.inputs.PromptInputs`
                for more details about the format of each input.
            sampling_params: The sampling parameters of the request.
            request_id: The unique id of the request.
@@ -880,7 +881,7 @@ class AsyncLLMEngine:
        """
        async for output in await self.add_request(
                request_id,
-                prompt,
+                inputs,
                sampling_params,
                lora_request=lora_request,
                trace_headers=trace_headers,
@@ -890,7 +891,7 @@ class AsyncLLMEngine:

    async def encode(
        self,
-        prompt: PromptType,
+        inputs: PromptInputs,
        pooling_params: PoolingParams,
        request_id: str,
        lora_request: Optional[LoRARequest] = None,
@@ -903,7 +904,8 @@ class AsyncLLMEngine:
        from the LLMEngine to the caller.

        Args:
-            prompt: The prompt to the LLM. See :class:`~vllm.inputs.PromptType`
+            inputs: The inputs to the LLM. See
+                :class:`~vllm.inputs.PromptInputs`
                for more details about the format of each input.
            pooling_params: The pooling parameters of the request.
            request_id: The unique id of the request.
@@ -957,7 +959,7 @@ class AsyncLLMEngine:
        """
        async for output in await self.add_request(
                request_id,
-                prompt,
+                inputs,
                pooling_params,
                lora_request=lora_request,
                trace_headers=trace_headers,