Fix vLLM CPU /chat endpoint (#11748)

2024-08-09 10:33:52 +08:00 · 2024-08-09 10:33:52 +08:00 · 044e486480
commit 044e486480
parent 27b4b104ed
1 changed files with 0 additions and 1 deletions
--- a/python/llm/src/ipex_llm/vllm/cpu/entrypoints/openai/api_server.py
+++ b/python/llm/src/ipex_llm/vllm/cpu/entrypoints/openai/api_server.py
@ -114,7 +114,6 @@ async def create_chat_completion(request: ChatCompletionRequest,
        return StreamingResponse(content=generator,
                                 media_type="text/event-stream")
    else:
        invalidInputError(isinstance(generator, ChatCompletionResponse))
        return JSONResponse(content=generator.model_dump())