From 1683d673d26a5ca7a82646c22e22ec9d431453e8 Mon Sep 17 00:00:00 2001 From: zR <2448370773@qq.com> Date: Thu, 6 Jun 2024 10:14:15 +0800 Subject: [PATCH] fix #60 and #51 --- basic_demo/openai_api_server.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/basic_demo/openai_api_server.py b/basic_demo/openai_api_server.py index 806d59e..6d8499c 100644 --- a/basic_demo/openai_api_server.py +++ b/basic_demo/openai_api_server.py @@ -314,7 +314,7 @@ async def create_chat_completion(request: ChatCompletionRequest): if request.stream: predict_stream_generator = predict_stream(request.model, gen_params) output = await anext(predict_stream_generator) - if not output and 'get_' in output: + if output: return EventSourceResponse(predict_stream_generator, media_type="text/event-stream") logger.debug(f"First result output:\n{output}") @@ -535,7 +535,6 @@ if __name__ == "__main__": engine_args = AsyncEngineArgs( model=MODEL_PATH, tokenizer=MODEL_PATH, - tokenizer_mode="slow", tensor_parallel_size=1, dtype="bfloat16", trust_remote_code=True,