Update openai_api_server.py

Changed vllm’s gpu memory utilization
This commit is contained in:
Lao 2024-06-05 11:48:20 +08:00 committed by GitHub
parent d95f131b03
commit 205b7db3cc
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
1 changed files with 1 additions and 1 deletions

View File

@ -533,7 +533,7 @@ if __name__ == "__main__":
tensor_parallel_size=1,
dtype="bfloat16",
trust_remote_code=True,
gpu_memory_utilization=0.3,
gpu_memory_utilization=0.9,
enforce_eager=True,
worker_use_ray=True,
engine_use_ray=False,