diff --git a/fastdeploy/entrypoints/openai/api_server.py b/fastdeploy/entrypoints/openai/api_server.py index f7856086e8..3a79ab743d 100644 --- a/fastdeploy/entrypoints/openai/api_server.py +++ b/fastdeploy/entrypoints/openai/api_server.py @@ -660,6 +660,7 @@ def launch_api_server() -> None: api_server_logger.info(f"args: {args.__dict__}") # fd_start_span("FD_START") + # set control_socket_disable=True to avoid conflicts when running multiple instances options = { "bind": f"{args.host}:{args.port}", "workers": args.workers, @@ -667,6 +668,7 @@ def launch_api_server() -> None: "loglevel": "info", "graceful_timeout": args.timeout_graceful_shutdown, "timeout": args.timeout, + "control_socket_disable": True, } try: diff --git a/requirements.txt b/requirements.txt index d3af47625c..b3ccc8475d 100644 --- a/requirements.txt +++ b/requirements.txt @@ -28,7 +28,7 @@ moviepy triton crcmod msgpack -gunicorn==25.0.3 +gunicorn>=25.1.0 modelscope safetensors>=0.7.0 opentelemetry-api>=1.24.0