mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[CI] Fix tests and docs to resolve failure (#6572)
This commit is contained in:
@@ -1,4 +1,4 @@
|
||||
[English](../../best_practices/DeepSeek-V3-V3.1.md)
|
||||
[English](../../best_practices/DeepSeek-V3.md)
|
||||
|
||||
# DeepSeek-V3/V3.1 模型
|
||||
|
||||
|
||||
@@ -37,12 +37,6 @@ from e2e.utils.serving_utils import (
|
||||
os.environ.setdefault("DG_NVCC_OVERRIDE_CPP_STANDARD", "17")
|
||||
|
||||
W4AFP8_CONFIGS = [
|
||||
{
|
||||
"id": "w4afp8_default_v1",
|
||||
"load_choices": "default_v1",
|
||||
"model_name": "ernie-4_5-21b-a3b-bf16-paddle",
|
||||
"model_subdir": None,
|
||||
},
|
||||
{
|
||||
"id": "w4afp8_default_v1",
|
||||
"load_choices": "default_v1",
|
||||
|
||||
@@ -1540,7 +1540,7 @@ class TestFastDeployBatch(unittest.TestCase):
|
||||
|
||||
def test_completions(self):
|
||||
"""测试正常的批量chat请求"""
|
||||
return_code, contents, proc = self.run_fastdeploy_command(INPUT_BATCH, port="2235")
|
||||
return_code, contents, proc = self.run_fastdeploy_command(INPUT_BATCH, port=str(FD_CACHE_QUEUE_PORT))
|
||||
print(f"进程输出: {return_code}")
|
||||
|
||||
self.assertEqual(return_code, 0, f"进程返回非零码: {return_code}, 进程信息: {proc}")
|
||||
|
||||
Reference in New Issue
Block a user