diff --git a/docs/zh/best_practices/DeepSeek-V3.md b/docs/zh/best_practices/DeepSeek-V3.md index e8907132c3..ad0dc38b07 100644 --- a/docs/zh/best_practices/DeepSeek-V3.md +++ b/docs/zh/best_practices/DeepSeek-V3.md @@ -1,4 +1,4 @@ -[English](../../best_practices/DeepSeek-V3-V3.1.md) +[English](../../best_practices/DeepSeek-V3.md) # DeepSeek-V3/V3.1 模型 diff --git a/tests/ci_use/w4afp8/test_moe_w4afp8_online_quant.py b/tests/ci_use/w4afp8/test_moe_w4afp8_online_quant.py index acff7fc548..bd2edbf84d 100644 --- a/tests/ci_use/w4afp8/test_moe_w4afp8_online_quant.py +++ b/tests/ci_use/w4afp8/test_moe_w4afp8_online_quant.py @@ -37,12 +37,6 @@ from e2e.utils.serving_utils import ( os.environ.setdefault("DG_NVCC_OVERRIDE_CPP_STANDARD", "17") W4AFP8_CONFIGS = [ - { - "id": "w4afp8_default_v1", - "load_choices": "default_v1", - "model_name": "ernie-4_5-21b-a3b-bf16-paddle", - "model_subdir": None, - }, { "id": "w4afp8_default_v1", "load_choices": "default_v1", diff --git a/tests/entrypoints/openai/test_run_batch.py b/tests/entrypoints/openai/test_run_batch.py index 22b8f2f925..50410ccf23 100644 --- a/tests/entrypoints/openai/test_run_batch.py +++ b/tests/entrypoints/openai/test_run_batch.py @@ -1540,7 +1540,7 @@ class TestFastDeployBatch(unittest.TestCase): def test_completions(self): """测试正常的批量chat请求""" - return_code, contents, proc = self.run_fastdeploy_command(INPUT_BATCH, port="2235") + return_code, contents, proc = self.run_fastdeploy_command(INPUT_BATCH, port=str(FD_CACHE_QUEUE_PORT)) print(f"进程输出: {return_code}") self.assertEqual(return_code, 0, f"进程返回非零码: {return_code}, 进程信息: {proc}")