[BugFix] fix cpu prefix cache bug (#5544)
CE Compile Job / ce_job_pre_check (push) Has been cancelled
CE Compile Job / print_ce_job_pre_check_outputs (push) Has been cancelled
CE Compile Job / FD-Clone-Linux (push) Has been cancelled
CE Compile Job / Show Code Archive Output (push) Has been cancelled
CE Compile Job / BUILD_SM8090 (push) Has been cancelled
CE Compile Job / BUILD_SM8689 (push) Has been cancelled
CE Compile Job / CE_UPLOAD (push) Has been cancelled
Deploy GitHub Pages / deploy (push) Has been cancelled

* fix_dy_c8_bug

* add block_num check

* fix test case

* update ci case
This commit is contained in:
kevin
2025-12-16 14:21:42 +08:00
committed by GitHub
parent 5d2b16e6f3
commit c9b47f90ce
5 changed files with 23 additions and 8 deletions
+3 -2
View File
@@ -253,8 +253,9 @@ class TestCommonEngineAdditionalCoverage(unittest.TestCase):
with patch("fastdeploy.engine.args_utils.envs.ENABLE_V1_KVCACHE_SCHEDULER", 0):
cfg = self._make_cfg(
splitwise_role="prefill",
num_gpu_blocks_override=3,
num_gpu_blocks_override=4,
router="0.0.0.0:30000",
kv_cache_ratio=1,
)
# Patch EngineWorkerQueue before EngineService ctor to avoid real IPC
@@ -337,7 +338,7 @@ class TestCommonEngineAdditionalCoverage(unittest.TestCase):
def test_start_mixed_branch_cache_after_load_and_zmq(self):
"""Cover lines 215-217 and 231 in start()."""
cfg = self._make_cfg(splitwise_role="mixed", num_gpu_blocks_override=2)
cfg = self._make_cfg(splitwise_role="mixed", num_gpu_blocks_override=4)
class DummyQ:
def __init__(self, *a, **k):