Simplify available_blocks assignment logic (#6819)

This commit is contained in:
Jiang-Jia-Jun
2026-03-16 20:12:30 +08:00
committed by GitHub
parent 5c92f4d0cd
commit d113397b09
+1 -5
View File
@@ -842,11 +842,7 @@ class EngineService:
# In multi-mode scenarios, using available_block_num to pull requests to prevent heavy rescheduling
# in the frequency domain due to insufficient blocks
if self.cfg.model_config.enable_mm:
self.resource_manager.check_and_free_block_tables()
available_blocks = self.resource_manager.available_block_num()
else:
available_blocks = self.cfg.cache_config.max_block_num_per_seq
available_blocks = self.cfg.cache_config.max_block_num_per_seq
tasks = self.scheduler.get_requests(
available_blocks=available_blocks,