mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
Simplify available_blocks assignment logic (#6819)
This commit is contained in:
@@ -842,11 +842,7 @@ class EngineService:
|
||||
|
||||
# In multi-mode scenarios, using available_block_num to pull requests to prevent heavy rescheduling
|
||||
# in the frequency domain due to insufficient blocks
|
||||
if self.cfg.model_config.enable_mm:
|
||||
self.resource_manager.check_and_free_block_tables()
|
||||
available_blocks = self.resource_manager.available_block_num()
|
||||
else:
|
||||
available_blocks = self.cfg.cache_config.max_block_num_per_seq
|
||||
available_blocks = self.cfg.cache_config.max_block_num_per_seq
|
||||
|
||||
tasks = self.scheduler.get_requests(
|
||||
available_blocks=available_blocks,
|
||||
|
||||
Reference in New Issue
Block a user