mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[BugFix] fix multi-step mtp bug (#6754)
This commit is contained in:
@@ -541,7 +541,6 @@ class TestResourceManagerV1Additional(unittest.TestCase):
|
||||
manager.cache_manager.get_required_block_num.return_value = 0
|
||||
success = manager.get_prefix_cached_blocks(request)
|
||||
self.assertTrue(success)
|
||||
self.assertTrue(request.skip_allocate)
|
||||
self.assertEqual(request.num_cached_tokens, 8)
|
||||
self.assertEqual(request.metrics.gpu_cache_token_num, 4)
|
||||
self.assertEqual(request.metrics.cpu_cache_token_num, 0)
|
||||
|
||||
Reference in New Issue
Block a user