mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
Split enable_mm (#7183)
Co-authored-by: liuruian <liuruian@MacBook-Pro.local>
This commit is contained in:
@@ -92,6 +92,7 @@ class MockFDConfig:
|
||||
model_config = MockModelConfig()
|
||||
cache_config = MockCacheConfig()
|
||||
speculative_config = MockSpecaulativeConfig()
|
||||
enable_mm_runtime = MockModelConfig.enable_mm
|
||||
|
||||
def get_max_chunk_tokens(self, mm_max_tokens_per_item=None):
|
||||
return 8192
|
||||
@@ -139,7 +140,7 @@ class TestChunkedMoE(unittest.TestCase):
|
||||
model_runner.model_config = mock_model_config
|
||||
model_runner.cache_config = mock_cache_config
|
||||
model_runner.attn_backends = [MockAttentionBackend()]
|
||||
model_runner.enable_mm = True
|
||||
model_runner.enable_mm = mock_fd_config.enable_mm_runtime
|
||||
model_runner.cudagraph_only_prefill = False
|
||||
model_runner.use_cudagraph = False
|
||||
model_runner.speculative_decoding = False
|
||||
|
||||
Reference in New Issue
Block a user