mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Metax][CI] e2e ci tests enable cuda graph (#6401)
This commit is contained in:
@@ -31,7 +31,7 @@ class TestErnie21B(unittest.TestCase):
|
||||
load_choices="default_v1",
|
||||
# enable_prefix_caching=False,
|
||||
disable_custom_all_reduce=True,
|
||||
graph_optimization_config={"use_cudagraph": False, "graph_opt_level": 0},
|
||||
# graph_optimization_config={"use_cudagraph": False, "graph_opt_level": 0},
|
||||
)
|
||||
|
||||
cls.sampling_params = fastdeploy.SamplingParams(top_p=0.95, max_tokens=256, temperature=0.6)
|
||||
|
||||
@@ -37,7 +37,7 @@ class TestErnie28BVL(unittest.TestCase):
|
||||
quantization="wint8",
|
||||
disable_custom_all_reduce=True,
|
||||
# enable_prefix_caching=False,
|
||||
graph_optimization_config={"use_cudagraph": False, "graph_opt_level": 0},
|
||||
# graph_optimization_config={"use_cudagraph": False, "graph_opt_level": 0},
|
||||
limit_mm_per_prompt={"image": 100},
|
||||
reasoning_parser="ernie-45-vl",
|
||||
load_choices="default_v1",
|
||||
|
||||
Reference in New Issue
Block a user