mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 17:11:21 +08:00
native top_p_sampling (#2901)
This commit is contained in:
@@ -20,7 +20,7 @@ import paddle
|
||||
|
||||
from fastdeploy.platforms import current_platform
|
||||
|
||||
if current_platform.is_cuda() and not current_platform.is_dcu():
|
||||
if current_platform.is_cuda():
|
||||
from fastdeploy.model_executor.ops.gpu import (
|
||||
append_attention as append_attention_gpu,
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user