mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
fix fa4 test (#6408)
This commit is contained in:
@@ -118,9 +118,9 @@ def flash_attn_func(
|
||||
head_dim: int = 128,
|
||||
version: Optional[int] = None,
|
||||
):
|
||||
if FLASH_ATTN_VERSION is None:
|
||||
init_flash_attn_version()
|
||||
if version is None:
|
||||
if FLASH_ATTN_VERSION is None:
|
||||
init_flash_attn_version()
|
||||
version = FLASH_ATTN_VERSION
|
||||
if version == 4:
|
||||
assert (
|
||||
|
||||
Reference in New Issue
Block a user