【Hackathon 9th No.86】autogen MultiQueryDecoderAttention template_instantiation -part (#4383)

* split MultiQueryDecoderAttention template_instantiation

* update comment

* CI
This commit is contained in:
Zhenghai Zhang
2025-10-16 17:08:19 +08:00
committed by GitHub
parent f72be7a2c8
commit 6adfbe07ad
27 changed files with 3975 additions and 3836 deletions
+2
View File
@@ -353,6 +353,8 @@ elif paddle.is_compiled_with_cuda():
"-Igpu_ops",
"-Ithird_party/nlohmann_json/include",
]
worker_threads = os.cpu_count()
nvcc_compile_args += ["-t", str(worker_threads)]
nvcc_version = get_nvcc_version()
print(f"nvcc_version = {nvcc_version}")