【Hackathon 9th No.86】autogen MultiQueryDecoderAttention template_instantiation -part (#4383)

* split MultiQueryDecoderAttention template_instantiation * update comment * CI
2026-04-23 00:17:25 +08:00 · 2025-10-16 17:08:19 +08:00
parent f72be7a2c8
commit 6adfbe07ad
27 changed files with 3975 additions and 3836 deletions
@@ -353,6 +353,8 @@ elif paddle.is_compiled_with_cuda():
        "-Igpu_ops",
        "-Ithird_party/nlohmann_json/include",
    ]
+    worker_threads = os.cpu_count()
+    nvcc_compile_args += ["-t", str(worker_threads)]

    nvcc_version = get_nvcc_version()
    print(f"nvcc_version = {nvcc_version}")