FastDeploy

mirror of https://github.com/PaddlePaddle/FastDeploy.git synced 2026-05-01 12:56:36 +08:00

Files

T

bukejiyu 598cce8545 [RL] Support SM100 FP8 quantization in RL (#6601 )

* RL SM100 Fix

* update

2026-03-04 04:55:04 -08:00

__init__.py

2025-08-25 11:27:45 +08:00

ep.py

2026-03-02 10:35:51 +08:00

fused_moe_backend_base.py

2026-01-09 17:13:24 +08:00

fused_moe_cutlass_backend.py

2026-03-02 14:07:17 +08:00

fused_moe_deepgemm_backend.py

2026-03-03 11:32:35 +08:00

fused_moe_marlin_backend.py

2026-02-26 21:08:46 -08:00

fused_moe_triton_backend.py

2026-03-04 04:55:04 -08:00

fused_moe_wint2_backend.py

2026-02-08 22:42:36 -08:00

moe.py

2026-02-08 22:42:36 -08:00

routing_indices_cache.py

2026-02-03 04:13:16 -08:00

triton_moe_kernels.py

2025-09-24 16:39:51 +08:00