mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
FA3 support qwen3 (#5441)
This commit is contained in:
@@ -190,6 +190,7 @@ std::vector<paddle::Tensor> GQARopeWriteCacheKernel(
|
||||
const int kv_token_num,
|
||||
const int max_seq_len,
|
||||
const float rms_norm_eps,
|
||||
const bool use_neox_rotary_style,
|
||||
const std::string& cache_quant_type,
|
||||
const bool rope_3d);
|
||||
|
||||
|
||||
Reference in New Issue
Block a user