mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Optimization] Update Deepseekv3.2 model and dsa-indexer networking and add some unitest (#6762)
* add deepseek model doc * update deepseek model doc * update deepseek model doc * update deepseek model doc * cwb suppor DSK_V32 Model * update DSK_V32_DSA modeling * Ibin Support DSK_DSA * update kernel * update yaml * update requirements * update pre_commit * update model-runner * fix CI bug * del start.sh * fix iluvatar_model_runner * update DSA & add unitest * update import deep_gemm
This commit is contained in:
@@ -75,7 +75,7 @@ void RadixTopkRaggedTransform(
|
||||
unsigned int num_rows = input.dims()[0];
|
||||
unsigned int max_len = input.dims()[1];
|
||||
|
||||
static cudaStream_t stream = input.stream();
|
||||
cudaStream_t stream = input.stream();
|
||||
cudaError_t status;
|
||||
auto input_dtype = input.dtype();
|
||||
|
||||
@@ -129,6 +129,8 @@ void RadixTopkRaggedTransform(
|
||||
max_len,
|
||||
row_states_ptr,
|
||||
stream);
|
||||
} else {
|
||||
PD_THROW("input_dtype should be one of [bf16, float]");
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user