mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
router support divided roolout (#6150)
This commit is contained in:
@@ -73,6 +73,11 @@ void SwapCacheImpLayout(
|
||||
copy_kind,
|
||||
stream);
|
||||
|
||||
PADDLE_ENFORCE_EQ(status,
|
||||
cudaSuccess,
|
||||
phi::errors::External("cudaMemcpyAsync failed: %s",
|
||||
cudaGetErrorString(status)));
|
||||
|
||||
#ifdef SWAP_DEBUG
|
||||
cudaStreamSynchronize(stream);
|
||||
std::cout << "mode:" << mode << ", layer_idx:" << layer_idx
|
||||
@@ -81,7 +86,11 @@ void SwapCacheImpLayout(
|
||||
#endif
|
||||
}
|
||||
}
|
||||
cudaStreamSynchronize(stream);
|
||||
cudaError_t sync_status = cudaStreamSynchronize(stream);
|
||||
PADDLE_ENFORCE_EQ(sync_status,
|
||||
cudaSuccess,
|
||||
phi::errors::External("cudaStreamSynchronize failed: %s",
|
||||
cudaGetErrorString(sync_status)));
|
||||
}
|
||||
|
||||
void SwapCacheLayout(
|
||||
|
||||
Reference in New Issue
Block a user