mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
39dc4b0c2e
* fix(examples): comment out stop.sh to avoid error when script is missing * feat: add file_store support for cache manager * [fix] fix multi gpu transfer * [fix] fix global kvcache transfer * [Feature] [KVCache] support file_store kv cache backend * chore: update FileStore according to PR comments * fix: remove comments * fix: add swap_cache_layout for file store * fix: remove rank key * fix: Switch KV cache storage to pure file mode * Temporarily disable support for Tensor types * fix: remove args --kvcache_file_path & add envs FILE_BACKEND_STORAGE_DIR * fixx: Simplify cache_transfer_manager.py * fix: fix syntax bug * fix: Simplify file_store.py * fix: Use the key directly as the filename * fix: Simplify set() * fix: Simplify cache_transfer_manager.py & file_store.py * fix: Only support load to cpu buffer * feat: add FileStore backend for cache transfer * fix: guard zmq import
38 lines
1.1 KiB
Python
38 lines
1.1 KiB
Python
"""
|
|
# Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License"
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
"""
|
|
|
|
from fastdeploy.platforms import current_platform
|
|
|
|
from .file_store import FileStore
|
|
from .kvcache_storage import KVCacheStorage
|
|
from .mooncake_store import AttentionStore, MooncakeStore
|
|
from .rdma_cache_transfer import RDMACommManager
|
|
|
|
if current_platform.is_cuda():
|
|
from .ipc_cache_transfer import IPCCommManager
|
|
else:
|
|
IPCCommManager = None
|
|
|
|
|
|
__all__ = [
|
|
"IPCCommManager",
|
|
"RDMACommManager",
|
|
"KVCacheStorage",
|
|
"MooncakeStore",
|
|
"AttentionStore",
|
|
"FileStore",
|
|
]
|