mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
only update self.exist_prefill_task_signal in v0 (#6064)
* commit * commit * commit --------- Co-authored-by: xiaoluomi <1037819816@qq.com>
This commit is contained in:
@@ -542,7 +542,9 @@ class PaddleDisWorkerProc:
|
||||
# These generated tokens can be obtained through get_output op.
|
||||
start_execute_time = time.time()
|
||||
self.worker.execute_model(req_dicts, max_occupied_batch_index)
|
||||
self.exist_prefill_task_signal.value[0] = self.worker.exist_prefill()
|
||||
# Only v0 use this signal
|
||||
if not envs.ENABLE_V1_KVCACHE_SCHEDULER:
|
||||
self.exist_prefill_task_signal.value[0] = self.worker.exist_prefill()
|
||||
logger.debug(f"execute model cost: {time.time()-start_execute_time:.5f} s")
|
||||
|
||||
def initialize_kv_cache(self) -> None:
|
||||
|
||||
Reference in New Issue
Block a user