mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Optimization] Improve perf for fd response token with internal adapter (#4992)
* [Optimize] Improve perf for fd response token with internal adapter * fix * fix bug * fix ci * fix ci * fix ci * fix ci
This commit is contained in:
@@ -71,6 +71,7 @@ class MockScheduledResponse:
|
||||
def __init__(self, request_output):
|
||||
self.request_id = request_output.request_id
|
||||
self.finished = request_output.finished
|
||||
self.raw = self
|
||||
|
||||
|
||||
# Mock LocalScheduler base class
|
||||
@@ -93,6 +94,7 @@ class MockLocalScheduler:
|
||||
self.ids_read_cursor = 0
|
||||
self.requests_not_empty = threading.Condition()
|
||||
self.responses_not_empty = threading.Condition()
|
||||
self.batch_responses_per_step = list()
|
||||
|
||||
def calc_required_blocks(self, token_len, block_size):
|
||||
return (token_len + block_size - 1) // block_size
|
||||
|
||||
Reference in New Issue
Block a user