[Optimization] Improve perf for fd response token with internal adapter (#4992)

* [Optimize] Improve perf for fd response token with internal adapter

* fix

* fix bug

* fix ci

* fix ci

* fix ci

* fix ci
This commit is contained in:
chenjian
2025-11-21 19:02:03 +08:00
committed by GitHub
parent 5bcf79d780
commit 3ea1b44a58
15 changed files with 202 additions and 67 deletions
+2
View File
@@ -69,6 +69,8 @@ class MockTask:
self.prefill_chunk_num = 0
self.pooling_params = None
self.llm_engine_recv_req_timestamp = time.time()
self.ic_req_data = {}
self.prompt_token_ids_len = 0
def get(self, key: str, default_value=None):
if hasattr(self, key):
@@ -63,6 +63,8 @@ class MockTask:
self.prefill_chunk_info = None
self.prefill_chunk_num = 0
self.llm_engine_recv_req_timestamp = time.time()
self.ic_req_data = {}
self.prompt_token_ids_len = 0
def get(self, key: str, default_value=None):
if hasattr(self, key):
@@ -38,6 +38,9 @@ class TestTokenProcessorLogprobs(unittest.TestCase):
self.task_mock.preprocess_end_time = 95.0
self.task_mock.preprocess_start_time = 90.0
self.task_mock.schedule_start_time = 95.0
self.task_mock.llm_engine_recv_req_timestamp = 95.0
self.task_mock.ic_req_data = {}
self.task_mock.prompt_token_ids_len = 0
self.processor.resource_manager.tasks_list = [self.task_mock]