mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 00:17:25 +08:00
[Speculative Decoding] Optimize draft logprob (#5842)
* optimize draft logprob * fix ut
This commit is contained in:
@@ -740,6 +740,8 @@ class SpeculativeConfig:
|
||||
|
||||
self.num_extra_cache_layer = 0
|
||||
|
||||
self.enable_draft_logprob: bool = False
|
||||
|
||||
for key, value in args.items():
|
||||
if hasattr(self, key):
|
||||
setattr(self, key, value)
|
||||
|
||||
Reference in New Issue
Block a user