mirror of
https://github.com/PaddlePaddle/FastDeploy.git
synced 2026-04-23 17:11:21 +08:00
WINT4/WINT8 dense gemm default use Machete (#4451)
This commit is contained in:
@@ -167,7 +167,7 @@ def machete_quantize_and_pack(
|
||||
atype,
|
||||
quant_type,
|
||||
scale_type,
|
||||
)[0]
|
||||
)
|
||||
return w_q_prepack, w_s
|
||||
|
||||
|
||||
@@ -194,5 +194,5 @@ def machete_wint_mm(
|
||||
out_dtype, # out_dtype
|
||||
group_size, # group_size
|
||||
scheduler, # scheduler
|
||||
)[0]
|
||||
)
|
||||
return out
|
||||
|
||||
Reference in New Issue
Block a user