[Other] Adjust GPUModelRunner to enhance compatibility (#6851)

This commit is contained in:
ming1753
2026-03-16 14:49:19 +08:00
committed by GitHub
parent 04fde3b227
commit bb925c605f
25 changed files with 224 additions and 248 deletions
@@ -326,7 +326,6 @@ class AppendAttentionBackend(AttentionBackend):
cache_v_scales = getattr(layer, "cache_v_scale", None)
if layer.layer_id == 0:
# print(forward_meta.seq_lens_this_time)
get_block_shape_and_split_kv_block(
forward_meta.seq_lens_encoder,
forward_meta.seq_lens_decoder,