mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-19 07:42:06 +00:00
Fix crash
Signed-off-by: yuanwu <yuan.wu@intel.com>
This commit is contained in:
parent
512eca7f8f
commit
91c40e6c58
@ -185,7 +185,6 @@ class Qwen3MoeAttention(nn.Module):
|
||||
seqlen=seqlen,
|
||||
softmax_scale=self.scaling,
|
||||
window_size_left=self.max_past,
|
||||
num_key_value_groups=self.num_key_value_groups,
|
||||
)
|
||||
# Decode
|
||||
else:
|
||||
|
Loading…
Reference in New Issue
Block a user