mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-19 15:52:08 +00:00
Fix crash
Signed-off-by: yuanwu <yuan.wu@intel.com>
This commit is contained in:
parent
512eca7f8f
commit
91c40e6c58
@ -185,7 +185,6 @@ class Qwen3MoeAttention(nn.Module):
|
|||||||
seqlen=seqlen,
|
seqlen=seqlen,
|
||||||
softmax_scale=self.scaling,
|
softmax_scale=self.scaling,
|
||||||
window_size_left=self.max_past,
|
window_size_left=self.max_past,
|
||||||
num_key_value_groups=self.num_key_value_groups,
|
|
||||||
)
|
)
|
||||||
# Decode
|
# Decode
|
||||||
else:
|
else:
|
||||||
|
Loading…
Reference in New Issue
Block a user