mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 11:54:52 +00:00
chore: fix typo in mpt_modeling.py
implemetation -> implementation
This commit is contained in:
parent
3ef5ffbc64
commit
a1cec743ee
@ -297,7 +297,7 @@ def triton_flash_attn_fn(
|
|||||||
class MultiheadAttention(nn.Module):
|
class MultiheadAttention(nn.Module):
|
||||||
"""Multi-head self attention.
|
"""Multi-head self attention.
|
||||||
|
|
||||||
Using torch or triton attention implemetation enables user to also use
|
Using torch or triton attention implementation enables user to also use
|
||||||
additive bias.
|
additive bias.
|
||||||
"""
|
"""
|
||||||
|
|
||||||
@ -386,7 +386,7 @@ class MultiheadAttention(nn.Module):
|
|||||||
class MultiQueryAttention(nn.Module):
|
class MultiQueryAttention(nn.Module):
|
||||||
"""Multi-Query self attention.
|
"""Multi-Query self attention.
|
||||||
|
|
||||||
Using torch or triton attention implemetation enables user to also use
|
Using torch or triton attention implementation enables user to also use
|
||||||
additive bias.
|
additive bias.
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user