mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-05-24 04:22:10 +00:00
Fix the crash in default ATTENTION path for Gaudi backend (#3235)
Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
This commit is contained in:
parent
000e313a92
commit
43b1b07fb9
@ -31,6 +31,7 @@ def main(args):
|
|||||||
trust_remote_code=args.trust_remote_code,
|
trust_remote_code=args.trust_remote_code,
|
||||||
uds_path=args.uds_path,
|
uds_path=args.uds_path,
|
||||||
max_input_tokens=args.max_input_tokens,
|
max_input_tokens=args.max_input_tokens,
|
||||||
|
kv_cache_dtype="auto",
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user