mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
Remove outdated TODO
This commit is contained in:
parent
df582a1842
commit
fc3ac8075b
@ -23,7 +23,6 @@ else:
|
||||
quantization = None
|
||||
|
||||
try:
|
||||
# TODO: needs to be ported over to MoE and used on CUDA.
|
||||
from moe_kernels.fp8_utils import w8a8_block_fp8_matmul, per_token_group_quant_fp8
|
||||
except ImportError:
|
||||
w8a8_block_fp8_matmul = None
|
||||
|
Loading…
Reference in New Issue
Block a user