mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
Remove outdated TODO
This commit is contained in:
parent
df582a1842
commit
fc3ac8075b
@ -23,7 +23,6 @@ else:
|
|||||||
quantization = None
|
quantization = None
|
||||||
|
|
||||||
try:
|
try:
|
||||||
# TODO: needs to be ported over to MoE and used on CUDA.
|
|
||||||
from moe_kernels.fp8_utils import w8a8_block_fp8_matmul, per_token_group_quant_fp8
|
from moe_kernels.fp8_utils import w8a8_block_fp8_matmul, per_token_group_quant_fp8
|
||||||
except ImportError:
|
except ImportError:
|
||||||
w8a8_block_fp8_matmul = None
|
w8a8_block_fp8_matmul = None
|
||||||
|
Loading…
Reference in New Issue
Block a user