mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
Do not fail on missing moe-kernels (Intel-cpu).
This commit is contained in:
parent
b73aec7fa3
commit
b2a13b92f9
@ -10,7 +10,11 @@ from text_generation_server.layers.fp8 import (
|
|||||||
quant_dtype,
|
quant_dtype,
|
||||||
normalize_e4m3fn_to_native_float8,
|
normalize_e4m3fn_to_native_float8,
|
||||||
)
|
)
|
||||||
from moe_kernels.fused_moe import fused_moe
|
|
||||||
|
try:
|
||||||
|
from moe_kernels.fused_moe import fused_moe
|
||||||
|
except Exception:
|
||||||
|
fused_moe = None
|
||||||
|
|
||||||
|
|
||||||
class FP8SparseMoELayer(nn.Module):
|
class FP8SparseMoELayer(nn.Module):
|
||||||
|
Loading…
Reference in New Issue
Block a user