..
attention
fix(gaudi): refactor server and implement requested changes
2025-02-27 12:59:28 +00:00
awq
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
gptq
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
marlin
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
moe
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
__init__.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
bnb.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
conv.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
eetq.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
exl2.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
fp8.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
layernorm.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
linear.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
lora.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
medusa.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
mlp.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
rotary.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
speculative.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00
tensor_parallel.py
wip(gaudi): import server and dockerfile from tgi-gaudi fork
2025-02-25 12:08:42 +00:00