.. |
attention
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
awq
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
gptq
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
marlin
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
moe
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
__init__.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
bnb.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
conv.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
eetq.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
exl2.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
fp8.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
layernorm.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
linear.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
lora.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
medusa.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
mlp.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
rotary.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
speculative.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |
tensor_parallel.py
|
wip(gaudi): import server and dockerfile from tgi-gaudi fork
|
2025-02-25 12:08:42 +00:00 |