mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
Generous snapshot for load because of accumulations errors in the
logprobs.
This commit is contained in:
parent
d9000a2bcb
commit
b9ac720d1e
@ -54,7 +54,7 @@ async def test_mamba_all_params(fused_kernel_mamba, response_snapshot):
|
||||
|
||||
@pytest.mark.asyncio
|
||||
@pytest.mark.private
|
||||
async def test_mamba_load(fused_kernel_mamba, generate_load, response_snapshot):
|
||||
async def test_mamba_load(fused_kernel_mamba, generate_load, generous_response_snapshot):
|
||||
responses = await generate_load(
|
||||
fused_kernel_mamba, "What is Deep Learning?", max_new_tokens=10, n=4
|
||||
)
|
||||
|
Loading…
Reference in New Issue
Block a user