mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
feat: skip long runnning tests
This commit is contained in:
parent
1eff07c0e4
commit
57a5766848
@ -28,6 +28,7 @@ async def test_flash_llama_grammar(flash_llama_grammar, response_snapshot):
|
|||||||
assert response == response_snapshot
|
assert response == response_snapshot
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
async def test_flash_llama_grammar_regex(flash_llama_grammar, response_snapshot):
|
async def test_flash_llama_grammar_regex(flash_llama_grammar, response_snapshot):
|
||||||
response = await flash_llama_grammar.generate(
|
response = await flash_llama_grammar.generate(
|
||||||
@ -46,6 +47,7 @@ async def test_flash_llama_grammar_regex(flash_llama_grammar, response_snapshot)
|
|||||||
assert response == response_snapshot
|
assert response == response_snapshot
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
async def test_flash_llama_grammar_json(flash_llama_grammar, response_snapshot):
|
async def test_flash_llama_grammar_json(flash_llama_grammar, response_snapshot):
|
||||||
response = await flash_llama_grammar.generate(
|
response = await flash_llama_grammar.generate(
|
||||||
@ -94,6 +96,7 @@ async def test_flash_llama_grammar_json(flash_llama_grammar, response_snapshot):
|
|||||||
assert response == response_snapshot
|
assert response == response_snapshot
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
async def test_flash_llama_grammar_load(
|
async def test_flash_llama_grammar_load(
|
||||||
flash_llama_grammar, generate_load, response_snapshot
|
flash_llama_grammar, generate_load, response_snapshot
|
||||||
@ -125,6 +128,7 @@ async def test_flash_llama_grammar_load(
|
|||||||
|
|
||||||
# this is the same as the above test, but only fires off a single request
|
# this is the same as the above test, but only fires off a single request
|
||||||
# this is only to ensure that the parallel and single inference produce the same result
|
# this is only to ensure that the parallel and single inference produce the same result
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
async def test_flash_llama_grammar_single_load_instance(
|
async def test_flash_llama_grammar_single_load_instance(
|
||||||
flash_llama_grammar, generate_load, response_snapshot
|
flash_llama_grammar, generate_load, response_snapshot
|
||||||
|
@ -21,6 +21,7 @@ async def non_flash_llama_grammar(non_flash_llama_grammar_handle):
|
|||||||
return non_flash_llama_grammar_handle.client
|
return non_flash_llama_grammar_handle.client
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
async def test_non_flash_llama_grammar_json(non_flash_llama_grammar, response_snapshot):
|
async def test_non_flash_llama_grammar_json(non_flash_llama_grammar, response_snapshot):
|
||||||
response = await non_flash_llama_grammar.generate(
|
response = await non_flash_llama_grammar.generate(
|
||||||
|
@ -98,6 +98,7 @@ async def test_flash_llama_grammar_no_tools(
|
|||||||
assert response == response_snapshot
|
assert response == response_snapshot
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
@pytest.mark.private
|
@pytest.mark.private
|
||||||
async def test_flash_llama_grammar_tools(flash_llama_grammar_tools, response_snapshot):
|
async def test_flash_llama_grammar_tools(flash_llama_grammar_tools, response_snapshot):
|
||||||
@ -134,6 +135,7 @@ async def test_flash_llama_grammar_tools(flash_llama_grammar_tools, response_sna
|
|||||||
assert response == response_snapshot
|
assert response == response_snapshot
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
@pytest.mark.private
|
@pytest.mark.private
|
||||||
async def test_flash_llama_grammar_tools_auto(
|
async def test_flash_llama_grammar_tools_auto(
|
||||||
@ -173,6 +175,7 @@ async def test_flash_llama_grammar_tools_auto(
|
|||||||
assert response == response_snapshot
|
assert response == response_snapshot
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
@pytest.mark.private
|
@pytest.mark.private
|
||||||
async def test_flash_llama_grammar_tools_choice(
|
async def test_flash_llama_grammar_tools_choice(
|
||||||
@ -208,6 +211,7 @@ async def test_flash_llama_grammar_tools_choice(
|
|||||||
assert response == response_snapshot
|
assert response == response_snapshot
|
||||||
|
|
||||||
|
|
||||||
|
@pytest.mark.skip
|
||||||
@pytest.mark.asyncio
|
@pytest.mark.asyncio
|
||||||
@pytest.mark.private
|
@pytest.mark.private
|
||||||
async def test_flash_llama_grammar_tools_stream(
|
async def test_flash_llama_grammar_tools_stream(
|
||||||
|
Loading…
Reference in New Issue
Block a user