diff --git a/integration-tests/models/__snapshots__/test_flash_deepseek_v2/test_flash_deepseek_v2_all_params.json b/integration-tests/models/__snapshots__/test_flash_deepseek_v2/test_flash_deepseek_v2_all_params.json index 6b45cf6b..3ac8d050 100644 --- a/integration-tests/models/__snapshots__/test_flash_deepseek_v2/test_flash_deepseek_v2_all_params.json +++ b/integration-tests/models/__snapshots__/test_flash_deepseek_v2/test_flash_deepseek_v2_all_params.json @@ -11,7 +11,7 @@ }, { "id": 3533, - "logprob": -9.625, + "logprob": -9.5625, "text": "Test" }, { @@ -24,13 +24,13 @@ "tokens": [ { "id": 2143, - "logprob": -1.828125, + "logprob": -1.8203125, "special": false, "text": " sent" }, { "id": 10081, - "logprob": -0.41210938, + "logprob": -0.55078125, "special": false, "text": " successfully" }, @@ -42,7 +42,7 @@ }, { "id": 100001, - "logprob": -0.16015625, + "logprob": -0.12695312, "special": true, "text": "<|end▁of▁sentence|>" } diff --git a/integration-tests/models/__snapshots__/test_flash_gemma/test_flash_gemma.json b/integration-tests/models/__snapshots__/test_flash_gemma/test_flash_gemma.json index 8829f9fe..96f2ce17 100644 --- a/integration-tests/models/__snapshots__/test_flash_gemma/test_flash_gemma.json +++ b/integration-tests/models/__snapshots__/test_flash_gemma/test_flash_gemma.json @@ -24,13 +24,13 @@ "tokens": [ { "id": 1736, - "logprob": -2.03125, + "logprob": -2.046875, "special": false, "text": " form" }, { "id": 109, - "logprob": -1.8671875, + "logprob": -1.8828125, "special": false, "text": "\n\n" }, @@ -42,48 +42,48 @@ }, { "id": 2121, - "logprob": -1.8125, + "logprob": -1.78125, "special": false, "text": " test" }, { "id": 3853, - "logprob": -0.24121094, + "logprob": -0.23632812, "special": false, "text": " request" }, { "id": 1736, - "logprob": -0.100097656, + "logprob": -0.09326172, "special": false, "text": " form" }, { "id": 603, - "logprob": -0.9453125, + "logprob": -0.8828125, "special": false, "text": " is" }, { - "id": 476, - "logprob": -1.703125, + "id": 1671, + "logprob": -1.6171875, "special": false, - "text": " a" + "text": " used" }, { - "id": 4551, - "logprob": -2.453125, + "id": 577, + "logprob": -0.390625, "special": false, - "text": " document" + "text": " to" }, { - "id": 674, - "logprob": -0.796875, + "id": 3853, + "logprob": -1.2265625, "special": false, - "text": " that" + "text": " request" } ], "top_tokens": null }, - "generated_text": " form\n\nThe test request form is a document that" + "generated_text": " form\n\nThe test request form is used to request" } diff --git a/integration-tests/models/test_flash_deepseek_v2.py b/integration-tests/models/test_flash_deepseek_v2.py index 010e08c9..edebda21 100644 --- a/integration-tests/models/test_flash_deepseek_v2.py +++ b/integration-tests/models/test_flash_deepseek_v2.py @@ -13,7 +13,7 @@ async def flash_deepseek_v2(flash_deepseek_v2_handle): return flash_deepseek_v2_handle.client -@pytest.mark.release +# @pytest.mark.release @pytest.mark.asyncio @pytest.mark.private async def test_flash_deepseek_v2(flash_deepseek_v2, response_snapshot): @@ -24,7 +24,7 @@ async def test_flash_deepseek_v2(flash_deepseek_v2, response_snapshot): assert response == response_snapshot -@pytest.mark.release +# @pytest.mark.release @pytest.mark.asyncio @pytest.mark.private async def test_flash_deepseek_v2_all_params(flash_deepseek_v2, response_snapshot): @@ -47,7 +47,7 @@ async def test_flash_deepseek_v2_all_params(flash_deepseek_v2, response_snapshot assert response == response_snapshot -@pytest.mark.release +# @pytest.mark.release @pytest.mark.asyncio @pytest.mark.private async def test_flash_deepseek_v2_load( diff --git a/integration-tests/models/test_flash_gemma.py b/integration-tests/models/test_flash_gemma.py index 7bee8dea..ad342dfb 100644 --- a/integration-tests/models/test_flash_gemma.py +++ b/integration-tests/models/test_flash_gemma.py @@ -13,7 +13,7 @@ async def flash_gemma(flash_gemma_handle): return flash_gemma_handle.client -@pytest.mark.release +# @pytest.mark.release @pytest.mark.asyncio @pytest.mark.private async def test_flash_gemma(flash_gemma, response_snapshot): @@ -25,7 +25,7 @@ async def test_flash_gemma(flash_gemma, response_snapshot): assert response == response_snapshot -@pytest.mark.release +# @pytest.mark.release @pytest.mark.asyncio @pytest.mark.private async def test_flash_gemma_all_params(flash_gemma, response_snapshot): @@ -49,7 +49,7 @@ async def test_flash_gemma_all_params(flash_gemma, response_snapshot): assert response == response_snapshot -@pytest.mark.release +# @pytest.mark.release @pytest.mark.asyncio @pytest.mark.private async def test_flash_gemma_load(flash_gemma, generate_load, response_snapshot):