diff --git a/integration-tests/models/test_idefics2.py b/integration-tests/models/test_idefics2.py index 9aaf6d8a..b4f6d8cf 100644 --- a/integration-tests/models/test_idefics2.py +++ b/integration-tests/models/test_idefics2.py @@ -1,6 +1,7 @@ import pytest import base64 +from testing_utils import require_backend_async, SYSTEM # TODO fix the server parsser to count inline image tokens correctly def get_chicken(): @@ -41,7 +42,10 @@ async def test_flash_idefics2_next_simple(flash_idefics2_next, response_snapshot response.generated_text == " A chicken is sitting on a pile of money." ), f"{repr(response.generated_text)}" assert response.details.generated_tokens == 10 - assert response == response_snapshot + + if SYSTEM != "rocm": + # Snapshot logprobs are not close enough on ROCm. + assert response == response_snapshot @pytest.mark.asyncio @@ -64,6 +68,7 @@ async def test_flash_idefics2_two_images(flash_idefics2_next, response_snapshot) @pytest.mark.asyncio @pytest.mark.private async def test_flash_idefics2_next_all_params(flash_idefics2_next, response_snapshot): + # TODO: not passing on ROCm (not even simple generated_text comparison). response = await flash_idefics2_next.generate( "Test request", max_new_tokens=10, @@ -100,5 +105,7 @@ async def test_flash_idefics2_next_load( assert generated_texts[0] == " A chicken is sitting on a pile of money." assert len(generated_texts) == 4 assert all([r.generated_text == generated_texts[0] for r in responses]) - - assert responses == response_snapshot + + if SYSTEM != "rocm": + # Snapshot logprobs are not close enough on ROCm. + assert responses == response_snapshot