fix: update tests for streaming tools

2025-09-11 12:24:53 +00:00 · 2024-02-28 03:56:37 +00:00 · 2024-02-28 03:56:37 +00:00 · b5cacca1dc
commit b5cacca1dc
parent 0fc7237380
2 changed files with 22 additions and 1 deletions
--- a/integration-tests/conftest.py
+++ b/integration-tests/conftest.py
@ -24,6 +24,7 @@ from text_generation.types import (
    BestOfSequence,
    Grammar,
    ChatComplete,
+    ChatCompletionChunk,
 )

 DOCKER_IMAGE = os.getenv("DOCKER_IMAGE", None)
@ -61,7 +62,15 @@ class ResponseComparator(JSONSnapshotExtension):
        def convert_data(data):
            data = json.loads(data)
            if isinstance(data, Dict) and "choices" in data:
+                choices = data["choices"]
+                if (
+                    isinstance(choices, List)
+                    and len(choices) >= 1
+                    and "delta" in choices[0]
+                ):
+                    return ChatCompletionChunk(**data)
                return ChatComplete(**data)
+
            if isinstance(data, Dict):
                return Response(**data)
            if isinstance(data, List):
@ -151,6 +160,11 @@ class ResponseComparator(JSONSnapshotExtension):
                response.choices[0].message.content == other.choices[0].message.content
            )

+        def eq_chat_complete_chunk(
+            response: ChatCompletionChunk, other: ChatCompletionChunk
+        ) -> bool:
+            return response.choices[0].delta.content == other.choices[0].delta.content
+
        def eq_response(response: Response, other: Response) -> bool:
            return response.generated_text == other.generated_text and eq_details(
                response.details, other.details
@ -169,6 +183,14 @@ class ResponseComparator(JSONSnapshotExtension):
                [eq_chat_complete(r, o) for r, o in zip(serialized_data, snapshot_data)]
            )

+        if isinstance(serialized_data[0], ChatCompletionChunk):
+            return len(snapshot_data) == len(serialized_data) and all(
+                [
+                    eq_chat_complete_chunk(r, o)
+                    for r, o in zip(serialized_data, snapshot_data)
+                ]
+            )
+
        return len(snapshot_data) == len(serialized_data) and all(
            [eq_response(r, o) for r, o in zip(serialized_data, snapshot_data)]
        )
--- a/integration-tests/models/test_tools_llama.py
+++ b/integration-tests/models/test_tools_llama.py
@ -234,7 +234,6 @@ async def test_flash_llama_grammar_tools_stream(

    count = 0
    async for response in responses:
-        print(response)
        count += 1

    assert count == 20