diff --git a/Cargo.lock b/Cargo.lock index 165cb590..cfe19dcd 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -4650,7 +4650,7 @@ dependencies = [ [[package]] name = "text-generation-backends-trtllm" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "async-trait", "clap 4.5.32", @@ -4671,7 +4671,7 @@ dependencies = [ [[package]] name = "text-generation-benchmark" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "average", "clap 4.5.32", @@ -4691,7 +4691,7 @@ dependencies = [ [[package]] name = "text-generation-client" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "async-trait", "base64 0.22.1", @@ -4709,7 +4709,7 @@ dependencies = [ [[package]] name = "text-generation-launcher" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "clap 4.5.32", "ctrlc", @@ -4730,7 +4730,7 @@ dependencies = [ [[package]] name = "text-generation-router" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "anyhow", "async-stream", @@ -4782,7 +4782,7 @@ dependencies = [ [[package]] name = "text-generation-router-llamacpp" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "async-trait", "bindgen 0.71.1", @@ -4800,7 +4800,7 @@ dependencies = [ [[package]] name = "text-generation-router-v2" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "async-stream", "async-trait", @@ -4849,7 +4849,7 @@ dependencies = [ [[package]] name = "text-generation-router-v3" -version = "3.3.5-dev0" +version = "3.3.6-dev0" dependencies = [ "async-stream", "async-trait", diff --git a/Cargo.toml b/Cargo.toml index a32d8e7f..f985d0a1 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -21,7 +21,7 @@ default-members = [ resolver = "2" [workspace.package] -version = "3.3.5-dev0" +version = "3.3.6-dev0" edition = "2021" authors = ["Olivier Dehaene"] homepage = "https://github.com/huggingface/text-generation-inference" diff --git a/docs/openapi.json b/docs/openapi.json index 6225f5e7..89172386 100644 --- a/docs/openapi.json +++ b/docs/openapi.json @@ -10,7 +10,7 @@ "name": "Apache 2.0", "url": "https://www.apache.org/licenses/LICENSE-2.0" }, - "version": "3.3.5-dev0" + "version": "3.3.6-dev0" }, "paths": { "/": { diff --git a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_jpg.json b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_jpg.json index b9803da8..2448b0b5 100644 --- a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_jpg.json +++ b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_jpg.json @@ -17,7 +17,7 @@ "id": "", "model": "google/gemma-3-4b-it", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 42, "prompt_tokens": 277, diff --git a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_png.json b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_png.json index a91f01f7..625db0a0 100644 --- a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_png.json +++ b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgb_png.json @@ -17,7 +17,7 @@ "id": "", "model": "google/gemma-3-4b-it", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 62, "prompt_tokens": 277, diff --git a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgba.json b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgba.json index d8104c9a..e34a9bad 100644 --- a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgba.json +++ b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_base64_rgba.json @@ -17,7 +17,7 @@ "id": "", "model": "google/gemma-3-4b-it", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 67, "prompt_tokens": 277, diff --git a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow.json b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow.json index 0a712cc7..7eca16db 100644 --- a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow.json +++ b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow.json @@ -17,7 +17,7 @@ "id": "", "model": "google/gemma-3-4b-it", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 72, "prompt_tokens": 275, diff --git a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow_dog.json b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow_dog.json index 6d4ee727..a64bb4fb 100644 --- a/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow_dog.json +++ b/integration-tests/models/__snapshots__/test_flash_gemma3/test_flash_gemma3_image_cow_dog.json @@ -17,7 +17,7 @@ "id": "", "model": "google/gemma-3-4b-it", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 80, "prompt_tokens": 279, diff --git a/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_basic.json b/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_basic.json index 3310bdcd..35cdbe01 100644 --- a/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_basic.json +++ b/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_basic.json @@ -14,7 +14,7 @@ "id": "", "model": "google/gemma-3-4b-it", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 35, "prompt_tokens": 32, diff --git a/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_complex.json b/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_complex.json index e627b2be..c12d8605 100644 --- a/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_complex.json +++ b/integration-tests/models/__snapshots__/test_json_schema_constrain/test_json_schema_complex.json @@ -14,7 +14,7 @@ "id": "", "model": "google/gemma-3-4b-it", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 44, "prompt_tokens": 37, diff --git a/integration-tests/models/__snapshots__/test_mllama/test_mllama_load.json b/integration-tests/models/__snapshots__/test_mllama/test_mllama_load.json index 58f5ada8..bd4595a6 100644 --- a/integration-tests/models/__snapshots__/test_mllama/test_mllama_load.json +++ b/integration-tests/models/__snapshots__/test_mllama/test_mllama_load.json @@ -18,7 +18,7 @@ "id": "", "model": "unsloth/Llama-3.2-11B-Vision-Instruct", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 10, "prompt_tokens": 45, @@ -44,7 +44,7 @@ "id": "", "model": "unsloth/Llama-3.2-11B-Vision-Instruct", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 10, "prompt_tokens": 45, diff --git a/integration-tests/models/__snapshots__/test_mllama/test_mllama_simpl.json b/integration-tests/models/__snapshots__/test_mllama/test_mllama_simpl.json index 6830b36b..175887a8 100644 --- a/integration-tests/models/__snapshots__/test_mllama/test_mllama_simpl.json +++ b/integration-tests/models/__snapshots__/test_mllama/test_mllama_simpl.json @@ -17,7 +17,7 @@ "id": "", "model": "unsloth/Llama-3.2-11B-Vision-Instruct", "object": "chat.completion", - "system_fingerprint": "3.3.5-dev0-native", + "system_fingerprint": "3.3.6-dev0-native", "usage": { "completion_tokens": 10, "prompt_tokens": 45,