diff --git a/Cargo.lock b/Cargo.lock index d006267e..f686bdb5 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -1888,7 +1888,7 @@ dependencies = [ [[package]] name = "text-generation-client" -version = "0.1.0" +version = "0.2.0" dependencies = [ "futures", "prost", @@ -1903,7 +1903,7 @@ dependencies = [ [[package]] name = "text-generation-launcher" -version = "0.1.0" +version = "0.2.0" dependencies = [ "clap 4.0.22", "ctrlc", @@ -1918,7 +1918,7 @@ dependencies = [ [[package]] name = "text-generation-router" -version = "0.1.0" +version = "0.2.0" dependencies = [ "async-stream", "axum", diff --git a/Cargo.toml b/Cargo.toml index 684a5da4..3720af32 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -4,9 +4,6 @@ members = [ "router/client", "launcher" ] -exclude = [ - "server/safetensors", -] [profile.release] debug = 1 diff --git a/Makefile b/Makefile index 39017944..08217730 100644 --- a/Makefile +++ b/Makefile @@ -15,6 +15,12 @@ server-dev: router-dev: cd router && cargo run +integration-tests: install-router install-launcher + cargo test + +python-tests: + cd server && pytest tests + run-bloom-560m: text-generation-launcher --model-id bigscience/bloom-560m --num-shard 2 diff --git a/README.md b/README.md index 74d7a988..49713ecc 100644 --- a/README.md +++ b/README.md @@ -33,6 +33,7 @@ to power LLMs api-inference widgets. - [Run](#run) - [Quantization](#quantization) - [Develop](#develop) +- [Testing](#testing) ## Features @@ -145,4 +146,11 @@ make run-bloom-quantize # Requires 8xA100 40GB ```shell make server-dev make router-dev +``` + +## Testing + +```shell +make python-tests +make integration-tests ``` \ No newline at end of file diff --git a/docs/openapi.json b/docs/openapi.json index d885b97f..4735c8df 100644 --- a/docs/openapi.json +++ b/docs/openapi.json @@ -11,7 +11,7 @@ "name": "Apache 2.0", "url": "https://www.apache.org/licenses/LICENSE-2.0" }, - "version": "0.1.0" + "version": "0.2.0" }, "paths": { "/generate": { diff --git a/launcher/Cargo.toml b/launcher/Cargo.toml index 58df28d9..f62fc804 100644 --- a/launcher/Cargo.toml +++ b/launcher/Cargo.toml @@ -1,6 +1,6 @@ [package] name = "text-generation-launcher" -version = "0.1.0" +version = "0.2.0" edition = "2021" authors = ["Olivier Dehaene"] description = "Text Generation Launcher" diff --git a/router/Cargo.toml b/router/Cargo.toml index 56d6b4f5..20f032b1 100644 --- a/router/Cargo.toml +++ b/router/Cargo.toml @@ -1,6 +1,6 @@ [package] name = "text-generation-router" -version = "0.1.0" +version = "0.2.0" edition = "2021" authors = ["Olivier Dehaene"] description = "Text Generation Webserver" diff --git a/router/client/Cargo.toml b/router/client/Cargo.toml index fdd32494..f4a900a4 100644 --- a/router/client/Cargo.toml +++ b/router/client/Cargo.toml @@ -1,6 +1,6 @@ [package] name = "text-generation-client" -version = "0.1.0" +version = "0.2.0" edition = "2021" [dependencies] diff --git a/server/README.md b/server/README.md index c7054b8d..8efd80ac 100644 --- a/server/README.md +++ b/server/README.md @@ -1,6 +1,6 @@ -# BLOOM Inference Python gRPC Server +# Text Generation Inference Python gRPC Server -A Python gRPC server for BLOOM Inference +A Python gRPC server for Text Generation Inference ## Install diff --git a/server/pyproject.toml b/server/pyproject.toml index 98d91125..87aa8cfb 100644 --- a/server/pyproject.toml +++ b/server/pyproject.toml @@ -1,7 +1,7 @@ [tool.poetry] name = "text-generation" -version = "0.1.0" -description = "BLOOM Inference Python gRPC Server" +version = "0.2.0" +description = "Text Generation Inference Python gRPC Server" authors = ["Olivier Dehaene "] [tool.poetry.scripts]