mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
feat: conditionally toggle chat
This commit is contained in:
parent
0eabc83541
commit
90541fba07
@ -856,25 +856,32 @@ pub async fn run(
|
|||||||
docker_label: option_env!("DOCKER_LABEL"),
|
docker_label: option_env!("DOCKER_LABEL"),
|
||||||
};
|
};
|
||||||
|
|
||||||
// Create router
|
// Configure Swagger UI
|
||||||
let app = Router::new()
|
let swagger_ui = SwaggerUi::new("/docs").url("/api-doc/openapi.json", ApiDoc::openapi());
|
||||||
.merge(SwaggerUi::new("/docs").url("/api-doc/openapi.json", ApiDoc::openapi()))
|
|
||||||
// Base routes
|
// Define base and health routes
|
||||||
|
let base_routes = Router::new()
|
||||||
.route("/", post(compat_generate))
|
.route("/", post(compat_generate))
|
||||||
.route("/info", get(get_model_info))
|
.route("/info", get(get_model_info))
|
||||||
.route("/generate", post(generate))
|
.route("/generate", post(generate))
|
||||||
.route("/generate_stream", post(generate_stream))
|
.route("/generate_stream", post(generate_stream))
|
||||||
.route("/v1/chat/completions", post(chat_completions))
|
.route("/v1/chat/completions", post(chat_completions))
|
||||||
// AWS Sagemaker route
|
|
||||||
.route("/invocations", post(compat_generate))
|
|
||||||
// Base Health route
|
|
||||||
.route("/health", get(health))
|
.route("/health", get(health))
|
||||||
// Inference API health route
|
|
||||||
.route("/", get(health))
|
|
||||||
// AWS Sagemaker health route
|
|
||||||
.route("/ping", get(health))
|
.route("/ping", get(health))
|
||||||
// Prometheus metrics route
|
.route("/metrics", get(metrics));
|
||||||
.route("/metrics", get(metrics))
|
|
||||||
|
// Conditional AWS Sagemaker route
|
||||||
|
let aws_sagemaker_route = if std::env::var("OAI_ENABLED").map_or(false, |val| val == "true") {
|
||||||
|
Router::new().route("/invocations", post(chat_completions)) // Use 'chat_completions' for OAI_ENABLED
|
||||||
|
} else {
|
||||||
|
Router::new().route("/invocations", post(compat_generate)) // Use 'compat_generate' otherwise
|
||||||
|
};
|
||||||
|
|
||||||
|
// Combine routes and layers
|
||||||
|
let app = Router::new()
|
||||||
|
.merge(swagger_ui)
|
||||||
|
.merge(base_routes)
|
||||||
|
.merge(aws_sagemaker_route)
|
||||||
.layer(Extension(info))
|
.layer(Extension(info))
|
||||||
.layer(Extension(health_ext.clone()))
|
.layer(Extension(health_ext.clone()))
|
||||||
.layer(Extension(compat_return_full_text))
|
.layer(Extension(compat_return_full_text))
|
||||||
|
Loading…
Reference in New Issue
Block a user