text-generation-inference/router/src/main.rs

32 lines
698 B
Rust
Raw Normal View History

2022-10-08 10:30:12 +00:00
use bloom_inference_client::ShardedClient;
2022-10-11 08:36:51 +00:00
use poem;
use poem::listener::TcpListener;
2022-10-08 10:30:12 +00:00
use std::time::Duration;
2022-10-11 08:36:51 +00:00
mod server;
2022-10-08 10:30:12 +00:00
2022-10-11 08:36:51 +00:00
mod db;
2022-10-08 10:30:12 +00:00
use db::Db;
2022-10-11 08:36:51 +00:00
mod batcher;
use batcher::Batcher;
2022-10-08 10:30:12 +00:00
#[tokio::main]
async fn main() -> Result<(), std::io::Error> {
tracing_subscriber::fmt::init();
let sharded_client =
ShardedClient::connect_uds("/tmp/bloom-inference-0".to_string(), Duration::from_secs(5))
.await;
sharded_client
.clear_cache()
.await
.expect("Unable to clear cache");
tracing::info!("Connected");
2022-10-11 08:36:51 +00:00
let addr = "127.0.0.1:3000".to_string();
let listener = TcpListener::bind(addr);
2022-10-08 10:30:12 +00:00
2022-10-11 08:36:51 +00:00
server::run(sharded_client, listener).await
2022-10-08 10:30:12 +00:00
}