Integrate create_inference_router from inference-engine into predict-otron-9000, simplify server routing, and update dependencies to unify versions.

This commit is contained in:
geoffsee
2025-08-16 19:53:21 -04:00
parent 411ad78026
commit b8ba994783
4 changed files with 86 additions and 168 deletions

129
Cargo.lock generated
View File

@@ -354,17 +354,6 @@ dependencies = [
"syn 2.0.106",
]
[[package]]
name = "async-trait"
version = "0.1.89"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "9035ad2d096bed7955a320ee7e2230574d28fd3c3a0f186cbea1ff3c7eed5dbb"
dependencies = [
"proc-macro2",
"quote",
"syn 2.0.106",
]
[[package]]
name = "atoi"
version = "2.0.0"
@@ -409,47 +398,13 @@ dependencies = [
"arrayvec",
]
[[package]]
name = "axum"
version = "0.7.9"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "edca88bc138befd0323b20752846e6587272d3b03b0343c8ea28a6f819e6e71f"
dependencies = [
"async-trait",
"axum-core 0.4.5",
"bytes",
"futures-util",
"http",
"http-body",
"http-body-util",
"hyper",
"hyper-util",
"itoa",
"matchit 0.7.3",
"memchr",
"mime",
"percent-encoding",
"pin-project-lite",
"rustversion",
"serde",
"serde_json",
"serde_path_to_error",
"serde_urlencoded",
"sync_wrapper",
"tokio",
"tower 0.5.2",
"tower-layer",
"tower-service",
"tracing",
]
[[package]]
name = "axum"
version = "0.8.4"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "021e862c184ae977658b36c4500f7feac3221ca5da43e3f25bd04ab6c79a29b5"
dependencies = [
"axum-core 0.5.2",
"axum-core",
"bytes",
"form_urlencoded",
"futures-util",
@@ -459,7 +414,7 @@ dependencies = [
"hyper",
"hyper-util",
"itoa",
"matchit 0.8.4",
"matchit",
"memchr",
"mime",
"percent-encoding",
@@ -471,28 +426,7 @@ dependencies = [
"serde_urlencoded",
"sync_wrapper",
"tokio",
"tower 0.5.2",
"tower-layer",
"tower-service",
"tracing",
]
[[package]]
name = "axum-core"
version = "0.4.5"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "09f2bd6146b97ae3359fa0cc6d6b376d9539582c7b4220f041a33ec24c226199"
dependencies = [
"async-trait",
"bytes",
"futures-util",
"http",
"http-body",
"http-body-util",
"mime",
"pin-project-lite",
"rustversion",
"sync_wrapper",
"tower",
"tower-layer",
"tower-service",
"tracing",
@@ -1416,14 +1350,14 @@ name = "embeddings-engine"
version = "0.1.0"
dependencies = [
"async-openai",
"axum 0.8.4",
"axum",
"fastembed",
"rand 0.8.5",
"serde",
"serde_json",
"tokio",
"tower 0.5.2",
"tower-http 0.6.6",
"tower",
"tower-http",
"tracing",
"tracing-subscriber",
]
@@ -2526,7 +2460,7 @@ dependencies = [
"ab_glyph",
"accelerate-src",
"anyhow",
"axum 0.7.9",
"axum",
"bindgen_cuda",
"byteorder",
"candle-core",
@@ -2561,8 +2495,8 @@ dependencies = [
"symphonia",
"tokenizers",
"tokio",
"tower 0.4.13",
"tower-http 0.5.2",
"tower",
"tower-http",
"tracing",
"tracing-chrome",
"tracing-subscriber",
@@ -2946,12 +2880,6 @@ dependencies = [
"regex-automata 0.1.10",
]
[[package]]
name = "matchit"
version = "0.7.3"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "0e7465ac9959cc2b1404e8e2367b43684a6d13790fe23056cc8c6c5a6b7bcb94"
[[package]]
name = "matchit"
version = "0.8.4"
@@ -3785,14 +3713,14 @@ dependencies = [
name = "predict-otron-9000"
version = "0.1.0"
dependencies = [
"axum 0.8.4",
"axum",
"embeddings-engine",
"inference-engine",
"serde",
"serde_json",
"tokio",
"tower 0.5.2",
"tower-http 0.6.6",
"tower",
"tower-http",
"tracing",
"tracing-subscriber",
"uuid",
@@ -4439,8 +4367,8 @@ dependencies = [
"tokio-native-tls",
"tokio-rustls",
"tokio-util",
"tower 0.5.2",
"tower-http 0.6.6",
"tower",
"tower-http",
"tower-service",
"url",
"wasm-bindgen",
@@ -5549,17 +5477,6 @@ dependencies = [
"num-traits",
]
[[package]]
name = "tower"
version = "0.4.13"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "b8fa9be0de6cf49e536ce1851f987bd21a43b771b09473c3549a6c853db37c1c"
dependencies = [
"tower-layer",
"tower-service",
"tracing",
]
[[package]]
name = "tower"
version = "0.5.2"
@@ -5576,22 +5493,6 @@ dependencies = [
"tracing",
]
[[package]]
name = "tower-http"
version = "0.5.2"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "1e9cd434a998747dd2c4276bc96ee2e0c7a2eadf3cae88e52be55a05fa9053f5"
dependencies = [
"bitflags 2.9.2",
"bytes",
"http",
"http-body",
"http-body-util",
"pin-project-lite",
"tower-layer",
"tower-service",
]
[[package]]
name = "tower-http"
version = "0.6.6"
@@ -5605,7 +5506,7 @@ dependencies = [
"http-body",
"iri-string",
"pin-project-lite",
"tower 0.5.2",
"tower",
"tower-layer",
"tower-service",
"tracing",