mirror of
https://github.com/geoffsee/predict-otron-9001.git
synced 2025-09-08 22:46:44 +00:00

- Increase default maximum tokens in CLI configuration to 256. - Refactor and reorganize CLI
36 lines
977 B
TOML
36 lines
977 B
TOML
[package]
|
|
name = "predict-otron-9000"
|
|
version = "0.1.0"
|
|
edition = "2024"
|
|
|
|
[[bin]]
|
|
name = "predict-otron-9000"
|
|
path = "src/main.rs"
|
|
|
|
[dependencies]
|
|
# Axum web framework
|
|
axum = "0.8.4"
|
|
tokio = { version = "1.45.1", features = ["full"] }
|
|
tower = "0.5.2"
|
|
tower-http = { version = "0.6.6", features = ["trace", "cors"] }
|
|
serde = { version = "1.0.219", features = ["derive"] }
|
|
serde_json = "1.0.140"
|
|
tracing = "0.1"
|
|
tracing-subscriber = { version = "0.3", features = ["env-filter"] }
|
|
uuid = { version = "1.7.0", features = ["v4"] }
|
|
|
|
# Dependencies for embeddings functionality
|
|
embeddings-engine = { path = "../embeddings-engine" }
|
|
|
|
# Dependencies for inference functionality
|
|
inference-engine = { path = "../inference-engine" }
|
|
|
|
|
|
[package.metadata.kube]
|
|
image = "ghcr.io/geoffsee/predict-otron-9000:latest"
|
|
replicas = 1
|
|
port = 8080
|
|
resources.cpu = "500m"
|
|
resources.memory = "256Mi"
|
|
#ingress.host = "my-service.example.com"
|
|
#env = { RUST_LOG = "info", DATABASE_URL = "postgres://..." } |