2022-10-18 07:19:03 -06:00
|
|
|
[workspace]
|
|
|
|
members = [
|
2024-12-12 06:34:30 -07:00
|
|
|
"benchmark",
|
|
|
|
"backends/v2",
|
|
|
|
"backends/v3",
|
|
|
|
"backends/grpc-metadata",
|
|
|
|
"backends/trtllm",
|
|
|
|
"launcher",
|
|
|
|
"router"
|
2024-07-31 02:33:10 -06:00
|
|
|
]
|
|
|
|
default-members = [
|
2024-12-12 06:34:30 -07:00
|
|
|
"benchmark",
|
|
|
|
"backends/v2",
|
|
|
|
"backends/v3",
|
|
|
|
"backends/grpc-metadata",
|
|
|
|
# "backends/trtllm",
|
|
|
|
"launcher",
|
|
|
|
"router"
|
2022-10-18 07:19:03 -06:00
|
|
|
]
|
2024-01-22 07:22:54 -07:00
|
|
|
resolver = "2"
|
2023-05-09 05:19:31 -06:00
|
|
|
|
|
|
|
[workspace.package]
|
2024-11-22 10:26:15 -07:00
|
|
|
version = "2.4.2-dev0"
|
2023-05-09 05:19:31 -06:00
|
|
|
edition = "2021"
|
|
|
|
authors = ["Olivier Dehaene"]
|
|
|
|
homepage = "https://github.com/huggingface/text-generation-inference"
|
2022-10-18 07:19:03 -06:00
|
|
|
|
2024-04-18 09:17:40 -06:00
|
|
|
[workspace.dependencies]
|
2024-06-03 01:27:22 -06:00
|
|
|
base64 = "0.22.0"
|
2024-09-11 14:41:56 -06:00
|
|
|
tokenizers = { version = "0.20.0", features = ["http"] }
|
2024-04-18 09:17:40 -06:00
|
|
|
hf-hub = { version = "0.3.1", features = ["tokio"] }
|
2024-07-31 02:33:10 -06:00
|
|
|
metrics = { version = "0.23.0" }
|
|
|
|
metrics-exporter-prometheus = { version = "0.15.1", features = [] }
|
2024-08-27 11:31:08 -06:00
|
|
|
minijinja = { version = "2.2.0", features = ["json"] }
|
|
|
|
minijinja-contrib = { version = "2.0.2", features = ["pycompat"] }
|
2024-09-27 08:19:42 -06:00
|
|
|
pyo3 = { version = "0.22.2", features = ["auto-initialize"] }
|
2024-04-18 09:17:40 -06:00
|
|
|
|
2022-10-18 07:19:03 -06:00
|
|
|
[profile.release]
|
2024-06-04 11:38:46 -06:00
|
|
|
incremental = true
|
|
|
|
|
|
|
|
[profile.release-binary]
|
|
|
|
inherits = "release"
|
2022-10-18 07:19:03 -06:00
|
|
|
debug = 1
|
|
|
|
incremental = true
|
2024-06-05 04:18:38 -06:00
|
|
|
panic = "abort"
|
|
|
|
|
|
|
|
[profile.release-opt]
|
|
|
|
inherits = "release"
|
|
|
|
debug = 0
|
|
|
|
incremental = false
|
2024-04-12 04:34:13 -06:00
|
|
|
lto = "fat"
|
|
|
|
opt-level = 3
|
|
|
|
codegen-units = 1
|