fix formatting

This commit is contained in:
Mohit Sharma 2024-07-02 13:08:56 +00:00
parent f34560f74a
commit 6d6b0bdcc4
1 changed files with 7 additions and 1 deletions

View File

@ -29,6 +29,12 @@ class Dtype(str, Enum):
bloat16 = "bfloat16"
class KVDtype(str, Enum):
auto = "auto"
fp8 = "fp8"
fp8_e5m2 = "fp8_e5m2"
@app.command()
def serve(
model_id: str,
@ -37,7 +43,7 @@ def serve(
quantize: Optional[Quantization] = None,
speculate: Optional[int] = None,
dtype: Optional[Dtype] = None,
kv_cache_dtype: str = "auto",
kv_cache_dtype: KVDtype = "auto",
trust_remote_code: bool = False,
uds_path: Path = "/tmp/text-generation-server",
logger_level: str = "INFO",