fix formatting
This commit is contained in:
parent
f34560f74a
commit
6d6b0bdcc4
|
@ -29,6 +29,12 @@ class Dtype(str, Enum):
|
||||||
bloat16 = "bfloat16"
|
bloat16 = "bfloat16"
|
||||||
|
|
||||||
|
|
||||||
|
class KVDtype(str, Enum):
|
||||||
|
auto = "auto"
|
||||||
|
fp8 = "fp8"
|
||||||
|
fp8_e5m2 = "fp8_e5m2"
|
||||||
|
|
||||||
|
|
||||||
@app.command()
|
@app.command()
|
||||||
def serve(
|
def serve(
|
||||||
model_id: str,
|
model_id: str,
|
||||||
|
@ -37,7 +43,7 @@ def serve(
|
||||||
quantize: Optional[Quantization] = None,
|
quantize: Optional[Quantization] = None,
|
||||||
speculate: Optional[int] = None,
|
speculate: Optional[int] = None,
|
||||||
dtype: Optional[Dtype] = None,
|
dtype: Optional[Dtype] = None,
|
||||||
kv_cache_dtype: str = "auto",
|
kv_cache_dtype: KVDtype = "auto",
|
||||||
trust_remote_code: bool = False,
|
trust_remote_code: bool = False,
|
||||||
uds_path: Path = "/tmp/text-generation-server",
|
uds_path: Path = "/tmp/text-generation-server",
|
||||||
logger_level: str = "INFO",
|
logger_level: str = "INFO",
|
||||||
|
|
Loading…
Reference in New Issue