diff --git a/launcher/src/main.rs b/launcher/src/main.rs index d690a7c..113877f 100644 --- a/launcher/src/main.rs +++ b/launcher/src/main.rs @@ -41,6 +41,7 @@ impl std::fmt::Display for Quantization { #[derive(Clone, Copy, Debug, ValueEnum)] enum Dtype { Float16, + #[clap(name = "bfloat16")] BFloat16, }