Fixing linters. (#2650)

2024-10-15 12:43:49 +02:00 · 2024-10-15 12:43:49 +02:00 · cf04a43fb1
parent 58848cb471
commit cf04a43fb1
3 changed files with 4 additions and 15 deletions
--- a/docs/openapi.json
+++ b/docs/openapi.json
@ -2186,4 +2186,4 @@
      "description": "Hugging Face Text Generation Inference API"
    }
  ]
-}
+}
--- a/server/text_generation_server/models/causal_lm.py
+++ b/server/text_generation_server/models/causal_lm.py
@ -619,18 +619,11 @@ class CausalLM(Model):
            model_id,
            revision=revision,
            torch_dtype=dtype,
-            device_map=(
+            device_map=("auto" if device_count > 1 else None),
                "auto"
                if device_count > 1
                else None
            ),
            load_in_8bit=quantize == "bitsandbytes",
            trust_remote_code=trust_remote_code,
        )
-        if (
+        if device_count == 1 and quantize != "bitsandbytes":
            device_count == 1
            and quantize != "bitsandbytes"
        ):
            model = model.to(device)
        if tokenizer.pad_token_id is None:
--- a/server/text_generation_server/models/seq2seq_lm.py
+++ b/server/text_generation_server/models/seq2seq_lm.py
@ -649,11 +649,7 @@ class Seq2SeqLM(Model):
            model_id,
            revision=revision,
            torch_dtype=dtype,
-            device_map=(
+            device_map=("auto" if device_count > 1 else None),
                "auto"
                if device_count > 1
                else None
            ),
            load_in_8bit=quantize == "bitsandbytes",
            trust_remote_code=trust_remote_code,
        )