Gemma default device fix (#161)

kmaherx · schraderSimon · pre-commit-ci[bot] · web-flow · commit 532d1f0b0f86 · 2025-11-04T14:32:19.000Z
* Add max_memory parameter to run config Co-authored-by: Simon Schrader <simonschrader96@gmail.com> * Use configurable max_memory for offline explainer Co-authored-by: Simon Schrader <simonschrader96@gmail.com> * Fix breaking change in prompt input formatting from vLLM Co-authored-by: Simon Schrader <simonschrader96@gmail.com> * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * Fix bug in gemmascope device type check * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci --------- Co-authored-by: Simon Schrader <simonschrader96@gmail.com> Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
diff --git a/delphi/sparse_coders/custom/gemmascope.py b/delphi/sparse_coders/custom/gemmascope.py
@@ -104,6 +104,8 @@ def from_pretrained(cls, model_name_or_path, position, device):
         pt_params = {k: torch.from_numpy(v) for k, v in params.items()}
         model = cls(params["W_enc"].shape[0], params["W_enc"].shape[1])
         model.load_state_dict(pt_params)
-        if device == "cuda":
+        if device == "cuda" or (
+            isinstance(device, torch.device) and device.type == "cuda"
+        ):
             model.cuda()
         return model