squash: address comments

Signed-off-by: Michael Dawson <mdawson@devrus.com>
2025-07-31 16:01:46 +00:00 · 2025-05-26 13:40:35 -04:00 · 2025-05-26 13:40:35 -04:00 · 7b9a6eda63
commit 7b9a6eda63
parent f316dffe80
2 changed files with 3 additions and 15 deletions
--- a/llama_stack/providers/inline/safety/prompt_guard/config.py
+++ b/llama_stack/providers/inline/safety/prompt_guard/config.py
@ -15,14 +15,8 @@ class PromptGuardType(Enum):
    jailbreak = "jailbreak"


-class PromptGuardExecutionType(Enum):
-    cpu = "cpu"
-    cuda = "cuda"
-
-
 class PromptGuardConfig(BaseModel):
    guard_type: str = PromptGuardType.injection.value
-    guard_execution_type: str = PromptGuardExecutionType.cuda.value

    @classmethod
    @field_validator("guard_type")
@ -31,16 +25,8 @@ class PromptGuardConfig(BaseModel):
            raise ValueError(f"Unknown prompt guard type: {v}")
        return v

-    @classmethod
-    @field_validator("guard_execution_type")
-    def validate_guard_execution_type(cls, v):
-        if v not in [t.value for t in PromptGuardExecutionType]:
-            raise ValueError(f"Unknown prompt guard execution type: {v}")
-        return v
-
    @classmethod
    def sample_run_config(cls, __distro_dir__: str, **kwargs: Any) -> dict[str, Any]:
        return {
            "guard_type": "injection",
-            "guard_execution_type": "cuda",
        }
--- a/llama_stack/providers/inline/safety/prompt_guard/prompt_guard.py
+++ b/llama_stack/providers/inline/safety/prompt_guard/prompt_guard.py
@ -75,7 +75,9 @@ class PromptGuardShield:
        self.temperature = temperature
        self.threshold = threshold

-        self.device = self.config.guard_execution_type
+        self.device = "cpu"
+        if torch.cuda.is_available():
+            self.device = "cuda"

        # load model and tokenizer
        self.tokenizer = AutoTokenizer.from_pretrained(model_dir)