UserLM

Sleeping

pszemraj commited on Oct 12

Commit

c368985

verified ·

1 Parent(s): 9dd80f6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -27,7 +27,7 @@ def load_model(model_id: str = MODEL_ID):
     mdl = AutoModelForCausalLM.from_pretrained(
         model_id,
         trust_remote_code=True,
-        torch_dtype="auto",
         device_map="auto",
     )
@@ -138,7 +138,7 @@ def generate_reply(
     max_new_tokens: int = 128,
     temperature: float = 1.0,
     top_p: float = 0.8,
-    max_retries: int = 5,
 ) -> str:
     """Implements the 4 guardrails from Appendix C.1."""
     messages = build_hf_messages(system_prompt, history_pairs)

     mdl = AutoModelForCausalLM.from_pretrained(
         model_id,
         trust_remote_code=True,
+        torch_dtype=torch.bfloat16,
         device_map="auto",
     )
     max_new_tokens: int = 128,
     temperature: float = 1.0,
     top_p: float = 0.8,
+    max_retries: int = 10,
 ) -> str:
     """Implements the 4 guardrails from Appendix C.1."""
     messages = build_hf_messages(system_prompt, history_pairs)