jalonso24 commited on
Commit
2029bcf
·
verified ·
1 Parent(s): a845a1d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -18,11 +18,12 @@ tokenizer = AutoTokenizer.from_pretrained(base_model_id, use_fast=False)
18
  tokenizer.pad_token = tokenizer.eos_token
19
 
20
  def predict_risk(prompt):
21
- inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
 
22
  with torch.no_grad():
23
  outputs = model.generate(
24
  **inputs,
25
- max_new_tokens=50, # keeps output fast but complete
26
  temperature=0.7,
27
  do_sample=True,
28
  pad_token_id=tokenizer.eos_token_id
 
18
  tokenizer.pad_token = tokenizer.eos_token
19
 
20
  def predict_risk(prompt):
21
+ inputs = tokenizer(prompt, return_tensors="pt")
22
+ inputs = {k: v.to("cpu") for k, v in inputs.items()}
23
  with torch.no_grad():
24
  outputs = model.generate(
25
  **inputs,
26
+ max_new_tokens=50,
27
  temperature=0.7,
28
  do_sample=True,
29
  pad_token_id=tokenizer.eos_token_id