eslamirad commited on
Commit
0fca800
·
verified ·
1 Parent(s): fa5e4da

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -8,13 +8,12 @@ MODEL_NAME = "Qwen/Qwen2.5-7B-Instruct"
8
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
9
  model = AutoModelForCausalLM.from_pretrained(
10
  MODEL_NAME,
11
- torch_dtype=torch.float16,
12
- device_map="auto"
13
  )
14
 
15
  # تابع چت‌بات
16
  def chat_with_qwen(prompt):
17
- inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
18
  output = model.generate(**inputs, max_new_tokens=200)
19
  response = tokenizer.decode(output[0], skip_special_tokens=True)
20
  return response
 
8
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
9
  model = AutoModelForCausalLM.from_pretrained(
10
  MODEL_NAME,
11
+ torch_dtype=torch.float32, # از float32 استفاده کن تا روی CPU اجرا بشه
 
12
  )
13
 
14
  # تابع چت‌بات
15
  def chat_with_qwen(prompt):
16
+ inputs = tokenizer(prompt, return_tensors="pt")
17
  output = model.generate(**inputs, max_new_tokens=200)
18
  response = tokenizer.decode(output[0], skip_special_tokens=True)
19
  return response