nikravan commited on
Commit
0cd51ce
·
verified ·
1 Parent(s): 15c5cc5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +20 -0
app.py CHANGED
@@ -26,6 +26,26 @@ def respond(
26
  messages.append({"role": "user", "content": message})
27
 
28
  response = ""
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
29
 
30
  for message in client.chat_completion(
31
  messages,
 
26
  messages.append({"role": "user", "content": message})
27
 
28
  response = ""
29
+
30
+ from transformers import AutoModelForCausalLM, AutoTokenizer
31
+
32
+ MODEL_PATH = "THUDM/GLM-4-Z1-32B-0414"
33
+
34
+ tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH)
35
+ model = AutoModelForCausalLM.from_pretrained(MODEL_PATH, device_map="auto")
36
+
37
+ message = [{"role": "user", "content": "Let a, b be positive real numbers such that ab = a + b + 3. Determine the range of possible values for a + b."}]
38
+
39
+ .device)
40
+
41
+ generate_kwargs = {
42
+ "input_ids": inputs["input_ids"],
43
+ "attention_mask": inputs["attention_mask"],
44
+ "max_new_tokens": 4096,
45
+ "do_sample": False,
46
+ }
47
+ out = model.generate(**generate_kwargs)
48
+ print(tokenizer.decode(out[0][inputs["input_ids"].shape[1]:], skip_special_tokens=True))
49
 
50
  for message in client.chat_completion(
51
  messages,