bobber commited on
Commit
1db4a17
·
verified ·
1 Parent(s): 7a50100

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -8,20 +8,22 @@ import torch
8
  # model_name = "bartowski/simplescaling_s1-32B-GGUF"
9
  # subfolder = "Qwen-0.5B-GRPO/checkpoint-1868"
10
  # filename = "simplescaling_s1-32B-Q4_K_S.gguf"
11
- model_name = "simplescaling/s1.1-32B"
 
 
12
  torch_dtype = torch.bfloat16 # could be torch.float16 or torch.bfloat16 torch.float32 too
13
  cache_dir = "/data"
14
 
15
  model = AutoModelForCausalLM.from_pretrained(
16
  model_name,
17
  # subfolder=subfolder,
18
- # gguf_file=filename,
19
  torch_dtype=torch_dtype,
20
  device_map="auto",
21
  cache_dir = cache_dir,
22
  )
23
  tokenizer = AutoTokenizer.from_pretrained(model_name
24
- # , gguf_file=filename
25
  # , subfolder=subfolder
26
  )
27
  SYSTEM_PROMPT = """
 
8
  # model_name = "bartowski/simplescaling_s1-32B-GGUF"
9
  # subfolder = "Qwen-0.5B-GRPO/checkpoint-1868"
10
  # filename = "simplescaling_s1-32B-Q4_K_S.gguf"
11
+ # model_name = "simplescaling/s1.1-32B"
12
+ model_name = "unsloth/Llama-4-Scout-17B-16E-Instruct-GGUF"
13
+ filename = "Llama-4-Scout-17B-16E-Instruct-UD-IQ2_XXS.gguf"
14
  torch_dtype = torch.bfloat16 # could be torch.float16 or torch.bfloat16 torch.float32 too
15
  cache_dir = "/data"
16
 
17
  model = AutoModelForCausalLM.from_pretrained(
18
  model_name,
19
  # subfolder=subfolder,
20
+ gguf_file=filename,
21
  torch_dtype=torch_dtype,
22
  device_map="auto",
23
  cache_dir = cache_dir,
24
  )
25
  tokenizer = AutoTokenizer.from_pretrained(model_name
26
+ , gguf_file=filename
27
  # , subfolder=subfolder
28
  )
29
  SYSTEM_PROMPT = """