Spaces:

spuun
/

nagaluv

Sleeping

spuun commited on Apr 15

Commit

a00ca2c

verified ·

1 Parent(s): 5ccda69

fix: bump up rate limits wkw

Files changed (1) hide show

app.py CHANGED Viewed

@@ -99,14 +99,14 @@ def respond(
     response = ""
     for msg in client.chat_completion(
         messages,
-        model="meta-llama/llama-4-scout:free",
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
         seed=random.randint(1, 1000),
         top_p=top_p,
         extra_body={
-            "models": ["meta-llama/llama-4-maverick:free", "google/gemma-3-1b-it:free"]
         },
     ):
         token = msg.choices[0].delta.content

     response = ""
     for msg in client.chat_completion(
         messages,
+        model="meta-llama/llama-4-scout",
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
         seed=random.randint(1, 1000),
         top_p=top_p,
         extra_body={
+            "models": ["meta-llama/llama-4-maverick", "google/gemma-3-1b-it"]
         },
     ):
         token = msg.choices[0].delta.content