Final_Assignment_Template

Runtime error

0r0b0r0s commited on 13 days ago

Commit

9c1383b

verified ·

1 Parent(s): 594a71c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -17,26 +17,41 @@ from huggingface_hub import InferenceClient, login
 class BasicAgent:
     def __init__(self, hf_token: str):
-        # Validate authentication
         login(token=hf_token, add_to_git_credential=False)
-        # Initialize client with production endpoint
         self.client = InferenceClient(
             model="meta-llama/Meta-Llama-3-70B-Instruct",
             token=hf_token,
-            timeout=45
         )
     def __call__(self, question: str) -> str:
         try:
             response = self.client.text_generation(
-                prompt=f"GAIA Question: {question}\nAnswer:",
-                temperature=0.3,
-                max_new_tokens=512
             )
-            return response.split("Answer:")[-1].strip()
-        except Exception as e:
-            return f"Model Error: {str(e)}"
 def run_and_submit_all( profile: gr.OAuthProfile | None):

 class BasicAgent:
     def __init__(self, hf_token: str):
+        # Required for gated models
         login(token=hf_token, add_to_git_credential=False)
+        # Verify model access
+        try:
+            model_info = HfApi().model_info(
+                repo_id="meta-llama/Meta-Llama-3-70B-Instruct",
+                token=hf_token
+            )
+            if model_info.gated:
+                print("Verified model access")
+        except Exception as e:
+            raise RuntimeError(f"Model access denied: {str(e)}")
+        # Initialize client
         self.client = InferenceClient(
             model="meta-llama/Meta-Llama-3-70B-Instruct",
             token=hf_token,
+            timeout=60
         )
     def __call__(self, question: str) -> str:
         try:
             response = self.client.text_generation(
+                prompt=f"""GAIA RESPONSE PROTOCOL
+                        Question: {question}
+                        Answer: [EXACT ANSWER ONLY, NO EXPLANATION]""",
+                temperature=0.1,
+                max_new_tokens=50
             )
+            # Extract only the answer portion
+            return response.split("Answer:")[-1].strip().split("\n")[0]
+        except Exception:
+            # Return empty string instead of error message
+            return ""
 def run_and_submit_all( profile: gr.OAuthProfile | None):