Final_Assignment_Template

Runtime error

0r0b0r0s commited on 13 days ago

Commit

63affe0

verified ·

1 Parent(s): 6eaf9f8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -16,40 +16,36 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 from huggingface_hub import InferenceClient, login
 class BasicAgent:
     def __init__(self, hf_token: str):
-        # Required for gated models
         login(token=hf_token, add_to_git_credential=False)
-        # Initialize HfApi client
         self.hf_api = HfApi(token=hf_token)
         # Verify model access
         try:
-            model_info = self.hf_api.model_info(
-                repo_id="meta-llama/Meta-Llama-3-70B-Instruct"
-            )
-            if model_info.gated:
-                print("Verified Llama-3 access")
         except Exception as e:
-            raise RuntimeError(f"Model access denied: {str(e)}")
     def __call__(self, question: str) -> str:
         try:
             response = self.client.text_generation(
-                prompt=f"""GAIA RESPONSE PROTOCOL
-                        Question: {question}
-                        Answer: [EXACT ANSWER ONLY, NO EXPLANATION]""",
                 temperature=0.1,
                 max_new_tokens=50
             )
-            # Extract only the answer portion
             return response.split("Answer:")[-1].strip().split("\n")[0]
         except Exception:
-            # Return empty string instead of error message
             return ""
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,

 from huggingface_hub import InferenceClient, login
 class BasicAgent:
     def __init__(self, hf_token: str):
         login(token=hf_token, add_to_git_credential=False)
         self.hf_api = HfApi(token=hf_token)
         # Verify model access
         try:
+            self.hf_api.model_info("meta-llama/Meta-Llama-3-70B-Instruct")
         except Exception as e:
+            raise RuntimeError(f"Model access failed: {str(e)}")
+        # Initialize inference client
+        self.client = InferenceClient(
+            model="meta-llama/Meta-Llama-3-70B-Instruct",
+            token=hf_token,
+            timeout=60
+        )
     def __call__(self, question: str) -> str:
         try:
             response = self.client.text_generation(
+                prompt=f"Question: {question}\nAnswer:",
                 temperature=0.1,
                 max_new_tokens=50
             )
             return response.split("Answer:")[-1].strip().split("\n")[0]
         except Exception:
             return ""
 def run_and_submit_all( profile: gr.OAuthProfile | None):
     """
     Fetches all questions, runs the BasicAgent on them, submits all answers,