Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -3,7 +3,7 @@ import gradio as gr
|
|
3 |
import requests
|
4 |
import inspect
|
5 |
import pandas as pd
|
6 |
-
from huggingface_hub import InferenceClient, login
|
7 |
|
8 |
|
9 |
# (Keep Constants as is)
|
@@ -16,27 +16,23 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
|
|
16 |
from huggingface_hub import InferenceClient, login
|
17 |
|
18 |
class BasicAgent:
|
|
|
19 |
def __init__(self, hf_token: str):
|
20 |
# Required for gated models
|
21 |
login(token=hf_token, add_to_git_credential=False)
|
22 |
|
|
|
|
|
|
|
23 |
# Verify model access
|
24 |
try:
|
25 |
-
model_info =
|
26 |
-
repo_id="meta-llama/Meta-Llama-3-70B-Instruct"
|
27 |
-
token=hf_token
|
28 |
)
|
29 |
if model_info.gated:
|
30 |
-
print("Verified
|
31 |
except Exception as e:
|
32 |
raise RuntimeError(f"Model access denied: {str(e)}")
|
33 |
-
|
34 |
-
# Initialize client
|
35 |
-
self.client = InferenceClient(
|
36 |
-
model="meta-llama/Meta-Llama-3-70B-Instruct",
|
37 |
-
token=hf_token,
|
38 |
-
timeout=60
|
39 |
-
)
|
40 |
|
41 |
def __call__(self, question: str) -> str:
|
42 |
try:
|
|
|
3 |
import requests
|
4 |
import inspect
|
5 |
import pandas as pd
|
6 |
+
from huggingface_hub import HfApi, InferenceClient, login
|
7 |
|
8 |
|
9 |
# (Keep Constants as is)
|
|
|
16 |
from huggingface_hub import InferenceClient, login
|
17 |
|
18 |
class BasicAgent:
|
19 |
+
|
20 |
def __init__(self, hf_token: str):
|
21 |
# Required for gated models
|
22 |
login(token=hf_token, add_to_git_credential=False)
|
23 |
|
24 |
+
# Initialize HfApi client
|
25 |
+
self.hf_api = HfApi(token=hf_token)
|
26 |
+
|
27 |
# Verify model access
|
28 |
try:
|
29 |
+
model_info = self.hf_api.model_info(
|
30 |
+
repo_id="meta-llama/Meta-Llama-3-70B-Instruct"
|
|
|
31 |
)
|
32 |
if model_info.gated:
|
33 |
+
print("Verified Llama-3 access")
|
34 |
except Exception as e:
|
35 |
raise RuntimeError(f"Model access denied: {str(e)}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
36 |
|
37 |
def __call__(self, question: str) -> str:
|
38 |
try:
|