Xueqing commited on
Commit
15e85b4
·
verified ·
1 Parent(s): f09b25a

Update backend/utils/analyze_prod_models.py

Browse files
backend/utils/analyze_prod_models.py CHANGED
@@ -5,7 +5,7 @@ from datetime import datetime
5
  from pathlib import Path
6
  from huggingface_hub import HfApi
7
  from dotenv import load_dotenv
8
- from app.config.hf_config import HF_ORGANIZATION
9
 
10
  # Get the backend directory path
11
  BACKEND_DIR = Path(__file__).parent.parent
@@ -22,22 +22,22 @@ logging.basicConfig(
22
  logger = logging.getLogger(__name__)
23
 
24
  # Initialize Hugging Face API
25
- HF_TOKEN = os.getenv("HF_TOKEN")
26
- if not HF_TOKEN:
27
- raise ValueError("HF_TOKEN not found in environment variables")
28
  api = HfApi(token=HF_TOKEN)
29
 
30
  def count_evaluated_models():
31
  """Count the number of evaluated models"""
32
  try:
33
  # Get dataset info
34
- dataset_info = api.dataset_info(repo_id=f"{HF_ORGANIZATION}/greek-contents", repo_type="dataset")
35
 
36
  # Get file list
37
- files = api.list_repo_files(f"{HF_ORGANIZATION}/greek-contents", repo_type="dataset")
38
 
39
  # Get last commit info
40
- commits = api.list_repo_commits(f"{HF_ORGANIZATION}/greek-contents", repo_type="dataset")
41
  last_commit = next(commits, None)
42
 
43
  # Count lines in jsonl files
@@ -47,7 +47,7 @@ def count_evaluated_models():
47
  try:
48
  # Download file content
49
  content = api.hf_hub_download(
50
- repo_id=f"{HF_ORGANIZATION}/greek-contents",
51
  filename=file,
52
  repo_type="dataset"
53
  )
 
5
  from pathlib import Path
6
  from huggingface_hub import HfApi
7
  from dotenv import load_dotenv
8
+ from app.config.hf_config import HF_TOKEN, HF_ORGANIZATION, HF_AGGREGATED
9
 
10
  # Get the backend directory path
11
  BACKEND_DIR = Path(__file__).parent.parent
 
22
  logger = logging.getLogger(__name__)
23
 
24
  # Initialize Hugging Face API
25
+ # HF_TOKEN = os.getenv("HF_TOKEN")
26
+ # if not HF_TOKEN:
27
+ # raise ValueError("HF_TOKEN not found in environment variables")
28
  api = HfApi(token=HF_TOKEN)
29
 
30
  def count_evaluated_models():
31
  """Count the number of evaluated models"""
32
  try:
33
  # Get dataset info
34
+ dataset_info = api.dataset_info(repo_id=f"{HF_ORGANIZATION}/{HF_AGGREGATED}", repo_type="dataset")
35
 
36
  # Get file list
37
+ files = api.list_repo_files(f"{HF_ORGANIZATION}/{HF_AGGREGATED}", repo_type="dataset")
38
 
39
  # Get last commit info
40
+ commits = api.list_repo_commits(f"{HF_ORGANIZATION}/{HF_AGGREGATED}", repo_type="dataset")
41
  last_commit = next(commits, None)
42
 
43
  # Count lines in jsonl files
 
47
  try:
48
  # Download file content
49
  content = api.hf_hub_download(
50
+ repo_id=f"{HF_ORGANIZATION}/{HF_AGGREGATED}",
51
  filename=file,
52
  repo_type="dataset"
53
  )