Spaces:

wuhp
/

evaltest

Sleeping

App Files Files Community

wuhp commited on about 1 month ago

Commit

22b976e

verified ·

1 Parent(s): e09a48c

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -237

app.py CHANGED Viewed

@@ -1,15 +1,11 @@
 """
-app.py – Roboflow‑aware YOLOv8 Dataset Quality Evaluator (v2)
-Changelog (2025‑04‑17)
-──────────────────────
-• **CPU‑bound loops parallelised** with `concurrent.futures.ProcessPoolExecutor`.
-• **Batch inference** in `qc_model_qa()` (GPU util ↑, latency ↓).
-• Optional **fastdup** path for duplicate detection (≈ 10× faster on large sets).
-• Faster NumPy‑based `parse_label_file()`.
-• Small refactors → clearer separation of stages & fewer globals.
-• Graceful degradation if heavy deps unavailable (cv2, imagehash, fastdup).
-• Tunable `CPU_COUNT` + env‑var guard for HF Spaces quota.
 """
 from __future__ import annotations
@@ -33,7 +29,7 @@ import yaml
 from PIL import Image
 from tqdm import tqdm
-# ───────────────────────────────────────── Heavy optional deps ──
 try:
     import cv2  # type: ignore
 except ImportError:
@@ -49,6 +45,11 @@ try:
 except ImportError:
     fastdup = None
 try:
     from ultralytics import YOLO  # type: ignore
 except ImportError:
@@ -63,16 +64,17 @@ except ImportError:
 TMP_ROOT = Path(tempfile.gettempdir()) / "rf_datasets"
 TMP_ROOT.mkdir(parents=True, exist_ok=True)
-# Limit CPU workers on HF Spaces (feel free to raise locally)
 CPU_COUNT = int(os.getenv("QC_CPU", max(1, (os.cpu_count() or 4) // 2)))
 BATCH = int(os.getenv("QC_BATCH", 16))
 DEFAULT_W = {
-    "Integrity": 0.30,
     "Class balance": 0.15,
     "Image quality": 0.15,
     "Duplicates": 0.10,
-    "Model QA": 0.30,
 }
 @dataclass
@@ -86,17 +88,19 @@ def load_yaml(path: Path) -> Dict:
     with path.open(encoding="utf-8") as f:
         return yaml.safe_load(f)
-def parse_label_file(path: Path) -> list[tuple[int, float, float, float, float]]:
-    if not path.exists() or path.stat().st_size == 0:
-        return []
     try:
         arr = np.loadtxt(path, dtype=float)
         if arr.ndim == 1:
             arr = arr.reshape(1, -1)
-        return [tuple(row) for row in arr]
     except Exception:
-        return []
 def guess_image_dirs(root: Path) -> List[Path]:
@@ -164,9 +168,9 @@ def qc_class_balance(lbls: List[Path]):
     cls_counts = Counter()
     boxes_per_img = []
     for l in lbls:
-        bs = parse_label_file(l) if l else []
-        boxes_per_img.append(len(bs))
-        cls_counts.update(b[0] for b in bs)
     if not cls_counts:
         return {"name": "Class balance", "score": 0, "details": "No labels"}
@@ -200,10 +204,7 @@ def qc_image_quality(imgs: List[Path], blur_thr: float = 100.0):
     if cv2 is None:
         return {"name": "Image quality", "score": 100, "details": "cv2 not installed"}
-    blurry: list[Path] = []
-    dark: list[Path] = []
-    bright: list[Path] = []
     with ProcessPoolExecutor(max_workers=CPU_COUNT) as ex:
         for p, is_blur, is_dark, is_bright in tqdm(
             ex.map(lambda x: _quality_stat(x, blur_thr), imgs),
@@ -233,7 +234,6 @@ def qc_image_quality(imgs: List[Path], blur_thr: float = 100.0):
 # Duplicate images ---------------------------------------------
 def qc_duplicates(imgs: List[Path]):
-    # Fast path – use fastdup if installed & enough images
     if fastdup is not None and len(imgs) > 50:
         try:
             fd = fastdup.create(input_dir=str(Path(imgs[0]).parent.parent), work_dir=str(TMP_ROOT / "fastdup"))
@@ -241,13 +241,9 @@ def qc_duplicates(imgs: List[Path]):
             clusters = fd.get_clusters()
             dup = sum(len(c) - 1 for c in clusters)
             score = 100 - dup / max(len(imgs), 1) * 100
-            return {
-                "name": "Duplicates",
-                "score": score,
-                "details": {"groups": clusters[:50]},
-            }
         except Exception:
-            pass  # fallback to hash
     if imagehash is None:
         return {"name": "Duplicates", "score": 100, "details": "skipped (deps)"}
@@ -256,206 +252,4 @@ def qc_duplicates(imgs: List[Path]):
         return str(imagehash.average_hash(Image.open(p)))
     hashes: Dict[str, List[Path]] = defaultdict(list)
-    with ProcessPoolExecutor(max_workers=CPU_COUNT) as ex:
-        for h, p in tqdm(
-            zip(ex.map(_hash, imgs), imgs),
-            total=len(imgs),
-            desc="hashing",
-            leave=False,
-        ):
-            hashes[h].append(p)
-    groups = [g for g in hashes.values() if len(g) > 1]
-    dup = sum(len(g) - 1 for g in groups)
-    score = 100 - dup / max(len(imgs), 1) * 100
-    return {
-        "name": "Duplicates",
-        "score": score,
-        "details": {"groups": [[str(p) for p in g] for g in groups[:50]]},
-    }
-# Model‑assisted QA --------------------------------------------
-def _rel_iou(b1, b2):
-    x1, y1, w1, h1 = b1
-    x2, y2, w2, h2 = b2
-    xa1, ya1, xa2, ya2 = x1 - w1 / 2, y1 - h1 / 2, x1 + w1 / 2, y1 + h1 / 2
-    xb1, yb1, xb2, yb2 = x2 - w2 / 2, y2 - h2 / 2, x2 + w2 / 2, y2 + h2 / 2
-    ix1, iy1, ix2, iy2 = max(xa1, xb1), max(ya1, yb1), min(xa2, xb2), min(ya2, yb2)
-    inter = max(ix2 - ix1, 0) * max(iy2 - iy1, 0)
-    union = w1 * h1 + w2 * h2 - inter
-    return inter / union if union else 0.0
-def qc_model_qa(imgs: List[Path], weights: str | None, lbls: List[Path], iou_thr: float = 0.5):
-    if weights is None or YOLO is None:
-        return {"name": "Model QA", "score": 100, "details": "skipped (no weights)"}
-    model = YOLO(weights)
-    ious, mism = [], []
-    for i in range(0, len(imgs), BATCH):
-        batch_paths = imgs[i : i + BATCH]
-        results = model.predict(batch_paths, verbose=False)
-        for p, res in zip(batch_paths, results):
-            gtb = parse_label_file(p.parent.parent / "labels" / f"{p.stem}.txt")
-            if not gtb:
-                continue
-            for cls, x, y, w, h in gtb:
-                best = 0.0
-                for b, c in zip(res.boxes.xywh.cpu().numpy(), res.boxes.cls.cpu().numpy()):
-                    if int(c) != cls:
-                        continue
-                    best = max(best, _rel_iou((x, y, w, h), tuple(b)))
-                ious.append(best)
-                if best < iou_thr:
-                    mism.append(str(p))
-    miou = float(np.mean(ious)) if ious else 1.0
-    return {
-        "name": "Model QA",
-        "score": miou * 100,
-        "details": {"mean_iou": miou, "mismatched_images": mism[:50]},
-    }
-# Aggregate -----------------------------------------------------
-def aggregate(scores):
-    return sum(DEFAULT_W.get(r["name"], 0) * r["score"] for r in scores)
-# ───────────────────────────────────────── Roboflow helpers ────
-RF_RE = re.compile(r"https://universe\.roboflow\.com/([^/]+)/([^/]+)/dataset/(\d+)")
-def download_rf_dataset(url: str, rf_api: "Roboflow", dest: Path) -> Path:
-    m = RF_RE.match(url.strip())
-    if not m:
-        raise ValueError(f"Bad RF URL: {url}")
-    ws, proj, ver = m.groups()
-    ds_dir = dest / f"{ws}_{proj}_v{ver}"
-    if ds_dir.exists():
-        return ds_dir
-    project = rf_api.workspace(ws).project(proj)
-    project.version(int(ver)).download("yolov8", location=str(ds_dir))
-    return ds_dir
-# ───────────────────────────────────────── Main logic ──────────
-def run_quality(root: Path, yaml_override: Path | None, weights: Path | None):
-    imgs, lbls, meta = gather_dataset(root, yaml_override)
-    res = [
-        qc_integrity(imgs, lbls),
-        qc_class_balance(lbls),
-        qc_image_quality(imgs),
-        qc_duplicates(imgs),
-        qc_model_qa(imgs, str(weights) if weights else None, lbls),
-    ]
-    final = aggregate(res)
-    md = [f"## **{meta.get('name', root.name)}** — Score {final:.1f}/100"]
-    for r in res:
-        md.append(f"### {r['name']}  {r['score']:.1f}")
-        md.append("<details><summary>details</summary>\n\n```json")
-        md.append(json.dumps(r["details"], indent=2))
-        md.append("```\n</details>\n")
-    md_str = "\n".join(md)
-    cls_counts = res[1]["details"].get("class_counts", {})  # type: ignore[index]
-    df = pd.DataFrame.from_dict(cls_counts, orient="index", columns=["count"])
-    df.index.name = "class"
-    return md_str, df
-# ───────────────────────────────────────── Gradio UI ───────���───
-def evaluate(
-    api_key: str,
-    url_txt: gr.File | None,
-    zip_file: gr.File | None,
-    server_path: str,
-    yaml_file: gr.File | None,
-    weights: gr.File | None,
-):
-    if not any([url_txt, zip_file, server_path]):
-        return "Upload a .txt of URLs or dataset ZIP/path", pd.DataFrame()
-    reports, dfs = [], []
-    # Roboflow batch ------------------------------------------
-    if url_txt:
-        if Roboflow is None:
-            return "`roboflow` not installed", pd.DataFrame()
-        if not api_key:
-            return "Enter Roboflow API key", pd.DataFrame()
-        rf = Roboflow(api_key=api_key.strip())
-        for line in Path(url_txt.name).read_text().splitlines():
-            if not line.strip():
-                continue
-            try:
-                ds_root = download_rf_dataset(line, rf, TMP_ROOT)
-                md, df = run_quality(ds_root, None, Path(weights.name) if weights else None)
-                reports.append(md)
-                dfs.append(df)
-            except Exception as e:
-                reports.append(f"### {line}\n\n⚠️ {e}")
-    # Manual ZIP ----------------------------------------------
-    if zip_file:
-        tmp_dir = Path(tempfile.mkdtemp())
-        shutil.unpack_archive(zip_file.name, tmp_dir)
-        md, df = run_quality(tmp_dir, Path(yaml_file.name) if yaml_file else None, Path(weights.name) if weights else None)
-        reports.append(md)
-        dfs.append(df)
-        shutil.rmtree(tmp_dir, ignore_errors=True)
-    # Manual path ---------------------------------------------
-    if server_path:
-        md, df = run_quality(Path(server_path), Path(yaml_file.name) if yaml_file else None, Path(weights.name) if weights else None)
-        reports.append(md)
-        dfs.append(df)
-    summary_md = "\n\n---\n\n".join(reports)
-    combined_df = pd.concat(dfs).groupby(level=0).sum() if dfs else pd.DataFrame()
-    return summary_md, combined_df
-# ───────────────────────────────────────── Launch  ────────────
-with gr.Blocks(title="YOLO Dataset Quality Evaluator") as demo:
-    gr.Markdown(
-        """
-# YOLOv8 Dataset Quality Evaluator
-### Roboflow batch
-1. Paste your **Roboflow API key**
-2. Upload a **.txt** file – one `https://universe.roboflow.com/.../dataset/x` per line
-### Manual
-* Upload a dataset **ZIP** or type a dataset **path** on the server
-* Optionally supply a custom **data.yaml** and/or a **YOLO .pt** weights file for model‑assisted QA
-"""
-    )
-    with gr.Row():
-        api_in = gr.Textbox(label="Roboflow API key", type="password", placeholder="rf_XXXXXXXXXXXXXXXX")
-        url_txt_in = gr.File(label=".txt of RF dataset URLs", file_types=[".txt"])
-    with gr.Row():
-        zip_in = gr.File(label="Dataset ZIP")
-        path_in = gr.Textbox(label="Path on server", placeholder="/data/my_dataset")
-    with gr.Row():
-        yaml_in = gr.File(label="Custom YAML", file_types=[".yaml"])
-        weights_in = gr.File(label="YOLO weights (.pt)")
-    run_btn = gr.Button("Evaluate")
-    out_md = gr.Markdown()
-    out_df = gr.Dataframe()
-    run_btn.click(
-        evaluate,
-        inputs=[api_in, url_txt_in, zip_in, path_in, yaml_in, weights_in],
-        outputs=[out_md, out_df],
-    )
-if __name__ == "__main__":
-    demo.launch(server_name="0.0.0.0", server_port=int(os.getenv("PORT", 7860)))

 """
+app.py – Roboflow‑aware YOLOv8 Dataset Quality Evaluator (v3)
+─────────────────────────────────────────────────────────────
+Changelog (2025‑04‑17 b)
+• **Cleanlab** integration → extra *label‑issue* metric (skips gracefully if lib missing).
+• New **BBox validity** check: flags coords outside [0, 1].
+• Weight table updated (Integrity 25 %, Model 20 %, Cleanlab 10 %, etc.).
+• Minor: switched to cached NumPy reader for labels, clarified env vars.
 """
 from __future__ import annotations
 from PIL import Image
 from tqdm import tqdm
+# ───────────────────────────── Optional heavy deps (fail‑soft) ──
 try:
     import cv2  # type: ignore
 except ImportError:
 except ImportError:
     fastdup = None
+try:
+    from cleanlab.object_detection import find_label_issues  # type: ignore
+except (ImportError, AttributeError):
+    find_label_issues = None  # type: ignore
 try:
     from ultralytics import YOLO  # type: ignore
 except ImportError:
 TMP_ROOT = Path(tempfile.gettempdir()) / "rf_datasets"
 TMP_ROOT.mkdir(parents=True, exist_ok=True)
 CPU_COUNT = int(os.getenv("QC_CPU", max(1, (os.cpu_count() or 4) // 2)))
 BATCH = int(os.getenv("QC_BATCH", 16))
 DEFAULT_W = {
+    "Integrity": 0.25,
     "Class balance": 0.15,
     "Image quality": 0.15,
     "Duplicates": 0.10,
+    "BBox validity": 0.05,
+    "Model QA": 0.20,
+    "Cleanlab QA": 0.10,
 }
 @dataclass
     with path.open(encoding="utf-8") as f:
         return yaml.safe_load(f)
+_label_cache: dict[Path, np.ndarray] = {}
+def load_labels_np(path: Path) -> np.ndarray:
+    if path in _label_cache:
+        return _label_cache[path]
     try:
         arr = np.loadtxt(path, dtype=float)
         if arr.ndim == 1:
             arr = arr.reshape(1, -1)
     except Exception:
+        arr = np.empty((0, 5))
+    _label_cache[path] = arr
+    return arr
 def guess_image_dirs(root: Path) -> List[Path]:
     cls_counts = Counter()
     boxes_per_img = []
     for l in lbls:
+        arr = load_labels_np(l) if l else np.empty((0, 5))
+        boxes_per_img.append(len(arr))
+        cls_counts.update(arr[:, 0].astype(int) if arr.size else [])
     if not cls_counts:
         return {"name": "Class balance", "score": 0, "details": "No labels"}
     if cv2 is None:
         return {"name": "Image quality", "score": 100, "details": "cv2 not installed"}
+    blurry, dark, bright = [], [], []
     with ProcessPoolExecutor(max_workers=CPU_COUNT) as ex:
         for p, is_blur, is_dark, is_bright in tqdm(
             ex.map(lambda x: _quality_stat(x, blur_thr), imgs),
 # Duplicate images ---------------------------------------------
 def qc_duplicates(imgs: List[Path]):
     if fastdup is not None and len(imgs) > 50:
         try:
             fd = fastdup.create(input_dir=str(Path(imgs[0]).parent.parent), work_dir=str(TMP_ROOT / "fastdup"))
             clusters = fd.get_clusters()
             dup = sum(len(c) - 1 for c in clusters)
             score = 100 - dup / max(len(imgs), 1) * 100
+            return {"name": "Duplicates", "score": score, "details": {"groups": clusters[:50]}}
         except Exception:
+            pass
     if imagehash is None:
         return {"name": "Duplicates", "score": 100, "details": "skipped (deps)"}
         return str(imagehash.average_hash(Image.open(p)))
     hashes: Dict[str, List[Path]] = defaultdict(list)
+    with ProcessPoolExecutor(max_workers=CPU