PhotoshopRequest-Arena

Sleeping

App Files Files Community

taesiri commited on Feb 20

Commit

c628077

1 Parent(s): aa72fc4

backup

Browse files

Files changed (2) hide show

app.py +472 -0
photoexp_filtered.csv +0 -0

app.py ADDED Viewed

	@@ -0,0 +1,472 @@

+import gradio as gr
+import random
+from datasets import load_dataset
+import csv
+from datetime import datetime
+import os
+import pandas as pd
+import json
+from huggingface_hub import CommitScheduler, HfApi, snapshot_download
+import shutil
+import uuid
+import git
+from pathlib import Path
+api = HfApi(token=os.environ["HF_TOKEN"])
+RESULTS_BACKUP_REPO = "taesiri/PhotoEditBattleResults"
+# Load the experimental dataset
+dataset = load_dataset("taesiri/IERv2-BattleResults_exp", split="train")
+dataset_post_ids = list(
+    set(
+        load_dataset(
+            "taesiri/IERv2-BattleResults_exp", columns=["post_id"], split="train"
+        )
+        .to_pandas()
+        .post_id.tolist()
+    )
+)
+photoexp = pd.read_csv("./photoexp_filtered.csv")
+# Download existing data from hub
+def sync_with_hub():
+    """
+    Synchronize local data with the hub by cloning the dataset repo
+    """
+    print("Starting sync with hub...")
+    data_dir = Path("./data")
+    if data_dir.exists():
+        # Backup existing data
+        backup_dir = Path("./data_backup")
+        if backup_dir.exists():
+            shutil.rmtree(backup_dir)
+        shutil.copytree(data_dir, backup_dir)
+    # Clone/pull latest data from hub
+    # Use token in the URL for authentication following HF's new format
+    token = os.environ["HF_TOKEN"]
+    username = "taesiri"  # Extract from DATASET_REPO
+    repo_url = (
+        f"https://{username}:{token}@huggingface.co/datasets/{RESULTS_BACKUP_REPO}"
+    )
+    hub_data_dir = Path("hub_data")
+    if hub_data_dir.exists():
+        # If repo exists, do a git pull
+        print("Pulling latest changes...")
+        repo = git.Repo(hub_data_dir)
+        origin = repo.remotes.origin
+        # Set the new URL with token
+        if "https://" in origin.url:
+            origin.set_url(repo_url)
+        origin.pull()
+    else:
+        # Clone the repo with token
+        print("Cloning repository...")
+        git.Repo.clone_from(repo_url, hub_data_dir)
+    # Merge hub data with local data
+    hub_data_source = hub_data_dir / "data"
+    if hub_data_source.exists():
+        # Create data dir if it doesn't exist
+        data_dir.mkdir(exist_ok=True)
+        # Copy files from hub
+        for item in hub_data_source.glob("*"):
+            if item.is_dir():
+                dest = data_dir / item.name
+                if not dest.exists():  # Only copy if doesn't exist locally
+                    shutil.copytree(item, dest)
+    # Clean up cloned repo
+    if hub_data_dir.exists():
+        shutil.rmtree(hub_data_dir)
+    print("Finished syncing with hub!")
+scheduler = CommitScheduler(
+    repo_id=RESULTS_BACKUP_REPO,
+    repo_type="dataset",
+    folder_path="./data",
+    path_in_repo="data",
+    every=1,
+)
+def save_evaluation(post_id, model_a, model_b, verdict):
+    """Save evaluation results to CSV. Multiple evaluations per image/model are allowed."""
+    timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+    # Create data directory if it doesn't exist
+    os.makedirs("data", exist_ok=True)
+    filename = "data/evaluation_results_exp.csv"
+    # Create file with headers if it doesn't exist
+    if not os.path.exists(filename):
+        with open(filename, "w", newline="") as f:
+            writer = csv.writer(f)
+            writer.writerow(["timestamp", "post_id", "model_a", "model_b", "verdict"])
+    # Append the new evaluation - multiple entries per image/model are allowed
+    with open(filename, "a", newline="") as f:
+        writer = csv.writer(f)
+        writer.writerow([timestamp, post_id, model_a, model_b, verdict])
+    print(
+        f"Saved evaluation: {post_id} - Model A: {model_a} - Model B: {model_b} - Verdict: {verdict}"
+    )
+def get_random_sample():
+    """Get a random sample from the dataset. Sampling with replacement is allowed."""
+    idx = random.randint(0, len(dataset) - 1)
+    sample = dataset[idx]
+    # Filter photoexp to get entries with the same post_id
+    matching_photoexp_entries = photoexp[photoexp.post_id == sample["post_id"]]
+    # Randomly select one entry from the matching entries
+    if not matching_photoexp_entries.empty:
+        random_photoexp_entry = matching_photoexp_entries.sample(n=1).iloc[0]
+        additional_edited_image = random_photoexp_entry["edited_image"]
+        # Add REDDIT_ prefix when using comment_id instead of model
+        model_b = random_photoexp_entry.get("model")
+        if model_b is None:
+            model_b = f"REDDIT_{random_photoexp_entry['comment_id']}"
+    else:
+        additional_edited_image = None
+        model_b = None
+    # Randomly assign images to A and B
+    if random.choice([True, False]):
+        image_a = sample["edited_image"]
+        model_a = sample["model"]
+        image_b = additional_edited_image
+    else:
+        image_a = additional_edited_image
+        model_a = model_b
+        image_b = sample["edited_image"]
+        model_b = sample["model"]
+    print(f"Selected sample {idx}: {sample['post_id']} - {sample['model']}")
+    return {
+        "post_id": sample["post_id"],
+        "instruction": '## User Request: "' + sample["instruction"] + '"',
+        "simplified_instruction": '## User Request: "'
+        + sample["simplified_instruction"]
+        + '"',
+        "source_image": sample["source_image"],
+        "image_a": image_a,
+        "image_b": image_b,
+        "model_a": model_a,
+        "model_b": model_b,
+    }
+def evaluate(verdict, state):
+    """Handle evaluation button clicks"""
+    if state is None:
+        return (
+            None,
+            None,
+            None,
+            None,
+            None,
+            None,
+            None,
+            False,
+            False,
+            False,
+            None,
+            None,
+            None,
+            None,
+            None,
+            None,
+            None,
+        )
+    # Save the evaluation
+    save_evaluation(state["post_id"], state["model_a"], state["model_b"], verdict)
+    # Get next sample
+    next_sample = get_random_sample()
+    # Reset button styles
+    a_better_reset = gr.update(variant="secondary")
+    b_better_reset = gr.update(variant="secondary")
+    neither_reset = gr.update(variant="secondary")
+    tie_reset = gr.update(variant="secondary")
+    return (
+        next_sample["source_image"],
+        next_sample["image_a"],
+        next_sample["image_b"],
+        next_sample["instruction"],
+        next_sample["simplified_instruction"],
+        f"Model A: {next_sample['model_a']} | Model B: {next_sample['model_b']}",
+        next_sample,
+        None,  # selected_verdict
+        False,
+        False,
+        False,
+        False,  # reset all button states
+        a_better_reset,  # reset A is better button style
+        b_better_reset,  # reset B is better button style
+        neither_reset,  # reset neither is good button style
+        tie_reset,  # reset tie button style
+        next_sample["post_id"],
+    )
+def select_verdict(verdict, state):
+    """Handle first step selection"""
+    if state is None:
+        return None, False, False, False, False  # Ensure it returns 5 values
+    return (
+        verdict,
+        verdict == "A is better",
+        verdict == "B is better",
+        verdict == "Neither is good",
+        verdict == "Tie",
+    )
+def initialize():
+    """Initialize the interface with first sample"""
+    sample = get_random_sample()
+    return (
+        sample["source_image"],
+        sample["image_a"],
+        sample["image_b"],
+        sample["instruction"],
+        sample["simplified_instruction"],
+        f"Model A: {sample['model_a']} | Model B: {sample['model_b']}",
+        sample,
+        None,  # selected_verdict
+        False,  # a_better_selected
+        False,  # b_better_selected
+        False,  # neither_selected
+        False,  # tie_selected
+        sample["post_id"],
+    )
+def update_button_styles(verdict):
+    """Update button styles based on selection"""
+    # Update button labels to use emojis
+    a_better_style = gr.update(
+        value="👈 A is better" if verdict == "A is better" else "👈 A is better"
+    )
+    b_better_style = gr.update(
+        value="👉 B is better" if verdict == "B is better" else "👉 B is better"
+    )
+    neither_style = gr.update(
+        value="👎 Both are bad" if verdict == "Neither is good" else "👎 Both are bad"
+    )
+    tie_style = gr.update(value="🤝 Tie" if verdict == "Tie" else "🤝 Tie")
+    return a_better_style, b_better_style, neither_style, tie_style
+# Create Gradio interface
+with gr.Blocks() as demo:
+    # Add instruction panel at the top
+    gr.HTML(
+        """
+        <div style="padding: 0.8rem; margin-bottom: 0.8rem; background-color: #2c3e50; border-radius: 0.5rem; color: white; text-align: center;">
+            <div style="font-size: 1.1rem; margin-bottom: 0.5rem;">Read the user instruction, look at the source image, then evaluate which edit (A or B) best satisfies the request better.</div>
+            <div style="font-size: 1rem;">
+                <strong>🤝 Tie</strong> &nbsp;&nbsp;|&nbsp;&nbsp;
+                <strong>👈 A is better</strong> &nbsp;&nbsp;|&nbsp;&nbsp;
+                <strong>👉 B is better</strong>
+            </div>
+        </div>
+    """
+    )
+    with gr.Row():
+        simplified_instruction = gr.Textbox(
+            label="Simplified Instruction", show_label=True, visible=False
+        )
+        instruction = gr.Markdown(label="Original Instruction", show_label=True)
+    with gr.Row():
+        with gr.Column():
+            source_image = gr.Image(label="Source Image", show_label=True, height=500)
+            tie_btn = gr.Button("🤝 Tie", variant="secondary")
+        with gr.Column():
+            image_a = gr.Image(label="Image A", show_label=True, height=500)
+            a_better_btn = gr.Button("👈 A is better", variant="secondary")
+        with gr.Column():
+            image_b = gr.Image(label="Image B", show_label=True, height=500)
+            b_better_btn = gr.Button("👉 B is better", variant="secondary")
+    # Add confirmation button in new row
+    with gr.Row():
+        confirm_btn = gr.Button("Confirm Selection", variant="primary", visible=False)
+    with gr.Row():
+        neither_btn = gr.Button("👎 Both are bad", variant="secondary", visible=False)
+    with gr.Accordion("DEBUG", open=False):
+        with gr.Row():
+            post_id_display = gr.Textbox(
+                label="Post ID", show_label=True, interactive=False
+            )
+            model_info = gr.Textbox(label="Model Information", show_label=True)
+    state = gr.State()
+    selected_verdict = gr.State()
+    # Add states for button selection
+    a_better_selected = gr.Checkbox(visible=False)
+    b_better_selected = gr.Checkbox(visible=False)
+    neither_selected = gr.Checkbox(visible=False)
+    tie_selected = gr.Checkbox(visible=False)
+    def update_confirm_visibility(a_better, b_better, neither, tie):
+        # Update button text based on selection
+        if a_better:
+            return gr.update(visible=True, value="Confirm A is better")
+        elif b_better:
+            return gr.update(visible=True, value="Confirm B is better")
+        elif neither:
+            return gr.update(visible=True, value="Confirm Neither is good")
+        elif tie:
+            return gr.update(visible=True, value="Confirm Tie")
+        return gr.update(visible=False)
+    # Initialize the interface
+    demo.load(
+        initialize,
+        outputs=[
+            source_image,
+            image_a,
+            image_b,
+            instruction,
+            simplified_instruction,
+            model_info,
+            state,
+            selected_verdict,
+            a_better_selected,
+            b_better_selected,
+            neither_selected,
+            tie_selected,
+            post_id_display,
+        ],
+    )
+    # Handle first step button clicks
+    a_better_btn.click(
+        lambda state: select_verdict("A is better", state),
+        inputs=[state],
+        outputs=[
+            selected_verdict,
+            a_better_selected,
+            b_better_selected,
+            neither_selected,
+            tie_selected,
+        ],
+    ).then(
+        update_button_styles,
+        inputs=[selected_verdict],
+        outputs=[a_better_btn, b_better_btn, neither_btn, tie_btn],
+    )
+    b_better_btn.click(
+        lambda state: select_verdict("B is better", state),
+        inputs=[state],
+        outputs=[
+            selected_verdict,
+            a_better_selected,
+            b_better_selected,
+            neither_selected,
+            tie_selected,
+        ],
+    ).then(
+        update_button_styles,
+        inputs=[selected_verdict],
+        outputs=[a_better_btn, b_better_btn, neither_btn, tie_btn],
+    )
+    neither_btn.click(
+        lambda state: select_verdict("Neither is good", state),
+        inputs=[state],
+        outputs=[
+            selected_verdict,
+            a_better_selected,
+            b_better_selected,
+            neither_selected,
+            tie_selected,
+        ],
+    ).then(
+        update_button_styles,
+        inputs=[selected_verdict],
+        outputs=[a_better_btn, b_better_btn, neither_btn, tie_btn],
+    )
+    tie_btn.click(
+        lambda state: select_verdict("Tie", state),
+        inputs=[state],
+        outputs=[
+            selected_verdict,
+            a_better_selected,
+            b_better_selected,
+            neither_selected,
+            tie_selected,
+        ],
+    ).then(
+        update_button_styles,
+        inputs=[selected_verdict],
+        outputs=[a_better_btn, b_better_btn, neither_btn, tie_btn],
+    )
+    # Update confirm button visibility when selection changes
+    for checkbox in [
+        a_better_selected,
+        b_better_selected,
+        neither_selected,
+        tie_selected,
+    ]:
+        checkbox.change(
+            update_confirm_visibility,
+            inputs=[
+                a_better_selected,
+                b_better_selected,
+                neither_selected,
+                tie_selected,
+            ],
+            outputs=[confirm_btn],
+        )
+    # Handle confirmation button click
+    confirm_btn.click(
+        lambda verdict, state: evaluate(verdict, state),
+        inputs=[selected_verdict, state],
+        outputs=[
+            source_image,
+            image_a,
+            image_b,
+            instruction,
+            simplified_instruction,
+            model_info,
+            state,
+            selected_verdict,
+            a_better_selected,
+            b_better_selected,
+            neither_selected,
+            tie_selected,
+            a_better_btn,
+            b_better_btn,
+            neither_btn,
+            tie_btn,
+            post_id_display,
+        ],
+    )
+if __name__ == "__main__":
+    demo.launch()

photoexp_filtered.csv ADDED Viewed

The diff for this file is too large to render. See raw diff