Spaces:

2dogey
/

VenusFactory

Runtime error

App Files Files Community

VenusFactory / src /web /predict_tab.py

2dogey

Upload folder using huggingface_hub

8918ac7 verified about 1 month ago

raw

history blame contribute delete

94.7 kB

	import gradio as gr
	import json
	import os
	import subprocess
	import sys
	import signal
	import threading
	import queue
	import time
	import pandas as pd
	import tempfile
	import csv
	from pathlib import Path
	import traceback
	import re
	from web.utils.command import preview_predict_command
	import select

	def create_predict_tab(constant):
	plm_models = constant["plm_models"]
	is_predicting = False
	current_process = None
	output_queue = queue.Queue()
	stop_thread = False
	process_aborted = False # Flag indicating if the process was manually terminated

	def process_output(process, queue):
	"""Process output from subprocess and put it in queue"""
	nonlocal stop_thread
	while True:
	if stop_thread:
	break
	output = process.stdout.readline()
	if output == '' and process.poll() is not None:
	break
	if output:
	queue.put(output.strip())
	process.stdout.close()

	def generate_status_html(status_info):
	"""Generate HTML for single sequence prediction status"""
	stage = status_info.get("current_step", "Preparing")
	status = status_info.get("status", "running")

	# Determine status color and icon
	if status == "running":
	status_color = "#4285f4" # Blue
	icon = "⏳"
	animation = """
	@keyframes pulse {
	0% { transform: scale(1); }
	50% { transform: scale(1.05); }
	100% { transform: scale(1); }
	}
	"""
	animation_style = "animation: pulse 1.5s infinite ease-in-out;"
	elif status == "completed":
	status_color = "#2ecc71" # Green
	icon = "✅"
	animation = ""
	animation_style = ""
	else: # failed
	status_color = "#e74c3c" # Red
	icon = "❌"
	animation = ""
	animation_style = ""

	# Create a clean, centered notification
	return f"""
	<div style="text-align: center; background-color: white; padding: 30px; border-radius: 8px; box-shadow: 0 2px 4px rgba(0,0,0,0.1); margin: 20px 0;">
	<div style="display: inline-block; background-color: {status_color}; color: white; border-radius: 50%; width: 60px; height: 60px; line-height: 60px; font-size: 24px; margin-bottom: 15px; {animation_style}">
	{icon}
	</div>
	<h2 style="color: #2c3e50; margin: 10px 0; font-size: 20px;">{stage}</h2>
	<p style="color: #7f8c8d; font-size: 16px;">{status.capitalize()}</p>
	<style>
	{animation}
	</style>
	</div>
	"""

	def predict_sequence(plm_model, model_path, aa_seq, eval_method, eval_structure_seq, pooling_method, problem_type, num_labels):
	"""Predict for a single protein sequence"""
	nonlocal is_predicting, current_process, stop_thread, process_aborted

	# Check if we're already predicting
	if is_predicting:
	return gr.HTML("""
	<div style="padding: 10px; background-color: #fff8e1; border-radius: 5px;">
	<p style="margin: 0; color: #f57f17; font-weight: bold;">A prediction is already running. Please wait or abort it.</p>
	</div>
	""")

	# If the process was aborted but not reset properly, ensure we're in a clean state
	if process_aborted:
	process_aborted = False

	# Set the prediction flag
	is_predicting = True
	stop_thread = False # Ensure this is reset

	# Create a status info object, similar to batch prediction
	status_info = {
	"status": "running",
	"current_step": "Starting prediction"
	}

	# Show initial status
	yield generate_status_html(status_info)

	try:
	# Validate inputs
	if not model_path:
	is_predicting = False
	return gr.HTML("""
	<div class="error-container">
	<div class="error-icon">❌</div>
	<div class="error-message">Please provide a model path</div>
	</div>
	<style>
	.error-container {
	background-color: #fff5f5;
	border-left: 5px solid #f56565;
	padding: 15px;
	border-radius: 5px;
	margin: 10px 0;
	}
	.error-icon {
	font-size: 20px;
	margin-bottom: 8px;
	}
	.error-message {
	font-weight: 500;
	}
	</style>
	""")

	if not os.path.exists(os.path.dirname(model_path)):
	is_predicting = False
	return gr.HTML("""
	<div class="error-container">
	<div class="error-icon">❌</div>
	<div class="error-message">Invalid model path - directory does not exist</div>
	</div>
	<style>
	.error-container {
	background-color: #fff5f5;
	border-left: 5px solid #f56565;
	padding: 15px;
	border-radius: 5px;
	margin: 10px 0;
	}
	.error-icon {
	font-size: 20px;
	margin-bottom: 8px;
	}
	.error-message {
	font-weight: 500;
	}
	</style>
	""")

	if not aa_seq:
	is_predicting = False
	return gr.HTML("""
	<div class="error-container">
	<div class="error-icon">❌</div>
	<div class="error-message">Amino acid sequence is required</div>
	</div>
	<style>
	.error-container {
	background-color: #fff5f5;
	border-left: 5px solid #f56565;
	padding: 15px;
	border-radius: 5px;
	margin: 10px 0;
	}
	.error-icon {
	font-size: 20px;
	margin-bottom: 8px;
	}
	.error-message {
	font-weight: 500;
	}
	</style>
	""")

	# Update status
	status_info["current_step"] = "Preparing model and parameters"
	yield generate_status_html(status_info)

	# Prepare command
	args_dict = {
	"model_path": model_path,
	"plm_model": plm_models[plm_model],
	"aa_seq": aa_seq,
	"pooling_method": pooling_method,
	"problem_type": problem_type,
	"num_labels": num_labels,
	"eval_method": eval_method
	}

	if eval_method == "ses-adapter":
	# Handle structure sequence selection from multi-select dropdown
	args_dict["structure_seq"] = ",".join(eval_structure_seq) if eval_structure_seq else None

	# Set flags based on selected structure sequences
	if eval_structure_seq:
	if "foldseek_seq" in eval_structure_seq:
	args_dict["use_foldseek"] = True
	if "ss8_seq" in eval_structure_seq:
	args_dict["use_ss8"] = True
	else:
	args_dict["structure_seq"] = None
	args_dict["use_foldseek"] = False
	args_dict["use_ss8"] = False

	# Build command line
	final_cmd = [sys.executable, "src/predict.py"]
	for k, v in args_dict.items():
	if v is True:
	final_cmd.append(f"--{k}")
	elif v is not False and v is not None:
	final_cmd.append(f"--{k}")
	final_cmd.append(str(v))

	# Update status
	status_info["current_step"] = "Starting prediction process"
	yield generate_status_html(status_info)

	# Start prediction process
	try:
	current_process = subprocess.Popen(
	final_cmd,
	stdout=subprocess.PIPE,
	stderr=subprocess.STDOUT,
	text=True,
	bufsize=1,
	universal_newlines=True,
	preexec_fn=os.setsid if hasattr(os, "setsid") else None
	)
	except Exception as e:
	is_predicting = False
	return gr.HTML(f"""
	<div class="error-container">
	<div class="error-icon">❌</div>
	<div class="error-message">Error starting prediction process: {str(e)}</div>
	</div>
	<style>
	"""+"""
	.error-container {
	background-color: #fff5f5;
	border-left: 5px solid #f56565;
	padding: 15px;
	border-radius: 5px;
	margin: 10px 0;
	}
	.error-icon {
	font-size: 20px;
	margin-bottom: 8px;
	}
	.error-message {
	font-weight: 500;
	}
	</style>
	""")

	output_thread = threading.Thread(target=process_output, args=(current_process, output_queue))
	output_thread.daemon = True
	output_thread.start()

	# Collect output
	result_output = ""
	prediction_data = None
	json_str = ""
	in_json_block = False
	json_lines = []

	# Update status
	status_info["current_step"] = "Processing sequence"
	yield generate_status_html(status_info)

	while current_process.poll() is None:
	# Check if the process was aborted
	if process_aborted or stop_thread:
	break

	try:
	while not output_queue.empty():
	line = output_queue.get_nowait()
	result_output += line + "\n"

	# Update status with more meaningful messages
	if "Loading model" in line:
	status_info["current_step"] = "Loading model and tokenizer"
	elif "Processing sequence" in line:
	status_info["current_step"] = "Processing protein sequence"
	elif "Tokenizing" in line:
	status_info["current_step"] = "Tokenizing sequence"
	elif "Forward pass" in line:
	status_info["current_step"] = "Running model inference"
	elif "Making prediction" in line:
	status_info["current_step"] = "Calculating final prediction"
	elif "Prediction Results" in line:
	status_info["current_step"] = "Finalizing results"

	# Update status display
	yield generate_status_html(status_info)

	# Detect start of JSON results block
	if "---------- Prediction Results ----------" in line:
	in_json_block = True
	json_lines = []
	continue

	# If in JSON block, collect JSON lines
	if in_json_block and line.strip():
	json_lines.append(line.strip())

	# Try to parse the complete JSON when we have multiple lines
	if line.strip() == "}": # Potential end of JSON object
	try:
	complete_json = " ".join(json_lines)
	# Clean up the JSON string by removing line breaks and extra spaces
	complete_json = re.sub(r'\s+', ' ', complete_json).strip()
	prediction_data = json.loads(complete_json)
	print(f"Successfully parsed complete JSON: {prediction_data}")
	except json.JSONDecodeError as e:
	print(f"Failed to parse complete JSON: {e}")

	time.sleep(0.1)
	except Exception as e:
	yield gr.HTML(f"""
	<div class="warning-container">
	<div class="warning-icon">⚠️</div>
	<div class="warning-message">Warning reading output: {str(e)}</div>
	</div>
	<style>"""+"""
	.warning-container {
	background-color: #fffbea;
	border-left: 5px solid #ecc94b;
	padding: 15px;
	border-radius: 5px;
	margin: 10px 0;
	}
	.warning-icon {
	font-size: 20px;
	margin-bottom: 8px;
	}
	.warning-message {
	font-weight: 500;
	}
	</style>
	""")

	# Check if the process was aborted
	if process_aborted:
	# Show aborted message
	abort_html = """
	<div style="padding: 10px; background-color: #fff8e1; border-radius: 5px;">
	<p style="margin: 0; color: #f57f17; font-weight: bold;">Prediction was aborted by user</p>
	</div>
	"""
	yield gr.HTML(abort_html)
	is_predicting = False
	return

	# Process has completed
	if current_process and current_process.returncode == 0:
	# Update status
	status_info["status"] = "completed"
	status_info["current_step"] = "Prediction completed successfully"
	yield generate_status_html(status_info)

	# If no prediction data found, try to parse from complete output
	if not prediction_data:
	try:
	# Find the JSON block in the output
	results_marker = "---------- Prediction Results ----------"
	if results_marker in result_output:
	json_part = result_output.split(results_marker)[1].strip()

	# Try to extract the JSON object
	json_match = re.search(r'(\{.*?\})', json_part.replace('\n', ' '), re.DOTALL)
	if json_match:
	try:
	json_str = json_match.group(1)
	# Clean up the JSON string
	json_str = re.sub(r'\s+', ' ', json_str).strip()
	prediction_data = json.loads(json_str)
	print(f"Parsed prediction data from regex: {prediction_data}")
	except json.JSONDecodeError as e:
	print(f"JSON parse error from regex: {e}")
	except Exception as e:
	print(f"Error parsing JSON from complete output: {e}")

	if prediction_data:
	# Create styled HTML table based on problem type
	if problem_type == "regression":
	html_result = f"""
	<div class="results-container">
	<h2>Regression Prediction Results</h2>
	<table class='styled-table'>
	<thead>
	<tr><th style="width:50%; text-align:center">Output</th><th style="width:50%; text-align:center">Value</th></tr>
	</thead>
	<tbody>
	<tr><td style="text-align:center">Predicted Value</td><td style="text-align:center">{prediction_data['prediction']:.4f}</td></tr>
	</tbody>
	</table>
	</div>
	"""
	elif problem_type == "single_label_classification":
	# Create probability table
	prob_rows = ""
	if isinstance(prediction_data.get('probabilities'), list):
	prob_rows = "".join([
	f"<tr><td style='text-align:center'>Class {i}</td><td style='text-align:center'>{prob:.4f}</td></tr>"
	for i, prob in enumerate(prediction_data['probabilities'])
	])
	elif isinstance(prediction_data.get('probabilities'), dict):
	prob_rows = "".join([
	f"<tr><td style='text-align:center'>Class {label}</td><td style='text-align:center'>{prob:.4f}</td></tr>"
	for label, prob in prediction_data['probabilities'].items()
	])
	else:
	# Handle case where probabilities is not a list or dict
	prob_value = prediction_data.get('probabilities', 0)
	prob_rows = f"<tr><td style='text-align:center'>Class 0</td><td style='text-align:center'>{prob_value:.4f}</td></tr>"

	html_result = f"""
	<div class="results-container">
	<h2>Single-Label Classification Results</h2>
	<table class='styled-table'>
	<thead>
	<tr><th style="width:50%; text-align:center">Output</th><th style="width:50%; text-align:center">Value</th></tr>
	</thead>
	<tbody>
	<tr><td style="text-align:center">Predicted Class</td><td style="text-align:center">{prediction_data['predicted_class']}</td></tr>
	</tbody>
	</table>
	<h3 style='margin-top: 25px; margin-bottom: 15px;'>Class Probabilities</h3>
	<table class='styled-table'>
	<thead>
	<tr><th style="width:50%; text-align:center">Class</th><th style="width:50%; text-align:center">Probability</th></tr>
	</thead>
	<tbody>
	{prob_rows}
	</tbody>
	</table>
	</div>
	"""
	else: # multi_label_classification
	# Create prediction table
	pred_rows = ""
	if 'predictions' in prediction_data and 'probabilities' in prediction_data:
	# Handle different formats of predictions and probabilities
	if (isinstance(prediction_data['predictions'], list) and
	isinstance(prediction_data['probabilities'], list)):
	pred_rows = "".join([
	f"<tr><td style='width:33.33%; text-align:center'>Label {i}</td><td style='width:33.33%; text-align:center'>{pred}</td><td style='width:33.33%; text-align:center'>{prob:.4f}</td></tr>"
	for i, (pred, prob) in enumerate(zip(prediction_data['predictions'], prediction_data['probabilities']))
	])
	elif (isinstance(prediction_data['predictions'], dict) and
	isinstance(prediction_data['probabilities'], dict)):
	pred_rows = "".join([
	f"<tr><td style='width:33.33%; text-align:center'>Label {label}</td><td style='width:33.33%; text-align:center'>{pred}</td><td style='width:33.33%; text-align:center'>{prediction_data['probabilities'].get(label, 0):.4f}</td></tr>"
	for label, pred in prediction_data['predictions'].items()
	])
	else:
	# Handle case where predictions or probabilities is not a list or dict
	pred = prediction_data['predictions'] if 'predictions' in prediction_data else "N/A"
	prob = prediction_data['probabilities'] if 'probabilities' in prediction_data else 0.0
	pred_rows = f"<tr><td style='width:33.33%; text-align:center'>Label 0</td><td style='width:33.33%; text-align:center'>{pred}</td><td style='width:33.33%; text-align:center'>{prob:.4f}</td></tr>"
	else:
	# Handle other prediction data formats
	for key, value in prediction_data.items():
	if 'label' in key.lower() or 'class' in key.lower():
	label_name = key
	label_value = value
	prob_value = prediction_data.get(f"{key}_prob", 0.0)
	pred_rows += f"<tr><td style='width:33.33%; text-align:center'>{label_name}</td><td style='width:33.33%; text-align:center'>{label_value}</td><td style='width:33.33%; text-align:center'>{prob_value:.4f}</td></tr>"

	html_result = f"""
	<div class="results-container">
	<h2>Multi-Label Classification Results</h2>
	<table class='styled-table'>
	<thead>
	<tr><th style="width:33.33%; text-align:center">Label</th><th style="width:33.33%; text-align:center">Prediction</th><th style="width:33.33%; text-align:center">Probability</th></tr>
	</thead>
	<tbody>
	{pred_rows}
	</tbody>
	</table>
	</div>
	"""

	# Add CSS styling
	html_result += """
	<style>
	.results-container {
	background-color: white;
	border-radius: 8px;
	box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);
	padding: 20px;
	margin-bottom: 20px;
	}

	.results-container h2 {
	color: #2c3e50;
	text-align: center;
	margin-bottom: 20px;
	font-size: 20px;
	}

	.results-container h3 {
	color: #2c3e50;
	text-align: center;
	margin-bottom: 15px;
	font-size: 18px;
	}

	.styled-table {
	border-collapse: collapse;
	margin: 25px auto;
	font-size: 14px;
	font-family: sans-serif;
	min-width: 400px;
	box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);
	border-radius: 6px;
	overflow: hidden;
	}
	.styled-table thead tr {
	background-color: #e0e0e0;
	color: #2c3e50;
	text-align: center;
	}
	.styled-table th {
	padding: 8px;
	font-size: 14px;
	border: 1px solid #ddd;
	font-weight: bold;
	border-bottom: 1px solid #ccc;
	}
	.styled-table td {
	padding: 15px;
	font-size: 14px;
	border: 1px solid #ddd;
	text-align: center;
	}
	.styled-table tbody tr {
	border-bottom: 1px solid #ddd;
	}
	.styled-table tbody tr:nth-of-type(even) {
	background-color: #f9f9f9;
	}
	.styled-table tbody tr:hover {
	background-color: #f0f0f0;
	}
	</style>
	"""
	yield gr.HTML(html_result)
	else:
	# If no prediction data found, display raw output
	yield gr.HTML(f"""
	<div style='text-align:center; background-color: white; padding: 30px; border-radius: 8px;'>
	<h2 style='margin-bottom: 20px;'>Prediction Completed</h2>
	<p>No prediction results found in output.</p>
	<div style='text-align:left; max-height: 400px; overflow-y: auto; background-color: white; padding: 10px; border: 1px solid #dddddd; border-radius: 5px;'>
	<pre>{result_output}</pre>
	</div>
	</div>
	""")
	else:
	# Update status
	status_info["status"] = "failed"
	status_info["current_step"] = "Prediction failed"
	yield generate_status_html(status_info)

	stderr_output = ""
	if current_process and hasattr(current_process, 'stderr') and current_process.stderr:
	stderr_output = current_process.stderr.read()
	yield gr.HTML(f"""
	<div style='text-align:center; background-color: white; padding: 30px; border-radius: 8px;'>
	<h2 style='margin-bottom: 20px;'>Prediction Failed</h2>
	<p>Error code: {current_process.returncode if current_process else 'Unknown'}</p>
	<div style='text-align:left; max-height: 400px; overflow-y: auto; background-color: white; padding: 10px; border: 1px solid #dddddd; border-radius: 5px;'>
	<pre>{stderr_output}\n{result_output}</pre>
	</div>
	</div>
	""")
	except Exception as e:
	# Update status
	status_info["status"] = "failed"
	status_info["current_step"] = "Error occurred"
	yield generate_status_html(status_info)

	yield gr.HTML(f"""
	<div style='text-align:center; background-color: white; padding: 30px; border-radius: 8px;'>
	<h2 style='margin-bottom: 20px;'>Error</h2>
	<p>{str(e)}</p>
	<div style='text-align:left; max-height: 400px; overflow-y: auto; background-color: white; padding: 10px; border: 1px solid #dddddd; border-radius: 5px;'>
	<pre>{traceback.format_exc()}</pre>
	</div>
	</div>
	""")
	finally:
	# Reset state
	is_predicting = False

	# Properly clean up the process
	if current_process and current_process.poll() is None:
	try:
	# Use process group ID to kill all related processes if possible
	if hasattr(os, "killpg") and hasattr(os, "getpgid"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGTERM)
	else:
	# On Windows or if killpg is not available
	current_process.terminate()

	# Wait briefly for termination
	try:
	current_process.wait(timeout=1)
	except subprocess.TimeoutExpired:
	# Force kill if necessary
	if hasattr(os, "killpg") and hasattr(os, "getpgid"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGKILL)
	else:
	current_process.kill()
	except Exception as e:
	# Ignore errors during process cleanup
	print(f"Error cleaning up process: {e}")

	# Reset process reference
	current_process = None
	stop_thread = False

	def predict_batch(plm_model, model_path, eval_method, input_file, eval_structure_seq, pooling_method, problem_type, num_labels, batch_size):
	"""Batch predict multiple protein sequences"""
	nonlocal is_predicting, current_process, stop_thread, process_aborted

	# Check if we're already predicting (this check is performed first)
	if is_predicting:
	return gr.HTML("""
	<div style="padding: 10px; background-color: #fff8e1; border-radius: 5px;">
	<p style="margin: 0; color: #f57f17; font-weight: bold;">A prediction is already running. Please wait or abort it.</p>
	</div>
	"""), gr.update(visible=False)

	# If the process was aborted but not reset properly, ensure we're in a clean state
	if process_aborted:
	process_aborted = False

	# Reset all state completely
	is_predicting = True
	stop_thread = False

	# Clear the output queue
	while not output_queue.empty():
	try:
	output_queue.get_nowait()
	except queue.Empty:
	break

	# Initialize progress tracking with completely fresh state
	progress_info = {
	"total": 0,
	"completed": 0,
	"current_step": "Initializing",
	"status": "running",
	"lines": [] # Store lines for error handling
	}

	# Generate completely empty initial progress display
	initial_progress_html = """
	<div style="max-width: 100%; margin: 0 auto; font-family: system-ui, -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif;">
	<div style="padding: 20px; background-color: #f8f9fa; border-radius: 10px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px; align-items: center;">
	<div style="display: flex; align-items: center;">
	<span style="display: inline-block; width: 12px; height: 12px; border-radius: 50%; background-color: #3498db; margin-right: 10px; animation: pulse 1s infinite;"></span>
	<span style="font-weight: 600; font-size: 16px;">Initializing prediction environment...</span>
	</div>
	<span style="font-weight: 500; color: #3498db;">0%</span>
	</div>
	<div style="width: 100%; height: 8px; background-color: #e0e0e0; border-radius: 4px; overflow: hidden;">
	<div style="width: 0%; height: 100%; background-color: #3498db; border-radius: 4px;"></div>
	</div>
	<div style="margin-top: 10px; font-size: 14px; color: #666;">
	<p style="margin: 5px 0;">Sequences: 0/0</p>
	</div>
	</div>
	</div>
	<style>
	@keyframes pulse {
	0% { opacity: 0.4; }
	50% { opacity: 1; }
	100% { opacity: 0.4; }
	}
	</style>
	"""

	# Always ensure the download button is hidden when starting a new prediction
	yield gr.HTML(initial_progress_html), gr.update(visible=False)

	try:
	# Check abort state before continuing
	if process_aborted:
	is_predicting = False
	return gr.HTML("""
	<div style="padding: 10px; background-color: #e8f5e9; border-radius: 5px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Process was aborted.</p>
	</div>
	"""), gr.update(visible=False)

	# Validate inputs
	if not model_path:
	is_predicting = False
	yield gr.HTML("""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error: Model path is required</p>
	</div>
	"""), gr.update(visible=False)
	return

	if not os.path.exists(os.path.dirname(model_path)):
	is_predicting = False
	yield gr.HTML("""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error: Invalid model path - directory does not exist</p>
	</div>
	"""), gr.update(visible=False)
	return

	if not input_file:
	is_predicting = False
	yield gr.HTML("""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error: Input file is required</p>
	</div>
	"""), gr.update(visible=False)
	return

	# Update progress
	progress_info["current_step"] = "Preparing input file"
	yield generate_progress_html(progress_info), gr.update(visible=False)

	# Create temporary file to save uploaded file
	temp_dir = tempfile.mkdtemp()
	input_path = os.path.join(temp_dir, "input.csv")
	output_dir = temp_dir # Use the same temporary directory as output directory
	output_file = "predictions.csv"
	output_path = os.path.join(output_dir, output_file)

	# Save uploaded file
	try:
	with open(input_path, "wb") as f:
	# Fix file upload error, correctly handle files uploaded through gradio
	if hasattr(input_file, "name"):
	# If it's a NamedString object, read the file content
	with open(input_file.name, "rb") as uploaded:
	f.write(uploaded.read())
	else:
	# If it's a bytes object, write directly
	f.write(input_file)

	# Verify file was saved correctly
	if not os.path.exists(input_path):
	is_predicting = False
	yield gr.HTML("""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error: Failed to save input file</p>
	</div>
	"""), gr.update(visible=False)
	progress_info["status"] = "failed"
	progress_info["current_step"] = "Failed to save input file"
	return

	# Count sequences in input file
	try:
	df = pd.read_csv(input_path)
	progress_info["total"] = len(df)
	progress_info["current_step"] = f"Found {len(df)} sequences to process"
	yield generate_progress_html(progress_info), gr.update(visible=False)
	except Exception as e:
	is_predicting = False
	yield gr.HTML(f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error reading CSV file:</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto;">{str(e)}</pre>
	</div>
	"""), gr.update(visible=False)
	progress_info["status"] = "failed"
	progress_info["current_step"] = "Error reading CSV file"
	return

	except Exception as e:
	is_predicting = False
	yield gr.HTML(f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error saving input file:</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto;">{str(e)}</pre>
	</div>
	"""), gr.update(visible=False)
	progress_info["status"] = "failed"
	progress_info["current_step"] = "Failed to save input file"
	return

	# Update progress
	progress_info["current_step"] = "Preparing model and parameters"
	yield generate_progress_html(progress_info), gr.update(visible=False)

	# Prepare command
	args_dict = {
	"model_path": model_path,
	"plm_model": plm_models[plm_model],
	"input_file": input_path,
	"output_dir": output_dir, # Update to output directory
	"output_file": output_file, # Output filename
	"pooling_method": pooling_method,
	"problem_type": problem_type,
	"num_labels": num_labels,
	"eval_method": eval_method,
	"batch_size": batch_size
	}

	if eval_method == "ses-adapter":
	args_dict["structure_seq"] = ",".join(eval_structure_seq) if eval_structure_seq else None
	if eval_structure_seq:
	if "foldseek_seq" in eval_structure_seq:
	args_dict["use_foldseek"] = True
	if "ss8_seq" in eval_structure_seq:
	args_dict["use_ss8"] = True
	else:
	args_dict["structure_seq"] = None

	# Build command line
	final_cmd = [sys.executable, "src/predict_batch.py"]
	for k, v in args_dict.items():
	if v is True:
	final_cmd.append(f"--{k}")
	elif v is not False and v is not None:
	final_cmd.append(f"--{k}")
	final_cmd.append(str(v))

	# Update progress
	progress_info["current_step"] = "Starting batch prediction process"
	yield generate_progress_html(progress_info), gr.update(visible=False)

	# Start prediction process
	try:
	current_process = subprocess.Popen(
	final_cmd,
	stdout=subprocess.PIPE,
	stderr=subprocess.STDOUT,
	text=True,
	bufsize=1,
	universal_newlines=True,
	preexec_fn=os.setsid if hasattr(os, "setsid") else None
	)
	except Exception as e:
	is_predicting = False
	yield gr.HTML(f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error starting prediction process:</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto;">{str(e)}</pre>
	</div>
	"""), gr.update(visible=False)
	return

	output_thread = threading.Thread(target=process_output, args=(current_process, output_queue))
	output_thread.daemon = True
	output_thread.start()

	# Start monitoring loop
	last_update_time = time.time()
	result_output = ""

	# Modified processing loop with abort check
	while True:
	# Check if process was aborted or completed
	if process_aborted or current_process is None or current_process.poll() is not None:
	break

	# Check for new output
	try:
	# Get new lines
	new_lines = []
	for _ in range(10): # Process up to 10 lines at once
	try:
	line = output_queue.get_nowait()
	new_lines.append(line)
	result_output += line + "\n"
	progress_info["lines"].append(line)

	# Update progress based on output
	if "Predicting:" in line:
	try:
	# Extract progress from tqdm output
	match = re.search(r'(\d+)/(\d+)', line)
	if match:
	current, total = map(int, match.groups())
	progress_info["completed"] = current
	progress_info["total"] = total
	progress_info["current_step"] = f"Processing sequence {current}/{total}"
	except:
	pass
	elif "Loading Model and Tokenizer" in line:
	progress_info["current_step"] = "Loading model and tokenizer"
	elif "Processing sequences" in line:
	progress_info["current_step"] = "Processing sequences"
	elif "Saving results" in line:
	progress_info["current_step"] = "Saving results"
	except queue.Empty:
	break

	# Check if the process has been aborted before updating UI
	if process_aborted:
	break

	# Check if we need to update the UI
	current_time = time.time()
	if new_lines or (current_time - last_update_time >= 0.5):
	yield generate_progress_html(progress_info), gr.update(visible=False)
	last_update_time = current_time

	# Small sleep to avoid busy waiting
	if not new_lines:
	time.sleep(0.1)

	except Exception as e:
	# Check if the process has been aborted before showing error
	if process_aborted:
	break

	error_html = f"""
	<div style="padding: 10px; background-color: #fff8e1; border-radius: 5px;">
	<p style="margin: 0; color: #f57f17; font-weight: bold;">Warning reading output:</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto;">{str(e)}</pre>
	</div>
	"""
	yield gr.HTML(error_html), gr.update(visible=False)

	# Check if aborted instead of completed
	if process_aborted:
	is_predicting = False
	aborted_html = """
	<div style="padding: 10px; background-color: #e8f5e9; border-radius: 5px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Prediction was manually terminated.</p>
	<p style="margin: 5px 0 0; color: #388e3c;">All prediction state has been reset.</p>
	</div>
	"""
	yield gr.HTML(aborted_html), gr.update(visible=False)
	return

	# Process has completed
	if os.path.exists(output_path):
	if current_process and current_process.returncode == 0:
	progress_info["status"] = "completed"
	# Generate final success HTML
	success_html = f"""
	<div style="padding: 15px; background-color: #e8f5e9; border-radius: 5px; margin-bottom: 10px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Prediction completed successfully!</p>
	<p style="margin: 5px 0 0;">Results saved to: {output_path}</p>
	<p style="margin: 5px 0 0;">Total sequences processed: {progress_info.get('total', 0)}</p>
	</div>
	"""

	# Read prediction results
	try:
	df = pd.read_csv(output_path)

	# Create summary statistics based on problem type
	summary_html = ""
	if problem_type == "regression":
	summary_html = f"""
	<div class="summary-stats">
	<div class="stat-item">
	<div class="stat-value">{len(df)}</div>
	<div class="stat-label">Predictions</div>
	</div>
	<div class="stat-item">
	<div class="stat-value">{df['prediction'].mean():.4f}</div>
	<div class="stat-label">Mean</div>
	</div>
	<div class="stat-item">
	<div class="stat-value">{df['prediction'].min():.4f}</div>
	<div class="stat-label">Min</div>
	</div>
	<div class="stat-item">
	<div class="stat-value">{df['prediction'].max():.4f}</div>
	<div class="stat-label">Max</div>
	</div>
	</div>
	"""
	elif problem_type == "single_label_classification":
	if 'predicted_class' in df.columns:
	class_counts = df['predicted_class'].value_counts()
	class_stats = "".join([
	f"""
	<div class="stat-item">
	<div class="stat-value">{count}</div>
	<div class="stat-label">Class {class_label}</div>
	</div>
	"""
	for class_label, count in class_counts.items()
	])

	summary_html = f"""
	<div class="summary-stats">
	<div class="stat-item">
	<div class="stat-value">{len(df)}</div>
	<div class="stat-label">Predictions</div>
	</div>
	{class_stats}
	</div>
	"""
	elif problem_type == "multi_label_classification":
	label_cols = [col for col in df.columns if col.startswith('label_') and not col.endswith('_prob')]
	if label_cols:
	label_stats = "".join([
	f"""
	<div class="stat-item">
	<div class="stat-value">{df[col].sum()}</div>
	<div class="stat-label">{col}</div>
	</div>
	"""
	for col in label_cols
	])

	summary_html = f"""
	<div class="summary-stats">
	<div class="stat-item">
	<div class="stat-value">{len(df)}</div>
	<div class="stat-label">Predictions</div>
	</div>
	{label_stats}
	</div>
	"""

	# Create table preview with style consistent with dataset preview
	html_table = f"""
	<div class="results-container">
	<h2>Batch Prediction Results Preview</h2>
	{summary_html}
	<div class="table-wrapper">
	<table class="dataset-preview-table">
	<thead>
	<tr>
	{' '.join([f'<th style="text-align: center;">{col}</th>' for col in df.columns])}
	</tr>
	</thead>
	<tbody>
	{generate_table_rows(df)}
	</tbody>
	</table>
	</div>
	<div class="download-hint">
	<p>You can download the complete prediction results using the button below.</p>
	</div>
	</div>
	"""

	# Add CSS styles
	final_html = success_html + f"""
	{html_table}
	<style>
	.results-container {{
	background-color: white;
	border-radius: 8px;
	box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);
	padding: 20px;
	margin-bottom: 20px;
	}}

	.results-container h2 {{
	color: #2c3e50;
	text-align: center;
	margin-bottom: 20px;
	font-size: 20px;
	}}

	.results-container h3 {{
	color: #2c3e50;
	text-align: center;
	margin-bottom: 15px;
	font-size: 18px;
	}}

	.summary-stats {{
	display: flex;
	flex-wrap: wrap;
	justify-content: center;
	gap: 15px;
	margin-bottom: 25px;
	}}

	.stat-item {{
	background-color: #f8f9fa;
	border-radius: 6px;
	padding: 12px;
	min-width: 100px;
	text-align: center;
	box-shadow: 0 1px 3px rgba(0, 0, 0, 0.05);
	}}

	.stat-value {{
	font-size: 20px;
	font-weight: bold;
	color: #3498db;
	margin-bottom: 4px;
	text-align: center;
	}}

	.stat-label {{
	font-size: 12px;
	color: #7f8c8d;
	text-align: center;
	}}

	.table-wrapper {{
	max-height: 400px;
	overflow-y: auto;
	margin-bottom: 15px;
	border: 1px solid #ddd;
	border-radius: 6px;
	}}

	/* Match dataset-preview-table style from eval_tab */
	.dataset-preview-table {{
	width: 100%;
	border-collapse: collapse;
	font-size: 14px;
	background-color: white;
	table-layout: fixed;
	}}

	.dataset-preview-table th {{
	padding: 8px;
	font-size: 14px;
	border: 1px solid #ddd;
	background-color: #e0e0e0;
	font-weight: bold;
	border-bottom: 1px solid #ccc;
	text-align: center;
	width: auto;
	}}

	.dataset-preview-table td {{
	padding: 15px;
	font-size: 14px;
	border: 1px solid #ddd;
	text-align: center;
	width: auto;
	}}

	.dataset-preview-table tr:nth-child(even) {{
	background-color: #f9f9f9;
	}}

	.dataset-preview-table tr:hover {{
	background-color: #f0f0f0;
	}}

	.download-hint {{
	text-align: center;
	color: #7f8c8d;
	font-style: italic;
	margin-top: 10px;
	font-size: 12px;
	}}
	</style>
	"""

	# Return results preview and download link
	yield gr.HTML(final_html), gr.update(value=output_path, visible=True)
	except Exception as e:
	# If reading results file fails, show error but still provide download link
	error_html = f"""
	{success_html}
	<div style="padding: 10px; background-color: #fff8e1; border-radius: 5px; margin-top: 10px;">
	<p style="margin: 0; color: #f57f17; font-weight: bold;">Unable to load preview results: {str(e)}</p>
	<p style="margin: 5px 0 0;">You can still download the complete prediction results file.</p>
	</div>
	"""
	yield gr.HTML(error_html), gr.update(value=output_path, visible=True)
	else:
	# Process failed
	error_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Prediction failed to complete</p>
	<p style="margin: 5px 0 0;">Process return code: {current_process.returncode if current_process else 'Unknown'}</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto;">{result_output}</pre>
	</div>
	"""
	yield gr.HTML(error_html), gr.update(visible=False)
	else:
	progress_info["status"] = "failed"
	error_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Prediction completed, but output file not found at {output_path}</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto;">{result_output}</pre>
	</div>
	"""
	yield gr.HTML(error_html), gr.update(visible=False)
	except Exception as e:
	# Capture the full error with traceback
	error_traceback = traceback.format_exc()

	# Display error with traceback in UI
	error_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error during batch prediction: {str(e)}</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto; background-color: #f8f9fa; padding: 10px; border-radius: 5px; font-family: monospace; font-size: 12px;">{error_traceback}</pre>
	</div>
	"""
	yield gr.HTML(error_html), gr.update(visible=False)
	finally:
	# Always reset prediction state
	is_predicting = False
	if current_process:
	current_process = None
	process_aborted = False # Reset abort flag

	def generate_progress_html(progress_info):
	"""Generate HTML progress bar similar to eval_tab"""
	current = progress_info.get("completed", 0)
	total = max(progress_info.get("total", 1), 1) # Avoid division by zero
	percentage = min(100, int((current / total) * 100))
	stage = progress_info.get("current_step", "Preparing")

	# 确保进度在0-100之间
	percentage = max(0, min(100, percentage))

	# 准备详细信息
	details = []
	if total > 0:
	details.append(f"Total sequences: {total}")
	if current > 0 and total > 0:
	details.append(f"Current progress: {current}/{total}")

	details_text = ", ".join(details)

	# 创建更现代化的进度条 - 完全匹配eval_tab的样式
	return f"""
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Prediction Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">{stage}</span>
	</div>
	<div>
	<span style="font-weight: 600; color: #333;">{percentage:.1f}%</span>
	</div>
	</div>

	<div style="margin-bottom: 15px; background-color: #e9ecef; height: 10px; border-radius: 5px; overflow: hidden;">
	<div style="background-color: #4285f4; width: {percentage}%; height: 100%; border-radius: 5px; transition: width 0.3s ease;"></div>
	</div>

	<div style="display: flex; flex-wrap: wrap; gap: 10px; font-size: 14px; color: #555;">
	{f'<div style="background-color: #e3f2fd; padding: 5px 10px; border-radius: 4px;"><span style="font-weight: 500;">Total sequences:</span> {total}</div>' if total > 0 else ''}
	{f'<div style="background-color: #e8f5e9; padding: 5px 10px; border-radius: 4px;"><span style="font-weight: 500;">Progress:</span> {current}/{total}</div>' if current > 0 and total > 0 else ''}
	{f'<div style="background-color: #fff8e1; padding: 5px 10px; border-radius: 4px;"><span style="font-weight: 500;">Status:</span> {progress_info.get("status", "").capitalize()}</div>' if "status" in progress_info else ''}
	</div>
	</div>
	"""

	def generate_table_rows(df, max_rows=100):
	"""Generate HTML table rows with special handling for sequence data, maintaining consistent style with eval_tab"""
	rows = []
	for i, row in df.iterrows():
	if i >= max_rows:
	break

	cells = []
	for col in df.columns:
	value = row[col]
	# Special handling for sequence type columns
	if col in ['aa_seq', 'foldseek_seq', 'ss8_seq'] and isinstance(value, str) and len(value) > 30:
	# Add title attribute to show full sequence on hover
	cell = f'<td title="{value}" style="padding: 15px; font-size: 14px; border: 1px solid #ddd; font-family: monospace; text-align: center; vertical-align: middle; display: table-cell; text-align: center;">{value[:30]}...</td>'
	# Format numeric values to 4 decimal places
	elif isinstance(value, (int, float)) and not isinstance(value, bool):
	formatted_value = f"{value:.4f}" if isinstance(value, float) else value
	cell = f'<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{formatted_value}</td>'
	else:
	cell = f'<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{value}</td>'
	cells.append(cell)

	# Add alternating row background color
	bg_color = "#f9f9f9" if i % 2 == 1 else "white"
	rows.append(f'<tr style="background-color: {bg_color};">{" ".join(cells)}</tr>')

	if len(df) > max_rows:
	cols_count = len(df.columns)
	rows.append(f'<tr><td colspan="{cols_count}" style="text-align:center; font-style:italic; padding: 15px; font-size: 14px; border: 1px solid #ddd;">Showing {max_rows} of {len(df)} rows</td></tr>')

	return '\n'.join(rows)

	def handle_abort():
	"""Handle abortion of the prediction process for both single and batch prediction"""
	nonlocal is_predicting, current_process, stop_thread, process_aborted

	if not is_predicting or current_process is None:
	empty_html = """
	<div style="padding: 10px; background-color: #f5f5f5; border-radius: 5px;">
	<p style="margin: 0;">No prediction process is currently running.</p>
	</div>
	"""
	# Return full HTML value (not gr.HTML component)
	return empty_html

	try:
	# Set the abort flag before terminating the process
	process_aborted = True
	stop_thread = True

	# Kill the process group
	if hasattr(os, "killpg"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGTERM)
	else:
	current_process.terminate()

	# Wait for process to terminate (with timeout)
	try:
	current_process.wait(timeout=5)
	except subprocess.TimeoutExpired:
	if hasattr(os, "killpg"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGKILL)
	else:
	current_process.kill()

	# Reset state
	is_predicting = False
	current_process = None

	# Clear output queue
	while not output_queue.empty():
	try:
	output_queue.get_nowait()
	except queue.Empty:
	break

	success_html = """
	<div style="padding: 10px; background-color: #e8f5e9; border-radius: 5px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Prediction successfully terminated!</p>
	<p style="margin: 5px 0 0; color: #388e3c;">All prediction state has been reset.</p>
	</div>
	"""

	# Return full HTML value (not gr.HTML component)
	return success_html

	except Exception as e:
	# Reset states even on error
	is_predicting = False
	current_process = None
	process_aborted = False

	# Clear queue
	while not output_queue.empty():
	try:
	output_queue.get_nowait()
	except queue.Empty:
	break

	error_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Failed to terminate prediction: {str(e)}</p>
	<p style="margin: 5px 0 0; color: #c62828;">Prediction state has been reset.</p>
	</div>
	"""

	# Return full HTML value (not gr.HTML component)
	return error_html

	# Create handler functions for each tab
	def handle_abort_single():
	"""Handle abort for single sequence prediction tab"""
	# Flag the process for abortion first
	nonlocal stop_thread, process_aborted, is_predicting, current_process

	# Only proceed if there's an active prediction
	if not is_predicting or current_process is None:
	return gr.HTML("""
	<div style="padding: 10px; background-color: #f5f5f5; border-radius: 5px;">
	<p style="margin: 0;">No prediction process is currently running.</p>
	</div>
	""")

	# Set the abort flags
	process_aborted = True
	stop_thread = True

	# Terminate the process
	try:
	if hasattr(os, "killpg"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGTERM)
	else:
	current_process.terminate()

	# Wait briefly for termination
	try:
	current_process.wait(timeout=1)
	except subprocess.TimeoutExpired:
	# Force kill if necessary
	if hasattr(os, "killpg"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGKILL)
	else:
	current_process.kill()
	except Exception as e:
	pass # Catch any termination errors

	# Reset state
	is_predicting = False
	current_process = None

	# Return the success message
	return gr.HTML("""
	<div style="padding: 10px; background-color: #e8f5e9; border-radius: 5px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Prediction successfully terminated!</p>
	<p style="margin: 5px 0 0; color: #388e3c;">All prediction state has been reset.</p>
	</div>
	""")

	def handle_abort_batch():
	"""Handle abort for batch prediction tab"""
	# Flag the process for abortion first
	nonlocal stop_thread, process_aborted, is_predicting, current_process

	# Only proceed if there's an active prediction
	if not is_predicting or current_process is None:
	return gr.HTML("""
	<div style="padding: 10px; background-color: #f5f5f5; border-radius: 5px;">
	<p style="margin: 0;">No prediction process is currently running.</p>
	</div>
	"""), gr.update(visible=False)

	# Set the abort flags
	process_aborted = True
	stop_thread = True

	# Terminate the process
	try:
	if hasattr(os, "killpg"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGTERM)
	else:
	current_process.terminate()

	# Wait briefly for termination
	try:
	current_process.wait(timeout=1)
	except subprocess.TimeoutExpired:
	# Force kill if necessary
	if hasattr(os, "killpg"):
	os.killpg(os.getpgid(current_process.pid), signal.SIGKILL)
	else:
	current_process.kill()
	except Exception as e:
	pass # Catch any termination errors

	# Reset state
	is_predicting = False
	current_process = None

	# Clear output queue
	while not output_queue.empty():
	try:
	output_queue.get_nowait()
	except queue.Empty:
	break

	# Return the success message and hide the download button
	return gr.HTML("""
	<div style="padding: 10px; background-color: #e8f5e9; border-radius: 5px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Prediction successfully terminated!</p>
	<p style="margin: 5px 0 0; color: #388e3c;">All prediction state has been reset.</p>
	</div>
	"""), gr.update(visible=False)

	def handle_preview(plm_model, model_path, eval_method, aa_seq, foldseek_seq, ss8_seq, eval_structure_seq, pooling_method, problem_type, num_labels):
	"""处理单序列预测命令预览"""
	# 构建参数字典
	args_dict = {
	"model_path": model_path,
	"plm_model": plm_models[plm_model],
	"aa_seq": aa_seq,
	"foldseek_seq": foldseek_seq if foldseek_seq else "",
	"ss8_seq": ss8_seq if ss8_seq else "",
	"pooling_method": pooling_method,
	"problem_type": problem_type,
	"num_labels": num_labels,
	"eval_method": eval_method
	}

	if eval_method == "ses-adapter":
	args_dict["structure_seq"] = ",".join(eval_structure_seq) if eval_structure_seq else None
	if eval_structure_seq:
	if "foldseek_seq" in eval_structure_seq:
	args_dict["use_foldseek"] = True
	if "ss8_seq" in eval_structure_seq:
	args_dict["use_ss8"] = True

	# 生成预览命令
	preview_text = preview_predict_command(args_dict, is_batch=False)
	return gr.update(value=preview_text, visible=True)

	def handle_batch_preview(plm_model, model_path, eval_method, input_file, eval_structure_seq, pooling_method, problem_type, num_labels, batch_size):
	"""处理批量预测命令预览"""
	if not input_file:
	return gr.update(value="Please upload a file first", visible=True)

	# 创建临时目录作为输出目录
	temp_dir = "temp_predictions"
	output_file = "predictions.csv"

	args_dict = {
	"model_path": model_path,
	"plm_model": plm_models[plm_model],
	"input_file": input_file.name if hasattr(input_file, "name") else "input.csv",
	"output_dir": temp_dir, # 新增输出目录参数
	"output_file": output_file, # 输出文件名
	"pooling_method": pooling_method,
	"problem_type": problem_type,
	"num_labels": num_labels,
	"eval_method": eval_method,
	"batch_size": batch_size
	}

	if eval_method == "ses-adapter":
	args_dict["structure_seq"] = ",".join(eval_structure_seq) if eval_structure_seq else None
	if eval_structure_seq:
	if "foldseek_seq" in eval_structure_seq:
	args_dict["use_foldseek"] = True
	if "ss8_seq" in eval_structure_seq:
	args_dict["use_ss8"] = True

	# 生成预览命令
	preview_text = preview_predict_command(args_dict, is_batch=True)
	return gr.update(value=preview_text, visible=True)

	with gr.Tab("Prediction"):
	with gr.Row():
	with gr.Column():
	gr.Markdown("## Protein Function Prediction")

	gr.Markdown("### Model Configuration")
	with gr.Group():

	with gr.Row():
	model_path = gr.Textbox(
	label="Model Path",
	value="ckpt/demo/demo_provided.pt",
	placeholder="Path to the trained model"
	)
	plm_model = gr.Dropdown(
	choices=list(plm_models.keys()),
	label="Protein Language Model"
	)

	with gr.Row():
	eval_method = gr.Dropdown(
	choices=["full", "freeze", "ses-adapter", "plm-lora", "plm-qlora", "plm_adalora", "plm_dora", "plm_ia3"],
	label="Evaluation Method",
	value="freeze"
	)
	pooling_method = gr.Dropdown(
	choices=["mean", "attention1d", "light_attention"],
	label="Pooling Method",
	value="mean"
	)

	# Settings for different training methods
	with gr.Row(visible=False) as structure_seq_row:
	structure_seq = gr.Dropdown(
	choices=["foldseek_seq", "ss8_seq"],
	label="Structure Sequences",
	multiselect=True,
	value=["foldseek_seq", "ss8_seq"],
	info="Select the structure sequences to use for prediction"
	)


	with gr.Row():
	problem_type = gr.Dropdown(
	choices=["single_label_classification", "multi_label_classification", "regression"],
	label="Problem Type",
	value="single_label_classification"
	)
	num_labels = gr.Number(
	value=2,
	label="Number of Labels",
	precision=0,
	minimum=1
	)

	with gr.Tabs():
	with gr.Tab("Sequence Prediction"):
	gr.Markdown("### Input Sequences")
	with gr.Row():
	aa_seq = gr.Textbox(
	label="Amino Acid Sequence",
	placeholder="Enter protein sequence",
	lines=3
	)
	# Put the structure input rows in a row with controllable visibility
	with gr.Row(visible=False) as structure_input_row:
	foldseek_seq = gr.Textbox(
	label="Foldseek Sequence",
	placeholder="Enter foldseek sequence if available",
	lines=3
	)
	ss8_seq = gr.Textbox(
	label="SS8 Sequence",
	placeholder="Enter secondary structure sequence if available",
	lines=3
	)

	with gr.Row():
	preview_single_button = gr.Button("Preview Command")
	predict_button = gr.Button("Predict", variant="primary")
	abort_button = gr.Button("Abort", variant="stop")

	# 添加命令预览区域
	command_preview = gr.Code(
	label="Command Preview",
	language="shell",
	interactive=False,
	visible=False
	)
	predict_output = gr.HTML(label="Prediction Results")




	predict_button.click(
	fn=predict_sequence,
	inputs=[
	plm_model,
	model_path,
	aa_seq,
	eval_method,
	structure_seq,
	pooling_method,
	problem_type,
	num_labels
	],
	outputs=predict_output
	)

	abort_button.click(
	fn=handle_abort_single,
	inputs=[],
	outputs=[predict_output]
	)

	with gr.Tab("Batch Prediction"):
	gr.Markdown("### Batch Prediction")
	# Display CSV format information with improved styling
	gr.HTML("""
	<div class="csv-format-info">
	<h4>CSV File Format Requirements</h4>
	<p class="format-description">Please prepare your input CSV file with the following columns:</p>
	<div class="csv-columns">
	<div class="column-item required">
	<div class="column-name">aa_seq (required)</div>
	<div class="column-desc">Amino acid sequence</div>
	</div>
	<div class="column-item optional">
	<div class="column-name">id (optional)</div>
	<div class="column-desc">Unique identifier for each sequence</div>
	</div>
	<div class="column-item optional">
	<div class="column-name">foldseek_seq (optional)</div>
	<div class="column-desc">Foldseek structure sequence</div>
	</div>
	<div class="column-item optional">
	<div class="column-name">ss8_seq (optional)</div>
	<div class="column-desc">Secondary structure sequence</div>
	</div>
	</div>
	</div>
	<style>
	.csv-format-info {
	background-color: #ffffff;
	border-radius: 8px;
	padding: 15px;
	margin: 0 0 15px 0;
	}
	.csv-format-info h4 {
	margin: 0 0 10px 0;
	color: #2c3e50;
	font-size: 16px;
	}
	.format-description {
	margin-bottom: 12px;
	color: #555;
	font-size: 14px;
	}
	.csv-columns {
	display: flex;
	flex-wrap: wrap;
	gap: 10px;
	margin-bottom: 10px;
	}
	.column-item {
	background-color: white;
	border-radius: 6px;
	padding: 10px;
	flex: 1 1 200px;
	box-shadow: 0 1px 3px rgba(0,0,0,0.1);
	transition: transform 0.2s ease;
	}
	.column-item:hover {
	transform: translateY(-2px);
	}
	.column-item.required {
	border-left: 3px solid #3498db;
	}
	.column-item.optional {
	border-left: 3px solid #27ae60;
	}
	.column-name {
	font-family: monospace;
	font-weight: bold;
	margin-bottom: 5px;
	color: #2c3e50;
	font-size: 14px;
	}
	.column-desc {
	font-size: 13px;
	color: #7f8c8d;
	line-height: 1.3;
	}
	.csv-example {
	background-color: #e9ecef;
	border-radius: 6px;
	padding: 10px;
	margin-top: 8px;
	}
	</style>
	""")

	with gr.Row():
	input_file = gr.UploadButton(
	label="Upload CSV File",
	file_types=[".csv"],
	file_count="single"
	)

	# File preview accordion
	with gr.Accordion("File Preview", open=False) as file_preview_accordion:
	# File info area
	with gr.Row():
	file_info = gr.HTML("", elem_classes=["dataset-stats"])

	# Table area
	with gr.Row():
	file_preview = gr.Dataframe(
	headers=["name", "sequence"],
	value=[["No file uploaded", "-"]],
	wrap=True,
	interactive=False,
	row_count=5,
	elem_classes=["preview-table"]
	)

	# Add file preview function
	def update_file_preview(file):
	if file is None:
	return gr.update(value="<div class='file-info'>No file uploaded</div>"), gr.update(value=[["No file uploaded", "-"]], headers=["name", "sequence"]), gr.update(open=False)
	try:
	df = pd.read_csv(file.name)
	info_html = f"""
	<div style="text-align: center; margin: 20px 0;">
	<table style="width: 100%; border-collapse: collapse; margin: 0 auto;">
	<tr>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">File</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Total Sequences</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Columns</th>
	</tr>
	<tr>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{file.name.split('/')[-1]}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{len(df)}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{', '.join(df.columns.tolist())}</td>
	</tr>
	</table>
	</div>
	"""
	return gr.update(value=info_html), gr.update(value=df.head(5).values.tolist(), headers=df.columns.tolist()), gr.update(open=True)
	except Exception as e:
	error_html = f"""
	<div>
	<h2>Error reading file</h2>
	<p style="color: #c62828;">{str(e)}</p>
	</div>
	"""
	return gr.update(value=error_html), gr.update(value=[["Error", str(e)]], headers=["Error", "Message"]), gr.update(open=True)

	# Use upload event instead of click event
	input_file.upload(
	fn=update_file_preview,
	inputs=[input_file],
	outputs=[file_info, file_preview, file_preview_accordion]
	)
	with gr.Row():
	with gr.Column(scale=1):
	batch_size = gr.Slider(
	minimum=1,
	maximum=32,
	value=8,
	step=1,
	label="Batch Size",
	info="Number of sequences to process at once"
	)

	with gr.Row():
	preview_batch_button = gr.Button("Preview Command")
	batch_predict_button = gr.Button("Start Batch Prediction", variant="primary")
	batch_abort_button = gr.Button("Abort", variant="stop")

	# 添加命令预览区域
	batch_command_preview = gr.Code(
	label="Command Preview",
	language="shell",
	interactive=False,
	visible=False
	)
	batch_predict_output = gr.HTML(label="Prediction Progress")
	result_file = gr.DownloadButton(label="Download Predictions", visible=False)

	# 在UI部分添加命令预览的可见性控制
	def toggle_preview(button_text):
	"""切换命令预览的可见性"""
	if "Preview" in button_text:
	return gr.update(visible=True)
	return gr.update(visible=False)

	# 连接预览按钮
	preview_single_button.click(
	fn=toggle_preview,
	inputs=[preview_single_button],
	outputs=[command_preview]
	).then(
	fn=handle_preview,
	inputs=[
	plm_model,
	model_path,
	eval_method,
	aa_seq,
	foldseek_seq,
	ss8_seq,
	structure_seq,
	pooling_method,
	problem_type,
	num_labels
	],
	outputs=[command_preview]
	)

	# 连接预览按钮
	preview_batch_button.click(
	fn=toggle_preview,
	inputs=[preview_batch_button],
	outputs=[batch_command_preview]
	).then(
	fn=handle_batch_preview,
	inputs=[
	plm_model,
	model_path,
	eval_method,
	input_file,
	structure_seq,
	pooling_method,
	problem_type,
	num_labels,
	batch_size
	],
	outputs=[batch_command_preview]
	)

	batch_predict_button.click(
	fn=predict_batch,
	inputs=[
	plm_model,
	model_path,
	eval_method,
	input_file,
	structure_seq,
	pooling_method,
	problem_type,
	num_labels,
	batch_size
	],
	outputs=[batch_predict_output, result_file]
	)

	batch_abort_button.click(
	fn=handle_abort_batch,
	inputs=[],
	outputs=[batch_predict_output, result_file]
	)

	# Add this code after all UI components are defined
	def update_eval_method(method):
	return {
	structure_seq_row: gr.update(visible=method == "ses-adapter"),
	structure_input_row: gr.update(visible=method == "ses-adapter")
	}

	eval_method.change(
	fn=update_eval_method,
	inputs=[eval_method],
	outputs=[structure_seq_row, structure_input_row]
	)

	# Add a new function to control the visibility of the structure sequence input boxes
	def update_structure_inputs(structure_seq_choices):
	return {
	foldseek_seq: gr.update(visible="foldseek_seq" in structure_seq_choices),
	ss8_seq: gr.update(visible="ss8_seq" in structure_seq_choices)
	}

	# Add event handling to the UI definition section
	structure_seq.change(
	fn=update_structure_inputs,
	inputs=[structure_seq],
	outputs=[foldseek_seq, ss8_seq]
	)



	return {
	"predict_sequence": predict_sequence,
	"predict_batch": predict_batch,
	"handle_abort": handle_abort
	}