Spaces:

2dogey
/

VenusFactory

Runtime error

App Files Files Community

VenusFactory / src /web /train_tab.py

2dogey

Upload folder using huggingface_hub

8918ac7 verified about 1 month ago

raw

history blame contribute delete

80.7 kB

	import os
	import json
	import gradio as gr
	import time
	from datasets import load_dataset
	import pandas as pd
	from typing import Any, Dict, Union, Optional, Generator, List
	from dataclasses import dataclass
	from .utils.command import preview_command, save_arguments, build_command_list
	from .utils.monitor import TrainingMonitor
	import traceback
	import base64
	import tempfile
	import numpy as np
	import queue
	import subprocess
	import sys
	import threading

	@dataclass
	class TrainingArgs:
	def __init__(self, args: list, plm_models: dict, dataset_configs: dict):
	# Basic parameters
	self.plm_model = plm_models[args[0]]

	# 处理自定义数据集或预定义数据集
	self.dataset_selection = args[1] # "Use Custom Dataset" 或 "Use Pre-defined Dataset"
	if self.dataset_selection == "Use Pre-defined Dataset":
	self.dataset_config = dataset_configs[args[2]]
	self.dataset_custom = None
	# 从配置加载问题类型等
	with open(self.dataset_config, 'r') as f:
	config = json.load(f)
	self.problem_type = config.get("problem_type", "single_label_classification")
	self.num_labels = config.get("num_labels", 2)
	self.metrics = config.get("metrics", "accuracy,mcc,f1,precision,recall,auroc")
	else:
	self.dataset_config = None
	self.dataset_custom = args[3] # Custom dataset path
	self.problem_type = args[4]
	self.num_labels = args[5]
	self.metrics = args[6]
	# 如果metrics是列表，转换为逗号分隔的字符串
	if isinstance(self.metrics, list):
	self.metrics = ",".join(self.metrics)

	# Training method parameters
	self.training_method = args[7]
	self.pooling_method = args[8]

	# Batch processing parameters
	self.batch_mode = args[9]
	if self.batch_mode == "Batch Size Mode":
	self.batch_size = args[10]
	else:
	self.batch_token = args[11]

	# Training parameters
	self.learning_rate = args[12]
	self.num_epochs = args[13]
	self.max_seq_len = args[14]
	self.gradient_accumulation_steps = args[15]
	self.warmup_steps = args[16]
	self.scheduler = args[17]

	# Output parameters
	self.output_model_name = args[18]
	self.output_dir = args[19]

	# Wandb parameters
	self.wandb_enabled = args[20]
	if self.wandb_enabled:
	self.wandb_project = args[21]
	self.wandb_entity = args[22]

	# Other parameters
	self.patience = args[23]
	self.num_workers = args[24]
	self.max_grad_norm = args[25]
	self.structure_seq = args[26]

	# LoRA parameters
	self.lora_r = args[27]
	self.lora_alpha = args[28]
	self.lora_dropout = args[29]
	self.lora_target_modules = [m.strip() for m in args[30].split(",")] if args[30] else []

	def to_dict(self) -> Dict[str, Any]:
	args_dict = {
	"plm_model": self.plm_model,
	"training_method": self.training_method,
	"pooling_method": self.pooling_method,
	"learning_rate": self.learning_rate,
	"num_epochs": self.num_epochs,
	"max_seq_len": self.max_seq_len,
	"gradient_accumulation_steps": self.gradient_accumulation_steps,
	"warmup_steps": self.warmup_steps,
	"scheduler": self.scheduler,
	"output_model_name": self.output_model_name,
	"output_dir": self.output_dir,
	"patience": self.patience,
	"num_workers": self.num_workers,
	"max_grad_norm": self.max_grad_norm,
	}

	if self.training_method == "ses-adapter" and self.structure_seq:
	args_dict["structure_seq"] = ",".join(self.structure_seq)

	# 添加数据集相关参数
	if self.dataset_selection == "Use Pre-defined Dataset":
	args_dict["dataset_config"] = self.dataset_config
	else:
	args_dict["dataset"] = self.dataset_custom
	args_dict["problem_type"] = self.problem_type
	args_dict["num_labels"] = self.num_labels
	args_dict["metrics"] = self.metrics

	# Add LoRA parameters
	if self.training_method in ["plm-lora", "plm-qlora", "plm_adalora", "plm_dora", "plm_ia3"]:
	args_dict.update({
	"lora_r": self.lora_r,
	"lora_alpha": self.lora_alpha,
	"lora_dropout": self.lora_dropout,
	"lora_target_modules": self.lora_target_modules
	})

	# Add batch processing parameters
	if self.batch_mode == "Batch Size Mode":
	args_dict["batch_size"] = self.batch_size
	else:
	args_dict["batch_token"] = self.batch_token

	# Add wandb parameters
	if self.wandb_enabled:
	args_dict["wandb"] = True
	if self.wandb_project:
	args_dict["wandb_project"] = self.wandb_project
	if self.wandb_entity:
	args_dict["wandb_entity"] = self.wandb_entity

	return args_dict

	def create_train_tab(constant: Dict[str, Any]) -> Dict[str, Any]:
	# Create training monitor
	monitor = TrainingMonitor()

	# Add missing variable declarations
	is_training = False
	current_process = None
	stop_thread = False
	process_aborted = False

	plm_models = constant["plm_models"]
	dataset_configs = constant["dataset_configs"]

	with gr.Tab("Training"):
	# Model and Dataset Selection
	gr.Markdown("### Model and Dataset Configuration")

	# Original training interface components
	with gr.Group():
	with gr.Row():
	with gr.Column(scale=4):
	with gr.Row():
	plm_model = gr.Dropdown(
	choices=list(plm_models.keys()),
	label="Protein Language Model",
	value=list(plm_models.keys())[0],
	scale=2
	)

	# 新增数据集选择方式
	is_custom_dataset = gr.Radio(
	choices=["Use Custom Dataset", "Use Pre-defined Dataset"],
	label="Dataset Selection",
	value="Use Pre-defined Dataset",
	scale=3
	)

	dataset_config = gr.Dropdown(
	choices=list(dataset_configs.keys()),
	label="Dataset Configuration",
	value=list(dataset_configs.keys())[0],
	visible=True,
	scale=2
	)

	dataset_custom = gr.Textbox(
	label="Custom Dataset Path",
	placeholder="Huggingface Dataset eg: user/dataset",
	visible=False,
	scale=2
	)

	# 将预览按钮放在单独的列中，并添加样式
	with gr.Column(scale=1, min_width=120, elem_classes="preview-button-container"):
	dataset_preview_button = gr.Button(
	"Preview Dataset",
	variant="primary",
	size="lg",
	elem_classes="preview-button"
	)

	# 自定义数据集的额外配置选项（单独一行）
	with gr.Row(visible=True) as custom_dataset_settings:
	problem_type = gr.Dropdown(
	choices=["single_label_classification", "multi_label_classification", "regression"],
	label="Problem Type",
	value="single_label_classification",
	scale=23,
	interactive=False
	)
	num_labels = gr.Number(
	value=2,
	label="Number of Labels",
	scale=11,
	interactive=False
	)
	metrics = gr.Dropdown(
	choices=["accuracy", "recall", "precision", "f1", "mcc", "auroc", "f1max", "spearman_corr", "mse"],
	label="Metrics",
	value=["accuracy", "mcc", "f1", "precision", "recall", "auroc"],
	scale=101,
	multiselect=True,
	interactive=False
	)

	with gr.Row():
	structure_seq = gr.Dropdown(
	label="Structure Sequence",
	choices=["foldseek_seq", "ss8_seq"],
	value=["foldseek_seq", "ss8_seq"],
	multiselect=True,
	visible=False
	)

	# ! add for plm-lora, plm-qlora, plm_adalora, plm_dora, plm_ia3
	with gr.Row(visible=False) as lora_params_row:
	# gr.Markdown("#### LoRA Parameters")
	with gr.Column():
	lora_r = gr.Number(
	value=8,
	label="LoRA Rank",
	precision=0,
	minimum=1,
	maximum=128,
	)
	with gr.Column():
	lora_alpha = gr.Number(
	value=32,
	label="LoRA Alpha",
	precision=0,
	minimum=1,
	maximum=128
	)
	with gr.Column():
	lora_dropout = gr.Number(
	value=0.1,
	label="LoRA Dropout",
	minimum=0.0,
	maximum=1.0
	)
	with gr.Column():
	lora_target_modules = gr.Textbox(
	value="query,key,value",
	label="LoRA Target Modules",
	placeholder="Comma-separated list of target modules",
	# info="LoRA will be applied to these modules"
	)

	# 将数据统计和表格都放入折叠面板
	with gr.Row():
	with gr.Accordion("Dataset Preview", open=False) as preview_accordion:
	# 数据统计区域
	with gr.Row():
	dataset_stats_md = gr.HTML("", elem_classes=["dataset-stats"])

	# 表格区域
	with gr.Row():
	preview_table = gr.Dataframe(
	headers=["Name", "Sequence", "Label"],
	value=[["No dataset selected", "-", "-"]],
	wrap=True,
	interactive=False,
	row_count=3,
	elem_classes=["preview-table"]
	)

	# Add CSS styles
	gr.HTML("""
	<style>
	/* 数据统计样式 */
	.dataset-stats {
	margin: 0 0 15px 0;
	padding: 0;
	}

	.dataset-stats table {
	width: 100%;
	border-collapse: collapse;
	font-size: 0.9em;
	box-shadow: 0 2px 4px rgba(0,0,0,0.05);
	border-radius: 8px;
	overflow: hidden;
	table-layout: fixed;
	}

	.dataset-stats th {
	background-color: #e0e0e0;
	font-weight: bold;
	padding: 6px 10px;
	text-align: center;
	border: 1px solid #ddd;
	font-size: 0.95em;
	white-space: nowrap;
	overflow: hidden;
	min-width: 120px;
	}

	.dataset-stats td {
	padding: 6px 10px;
	text-align: center;
	border: 1px solid #ddd;
	}

	.dataset-stats h2 {
	font-size: 1.1em;
	margin: 0 0 10px 0;
	text-align: center;
	}

	/* 表格样式 */
	.preview-table table {
	background-color: white !important;
	font-size: 0.9em !important;
	width: 100%;
	table-layout: fixed !important;
	}

	.preview-table .gr-block.gr-box {
	background-color: transparent !important;
	}

	.preview-table .gr-input-label {
	background-color: transparent !important;
	}

	/* 表格外观增强 */
	.preview-table table {
	margin-top: 0;
	border-radius: 8px;
	overflow: hidden;
	box-shadow: 0 2px 4px rgba(0,0,0,0.05);
	}

	/* 表头样式 */
	.preview-table th {
	background-color: #e0e0e0 !important;
	font-weight: bold !important;
	padding: 6px !important;
	border-bottom: 1px solid #ccc !important;
	font-size: 0.95em !important;
	text-align: center !important;
	white-space: nowrap !important;
	min-width: 120px !important;
	}

	/* 单元格样式 */
	.preview-table td {
	padding: 4px 6px !important;
	max-width: 300px !important;
	overflow: hidden;
	text-overflow: ellipsis;
	white-space: nowrap;
	text-align: left !important;
	}

	/* 悬停效果 */
	.preview-table tr:hover {
	background-color: #f0f0f0 !important;
	}

	/* 折叠面板样式 */
	.gr-accordion {
	border: 1px solid #e0e0e0;
	border-radius: 8px;
	overflow: hidden;
	margin-bottom: 15px;
	}

	/* 折叠面板标题样式 */
	.gr-accordion .label-wrap {
	background-color: #f5f5f5;
	padding: 8px 15px;
	font-weight: bold;
	}

	.preview-button {
	height: 86px !important;
	}

	/* Center Model Statistics Table */
	.center-table-content td, .center-table-content th {
	text-align: center !important;
	font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif !important;
	padding: 10px !important;
	}

	.center-table-content table {
	width: 100% !important;
	border-collapse: collapse !important;
	margin-bottom: 20px !important;
	box-shadow: 0 2px 8px rgba(0,0,0,0.1) !important;
	border-radius: 8px !important;
	overflow: hidden !important;
	}

	.center-table-content th {
	background-color: #f0f4f8 !important;
	color: #2c3e50 !important;
	font-weight: 600 !important;
	border-bottom: 2px solid #ddd !important;
	}

	.center-table-content tr:nth-child(even) {
	background-color: #f9f9f9 !important;
	}

	.center-table-content tr:hover {
	background-color: #f0f7ff !important;
	}

	/* Improve readability of progress bars */
	.progress-container {
	margin-bottom: 20px !important;
	}

	.progress-bar {
	transition: width 0.5s ease-in-out !important;
	}

	.status-message {
	margin-bottom: 8px !important;
	font-weight: 500 !important;
	}
	</style>
	""", visible=True)

	# Batch Processing Configuration
	gr.Markdown("### Batch Processing Configuration")
	with gr.Group():
	with gr.Row(equal_height=True):
	with gr.Column(scale=1):
	batch_mode = gr.Radio(
	choices=["Batch Size Mode", "Batch Token Mode"],
	label="Batch Processing Mode",
	value="Batch Size Mode"
	)

	with gr.Column(scale=2):
	batch_size = gr.Slider(
	minimum=1,
	maximum=128,
	value=16,
	step=1,
	label="Batch Size",
	visible=True
	)

	batch_token = gr.Slider(
	minimum=1000,
	maximum=50000,
	value=10000,
	step=1000,
	label="Tokens per Batch",
	visible=False
	)

	def update_batch_inputs(mode):
	return {
	batch_size: gr.update(visible=mode == "Batch Size Mode"),
	batch_token: gr.update(visible=mode == "Batch Token Mode")
	}

	# Update visibility when mode changes
	batch_mode.change(
	fn=update_batch_inputs,
	inputs=[batch_mode],
	outputs=[batch_size, batch_token]
	)

	# Training Parameters
	gr.Markdown("### Training Parameters")
	with gr.Group():
	# First row: Basic training parameters
	with gr.Row(equal_height=True):
	with gr.Column(scale=1, min_width=150):
	training_method = gr.Dropdown(
	choices=["full", "freeze", "ses-adapter", "plm-lora", "plm-qlora", "plm_adalora", "plm_dora", "plm_ia3"],
	label="Training Method",
	value="freeze"
	)
	with gr.Column(scale=1, min_width=150):
	learning_rate = gr.Slider(
	minimum=1e-8, maximum=1e-2, value=5e-4, step=1e-6,
	label="Learning Rate"
	)
	with gr.Column(scale=1, min_width=150):
	num_epochs = gr.Slider(
	minimum=1, maximum=200, value=20, step=1,
	label="Number of Epochs"
	)
	with gr.Column(scale=1, min_width=150):
	patience = gr.Slider(
	minimum=1, maximum=50, value=10, step=1,
	label="Early Stopping Patience"
	)
	with gr.Column(scale=1, min_width=150):
	max_seq_len = gr.Slider(
	minimum=-1, maximum=2048, value=None, step=32,
	label="Max Sequence Length (-1 for unlimited)"
	)

	def update_training_method(method):
	return {
	structure_seq: gr.update(visible=method == "ses-adapter"),
	lora_params_row: gr.update(visible=method in ["plm-lora", "plm-qlora", "plm_adalora", "plm_dora", "plm_ia3"])
	}

	# Add training_method change event
	training_method.change(
	fn=update_training_method,
	inputs=[training_method],
	outputs=[structure_seq, lora_params_row]
	)

	# Second row: Advanced training parameters
	with gr.Row(equal_height=True):
	with gr.Column(scale=1, min_width=150):
	pooling_method = gr.Dropdown(
	choices=["mean", "attention1d", "light_attention"],
	label="Pooling Method",
	value="mean"
	)

	with gr.Column(scale=1, min_width=150):
	scheduler_type = gr.Dropdown(
	choices=["linear", "cosine", "step", None],
	label="Scheduler Type",
	value=None
	)
	with gr.Column(scale=1, min_width=150):
	warmup_steps = gr.Slider(
	minimum=0, maximum=1000, value=0, step=10,
	label="Warmup Steps"
	)
	with gr.Column(scale=1, min_width=150):
	gradient_accumulation_steps = gr.Slider(
	minimum=1, maximum=32, value=1, step=1,
	label="Gradient Accumulation Steps"
	)
	with gr.Column(scale=1, min_width=150):
	max_grad_norm = gr.Slider(
	minimum=0.1, maximum=10.0, value=-1, step=0.1,
	label="Max Gradient Norm (-1 for no clipping)"
	)
	with gr.Column(scale=1, min_width=150):
	num_workers = gr.Slider(
	minimum=0, maximum=16, value=4, step=1,
	label="Number of Workers"
	)

	# Output and Logging Settings
	gr.Markdown("### Output and Logging Settings")
	with gr.Row():
	with gr.Column():
	output_dir = gr.Textbox(
	label="Save Directory",
	value="demo",
	placeholder="Path to save training results"
	)

	output_model_name = gr.Textbox(
	label="Output Model Name",
	value="demo.pt",
	placeholder="Name of the output model file"
	)

	with gr.Column():
	wandb_logging = gr.Checkbox(
	label="Enable W&B Logging",
	value=False
	)

	wandb_project = gr.Textbox(
	label="W&B Project Name",
	value=None,
	visible=False
	)

	wandb_entity = gr.Textbox(
	label="W&B Entity",
	value=None,
	visible=False
	)

	# Training Control and Output
	gr.Markdown("### Training Control")
	with gr.Row():
	preview_button = gr.Button("Preview Command")
	abort_button = gr.Button("Abort", variant="stop")
	train_button = gr.Button("Start", variant="primary")

	with gr.Row():
	command_preview = gr.Code(
	label="Command Preview",
	language="shell",
	interactive=False,
	visible=False
	)

	# Model Statistics Section
	gr.Markdown("### Model Statistics")
	with gr.Row():
	model_stats = gr.Dataframe(
	headers=["Model Type", "Total Parameters", "Trainable Parameters", "Percentage"],
	value=[
	["Training Model", "-", "-", "-"],
	["Pre-trained Model", "-", "-", "-"],
	["Combined Model", "-", "-", "-"]
	],
	interactive=False,
	elem_classes=["center-table-content"]
	)

	def update_model_stats(stats: Dict[str, str]) -> List[List[str]]:
	"""Update model statistics in table format."""
	if not stats:
	return [
	["Training Model", "-", "-", "-"],
	["Pre-trained Model", "-", "-", "-"],
	["Combined Model", "-", "-", "-"]
	]

	adapter_total = stats.get('adapter_total', '-')
	adapter_trainable = stats.get('adapter_trainable', '-')
	pretrain_total = stats.get('pretrain_total', '-')
	pretrain_trainable = stats.get('pretrain_trainable', '-')
	combined_total = stats.get('combined_total', '-')
	combined_trainable = stats.get('combined_trainable', '-')
	trainable_percentage = stats.get('trainable_percentage', '-')

	return [
	["Training Model", str(adapter_total), str(adapter_trainable), "-"],
	["Pre-trained Model", str(pretrain_total), str(pretrain_trainable), "-"],
	["Combined Model", str(combined_total), str(combined_trainable), str(trainable_percentage)]
	]

	# Training Progress
	gr.Markdown("### Training Progress")
	with gr.Row():
	progress_status = gr.HTML(
	value="""
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">Click Start to train your model</span>
	</div>
	</div>
	</div>
	""",
	label="Status"
	)

	with gr.Row():
	best_model_info = gr.Textbox(
	value="Best Model: None",
	label="Best Performance",
	interactive=False
	)

	# Add test results HTML display
	with gr.Row():
	test_results_html = gr.HTML(
	value="",
	label="Test Results",
	visible=True
	)

	with gr.Row():
	with gr.Column(scale=4):
	pass
	with gr.Column(scale=1): # 限制列的最大宽度
	download_csv_btn = gr.DownloadButton(
	"Download CSV",
	visible=False,
	size="lg"
	)
	# 添加一个空列来占据剩余空间
	with gr.Column(scale=4):
	pass

	# Training plot in a separate row for full width
	with gr.Row():
	with gr.Column():
	loss_plot = gr.Plot(
	label="Training and Validation Loss",
	elem_id="loss_plot"
	)
	with gr.Column():
	metrics_plot = gr.Plot(
	label="Validation Metrics",
	elem_id="metrics_plot"
	)

	def update_progress(progress_info):
	# If progress_info is empty or None, use completely fresh empty state
	if not progress_info or not any(progress_info.values()):
	fresh_status_html = """
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">Click Start to train your model</span>
	</div>
	</div>
	</div>
	"""
	return (
	fresh_status_html,
	"Best Model: None",
	gr.update(value="", visible=False),
	None,
	None,
	gr.update(visible=False)
	)

	# Reset values if stage is "Waiting" or "Error"
	if progress_info.get('stage', '') == 'Waiting' or progress_info.get('stage', '') == 'Error':
	# If this is an error stage, show error styling
	if progress_info.get('stage', '') == 'Error':
	error_status_html = """
	<div style="background-color: #ffebee; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #c62828; font-weight: 500; font-size: 16px;">Failed</span>
	</div>
	</div>
	</div>
	"""
	return (
	error_status_html,
	"Training failed",
	gr.update(value="", visible=False),
	None,
	None,
	gr.update(visible=False)
	)
	else:
	return (
	"""
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">Waiting to start...</span>
	</div>
	</div>
	</div>
	""",
	"Best Model: None",
	gr.update(value="", visible=False),
	None,
	None,
	gr.update(visible=False)
	)

	current = progress_info.get('current', 0)
	total = progress_info.get('total', 100)
	epoch = progress_info.get('epoch', 0)
	stage = progress_info.get('stage', 'Waiting')
	progress_detail = progress_info.get('progress_detail', '')
	best_epoch = progress_info.get('best_epoch', 0)
	best_metric_name = progress_info.get('best_metric_name', 'accuracy')
	best_metric_value = progress_info.get('best_metric_value', 0.0)
	elapsed_time = progress_info.get('elapsed_time', '')
	remaining_time = progress_info.get('remaining_time', '')
	it_per_sec = progress_info.get('it_per_sec', 0.0)
	grad_step = progress_info.get('grad_step', 0)
	loss = progress_info.get('loss', 0.0)
	total_epochs = progress_info.get('total_epochs', 0) # 获取总epoch数
	test_results_html = progress_info.get('test_results_html', '') # 获取测试结果HTML
	test_metrics = progress_info.get('test_metrics', {}) # 获取测试指标
	is_completed = progress_info.get('is_completed', False) # 检查训练是否完成

	# Test results HTML visibility is always True, but show message when content is empty
	if not test_results_html and stage == 'Testing':
	test_results_html = """
	<div style="text-align: center; padding: 20px; color: #666;">
	<p>Testing in progress, please wait for results...</p>
	</div>
	"""
	elif not test_results_html:
	test_results_html = """
	<div style="text-align: center; padding: 20px; color: #666;">
	<p>Test results will be displayed after testing phase completes</p>
	</div>
	"""

	test_html_update = gr.update(value=test_results_html, visible=True)

	# 处理CSV下载按钮
	if test_metrics and len(test_metrics) > 0:
	# 创建临时文件保存CSV内容
	with tempfile.NamedTemporaryFile(mode='w', delete=False, suffix='.csv', prefix='metrics_results_') as temp_file:
	# 写入CSV头部
	temp_file.write("Metric,Value\n")

	# 按照优先级排序指标
	priority_metrics = ['loss', 'accuracy', 'f1', 'precision', 'recall', 'auroc', 'mcc']

	def get_priority(item):
	name = item[0]
	if name in priority_metrics:
	return priority_metrics.index(name)
	return len(priority_metrics)

	# 排序并添加到CSV
	sorted_metrics = sorted(test_metrics.items(), key=get_priority)
	for metric_name, metric_value in sorted_metrics:
	# Convert metric name: uppercase for abbreviations, capitalize for others
	display_name = metric_name
	if metric_name.lower() in ['f1', 'mcc', 'auroc']:
	display_name = metric_name.upper()
	else:
	display_name = metric_name.capitalize()
	temp_file.write(f"{display_name},{metric_value:.6f}\n")

	file_path = temp_file.name

	download_btn_update = gr.update(value=file_path, visible=True)
	else:
	download_btn_update = gr.update(visible=False)

	# 计算进度百分比
	progress_percentage = (current / total) * 100 if total > 0 else 0

	# 创建现代化的进度条HTML
	if is_completed:
	# 训练完成状态
	status_html = """
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #4caf50; font-weight: 500; font-size: 16px;">Training complete!</span>
	</div>
	<div>
	<span style="font-weight: 600; color: #333;">100%</span>
	</div>
	</div>

	<div style="margin-bottom: 15px; background-color: #e9ecef; height: 10px; border-radius: 5px; overflow: hidden;">
	<div style="background-color: #4caf50; width: 100%; height: 100%; border-radius: 5px;"></div>
	</div>
	</div>
	"""
	else:
	# 训练或验证阶段
	epoch_total = total_epochs if total_epochs > 0 else 100

	status_html = f"""
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">{stage} (Epoch {epoch}/{epoch_total})</span>
	</div>
	<div>
	<span style="font-weight: 600; color: #333;">{progress_percentage:.1f}%</span>
	</div>
	</div>

	<div style="margin-bottom: 15px; background-color: #e9ecef; height: 10px; border-radius: 5px; overflow: hidden;">
	<div style="background-color: #4285f4; width: {progress_percentage}%; height: 100%; border-radius: 5px; transition: width 0.3s ease;"></div>
	</div>

	<div style="display: flex; flex-wrap: wrap; gap: 10px; font-size: 14px; color: #555;">
	<div style="background-color: #e8f5e9; padding: 5px 10px; border-radius: 4px;"><span style="font-weight: 500;">Progress:</span> {current}/{total}</div>
	{f'<div style="background-color: #fff8e1; padding: 5px 10px; border-radius: 4px;"><span style="font-weight: 500;">Time:</span> {elapsed_time}<{remaining_time}, {it_per_sec:.2f}it/s></div>' if elapsed_time and remaining_time else ''}
	{f'<div style="background-color: #e3f2fd; padding: 5px 10px; border-radius: 4px;"><span style="font-weight: 500;">Loss:</span> {loss:.4f}</div>' if stage == 'Training' and loss > 0 else ''}
	{f'<div style="background-color: #f3e5f5; padding: 5px 10px; border-radius: 4px;"><span style="font-weight: 500;">Grad steps:</span> {grad_step}</div>' if stage == 'Training' and grad_step > 0 else ''}
	</div>
	</div>
	"""

	# 构建最佳模型信息
	if best_epoch >= 0 and best_metric_value > 0:
	best_info = f"Best model: Epoch {best_epoch} ({best_metric_name}: {best_metric_value:.4f})"
	else:
	best_info = "No best model found yet"

	# 获取并更新图表
	loss_fig = monitor.get_loss_plot()
	metrics_fig = monitor.get_metrics_plot()

	# 返回更新的组件
	return status_html, best_info, test_html_update, loss_fig, metrics_fig, download_btn_update

	def handle_train(*args) -> Generator:
	nonlocal is_training, current_process, stop_thread, process_aborted, monitor

	# If already training, return
	if is_training:
	yield None, None, None, None, None, None, None
	return

	# Force explicit state reset first thing
	monitor._reset_tracking()
	monitor._reset_stats()

	# Explicitly ensure stats are reset
	if hasattr(monitor, "stats"):
	monitor.stats = {}

	# Force override any cached state in monitor
	monitor.current_progress = {
	"current": 0,
	"total": 0,
	"epoch": 0,
	"stage": "Waiting",
	"progress_detail": "",
	"best_epoch": -1,
	"best_metric_name": "",
	"best_metric_value": 0.0,
	"elapsed_time": "",
	"remaining_time": "",
	"it_per_sec": 0.0,
	"grad_step": 0,
	"loss": 0.0,
	"test_results_html": "",
	"test_metrics": {},
	"is_completed": False,
	"lines": []
	}

	# Reset all monitoring data structures
	monitor.train_losses = []
	monitor.val_losses = []
	monitor.metrics = {}
	monitor.epochs = []
	if hasattr(monitor, "stats"):
	monitor.stats = {}

	# Reset flags for new training session
	process_aborted = False
	stop_thread = False

	# Initialize table state
	initial_stats = [
	["Training Model", "-", "-", "-"],
	["Pre-trained Model", "-", "-", "-"],
	["Combined Model", "-", "-", "-"]
	]

	# Initial UI state with "Initializing" message
	initial_status_html = """
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">Initializing training environment...</span>
	</div>
	</div>
	<div style="font-size: 14px; color: #555; margin-top: 10px;">
	<p>• Parsing configuration parameters</p>
	<p>• Preparing training environment</p>
	<p>• This may take a few moments...</p>
	</div>
	</div>
	"""

	# First yield to update UI with "initializing" state
	yield initial_stats, initial_status_html, "Best Model: None", gr.update(value="", visible=False), None, None, gr.update(visible=False)

	try:
	# Parse training arguments
	training_args = TrainingArgs(args, plm_models, dataset_configs)

	if training_args.training_method != "ses-adapter":
	training_args.structure_seq = None

	args_dict = training_args.to_dict()

	# Save total epochs to monitor for use in progress_info
	total_epochs = args_dict.get('num_epochs', 100)
	monitor.current_progress['total_epochs'] = total_epochs

	# Update status to "Preparing dataset"
	preparing_status_html = """
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">Preparing dataset and model...</span>
	</div>
	</div>
	<div style="font-size: 14px; color: #555; margin-top: 10px;">
	<p>• Loading dataset</p>
	<p>• Initializing model architecture</p>
	<p>• Setting up training environment</p>
	</div>
	</div>
	"""
	yield initial_stats, preparing_status_html, "Best Model: None", gr.update(value="", visible=False), None, None, gr.update(visible=False)

	# Save arguments to file
	save_arguments(args_dict, args_dict.get('output_dir', 'ckpt'))

	# Start training
	is_training = True
	process_aborted = False # Reset abort flag
	monitor.start_training(args_dict)
	current_process = monitor.process # Store the process reference

	starting_status_html = """
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">Starting training process...</span>
	</div>
	</div>
	<div style="font-size: 14px; color: #555; margin-top: 10px;">
	<p>• Training process launched</p>
	<p>• Waiting for first statistics to appear</p>
	<p>• This may take a moment for large models</p>
	</div>
	</div>
	"""

	yield initial_stats, starting_status_html, "Best Model: None", gr.update(value="", visible=False), None, None, gr.update(visible=False)

	# Add delay to ensure enough time for parsing initial statistics
	for i in range(3):
	time.sleep(1)
	# Check if statistics are already available
	stats = monitor.get_stats()
	if stats and len(stats) > 0:
	break

	update_count = 0
	while True:
	# Check if the process still exists and hasn't been aborted
	if process_aborted or not monitor.is_training or current_process is None or (current_process and current_process.poll() is not None):
	break

	try:
	update_count += 1
	time.sleep(0.5)

	# Check process status
	monitor.check_process_status()

	# Get latest progress info
	progress_info = monitor.get_progress()

	# If process has ended, check if it's normal end or error
	if not monitor.is_training:
	# Check both monitor.process and current_process since they might be different objects
	if (monitor.process and monitor.process.returncode != 0) or (current_process and current_process.poll() is not None and current_process.returncode != 0):
	# Get the return code from whichever process object is available
	return_code = monitor.process.returncode if monitor.process else current_process.returncode
	# Get complete output log
	error_output = "\n".join(progress_info.get("lines", []))
	if not error_output:
	error_output = "No output captured from the training process"

	# Ensure we set the is_completed flag to False for errors
	progress_info['is_completed'] = False
	monitor.current_progress['is_completed'] = False

	# Also set the stage to Error
	progress_info['stage'] = 'Error'
	monitor.current_progress['stage'] = 'Error'

	error_status_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px; margin-bottom: 10px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Training failed with error code {return_code}:</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto; background-color: #f5f5f5; padding: 10px; border-radius: 4px; font-family: monospace;">{error_output}</pre>
	</div>
	"""
	yield (
	initial_stats,
	error_status_html,
	"Training failed",
	gr.update(value="", visible=False),
	None,
	None,
	gr.update(visible=False)
	)
	return
	else:
	# Only set is_completed to True if there was a successful exit code
	progress_info['is_completed'] = True
	monitor.current_progress['is_completed'] = True

	# Update UI
	stats = monitor.get_stats()
	if stats:
	model_stats = update_model_stats(stats)
	else:
	model_stats = initial_stats

	status_html, best_info, test_html_update, loss_fig, metrics_fig, download_btn_update = update_progress(progress_info)

	yield model_stats, status_html, best_info, test_html_update, loss_fig, metrics_fig, download_btn_update

	except Exception as e:
	# Get complete output log
	error_output = "\n".join(progress_info.get("lines", []))
	if not error_output:
	error_output = "No output captured from the training process"

	error_status_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px; margin-bottom: 10px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error during training:</p>
	<p style="margin: 5px 0; color: #c62828;">{str(e)}</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto; background-color: #f5f5f5; padding: 10px; border-radius: 4px; font-family: monospace;">{error_output}</pre>
	</div>
	"""
	print(f"Error updating UI: {str(e)}")
	traceback.print_exc()
	yield initial_stats, error_status_html, "Training error", gr.update(value="", visible=False), None, None, gr.update(visible=False)
	return

	# Check if aborted
	if process_aborted:
	is_training = False
	current_process = None
	aborted_status_html = """
	<div style="padding: 10px; background-color: #e8f5e9; border-radius: 5px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Training was manually terminated.</p>
	</div>
	"""
	yield initial_stats, aborted_status_html, "Training aborted", gr.update(value="", visible=False), None, None, gr.update(visible=False)
	return

	# Final update after training ends (only for normal completion)
	if monitor.process and monitor.process.returncode == 0:
	try:
	progress_info = monitor.get_progress()
	progress_info['is_completed'] = True
	monitor.current_progress['is_completed'] = True

	stats = monitor.get_stats()
	if stats:
	model_stats = update_model_stats(stats)
	else:
	model_stats = initial_stats

	status_html, best_info, test_html_update, loss_fig, metrics_fig, download_btn_update = update_progress(progress_info)

	yield model_stats, status_html, best_info, test_html_update, loss_fig, metrics_fig, download_btn_update
	except Exception as e:
	error_output = "\n".join(progress_info.get("lines", []))
	if not error_output:
	error_output = "No output captured from the training process"

	error_status_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px; margin-bottom: 10px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Error in final update:</p>
	<p style="margin: 5px 0; color: #c62828;">{str(e)}</p>
	<pre style="margin: 5px 0 0; white-space: pre-wrap; max-height: 300px; overflow-y: auto; background-color: #f5f5f5; padding: 10px; border-radius: 4px; font-family: monospace;">{error_output}</pre>
	</div>
	"""
	yield initial_stats, error_status_html, "Error in final update", gr.update(value="", visible=False), None, None, gr.update(visible=False)

	except Exception as e:
	# Initialization error, may not have output log
	error_status_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px; margin-bottom: 10px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Training initialization failed:</p>
	<p style="margin: 5px 0; color: #c62828;">{str(e)}</p>
	</div>
	"""
	yield initial_stats, error_status_html, "Training failed", gr.update(value="", visible=False), None, None, gr.update(visible=False)
	finally:
	is_training = False
	current_process = None

	def handle_abort():
	"""Handle abortion of the training process"""
	nonlocal is_training, current_process, stop_thread, process_aborted

	if not is_training or current_process is None:
	return (gr.HTML("""
	<div style="padding: 10px; background-color: #f5f5f5; border-radius: 5px;">
	<p style="margin: 0;">No training process is currently running.</p>
	</div>
	"""),
	[["Training Model", "-", "-", "-"],
	["Pre-trained Model", "-", "-", "-"],
	["Combined Model", "-", "-", "-"]],
	"Best Model: None",
	gr.update(value="", visible=False),
	None,
	None,
	gr.update(visible=False))

	try:
	# Set the abort flag before terminating the process
	process_aborted = True
	stop_thread = True

	# Use process.terminate() instead of os.killpg for safer termination
	# This avoids accidentally killing the parent WebUI process
	current_process.terminate()

	# Wait for process to terminate (with timeout)
	try:
	current_process.wait(timeout=5)
	except subprocess.TimeoutExpired:
	# Only if terminate didn't work, use a stronger method
	# But do NOT use killpg which might kill the parent WebUI
	current_process.kill()

	# Create a completely fresh state - not just resetting
	monitor.is_training = False

	# Explicitly create a new dictionary instead of modifying the existing one
	monitor.current_progress = {
	"current": 0,
	"total": 0,
	"epoch": 0,
	"stage": "Waiting",
	"progress_detail": "",
	"best_epoch": -1,
	"best_metric_name": "",
	"best_metric_value": 0.0,
	"elapsed_time": "",
	"remaining_time": "",
	"it_per_sec": 0.0,
	"grad_step": 0,
	"loss": 0.0,
	"test_results_html": "",
	"test_metrics": {},
	"is_completed": False,
	"lines": []
	}

	# Explicitly clear stats by creating a new dictionary
	monitor.stats = {}

	if hasattr(monitor, "process") and monitor.process:
	monitor.process = None

	# Reset state variables
	is_training = False
	current_process = None

	# Explicitly reset tracking to clear all state
	monitor._reset_tracking()
	monitor._reset_stats()

	# Reset all plots and statistics with new empty lists
	monitor.train_losses = []
	monitor.val_losses = []
	monitor.metrics = {}
	monitor.epochs = []

	# Create entirely fresh UI components
	empty_model_stats = [["Training Model", "-", "-", "-"],
	["Pre-trained Model", "-", "-", "-"],
	["Combined Model", "-", "-", "-"]]

	success_html = """
	<div style="padding: 10px; background-color: #e8f5e9; border-radius: 5px;">
	<p style="margin: 0; color: #2e7d32; font-weight: bold;">Training successfully terminated!</p>
	<p style="margin: 5px 0 0; color: #388e3c;">All training state has been reset. You can start a new training session.</p>
	</div>
	"""

	# Return updates for all relevant components
	return (gr.HTML(success_html),
	empty_model_stats,
	"Best Model: None",
	gr.update(value="", visible=False),
	None,
	None,
	gr.update(visible=False))
	except Exception as e:
	# Still need to reset states even if there's an error
	is_training = False
	current_process = None
	process_aborted = False

	# Reset monitor state regardless of error
	monitor.is_training = False
	monitor.stats = {}
	if hasattr(monitor, "process") and monitor.process:
	monitor.process = None
	monitor._reset_tracking()
	monitor._reset_stats()

	# Fresh empty components
	empty_model_stats = [["Training Model", "-", "-", "-"],
	["Pre-trained Model", "-", "-", "-"],
	["Combined Model", "-", "-", "-"]]

	error_html = f"""
	<div style="padding: 10px; background-color: #ffebee; border-radius: 5px;">
	<p style="margin: 0; color: #c62828; font-weight: bold;">Failed to terminate training: {str(e)}</p>
	<p style="margin: 5px 0 0; color: #c62828;">Training state has been reset.</p>
	</div>
	"""

	# Return updates for all relevant components including empty model stats
	return (gr.HTML(error_html),
	empty_model_stats,
	"Best Model: None",
	gr.update(value="", visible=False),
	None,
	None,
	gr.update(visible=False))

	def update_wandb_visibility(checkbox):
	return {
	wandb_project: gr.update(visible=checkbox),
	wandb_entity: gr.update(visible=checkbox)
	}

	# define all input components
	input_components = [
	plm_model, #0
	is_custom_dataset, #1
	dataset_config, #2
	dataset_custom, #3
	problem_type, #4
	num_labels, #5
	metrics, #6
	training_method, #7
	pooling_method, #8
	batch_mode, #9
	batch_size, #10
	batch_token, #11
	learning_rate, #12
	num_epochs, #13
	max_seq_len, #14
	gradient_accumulation_steps, #15
	warmup_steps, #16
	scheduler_type, #17
	output_model_name, #18
	output_dir, #19
	wandb_logging, #20
	wandb_project, #21
	wandb_entity, #22
	patience, #23
	num_workers, #24
	max_grad_norm, #25
	structure_seq, #26
	lora_r, #27
	lora_alpha, #28
	lora_dropout, #29
	lora_target_modules, #30
	]

	# bind preview and train buttons
	def handle_preview(*args):
	if command_preview.visible:
	return gr.update(visible=False)
	training_args = TrainingArgs(args, plm_models, dataset_configs)
	preview_text = preview_command(training_args.to_dict())
	return gr.update(value=preview_text, visible=True)

	def reset_train_ui():
	"""Reset the UI state before training starts"""
	# Reset monitor state
	monitor._reset_tracking()
	monitor._reset_stats()

	# Explicitly ensure stats are reset
	if hasattr(monitor, "stats"):
	monitor.stats = {}

	# Create a completely fresh progress state
	monitor.current_progress = {
	"current": 0,
	"total": 0,
	"epoch": 0,
	"stage": "Waiting",
	"progress_detail": "",
	"best_epoch": -1,
	"best_metric_name": "",
	"best_metric_value": 0.0,
	"elapsed_time": "",
	"remaining_time": "",
	"it_per_sec": 0.0,
	"grad_step": 0,
	"loss": 0.0,
	"test_results_html": "",
	"test_metrics": {},
	"is_completed": False,
	"lines": []
	}

	# Reset all statistical data
	monitor.train_losses = []
	monitor.val_losses = []
	monitor.metrics = {}
	monitor.epochs = []

	# Force UI to reset by creating completely fresh components
	empty_model_stats = [["Training Model", "-", "-", "-"],
	["Pre-trained Model", "-", "-", "-"],
	["Combined Model", "-", "-", "-"]]

	empty_progress_status = """
	<div style="background-color: #f8f9fa; border-radius: 10px; padding: 20px; margin-bottom: 15px; box-shadow: 0 2px 5px rgba(0,0,0,0.05);">
	<div style="display: flex; justify-content: space-between; margin-bottom: 12px;">
	<div>
	<span style="font-weight: 600; font-size: 16px;">Training Status: </span>
	<span style="color: #1976d2; font-weight: 500; font-size: 16px;">Preparing to start training...</span>
	</div>
	</div>
	</div>
	"""

	# Return exactly 7 values matching the 7 output components
	return (
	empty_model_stats,
	empty_progress_status,
	"Best Model: None",
	gr.update(value="", visible=False),
	None, # loss_plot must be None, not a string
	None, # metrics_plot must be None, not a string
	gr.update(visible=False)
	)

	preview_button.click(
	fn=handle_preview,
	inputs=input_components,
	outputs=[command_preview]
	)

	train_button.click(
	fn=reset_train_ui,
	outputs=[model_stats, progress_status, best_model_info, test_results_html, loss_plot, metrics_plot, download_csv_btn]
	).then(
	fn=handle_train,
	inputs=input_components,
	outputs=[model_stats, progress_status, best_model_info, test_results_html, loss_plot, metrics_plot, download_csv_btn]
	)

	# bind abort button
	abort_button.click(
	fn=handle_abort,
	outputs=[progress_status, model_stats, best_model_info, test_results_html, loss_plot, metrics_plot, download_csv_btn]
	)

	wandb_logging.change(
	fn=update_wandb_visibility,
	inputs=[wandb_logging],
	outputs=[wandb_project, wandb_entity]
	)

	def update_dataset_preview(dataset_type=None, dataset_name=None, custom_dataset=None):
	"""Update dataset preview content"""
	# Determine which dataset to use based on selection
	if dataset_type == "Use Custom Dataset" and custom_dataset:
	try:
	# Try to load custom dataset
	dataset = load_dataset(custom_dataset)
	stats_html = f"""
	<div style="text-align: center; margin: 20px 0;">
	<table style="width: 100%; border-collapse: collapse; margin: 0 auto;">
	<tr>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Dataset</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Train Samples</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Val Samples</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Test Samples</th>
	</tr>
	<tr>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{custom_dataset}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{len(dataset["train"]) if "train" in dataset else 0}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{len(dataset["validation"]) if "validation" in dataset else 0}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{len(dataset["test"]) if "test" in dataset else 0}</td>
	</tr>
	</table>
	</div>
	"""

	# Get sample data points
	split = "train" if "train" in dataset else list(dataset.keys())[0]
	samples = dataset[split].select(range(min(3, len(dataset[split]))))
	if len(samples) == 0:
	return gr.update(value=stats_html), gr.update(value=[["No data available", "-", "-"]], headers=["Name", "Sequence", "Label"]), gr.update(open=True)

	# Get fields actually present in the dataset
	available_fields = list(samples[0].keys())

	# Build sample data
	sample_data = []
	for sample in samples:
	sample_dict = {}
	for field in available_fields:
	# Keep full sequence
	sample_dict[field] = str(sample[field])
	sample_data.append(sample_dict)

	df = pd.DataFrame(sample_data)
	return gr.update(value=stats_html), gr.update(value=df.values.tolist(), headers=df.columns.tolist()), gr.update(open=True)
	except Exception as e:
	error_html = f"""
	<div>
	<h2>Error loading dataset</h2>
	<p style="color: #c62828;">{str(e)}</p>
	</div>
	"""
	return gr.update(value=error_html), gr.update(value=[["Error", str(e), "-"]], headers=["Name", "Sequence", "Label"]), gr.update(open=True)

	# Use predefined dataset
	elif dataset_type == "Use Pre-defined Dataset" and dataset_name:
	try:
	config_path = dataset_configs[dataset_name]
	with open(config_path, 'r') as f:
	config = json.load(f)

	# Load dataset statistics
	dataset = load_dataset(config["dataset"])
	stats_html = f"""
	<div style="text-align: center; margin: 20px 0;">
	<table style="width: 100%; border-collapse: collapse; margin: 0 auto;">
	<tr>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Dataset</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Train Samples</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Val Samples</th>
	<th style="padding: 8px; font-size: 14px; border: 1px solid #ddd; background-color: #e0e0e0; font-weight: bold; border-bottom: 1px solid #ccc; text-align: center;">Test Samples</th>
	</tr>
	<tr>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{config["dataset"]}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{len(dataset["train"]) if "train" in dataset else 0}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{len(dataset["validation"]) if "validation" in dataset else 0}</td>
	<td style="padding: 15px; font-size: 14px; border: 1px solid #ddd; text-align: center;">{len(dataset["test"]) if "test" in dataset else 0}</td>
	</tr>
	</table>
	</div>
	"""

	# Get sample data points and available fields
	samples = dataset["train"].select(range(min(3, len(dataset["train"]))))
	if len(samples) == 0:
	return gr.update(value=stats_html), gr.update(value=[["No data available", "-", "-"]], headers=["Name", "Sequence", "Label"]), gr.update(open=True)

	# Get fields actually present in the dataset
	available_fields = list(samples[0].keys())

	# Build sample data
	sample_data = []
	for sample in samples:
	sample_dict = {}
	for field in available_fields:
	# Keep full sequence
	sample_dict[field] = str(sample[field])
	sample_data.append(sample_dict)

	df = pd.DataFrame(sample_data)
	return gr.update(value=stats_html), gr.update(value=df.values.tolist(), headers=df.columns.tolist()), gr.update(open=True)
	except Exception as e:
	error_html = f"""
	<div>
	<h2>Error loading dataset</h2>
	<p style="color: #c62828;">{str(e)}</p>
	</div>
	"""
	return gr.update(value=error_html), gr.update(value=[["Error", str(e), "-"]], headers=["Name", "Sequence", "Label"]), gr.update(open=True)

	# If no valid dataset information provided
	return gr.update(value=""), gr.update(value=[["No dataset selected", "-", "-"]], headers=["Name", "Sequence", "Label"]), gr.update(open=True)

	# Preview button click event
	dataset_preview_button.click(
	fn=update_dataset_preview,
	inputs=[is_custom_dataset, dataset_config, dataset_custom],
	outputs=[dataset_stats_md, preview_table, preview_accordion]
	)

	# 添加自定义数据集设置的函数
	def update_dataset_settings(choice, dataset_name=None):
	if choice == "Use Pre-defined Dataset":
	# 从dataset_config加载配置
	result = {
	dataset_config: gr.update(visible=True),
	dataset_custom: gr.update(visible=False),
	custom_dataset_settings: gr.update(visible=True)
	}

	# 如果有选择特定数据集，自动加载配置
	if dataset_name and dataset_name in dataset_configs:
	with open(dataset_configs[dataset_name], 'r') as f:
	config = json.load(f)

	# 处理metrics，将字符串转换为列表以适应多选组件
	metrics_value = config.get("metrics", "accuracy,mcc,f1,precision,recall,auroc")
	if isinstance(metrics_value, str):
	metrics_value = metrics_value.split(",")

	result.update({
	problem_type: gr.update(value=config.get("problem_type", "single_label_classification"), interactive=False),
	num_labels: gr.update(value=config.get("num_labels", 2), interactive=False),
	metrics: gr.update(value=metrics_value, interactive=False),
	})
	return result
	else:
	# 自定义数据集设置，清零/设为默认值并可编辑
	# 为多选组件提供默认值列表
	default_metrics = ["accuracy", "mcc", "f1", "precision", "recall", "auroc"]

	return {
	dataset_config: gr.update(visible=False),
	dataset_custom: gr.update(visible=True),
	custom_dataset_settings: gr.update(visible=True),
	problem_type: gr.update(value="single_label_classification", interactive=True),
	num_labels: gr.update(value=2, interactive=True),
	metrics: gr.update(value=default_metrics, interactive=True)
	}

	# 绑定数据集设置更新事件
	is_custom_dataset.change(
	fn=update_dataset_settings,
	inputs=[is_custom_dataset, dataset_config],
	outputs=[dataset_config, dataset_custom, custom_dataset_settings, problem_type, num_labels, metrics]
	)

	dataset_config.change(
	fn=lambda x: update_dataset_settings("Use Pre-defined Dataset", x),
	inputs=[dataset_config],
	outputs=[dataset_config, dataset_custom, custom_dataset_settings, problem_type, num_labels, metrics]
	)

	# Return components that need to be accessed from outside
	return {
	"output_text": progress_status,
	"loss_plot": loss_plot,
	"metrics_plot": metrics_plot,
	"train_button": train_button,
	"monitor": monitor,
	"test_results_html": test_results_html, # 添加测试结果HTML组件
	"components": {
	"plm_model": plm_model,
	"dataset_config": dataset_config,
	"training_method": training_method,
	"pooling_method": pooling_method,
	"batch_mode": batch_mode,
	"batch_size": batch_size,
	"batch_token": batch_token,
	"learning_rate": learning_rate,
	"num_epochs": num_epochs,
	"max_seq_len": max_seq_len,
	"gradient_accumulation_steps": gradient_accumulation_steps,
	"warmup_steps": warmup_steps,
	"scheduler_type": scheduler_type,
	"output_model_name": output_model_name,
	"output_dir": output_dir,
	"wandb_logging": wandb_logging,
	"wandb_project": wandb_project,
	"wandb_entity": wandb_entity,
	"patience": patience,
	"num_workers": num_workers,
	"max_grad_norm": max_grad_norm,
	"structure_seq": structure_seq,
	"lora_r": lora_r,
	"lora_alpha": lora_alpha,
	"lora_dropout": lora_dropout,
	"lora_target_modules": lora_target_modules,
	}
	}