Spaces:

SemViQA
/

semviqa-demo

Sleeping

App Files Files Community

xuandin commited on Mar 19

Commit

270b4c0

verified ·

1 Parent(s): 7c117db

Update app.py

Browse files

Files changed (1) hide show

app.py +169 -14

app.py CHANGED Viewed

@@ -10,6 +10,9 @@ import pandas as pd
 import os
 import psutil
 import gc
 # Set environment variables to optimize CPU performance
 os.environ["OMP_NUM_THREADS"] = str(psutil.cpu_count(logical=False))
@@ -80,6 +83,69 @@ def perform_verification(claim, context, model_qatc, tokenizer_qatc, model_tc, t
         "pred_bc": pred_bc
     }
 # Set page configuration
 st.set_page_config(
@@ -234,6 +300,34 @@ st.markdown("""
         background-color: var(--primary-color);
         color: white;
     }
     </style>
 """, unsafe_allow_html=True)
@@ -319,7 +413,7 @@ with st.sidebar:
     os.environ["MKL_NUM_THREADS"] = str(num_threads)
 # Main content
-tabs = st.tabs(["🔍 Kiểm chứng", "📊 Lịch sử", "ℹ️ Thông tin"])
 tokenizer_qatc, model_qatc = load_model(qatc_model_name, QATCForQuestionAnswering, device=DEVICE)
 tokenizer_bc, model_bc = load_model(bc_model_name, ClaimModelForClassification, is_bc=True, device=DEVICE)
@@ -440,9 +534,22 @@ with tabs[0]:
 # --- Tab History ---
 with tabs[1]:
     st.markdown("### 📊 Lịch sử Kiểm chứng")
     if 'history' in st.session_state and st.session_state.history:
         # Download full history
-        history_df = pd.DataFrame(st.session_state.history)
         st.download_button(
             "📥 Tải toàn bộ lịch sử",
             data=history_df.to_csv(index=False).encode('utf-8'),
@@ -450,21 +557,61 @@ with tabs[1]:
             mime="text/csv"
         )
-        # Display history
-        for idx, record in enumerate(reversed(st.session_state.history), 1):
-            st.markdown(f"""
-                <div class="result-box">
-                    <h4>Kiểm chứng #{idx}</h4>
-                    <p><strong>Câu khẳng định:</strong> {record['claim']}</p>
-                    <p><strong>Kết luận:</strong> {verdict_icons.get(record['verdict'], '')} {record['verdict']}</p>
-                    <p><strong>Thời gian:</strong> {record['total_time']:.2f} giây</p>
-                </div>
-            """, unsafe_allow_html=True)
     else:
-        st.info("Chưa có lịch sử kiểm chứng.")
 # --- Tab Info ---
-with tabs[2]:
     st.markdown("""
         <div class="result-box">
             <h3>ℹ️ Thông tin về SemViQA</h3>
@@ -491,5 +638,13 @@ with tabs[2]:
                 <li><strong>REFUTED:</strong> Câu khẳng định bị bác bỏ bởi bằng chứng</li>
                 <li><strong>NEI:</strong> Không đủ bằng chứng để kết luận</li>
             </ul>
         </div>
     """, unsafe_allow_html=True)

 import os
 import psutil
 import gc
+import plotly.express as px
+import plotly.graph_objects as go
+from datetime import datetime
 # Set environment variables to optimize CPU performance
 os.environ["OMP_NUM_THREADS"] = str(psutil.cpu_count(logical=False))
         "pred_bc": pred_bc
     }
+# Add new functions for analysis
+def analyze_verdict_distribution(history):
+    if not history:
+        return None
+    df = pd.DataFrame(history)
+    verdict_counts = df['verdict'].value_counts()
+    fig = px.pie(
+        values=verdict_counts.values,
+        names=verdict_counts.index,
+        title='Phân bố Kết quả Kiểm chứng',
+        color_discrete_sequence=['#2ecc71', '#e74c3c', '#f1c40f']
+    )
+    return fig
+def analyze_processing_time(history):
+    if not history:
+        return None
+    df = pd.DataFrame(history)
+    df['timestamp'] = pd.to_datetime(df['timestamp'])
+    fig = px.line(
+        df,
+        x='timestamp',
+        y=['evidence_time', 'verdict_time', 'total_time'],
+        title='Thời gian Xử lý theo Thời gian',
+        labels={'value': 'Thời gian (giây)', 'timestamp': 'Thời điểm'}
+    )
+    return fig
+def generate_report(result):
+    report = f"""
+    BÁO CÁO KIỂM CHỨNG THÔNG TIN
+    Thời gian: {datetime.now().strftime('%d/%m/%Y %H:%M:%S')}
+    1. THÔNG TIN CƠ BẢN
+    -------------------
+    Câu khẳng định: {result['claim']}
+    Kết luận: {result['verdict']}
+    2. BẰNG CHỨNG
+    -------------
+    {result['evidence']}
+    3. THỐNG KÊ THỜI GIAN
+    ---------------------
+    - Thời gian trích xuất bằng chứng: {result['evidence_time']:.2f} giây
+    - Thời gian phân loại: {result['verdict_time']:.2f} giây
+    - Tổng thời gian xử lý: {result['total_time']:.2f} giây
+    4. CHI TIẾT KỸ THUẬT
+    -------------------
+    {result['details']}
+    5. MÔ HÌNH SỬ DỤNG
+    ------------------
+    - QATC Model: {result['qatc_model']}
+    - Binary Classification Model: {result['bc_model']}
+    - 3-Class Classification Model: {result['tc_model']}
+    """
+    return report
 # Set page configuration
 st.set_page_config(
         background-color: var(--primary-color);
         color: white;
     }
+    /* Analysis box styling */
+    .analysis-box {
+        background-color: white;
+        border-radius: 12px;
+        padding: 1.5rem;
+        margin: 1rem 0;
+        box-shadow: 0 2px 4px rgba(0, 0, 0, 0.05);
+    }
+    /* Search box styling */
+    .search-box {
+        background-color: white;
+        border-radius: 8px;
+        padding: 1rem;
+        margin-bottom: 1rem;
+        box-shadow: 0 2px 4px rgba(0, 0, 0, 0.05);
+    }
+    /* Comparison box styling */
+    .comparison-box {
+        background-color: white;
+        border-radius: 12px;
+        padding: 1.5rem;
+        margin: 1rem 0;
+        box-shadow: 0 2px 4px rgba(0, 0, 0, 0.05);
+        border-left: 4px solid var(--primary-color);
+    }
     </style>
 """, unsafe_allow_html=True)
     os.environ["MKL_NUM_THREADS"] = str(num_threads)
 # Main content
+tabs = st.tabs(["🔍 Kiểm chứng", "📊 Lịch sử", "📈 Phân tích", "ℹ️ Thông tin"])
 tokenizer_qatc, model_qatc = load_model(qatc_model_name, QATCForQuestionAnswering, device=DEVICE)
 tokenizer_bc, model_bc = load_model(bc_model_name, ClaimModelForClassification, is_bc=True, device=DEVICE)
 # --- Tab History ---
 with tabs[1]:
     st.markdown("### 📊 Lịch sử Kiểm chứng")
+    # Add search functionality
+    search_query = st.text_input("🔍 Tìm kiếm trong lịch sử", "")
     if 'history' in st.session_state and st.session_state.history:
+        # Filter history based on search query
+        filtered_history = st.session_state.history
+        if search_query:
+            filtered_history = [
+                record for record in st.session_state.history
+                if search_query.lower() in record['claim'].lower() or
+                   search_query.lower() in record['evidence'].lower()
+            ]
         # Download full history
+        history_df = pd.DataFrame(filtered_history)
         st.download_button(
             "📥 Tải toàn bộ lịch sử",
             data=history_df.to_csv(index=False).encode('utf-8'),
             mime="text/csv"
         )
+        # Display history with comparison option
+        for idx, record in enumerate(reversed(filtered_history), 1):
+            col1, col2 = st.columns([3, 1])
+            with col1:
+                st.markdown(f"""
+                    <div class="result-box">
+                        <h4>Kiểm chứng #{idx}</h4>
+                        <p><strong>Câu khẳng định:</strong> {record['claim']}</p>
+                        <p><strong>Kết luận:</strong> {verdict_icons.get(record['verdict'], '')} {record['verdict']}</p>
+                        <p><strong>Thời gian:</strong> {record['total_time']:.2f} giây</p>
+                    </div>
+                """, unsafe_allow_html=True)
+            with col2:
+                if st.button("🔄 So sánh", key=f"compare_{idx}"):
+                    st.session_state.selected_for_comparison = record
+# --- Tab Analysis ---
+with tabs[2]:
+    st.markdown("### 📈 Phân tích Chi tiết")
+    if 'history' in st.session_state and st.session_state.history:
+        # Add timestamp to history records
+        for record in st.session_state.history:
+            if 'timestamp' not in record:
+                record['timestamp'] = datetime.now()
+        # Distribution analysis
+        st.markdown("#### 📊 Phân bố Kết quả")
+        verdict_fig = analyze_verdict_distribution(st.session_state.history)
+        if verdict_fig:
+            st.plotly_chart(verdict_fig, use_container_width=True)
+        # Processing time analysis
+        st.markdown("#### ⏱️ Phân tích Thời gian Xử lý")
+        time_fig = analyze_processing_time(st.session_state.history)
+        if time_fig:
+            st.plotly_chart(time_fig, use_container_width=True)
+        # Model performance analysis
+        st.markdown("#### 🧠 Phân tích Hiệu suất Mô hình")
+        model_stats = pd.DataFrame(st.session_state.history)
+        if not model_stats.empty:
+            st.markdown("##### Thống kê theo Mô hình")
+            model_performance = model_stats.groupby(['qatc_model', 'bc_model', 'tc_model']).agg({
+                'total_time': ['mean', 'count'],
+                'verdict': lambda x: (x == 'SUPPORTED').mean()
+            }).round(2)
+            st.dataframe(model_performance)
     else:
+        st.info("Chưa có dữ liệu để phân tích.")
 # --- Tab Info ---
+with tabs[3]:
     st.markdown("""
         <div class="result-box">
             <h3>ℹ️ Thông tin về SemViQA</h3>
                 <li><strong>REFUTED:</strong> Câu khẳng định bị bác bỏ bởi bằng chứng</li>
                 <li><strong>NEI:</strong> Không đủ bằng chứng để kết luận</li>
             </ul>
+            <h4>🆕 Tính năng Mới</h4>
+            <ul>
+                <li><strong>Phân tích Chi tiết:</strong> Xem thống kê và biểu đồ về kết quả kiểm chứng</li>
+                <li><strong>Tìm kiếm Lịch sử:</strong> Dễ dàng tìm kiếm trong lịch sử kiểm chứng</li>
+                <li><strong>So sánh Kết quả:</strong> So sánh các kết quả kiểm chứng với nhau</li>
+                <li><strong>Báo cáo Chi tiết:</strong> Xuất báo cáo chi tiết về kết quả kiểm chứng</li>
+            </ul>
         </div>
     """, unsafe_allow_html=True)