Spaces:

kfkas
/

Tip

Runtime error

App Files Files Community

kfkas commited on Apr 2

Commit

f1454c7

1 Parent(s): 25bd246

z

Browse files

Files changed (3) hide show

app.py +11 -150
requirements.txt +4 -0
space.yaml +4 -0

app.py CHANGED Viewed

@@ -3,18 +3,13 @@ import shutil
 import cv2
 import base64
 import uuid
 from flask import Flask
 import gradio as gr
-import re
-# -----------------------------------------------------------------------------
-# Config: 앱 설정 (Gemma와 GPT4o 관련 설정은 제거)
-# -----------------------------------------------------------------------------
 class Config:
     """애플리케이션 설정 및 상수"""
-    # 음식 메뉴 데이터
     FOOD_ITEMS = [
         {"name": "짜장면", "image": "images/food1.jpg", "price": 7.00},
         {"name": "짬뽕", "image": "images/food2.jpg", "price": 8.50},
@@ -25,11 +20,9 @@ class Config:
         {"name": "콜라", "image": "images/food6.jpg", "price": 12.00},
         {"name": "사이다", "image": "images/food6.jpg", "price": 12.00},
     ]
     # 알리바바 Qwen API 키 (기본값은 빈 문자열)
     QWEN_API_KEY = ""
-    # 기본 프롬프트 템플릿
     DEFAULT_PROMPT_TEMPLATE = (
         "### Persona ###\n"
         "You are an expert tip calculation assistant focusing on service quality observed in a video.\n\n"
@@ -65,7 +58,6 @@ class Config:
         "Total Bill: $[Subtotal + Tip]"
     )
-    # Gradio UI용 CSS
     CUSTOM_CSS = """
     #food-container {
         display: grid;
@@ -74,21 +66,17 @@ class Config:
         overflow-y: auto;
         height: 600px;
     }
-    /* Qwen 버튼을 보라색으로 */
     #qwen-button {
         background-color: #8A2BE2 !important;
         color: white !important;
         border-color: #8A2BE2 !important;
     }
     #qwen-button:hover {
         background-color: #7722CC !important;
     }
     """
     def __init__(self):
-        # 이미지 디렉토리 확인
         if not os.path.exists("images"):
             print("경고: 'images' 폴더를 찾을 수 없습니다. 음식 이미지가 표시되지 않을 수 있습니다.")
         for item in self.FOOD_ITEMS:
@@ -96,12 +84,8 @@ class Config:
                 print(f"경고: 이미지 파일을 찾을 수 없습니다 - {item['image']}")
-# -----------------------------------------------------------------------------
-# ModelClients: 알리바바 Qwen API 클라이언트만 사용
-# -----------------------------------------------------------------------------
 class ModelClients:
-    """알리바바 Qwen API 클라이언트 관리"""
     def __init__(self, config: Config):
         self.config = config
         from openai import OpenAI as QwenOpenAI
@@ -111,56 +95,40 @@ class ModelClients:
         )
     def encode_video_qwen(self, video_path):
-        """Qwen API용 비디오 인코딩"""
         with open(video_path, "rb") as video_file:
             return base64.b64encode(video_file.read()).decode("utf-8")
-# -----------------------------------------------------------------------------
-# VideoProcessor: 비디오 처리 및 프레임 추출 기능 제공 (변경 없음)
-# -----------------------------------------------------------------------------
 class VideoProcessor:
-    """비디오 처리 및 프레임 추출 기능 제공"""
     def extract_video_frames(self, video_path, output_folder=None, fps=1):
-        """비디오 파일에서 프레임 추출"""
         if not video_path:
             return [], None
         if output_folder is None:
             output_folder = f"frames_list/frames_{uuid.uuid4().hex}"
         os.makedirs(output_folder, exist_ok=True)
         cap = cv2.VideoCapture(video_path)
         if not cap.isOpened():
             print(f"오류: 비디오 파일을 열 수 없습니다 - {video_path}")
             return [], None
         frame_paths = []
         frame_rate = cap.get(cv2.CAP_PROP_FPS)
         if not frame_rate or frame_rate == 0:
             print("경고: FPS를 읽을 수 없습니다, 기본값 4으로 설정합니다.")
             frame_rate = 4.0
         frame_interval = int(frame_rate / fps) if fps > 0 else 1
         if frame_interval <= 0:
             frame_interval = 1
         frame_count = 0
         saved_frame_count = 0
         while cap.isOpened():
             ret, frame = cap.read()
             if not ret:
                 break
             if frame is None:
                 print(f"경고: {frame_count}번째 프레임이 비어있습니다.")
                 frame_count += 1
                 continue
             if frame_count % frame_interval == 0:
                 frame_path = os.path.join(output_folder, f"frame_{saved_frame_count}.jpg")
                 try:
@@ -171,28 +139,22 @@ class VideoProcessor:
                         print(f"경고: {frame_path} 저장 실패.")
                 except Exception as e:
                     print(f"경고: 프레임 저장 오류 ({frame_path}): {e}")
             frame_count += 1
         cap.release()
         if not frame_paths:
             print("경고: 프레임 ���출 실패.")
             if os.path.exists(output_folder):
                 shutil.rmtree(output_folder)
             return [], None
         return frame_paths, output_folder
     def cleanup_temp_files(self, video_path, frame_folder):
-        """임시 비디오 파일 및 프레임 폴더 정리"""
         if video_path and "temp_video_" in video_path and os.path.exists(video_path):
             try:
                 os.remove(video_path)
                 print(f"임시 비디오 파일 삭제: {video_path}")
             except OSError as e:
                 print(f"임시 비디오 파일 삭제 오류: {e}")
         if frame_folder and os.path.exists(frame_folder):
             try:
                 shutil.rmtree(frame_folder)
@@ -201,24 +163,18 @@ class VideoProcessor:
                 print(f"프레임 폴더 삭제 오류: {e}")
-# -----------------------------------------------------------------------------
-# TipCalculator: 팁 계산 핵심 로직 (알리바바 Qwen만 사용)
-# -----------------------------------------------------------------------------
 class TipCalculator:
-    """팁 계산 핵심 로직 (Alibaba Qwen만 사용)"""
     def __init__(self, config: Config, model_clients: ModelClients, video_processor: VideoProcessor):
         self.config = config
         self.model_clients = model_clients
         self.video_processor = video_processor
     def parse_llm_output(self, output_text):
-        """LLM 출력을 파싱하여 팁 계산 결과 추출"""
         analysis = "Analysis not found."
         tip_percentage = 0.0
         tip_amount = 0.0
         total_bill = 0.0
         analysis_match = re.search(r"Analysis:\s*(.*?)Tip Percentage:", output_text, re.DOTALL | re.IGNORECASE)
         if analysis_match:
             analysis = analysis_match.group(1).strip()
@@ -226,7 +182,6 @@ class TipCalculator:
             analysis_match_alt = re.search(r"Analysis:\s*(.*)", output_text, re.DOTALL | re.IGNORECASE)
             if analysis_match_alt:
                 analysis = analysis_match_alt.group(1).strip()
         percentage_match = re.search(r"Tip Percentage:\s*\*{0,2}(\d+(?:\.\d+)?)%\*{0,2}", output_text,
                                      re.DOTALL | re.IGNORECASE)
         if percentage_match:
@@ -235,7 +190,6 @@ class TipCalculator:
             except ValueError:
                 print(f"경고: Tip Percentage 변환 실패 - {percentage_match.group(1)}")
                 tip_percentage = 0.0
         tip_match = re.search(r"Tip Amount:\s*\$?\s*([0-9.]+)", output_text, re.IGNORECASE)
         if tip_match:
             try:
@@ -245,32 +199,24 @@ class TipCalculator:
                 tip_amount = 0.0
         else:
             print(f"경고: 출력에서 Tip Amount를 찾을 수 없습니다:\n{output_text}")
         total_match = re.search(r"Total Bill:\s*\$?\s*([0-9.]+)", output_text, re.IGNORECASE)
         if total_match:
             try:
                 total_bill = float(total_match.group(1))
             except ValueError:
                 print(f"경고: Total Bill 변환 실패 - {total_match.group(1)}")
         if len(analysis) < 20 and analysis == "Analysis not found.":
             analysis = output_text
         return analysis, tip_percentage, tip_amount, output_text
     def process_tip_qwen(self, video_file_path, star_rating, user_review, calculated_subtotal, custom_prompt=None):
-        """Qwen API를 사용한 팁 계산 처리 (비디오 캡션 생성 및 팁 산출)"""
         if not os.path.exists(video_file_path):
             return "Error: 비디오 파일 경로가 유효하지 않습니다.", 0.0, 0.0, [], None, ""
-        # 비디오 -> base64 인코딩
         base64_video = self.model_clients.encode_video_qwen(video_file_path)
-        # Omni 프롬프트
         omni_caption_prompt = '''
 Task 1: Describe the waiters' actions in these restaurant video frames. Please check for mistakes or negative behaviors.
 Task 2: Provide a short chronological summary of the entire scene.
 '''
-        # Omni 스트리밍 호출
         omni_result = self.model_clients.qwen_client.chat.completions.create(
             model="qwen2.5-omni-7b",
             messages=[
@@ -281,10 +227,7 @@ Task 2: Provide a short chronological summary of the entire scene.
                 {
                     "role": "user",
                     "content": [
-                        {
-                            "type": "video_url",
-                            "video_url": {"url": f"data:;base64,{base64_video}"},
-                        },
                         {"type": "text", "text": omni_caption_prompt},
                     ],
                 },
@@ -293,7 +236,6 @@ Task 2: Provide a short chronological summary of the entire scene.
             stream=True,
             stream_options={"include_usage": True},
         )
-        # 캡션 추출
         all_omni_chunks = list(omni_result)
         caption_text = ""
         for chunk in all_omni_chunks[:-1]:
@@ -303,8 +245,6 @@ Task 2: Provide a short chronological summary of the entire scene.
                 caption_text += chunk.choices[0].delta.content
         if not caption_text.strip():
             caption_text = "(No caption from Omni)"
-        # --- 2) qvq-max로 팁 계산 ---
         user_review = user_review.strip() if user_review else "(No user review)"
         if custom_prompt is None:
             prompt = self.config.DEFAULT_PROMPT_TEMPLATE.format(
@@ -325,22 +265,12 @@ Task 2: Provide a short chronological summary of the entire scene.
                     star_rating=star_rating,
                     user_review=user_review
                 )
         final_prompt = prompt.replace("{caption_text}", caption_text)
         qvq_result = self.model_clients.qwen_client.chat.completions.create(
             model="qwen2.5-vl-32b-instruct",
             messages=[
-                {
-                    "role": "system",
-                    "content": [{"type": "text", "text": "You are a helpful assistant."}],
-                },
-                {
-                    "role": "user",
-                    "content": [
-                        {"type": "text", "text": final_prompt}
-                    ],
-                },
             ],
             modalities=["text"],
             stream=True,
@@ -360,13 +290,11 @@ Task 2: Provide a short chronological summary of the entire scene.
                     print("\n" + "=" * 20 + "Complete Response" + "=" * 20 + "\n")
                     is_answering = True
                 final_answer += d.content
         final_text = final_reasoning + "\n" + final_answer
         analysis, tip_percentage, tip_amount, output_text = self.parse_llm_output(final_text)
         return analysis, tip_percentage, tip_amount, [], None, output_text
     def calculate_manual_tip(self, tip_percent, subtotal):
-        """백분율에 따른 수동 팁 계산"""
         tip_amount = subtotal * (tip_percent / 100)
         total_bill = subtotal + tip_amount
         analysis_output = f"Manual calculation using fixed tip percentage of {tip_percent}%."
@@ -375,51 +303,38 @@ Task 2: Provide a short chronological summary of the entire scene.
         return analysis_output, tip_output, total_bill_output
-# -----------------------------------------------------------------------------
-# UIHandler: Gradio UI 이벤트 및 콜백 처리 (Qwen만 사용, 알리바바 API 키 입력 필드 추가)
-# -----------------------------------------------------------------------------
 class UIHandler:
-    """Gradio UI 이벤트 및 콜백 처리"""
     def __init__(self, config: Config, tip_calculator: TipCalculator, video_processor: VideoProcessor):
         self.config = config
         self.tip_calculator = tip_calculator
         self.video_processor = video_processor
     def update_subtotal_and_prompt(self, *args):
-        """사용자 입력에 따라 소계 및 프롬프트 업데이트"""
         num_food_items = len(self.config.FOOD_ITEMS)
         quantities = args[:num_food_items]
         star_rating = args[num_food_items]
         user_review = args[num_food_items + 1]
         calculated_subtotal = 0.0
         for i in range(num_food_items):
             calculated_subtotal += self.config.FOOD_ITEMS[i]['price'] * quantities[i]
         user_review_text = user_review.strip() if user_review and user_review.strip() else "(No user review provided)"
         updated_prompt = self.config.DEFAULT_PROMPT_TEMPLATE.format(
             calculated_subtotal=calculated_subtotal,
             star_rating=star_rating,
             user_review=user_review_text
         )
         updated_prompt = updated_prompt.replace("{caption_text}", "{{caption_text}}")
         return calculated_subtotal, updated_prompt
     def compute_tip(self, alibaba_key, video_file_obj, subtotal, star_rating, user_review, custom_prompt_text):
-        """알리바바 Qwen 모델을 사용하여 팁 계산"""
         analysis_output = "계산을 시작합니다..."
         tip_percentage = 0.0
         tip_output = "$0.00"
         total_bill_output = f"${subtotal:.2f}"
         if video_file_obj is None:
             return "오류: 비디오 파일을 업로드해주세요.", "$0.00", total_bill_output, custom_prompt_text, gr.update(value=None)
         try:
-            # 입력받은 알리바바 API 키가 있으면 Qwen 클라이언트를 재설정
             if alibaba_key and alibaba_key.strip():
                 from openai import OpenAI as QwenOpenAI
                 self.tip_calculator.model_clients.qwen_client = QwenOpenAI(
@@ -433,7 +348,6 @@ class UIHandler:
         except Exception as e:
             print(f"임시 비디오 파일 생성 오류: {e}")
             return f"오류: 비디오 파일을 처리할 수 없습니다: {e}", "$0.00", total_bill_output, custom_prompt_text, None
         frame_folder = None
         try:
             analysis, tip_percentage, tip_amount, _, _, output_text = self.tip_calculator.process_tip_qwen(
@@ -454,11 +368,9 @@ class UIHandler:
             total_bill_output = f"${subtotal:.2f}"
         finally:
             self.video_processor.cleanup_temp_files(temp_video_path, frame_folder)
         return analysis_output, tip_output, total_bill_output, custom_prompt_text, gr.update(value=None)
     def auto_tip_and_invoice(self, alibaba_key, video_file_obj, subtotal, star_rating, review, prompt, *quantities):
-        """AI 모델을 사용한 자동 팁 계산 및 청구서 업데이트 (알리바바 Qwen만 사용)"""
         analysis, tip_disp, total_bill_disp, prompt_out, vid_out = self.compute_tip(
             alibaba_key, video_file_obj, subtotal, star_rating, review, prompt
         )
@@ -466,72 +378,54 @@ class UIHandler:
         return analysis, tip_disp, total_bill_disp, prompt_out, vid_out, invoice
     def update_invoice_summary(self, *args):
-        """수량 및 팁에 따라 청구서 요약 업데이트"""
         num_items = len(self.config.FOOD_ITEMS)
         quantities = args[:num_items]
         if len(args) >= num_items + 2:
             tip_str = args[num_items]
             total_bill_str = args[num_items + 1]
         else:
             tip_str = "$0.00"
             total_bill_str = "$0.00"
         summary = ""
         for i, q in enumerate(quantities):
             try:
                 q_val = float(q)
             except:
                 q_val = 0
             if q_val > 0:
                 item = self.config.FOOD_ITEMS[i]
                 total_price = item['price'] * q_val
                 summary += f"{item['name']} x{int(q_val)} : ${total_price:.2f}\n"
         if summary == "":
             summary = "주문한 메뉴가 없습니다."
         summary += f"\nTip: {tip_str}\nTotal Bill: {total_bill_str}"
         return summary
     def manual_tip_and_invoice(self, tip_percent, subtotal, *quantities):
-        """수동 팁 계산 및 청구서 업데이트"""
         analysis, tip_disp, total_bill_disp = self.tip_calculator.calculate_manual_tip(tip_percent, subtotal)
         invoice = self.update_invoice_summary(*quantities, tip_disp, total_bill_disp)
         return analysis, tip_disp, total_bill_disp, invoice
     def process_payment(self, total_bill):
-        """총 청구액에 대한 결제 처리"""
         return f"{total_bill} 결제되었습니다."
-# -----------------------------------------------------------------------------
-# App: 모든 것을 연결하는 메인 애플리케이션 클래스
-# -----------------------------------------------------------------------------
 class App:
-    """메인 애플리케이션 클래스"""
     def __init__(self):
         self.config = Config()
         self.model_clients = ModelClients(self.config)
         self.video_processor = VideoProcessor()
         self.tip_calculator = TipCalculator(self.config, self.model_clients, self.video_processor)
         self.ui_handler = UIHandler(self.config, self.tip_calculator, self.video_processor)
-        # Flask 앱 (필요 시 사용)
         self.flask_app = Flask(__name__)
     def create_gradio_blocks(self):
-        """Gradio Blocks 인터페이스 구성"""
         with gr.Blocks(title="Video Tip Calculation Interface", theme=gr.themes.Soft(),
                        css=self.config.CUSTOM_CSS) as interface:
             gr.Markdown("## Video Tip Calculation Interface (Structured)")
             quantity_inputs = []
             subtotal_display = gr.Number(label="Subtotal ($)", value=0.0, interactive=False, visible=False)
             with gr.Row():
                 with gr.Column(scale=2):
                     gr.Markdown("### 1. Select Food Items")
@@ -556,13 +450,10 @@ class App:
                                     elem_id=f"qty_{item['name'].replace(' ', '_')}"
                                 )
                                 quantity_inputs.append(q_input)
                     subtotal_visible_display = gr.Textbox(label="Subtotal", value="$0.00", interactive=False)
                     gr.Markdown("### 2. Service Feedback")
                     review_input = gr.Textbox(label="Review", placeholder="서비스 리뷰를 작성해주세요.", lines=3)
                     rating_input = gr.Radio(choices=[1, 2, 3, 4, 5], value=3, label="⭐Star Rating (1-5)⭐", type="value")
                     gr.Markdown("### 3. Calculate Tip")
                     with gr.Row():
                         btn_5 = gr.Button("5%")
@@ -570,21 +461,15 @@ class App:
                         btn_15 = gr.Button("15%")
                         btn_20 = gr.Button("20%")
                         btn_25 = gr.Button("25%")
-                    # Qwen 모델 버튼만 남김
                     with gr.Row():
                         qwen_btn = gr.Button("Alibaba-Qwen", variant="tertiary", elem_id="qwen-button")
                     gr.Markdown("### 4. Results")
                     tip_display = gr.Textbox(label="Calculated Tip", value="$0.00", interactive=False)
-                    total_bill_display = gr.Textbox(label="Total Bill (Subtotal + Tip)", value="$0.00",
-                                                    interactive=False)
                     payment_btn = gr.Button("결제하기")
                     payment_result = gr.Textbox(label="Payment Result", value="", interactive=False)
                 with gr.Column(scale=1):
                     gr.Markdown("### 5. Upload & Prompt")
-                    # 알리바바 API 키 입력 필드 추가
                     alibaba_key_input = gr.Textbox(label="Alibaba API Key", placeholder="Enter your Alibaba API Key", lines=1)
                     video_input = gr.Video(label="Upload Service Video")
                     prompt_display = gr.Textbox(
@@ -598,21 +483,15 @@ class App:
                             user_review="(No user review provided)"
                         ).replace("{caption_text}", "{{caption_text}}")
                     )
                     gr.Markdown("### 6. AI Analysis")
                     analysis_display = gr.Textbox(label="AI Analysis", lines=10, max_lines=15, interactive=True)
                     gr.Markdown("### 7. 청구서")
                     order_summary_display = gr.Textbox(label="청구서", value="주문한 메뉴가 없습니다.", interactive=True)
-            # Subtotal 값 업데이트 시 $ 표시 갱신
             subtotal_display.change(
                 fn=lambda x: f"${x:.2f}",
                 inputs=[subtotal_display],
                 outputs=[subtotal_visible_display]
             )
-            # 음식 수량, 별점, 리뷰가 바뀔 때마다 Subtotal, Prompt 업데이트
             inputs_for_prompt_update = quantity_inputs + [rating_input, review_input]
             outputs_for_prompt_update = [subtotal_display, prompt_display]
             for comp in inputs_for_prompt_update:
@@ -621,21 +500,16 @@ class App:
                     inputs=inputs_for_prompt_update,
                     outputs=outputs_for_prompt_update
                 )
-            # 수량 변화 시 청구서 텍스트 업데이트
             for comp in quantity_inputs:
                 comp.change(
                     fn=self.ui_handler.update_invoice_summary,
                     inputs=quantity_inputs,
                     outputs=order_summary_display
                 )
-            # 모델 호출 후 결과 업데이트 (알리바바 API 키 포함)
             compute_inputs = [alibaba_key_input, video_input, subtotal_display, rating_input, review_input, prompt_display] + quantity_inputs
             compute_outputs = [
                 analysis_display, tip_display, total_bill_display, prompt_display, video_input, order_summary_display
             ]
             qwen_btn.click(
                 fn=lambda alibaba_key, vid, sub, rat, rev, prom, *qty: self.ui_handler.auto_tip_and_invoice(
                     alibaba_key, vid, sub, rat, rev, prom, *qty
@@ -643,8 +517,6 @@ class App:
                 inputs=compute_inputs,
                 outputs=compute_outputs
             )
-            # 수동 팁 계산 버튼들
             btn_5.click(
                 fn=lambda sub, *qty: self.ui_handler.manual_tip_and_invoice(5, sub, *qty),
                 inputs=[subtotal_display] + quantity_inputs,
@@ -670,35 +542,24 @@ class App:
                 inputs=[subtotal_display] + quantity_inputs,
                 outputs=[analysis_display, tip_display, total_bill_display, order_summary_display]
             )
-            # 결제 버튼
             payment_btn.click(
                 fn=self.ui_handler.process_payment,
                 inputs=[total_bill_display],
                 outputs=[payment_result]
             )
             return interface
     def run_gradio(self):
-        """Gradio 서버 실행"""
         interface = self.create_gradio_blocks()
         interface.launch(share=True)
     def run_flask(self):
-        """Flask 서버 실행 (원한다면)"""
         @self.flask_app.route("/")
         def index():
             return "Hello Flask"
         self.flask_app.run(host="0.0.0.0", port=5000, debug=True)
 if __name__ == "__main__":
     app = App()
-    # Gradio UI 실행
     app.run_gradio()
-    # Flask 서버 실행 (원하면 아래 주석 해제)
-    # app.run_flask()

 import cv2
 import base64
 import uuid
+import re
 from flask import Flask
 import gradio as gr
+# --- Config 클래스 (Gemma, GPT4o 제거, Qwen만 사용) ---
 class Config:
     """애플리케이션 설정 및 상수"""
     FOOD_ITEMS = [
         {"name": "짜장면", "image": "images/food1.jpg", "price": 7.00},
         {"name": "짬뽕", "image": "images/food2.jpg", "price": 8.50},
         {"name": "콜라", "image": "images/food6.jpg", "price": 12.00},
         {"name": "사이다", "image": "images/food6.jpg", "price": 12.00},
     ]
     # 알리바바 Qwen API 키 (기본값은 빈 문자열)
     QWEN_API_KEY = ""
     DEFAULT_PROMPT_TEMPLATE = (
         "### Persona ###\n"
         "You are an expert tip calculation assistant focusing on service quality observed in a video.\n\n"
         "Total Bill: $[Subtotal + Tip]"
     )
     CUSTOM_CSS = """
     #food-container {
         display: grid;
         overflow-y: auto;
         height: 600px;
     }
     #qwen-button {
         background-color: #8A2BE2 !important;
         color: white !important;
         border-color: #8A2BE2 !important;
     }
     #qwen-button:hover {
         background-color: #7722CC !important;
     }
     """
     def __init__(self):
         if not os.path.exists("images"):
             print("경고: 'images' 폴더를 찾을 수 없습니다. 음식 이미지가 표시되지 않을 수 있습니다.")
         for item in self.FOOD_ITEMS:
                 print(f"경고: 이미지 파일을 찾을 수 없습니다 - {item['image']}")
+# --- ModelClients (알리바바 Qwen API만 사용) ---
 class ModelClients:
     def __init__(self, config: Config):
         self.config = config
         from openai import OpenAI as QwenOpenAI
         )
     def encode_video_qwen(self, video_path):
         with open(video_path, "rb") as video_file:
             return base64.b64encode(video_file.read()).decode("utf-8")
+# --- VideoProcessor: 비디오 프레임 추출 ---
 class VideoProcessor:
     def extract_video_frames(self, video_path, output_folder=None, fps=1):
         if not video_path:
             return [], None
         if output_folder is None:
             output_folder = f"frames_list/frames_{uuid.uuid4().hex}"
         os.makedirs(output_folder, exist_ok=True)
         cap = cv2.VideoCapture(video_path)
         if not cap.isOpened():
             print(f"오류: 비디오 파일을 열 수 없습니다 - {video_path}")
             return [], None
         frame_paths = []
         frame_rate = cap.get(cv2.CAP_PROP_FPS)
         if not frame_rate or frame_rate == 0:
             print("경고: FPS를 읽을 수 없습니다, 기본값 4으로 설정합니다.")
             frame_rate = 4.0
         frame_interval = int(frame_rate / fps) if fps > 0 else 1
         if frame_interval <= 0:
             frame_interval = 1
         frame_count = 0
         saved_frame_count = 0
         while cap.isOpened():
             ret, frame = cap.read()
             if not ret:
                 break
             if frame is None:
                 print(f"경고: {frame_count}번째 프레임이 비어있습니다.")
                 frame_count += 1
                 continue
             if frame_count % frame_interval == 0:
                 frame_path = os.path.join(output_folder, f"frame_{saved_frame_count}.jpg")
                 try:
                         print(f"경고: {frame_path} 저장 실패.")
                 except Exception as e:
                     print(f"경고: 프레임 저장 오류 ({frame_path}): {e}")
             frame_count += 1
         cap.release()
         if not frame_paths:
             print("경고: 프레임 ���출 실패.")
             if os.path.exists(output_folder):
                 shutil.rmtree(output_folder)
             return [], None
         return frame_paths, output_folder
     def cleanup_temp_files(self, video_path, frame_folder):
         if video_path and "temp_video_" in video_path and os.path.exists(video_path):
             try:
                 os.remove(video_path)
                 print(f"임시 비디오 파일 삭제: {video_path}")
             except OSError as e:
                 print(f"임시 비디오 파일 삭제 오류: {e}")
         if frame_folder and os.path.exists(frame_folder):
             try:
                 shutil.rmtree(frame_folder)
                 print(f"프레임 폴더 삭제 오류: {e}")
+# --- TipCalculator (알리바바 Qwen API를 사용한 팁 계산) ---
 class TipCalculator:
     def __init__(self, config: Config, model_clients: ModelClients, video_processor: VideoProcessor):
         self.config = config
         self.model_clients = model_clients
         self.video_processor = video_processor
     def parse_llm_output(self, output_text):
         analysis = "Analysis not found."
         tip_percentage = 0.0
         tip_amount = 0.0
         total_bill = 0.0
         analysis_match = re.search(r"Analysis:\s*(.*?)Tip Percentage:", output_text, re.DOTALL | re.IGNORECASE)
         if analysis_match:
             analysis = analysis_match.group(1).strip()
             analysis_match_alt = re.search(r"Analysis:\s*(.*)", output_text, re.DOTALL | re.IGNORECASE)
             if analysis_match_alt:
                 analysis = analysis_match_alt.group(1).strip()
         percentage_match = re.search(r"Tip Percentage:\s*\*{0,2}(\d+(?:\.\d+)?)%\*{0,2}", output_text,
                                      re.DOTALL | re.IGNORECASE)
         if percentage_match:
             except ValueError:
                 print(f"경고: Tip Percentage 변환 실패 - {percentage_match.group(1)}")
                 tip_percentage = 0.0
         tip_match = re.search(r"Tip Amount:\s*\$?\s*([0-9.]+)", output_text, re.IGNORECASE)
         if tip_match:
             try:
                 tip_amount = 0.0
         else:
             print(f"경고: 출력에서 Tip Amount를 찾을 수 없습니다:\n{output_text}")
         total_match = re.search(r"Total Bill:\s*\$?\s*([0-9.]+)", output_text, re.IGNORECASE)
         if total_match:
             try:
                 total_bill = float(total_match.group(1))
             except ValueError:
                 print(f"경고: Total Bill 변환 실패 - {total_match.group(1)}")
         if len(analysis) < 20 and analysis == "Analysis not found.":
             analysis = output_text
         return analysis, tip_percentage, tip_amount, output_text
     def process_tip_qwen(self, video_file_path, star_rating, user_review, calculated_subtotal, custom_prompt=None):
         if not os.path.exists(video_file_path):
             return "Error: 비디오 파일 경로가 유효하지 않습니다.", 0.0, 0.0, [], None, ""
         base64_video = self.model_clients.encode_video_qwen(video_file_path)
         omni_caption_prompt = '''
 Task 1: Describe the waiters' actions in these restaurant video frames. Please check for mistakes or negative behaviors.
 Task 2: Provide a short chronological summary of the entire scene.
 '''
         omni_result = self.model_clients.qwen_client.chat.completions.create(
             model="qwen2.5-omni-7b",
             messages=[
                 {
                     "role": "user",
                     "content": [
+                        {"type": "video_url", "video_url": {"url": f"data:;base64,{base64_video}"}},
                         {"type": "text", "text": omni_caption_prompt},
                     ],
                 },
             stream=True,
             stream_options={"include_usage": True},
         )
         all_omni_chunks = list(omni_result)
         caption_text = ""
         for chunk in all_omni_chunks[:-1]:
                 caption_text += chunk.choices[0].delta.content
         if not caption_text.strip():
             caption_text = "(No caption from Omni)"
         user_review = user_review.strip() if user_review else "(No user review)"
         if custom_prompt is None:
             prompt = self.config.DEFAULT_PROMPT_TEMPLATE.format(
                     star_rating=star_rating,
                     user_review=user_review
                 )
         final_prompt = prompt.replace("{caption_text}", caption_text)
         qvq_result = self.model_clients.qwen_client.chat.completions.create(
             model="qwen2.5-vl-32b-instruct",
             messages=[
+                {"role": "system", "content": [{"type": "text", "text": "You are a helpful assistant."}]},
+                {"role": "user", "content": [{"type": "text", "text": final_prompt}]},
             ],
             modalities=["text"],
             stream=True,
                     print("\n" + "=" * 20 + "Complete Response" + "=" * 20 + "\n")
                     is_answering = True
                 final_answer += d.content
         final_text = final_reasoning + "\n" + final_answer
         analysis, tip_percentage, tip_amount, output_text = self.parse_llm_output(final_text)
         return analysis, tip_percentage, tip_amount, [], None, output_text
     def calculate_manual_tip(self, tip_percent, subtotal):
         tip_amount = subtotal * (tip_percent / 100)
         total_bill = subtotal + tip_amount
         analysis_output = f"Manual calculation using fixed tip percentage of {tip_percent}%."
         return analysis_output, tip_output, total_bill_output
+# --- UIHandler: Gradio 인터페이스 이벤트 처리 (알리바바 API 키 입력 포함) ---
 class UIHandler:
     def __init__(self, config: Config, tip_calculator: TipCalculator, video_processor: VideoProcessor):
         self.config = config
         self.tip_calculator = tip_calculator
         self.video_processor = video_processor
     def update_subtotal_and_prompt(self, *args):
         num_food_items = len(self.config.FOOD_ITEMS)
         quantities = args[:num_food_items]
         star_rating = args[num_food_items]
         user_review = args[num_food_items + 1]
         calculated_subtotal = 0.0
         for i in range(num_food_items):
             calculated_subtotal += self.config.FOOD_ITEMS[i]['price'] * quantities[i]
         user_review_text = user_review.strip() if user_review and user_review.strip() else "(No user review provided)"
         updated_prompt = self.config.DEFAULT_PROMPT_TEMPLATE.format(
             calculated_subtotal=calculated_subtotal,
             star_rating=star_rating,
             user_review=user_review_text
         )
         updated_prompt = updated_prompt.replace("{caption_text}", "{{caption_text}}")
         return calculated_subtotal, updated_prompt
     def compute_tip(self, alibaba_key, video_file_obj, subtotal, star_rating, user_review, custom_prompt_text):
         analysis_output = "계산을 시작합니다..."
         tip_percentage = 0.0
         tip_output = "$0.00"
         total_bill_output = f"${subtotal:.2f}"
         if video_file_obj is None:
             return "오류: 비디오 파일을 업로드해주세요.", "$0.00", total_bill_output, custom_prompt_text, gr.update(value=None)
         try:
             if alibaba_key and alibaba_key.strip():
                 from openai import OpenAI as QwenOpenAI
                 self.tip_calculator.model_clients.qwen_client = QwenOpenAI(
         except Exception as e:
             print(f"임시 비디오 파일 생성 오류: {e}")
             return f"오류: 비디오 파일을 처리할 수 없습니다: {e}", "$0.00", total_bill_output, custom_prompt_text, None
         frame_folder = None
         try:
             analysis, tip_percentage, tip_amount, _, _, output_text = self.tip_calculator.process_tip_qwen(
             total_bill_output = f"${subtotal:.2f}"
         finally:
             self.video_processor.cleanup_temp_files(temp_video_path, frame_folder)
         return analysis_output, tip_output, total_bill_output, custom_prompt_text, gr.update(value=None)
     def auto_tip_and_invoice(self, alibaba_key, video_file_obj, subtotal, star_rating, review, prompt, *quantities):
         analysis, tip_disp, total_bill_disp, prompt_out, vid_out = self.compute_tip(
             alibaba_key, video_file_obj, subtotal, star_rating, review, prompt
         )
         return analysis, tip_disp, total_bill_disp, prompt_out, vid_out, invoice
     def update_invoice_summary(self, *args):
         num_items = len(self.config.FOOD_ITEMS)
         quantities = args[:num_items]
         if len(args) >= num_items + 2:
             tip_str = args[num_items]
             total_bill_str = args[num_items + 1]
         else:
             tip_str = "$0.00"
             total_bill_str = "$0.00"
         summary = ""
         for i, q in enumerate(quantities):
             try:
                 q_val = float(q)
             except:
                 q_val = 0
             if q_val > 0:
                 item = self.config.FOOD_ITEMS[i]
                 total_price = item['price'] * q_val
                 summary += f"{item['name']} x{int(q_val)} : ${total_price:.2f}\n"
         if summary == "":
             summary = "주문한 메뉴가 없습니다."
         summary += f"\nTip: {tip_str}\nTotal Bill: {total_bill_str}"
         return summary
     def manual_tip_and_invoice(self, tip_percent, subtotal, *quantities):
         analysis, tip_disp, total_bill_disp = self.tip_calculator.calculate_manual_tip(tip_percent, subtotal)
         invoice = self.update_invoice_summary(*quantities, tip_disp, total_bill_disp)
         return analysis, tip_disp, total_bill_disp, invoice
     def process_payment(self, total_bill):
         return f"{total_bill} 결제되었습니다."
+# --- App: 모든 컴포넌트 연결 및 Gradio 인터페이스 실행 ---
 class App:
     def __init__(self):
         self.config = Config()
         self.model_clients = ModelClients(self.config)
         self.video_processor = VideoProcessor()
         self.tip_calculator = TipCalculator(self.config, self.model_clients, self.video_processor)
         self.ui_handler = UIHandler(self.config, self.tip_calculator, self.video_processor)
         self.flask_app = Flask(__name__)
     def create_gradio_blocks(self):
         with gr.Blocks(title="Video Tip Calculation Interface", theme=gr.themes.Soft(),
                        css=self.config.CUSTOM_CSS) as interface:
             gr.Markdown("## Video Tip Calculation Interface (Structured)")
             quantity_inputs = []
             subtotal_display = gr.Number(label="Subtotal ($)", value=0.0, interactive=False, visible=False)
             with gr.Row():
                 with gr.Column(scale=2):
                     gr.Markdown("### 1. Select Food Items")
                                     elem_id=f"qty_{item['name'].replace(' ', '_')}"
                                 )
                                 quantity_inputs.append(q_input)
                     subtotal_visible_display = gr.Textbox(label="Subtotal", value="$0.00", interactive=False)
                     gr.Markdown("### 2. Service Feedback")
                     review_input = gr.Textbox(label="Review", placeholder="서비스 리뷰를 작성해주세요.", lines=3)
                     rating_input = gr.Radio(choices=[1, 2, 3, 4, 5], value=3, label="⭐Star Rating (1-5)⭐", type="value")
                     gr.Markdown("### 3. Calculate Tip")
                     with gr.Row():
                         btn_5 = gr.Button("5%")
                         btn_15 = gr.Button("15%")
                         btn_20 = gr.Button("20%")
                         btn_25 = gr.Button("25%")
                     with gr.Row():
                         qwen_btn = gr.Button("Alibaba-Qwen", variant="tertiary", elem_id="qwen-button")
                     gr.Markdown("### 4. Results")
                     tip_display = gr.Textbox(label="Calculated Tip", value="$0.00", interactive=False)
+                    total_bill_display = gr.Textbox(label="Total Bill (Subtotal + Tip)", value="$0.00", interactive=False)
                     payment_btn = gr.Button("결제하기")
                     payment_result = gr.Textbox(label="Payment Result", value="", interactive=False)
                 with gr.Column(scale=1):
                     gr.Markdown("### 5. Upload & Prompt")
                     alibaba_key_input = gr.Textbox(label="Alibaba API Key", placeholder="Enter your Alibaba API Key", lines=1)
                     video_input = gr.Video(label="Upload Service Video")
                     prompt_display = gr.Textbox(
                             user_review="(No user review provided)"
                         ).replace("{caption_text}", "{{caption_text}}")
                     )
                     gr.Markdown("### 6. AI Analysis")
                     analysis_display = gr.Textbox(label="AI Analysis", lines=10, max_lines=15, interactive=True)
                     gr.Markdown("### 7. 청구서")
                     order_summary_display = gr.Textbox(label="청구서", value="주문한 메뉴가 없습니다.", interactive=True)
             subtotal_display.change(
                 fn=lambda x: f"${x:.2f}",
                 inputs=[subtotal_display],
                 outputs=[subtotal_visible_display]
             )
             inputs_for_prompt_update = quantity_inputs + [rating_input, review_input]
             outputs_for_prompt_update = [subtotal_display, prompt_display]
             for comp in inputs_for_prompt_update:
                     inputs=inputs_for_prompt_update,
                     outputs=outputs_for_prompt_update
                 )
             for comp in quantity_inputs:
                 comp.change(
                     fn=self.ui_handler.update_invoice_summary,
                     inputs=quantity_inputs,
                     outputs=order_summary_display
                 )
             compute_inputs = [alibaba_key_input, video_input, subtotal_display, rating_input, review_input, prompt_display] + quantity_inputs
             compute_outputs = [
                 analysis_display, tip_display, total_bill_display, prompt_display, video_input, order_summary_display
             ]
             qwen_btn.click(
                 fn=lambda alibaba_key, vid, sub, rat, rev, prom, *qty: self.ui_handler.auto_tip_and_invoice(
                     alibaba_key, vid, sub, rat, rev, prom, *qty
                 inputs=compute_inputs,
                 outputs=compute_outputs
             )
             btn_5.click(
                 fn=lambda sub, *qty: self.ui_handler.manual_tip_and_invoice(5, sub, *qty),
                 inputs=[subtotal_display] + quantity_inputs,
                 inputs=[subtotal_display] + quantity_inputs,
                 outputs=[analysis_display, tip_display, total_bill_display, order_summary_display]
             )
             payment_btn.click(
                 fn=self.ui_handler.process_payment,
                 inputs=[total_bill_display],
                 outputs=[payment_result]
             )
             return interface
     def run_gradio(self):
         interface = self.create_gradio_blocks()
         interface.launch(share=True)
     def run_flask(self):
         @self.flask_app.route("/")
         def index():
             return "Hello Flask"
         self.flask_app.run(host="0.0.0.0", port=5000, debug=True)
 if __name__ == "__main__":
     app = App()
     app.run_gradio()

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+gradio
+opencv-python
+flask
+openai

space.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+runtime: python
+python_version: "3.10"
+hardware:
+  gpu: false