Spaces:

Hieucyber2208
/

know-flow

Running

App Files Files Community

hieu-nguyen2208 commited on Mar 3

Commit

091b090

1 Parent(s): c9a39eb

"LOL"

Browse files

Files changed (3) hide show

app.py +2 -1
main.py +2 -2
src/text_processing.py +5 -5

app.py CHANGED Viewed

@@ -47,6 +47,7 @@ if uploaded_file:
     with open(file_path, "wb") as f:
         f.write(uploaded_file.getbuffer())  # Lưu file thực tế
 number_of_images = st.slider("🖼️ Nhập số ảnh",1,10,3)
 # Cấu hình đầu vào
 gender = st.radio("🗣️ Select Voice Gender", options=["female", "male"])
@@ -98,7 +99,7 @@ def convert_audio_format(video_input, video_output):
 if st.button("🚀 Generate Video"):
     if file_path and os.path.exists(file_path):
         st.success("⏳ Processing started...")
-        main(file_path, analysis_level, writting_style, word_lower_limit, word_upper_limit, gender, speed, number_of_images, detail_level, perspective, emotion, time_setting, art_style, style, color_palette)
         # Kiểm tra xem video đã được tạo chưa
         if os.path.exists(OUTPUT_VIDEO_PATH):

     with open(file_path, "wb") as f:
         f.write(uploaded_file.getbuffer())  # Lưu file thực tế
 number_of_images = st.slider("🖼️ Nhập số ảnh",1,10,3)
+chunks = st.slider("📄 Number of chunks", min_value=1, max_value=10, value=3)
 # Cấu hình đầu vào
 gender = st.radio("🗣️ Select Voice Gender", options=["female", "male"])
 if st.button("🚀 Generate Video"):
     if file_path and os.path.exists(file_path):
         st.success("⏳ Processing started...")
+        main(file_path, chunks, analysis_level, writting_style, word_lower_limit, word_upper_limit, gender, speed, number_of_images, detail_level, perspective, emotion, time_setting, art_style, style, color_palette)
         # Kiểm tra xem video đã được tạo chưa
         if os.path.exists(OUTPUT_VIDEO_PATH):

main.py CHANGED Viewed

@@ -5,7 +5,7 @@ from src.text_to_video import text_to_video
 import os
 import glob
-def main(file_path, analysis_level='basic', writting_style='academic', word_lower_limit=100, word_upper_limit = 150, gender = "female", speed = "fast", number_of_images = 3, detail_level="short", perspective="neutral", emotion="sad", time_setting="classic", art_style="realistic", style="anime", color_palette="monochrome"):
     # Lấy danh sách tất cả các tệp .txt và .mp3 trong thư mục hiện tại
     files_to_delete = glob.glob("*.txt") + glob.glob("*.mp3") + glob.glob("*.png")
@@ -14,7 +14,7 @@ def main(file_path, analysis_level='basic', writting_style='academic', word_lowe
         if file != "requirements.txt":
             os.remove(file)
             print(f"Deleted: {file}")
-    text_processing(file_path = file_path, analysis_level=analysis_level, writting_style=writting_style, word_lower_limit = word_lower_limit, word_upper_limit=word_upper_limit )
     text_to_speech(gender = gender, speed = speed)
     image_gen(number_of_images = number_of_images, detail_level=detail_level, perspective=perspective, emotion=emotion, time_setting=time_setting, art_style=art_style, style=style, color_palette=color_palette)
     text_to_video()

 import os
 import glob
+def main(file_path, chunks = 3, analysis_level='basic', writting_style='academic', word_lower_limit=100, word_upper_limit = 150, gender = "female", speed = "fast", number_of_images = 3, detail_level="short", perspective="neutral", emotion="sad", time_setting="classic", art_style="realistic", style="anime", color_palette="monochrome"):
     # Lấy danh sách tất cả các tệp .txt và .mp3 trong thư mục hiện tại
     files_to_delete = glob.glob("*.txt") + glob.glob("*.mp3") + glob.glob("*.png")
         if file != "requirements.txt":
             os.remove(file)
             print(f"Deleted: {file}")
+    text_processing(file_path = file_path, chunks = chunks, analysis_level=analysis_level, writting_style=writting_style, word_lower_limit = word_lower_limit, word_upper_limit=word_upper_limit )
     text_to_speech(gender = gender, speed = speed)
     image_gen(number_of_images = number_of_images, detail_level=detail_level, perspective=perspective, emotion=emotion, time_setting=time_setting, art_style=art_style, style=style, color_palette=color_palette)
     text_to_video()

src/text_processing.py CHANGED Viewed

@@ -40,9 +40,9 @@ def extract_text_from_file(file_path):
     else:
         raise ValueError("Unsupported file format. Only PDF and DOCX are supported.")
 ####################### - SEMANTIC CHUNKING - #######################
-def split_text_by_semantics(text, client):
     prompt = f"""
-    Bạn là một chuyên gia xử lý văn bản. Hãy chia văn bản sau thành một số đoạn có ý nghĩa sao cho mỗi đoạn vừa đủ để giải thích trong khoảng 3 đến 5 câu.
     Văn bản:
     {text}
@@ -68,7 +68,7 @@ def split_text_by_semantics(text, client):
         return []
 ####################### - CONTENT GENERATION - #######################
-def generate_explaination_for_chunks(chunks, client, analysis_level='basic', writting_style='academic', word_lower_limit=100, word_upper_limit=150):
     """
     Phân tích nội dung của văn bản theo mức độ và phong cách mong muốn.
@@ -127,14 +127,14 @@ def generate_explaination_for_chunks(chunks, client, analysis_level='basic', wri
     except Exception as e:
         print(f"Lỗi khi gọi API Gemini: {e}")
         return []
-def text_processing(file_path, analysis_level='basic', writting_style='academic', word_lower_limit = 100, word_upper_limit = 150):
     client = set_up_api()
     # Trích xuất văn bản từ file PDF
     text = extract_text_from_file(file_path=file_path)
     with open("./text.txt", "w", encoding="utf-8") as f:
         f.write(text)
     # Tách văn bản theo ngữ nghĩa
-    semantic_chunks = split_text_by_semantics(text, client)
     # Tạo thuyết minh cho từng phần semantic chunk
     explanations = generate_explaination_for_chunks(semantic_chunks, client, analysis_level=analysis_level, writting_style = writting_style, word_lower_limit = word_lower_limit, word_upper_limit=word_upper_limit)

     else:
         raise ValueError("Unsupported file format. Only PDF and DOCX are supported.")
 ####################### - SEMANTIC CHUNKING - #######################
+def split_text_by_semantics(text, chunks, client):
     prompt = f"""
+    Bạn là một chuyên gia xử lý văn bản. Hãy chia văn bản sau thành {chunks} số đoạn có ý nghĩa sao cho mỗi đoạn vừa đủ để giải thích trong khoảng 3 đến 5 câu.
     Văn bản:
     {text}
         return []
 ####################### - CONTENT GENERATION - #######################
+def generate_explaination_for_chunks(chunks, client, analysis_level='basic', writting_style='academic', word_lower_limit=50, word_upper_limit=100):
     """
     Phân tích nội dung của văn bản theo mức độ và phong cách mong muốn.
     except Exception as e:
         print(f"Lỗi khi gọi API Gemini: {e}")
         return []
+def text_processing(file_path, chunks = 3, analysis_level='basic', writting_style='academic', word_lower_limit = 100, word_upper_limit = 150):
     client = set_up_api()
     # Trích xuất văn bản từ file PDF
     text = extract_text_from_file(file_path=file_path)
     with open("./text.txt", "w", encoding="utf-8") as f:
         f.write(text)
     # Tách văn bản theo ngữ nghĩa
+    semantic_chunks = split_text_by_semantics(text, chunks, client)
     # Tạo thuyết minh cho từng phần semantic chunk
     explanations = generate_explaination_for_chunks(semantic_chunks, client, analysis_level=analysis_level, writting_style = writting_style, word_lower_limit = word_lower_limit, word_upper_limit=word_upper_limit)