Spaces:

awacke1
/

PDF-Paper-Maker-AI-UI-UX

Running

App Files Files Community

awacke1 commited on 28 days ago

Commit

7d76447

verified ·

1 Parent(s): 6786aba

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -3

app.py CHANGED Viewed

@@ -20,13 +20,17 @@ import pytz
 st.set_page_config(layout="wide", initial_sidebar_state="collapsed")
 def get_timestamp_prefix():
     central = pytz.timezone("US/Central")
     now = datetime.now(central)
     # Format: three-letter day, MMDD, HHMM + AM/PM (all uppercase)
     return now.strftime("%a %m%d %I%M%p").upper()
 def clean_for_speech(text):
     # Remove hash marks
     text = text.replace("#", "")
     # Remove emojis using a regex pattern that covers a wide range
@@ -45,12 +49,20 @@ def clean_for_speech(text):
     text = emoji_pattern.sub('', text)
     return text
 async def generate_audio(text, voice, filename):
     communicate = edge_tts.Communicate(text, voice)
     await communicate.save(filename)
     return filename
 def apply_emoji_font(text, emoji_font):
     emoji_pattern = re.compile(
         r"([\U0001F300-\U0001F5FF"
         r"\U0001F600-\U0001F64F"
@@ -65,40 +77,69 @@ def apply_emoji_font(text, emoji_font):
         r"\u2600-\u26FF"
         r"\u2700-\u27BF]+)"
     )
     def replace_emoji(match):
         emoji = match.group(1)
         emoji = unicodedata.normalize('NFC', emoji)
         return f'<font face="{emoji_font}">{emoji}</font>'
     segments = []
     last_pos = 0
     for match in emoji_pattern.finditer(text):
         start, end = match.span()
         if last_pos < start:
             segments.append(f'<font face="DejaVuSans">{text[last_pos:start]}</font>')
         segments.append(replace_emoji(match))
         last_pos = end
     if last_pos < len(text):
         segments.append(f'<font face="DejaVuSans">{text[last_pos:]}</font>')
-    return ''.join(segments)
 def markdown_to_pdf_content(markdown_text, render_with_bold, auto_bold_numbers):
     lines = markdown_text.strip().split('\n')
     pdf_content = []
     number_pattern = re.compile(r'^\d+\.\s')
     for line in lines:
         line = line.strip()
         if not line or line.startswith('# '):
             continue
         if render_with_bold:
             line = re.sub(r'\*\*(.*?)\*\*', r'<b>\1</b>', line)
         if auto_bold_numbers and number_pattern.match(line):
             if not (line.startswith("<b>") and line.endswith("</b>")):
-                line = f"<b>{line}</b>"
         pdf_content.append(line)
     total_lines = len(pdf_content)
     return pdf_content, total_lines
 def create_pdf(markdown_text, base_font_size, render_with_bold, auto_bold_numbers, enlarge_numbered, num_columns):
     buffer = io.BytesIO()
     page_width = A4[0] * 2
     page_height = A4[1]
@@ -179,7 +220,9 @@ def create_pdf(markdown_text, base_font_size, render_with_bold, auto_bold_number
     buffer.seek(0)
     return buffer.getvalue()
 def pdf_to_image(pdf_bytes):
     try:
         doc = fitz.open(stream=pdf_bytes, filetype="pdf")
         images = []
@@ -197,6 +240,7 @@ def pdf_to_image(pdf_bytes):
 md_files = [f for f in glob.glob("*.md") if os.path.basename(f) != "README.md"]
 md_options = [os.path.splitext(os.path.basename(f))[0] for f in md_files]
 with st.sidebar:
     st.markdown("### PDF Options")
     if md_options:
@@ -256,9 +300,11 @@ with st.sidebar:
             mime="audio/mpeg"
         )
 with st.spinner("Generating PDF..."):
     pdf_bytes = create_pdf(st.session_state.markdown_content, base_font_size, render_with_bold, auto_bold_numbers, enlarge_numbered, num_columns)
 with st.container():
     pdf_images = pdf_to_image(pdf_bytes)
     if pdf_images:
@@ -267,10 +313,11 @@ with st.container():
     else:
         st.info("Download the PDF to view it locally.")
 with st.sidebar:
     st.download_button(
         label="💾📄 Save PDF",
         data=pdf_bytes,
         file_name=f"{prefix} {selected_md}.pdf" if selected_md else f"{prefix} output.pdf",
         mime="application/pdf"
-    )

 st.set_page_config(layout="wide", initial_sidebar_state="collapsed")
+# 🕒 Time flies when you're having function calls
 def get_timestamp_prefix():
+    """🕰️ Gets a timestamp that's more reliable than your coworker's ETA estimates"""
     central = pytz.timezone("US/Central")
     now = datetime.now(central)
     # Format: three-letter day, MMDD, HHMM + AM/PM (all uppercase)
     return now.strftime("%a %m%d %I%M%p").upper()
+# 🧹 Because text needs a bath before being spoken
 def clean_for_speech(text):
+    """🧼 Scrubs your text cleaner than your bathroom will ever be"""
     # Remove hash marks
     text = text.replace("#", "")
     # Remove emojis using a regex pattern that covers a wide range
     text = emoji_pattern.sub('', text)
     return text
+# 🎤 Making robots talk so you don't have to
 async def generate_audio(text, voice, filename):
+    """🔊 Turn text into speech, because reading is so last century"""
     communicate = edge_tts.Communicate(text, voice)
     await communicate.save(filename)
     return filename
+# 🎭 Making emojis wear the right font costume
 def apply_emoji_font(text, emoji_font):
+    """🦄 Because emojis deserve their own font fashion show"""
+    # First, handle any bold formatting to avoid tag nesting issues
+    text = re.sub(r'<b>(.*?)</b>', lambda m: f'###BOLD_START###{m.group(1)}###BOLD_END###', text)
+    # Apply emoji font replacement
     emoji_pattern = re.compile(
         r"([\U0001F300-\U0001F5FF"
         r"\U0001F600-\U0001F64F"
         r"\u2600-\u26FF"
         r"\u2700-\u27BF]+)"
     )
     def replace_emoji(match):
         emoji = match.group(1)
         emoji = unicodedata.normalize('NFC', emoji)
         return f'<font face="{emoji_font}">{emoji}</font>'
     segments = []
     last_pos = 0
     for match in emoji_pattern.finditer(text):
         start, end = match.span()
         if last_pos < start:
             segments.append(f'<font face="DejaVuSans">{text[last_pos:start]}</font>')
         segments.append(replace_emoji(match))
         last_pos = end
     if last_pos < len(text):
         segments.append(f'<font face="DejaVuSans">{text[last_pos:]}</font>')
+    combined_text = ''.join(segments)
+    # Restore bold tags
+    combined_text = combined_text.replace('###BOLD_START###', '</font><b><font face="DejaVuSans">')
+    combined_text = combined_text.replace('###BOLD_END###', '</font></b><font face="DejaVuSans">')
+    return combined_text
+# 📝 Converting markdown to PDF content, because PDFs never go out of style
 def markdown_to_pdf_content(markdown_text, render_with_bold, auto_bold_numbers):
+    """📋 Transforms your disorganized thoughts into structured PDF content"""
     lines = markdown_text.strip().split('\n')
     pdf_content = []
     number_pattern = re.compile(r'^\d+\.\s')
     for line in lines:
         line = line.strip()
         if not line or line.startswith('# '):
             continue
+        # Handle bold formatting before any other processing
         if render_with_bold:
             line = re.sub(r'\*\*(.*?)\*\*', r'<b>\1</b>', line)
         if auto_bold_numbers and number_pattern.match(line):
+            # Only apply bold if not already entirely bold
             if not (line.startswith("<b>") and line.endswith("</b>")):
+                # If there's already some bold formatting inside, we need to handle carefully
+                if "<b>" in line and "</b>" in line:
+                    # Complex case - for simplicity, just make the whole line bold
+                    # but remove any existing bold tags first
+                    line = re.sub(r'</?b>', '', line)
+                    line = f"<b>{line}</b>"
+                else:
+                    line = f"<b>{line}</b>"
         pdf_content.append(line)
     total_lines = len(pdf_content)
     return pdf_content, total_lines
+# 🏗️ Building PDFs like it's your second job
 def create_pdf(markdown_text, base_font_size, render_with_bold, auto_bold_numbers, enlarge_numbered, num_columns):
+    """🔨 Constructs a PDF with the precision of a sleep-deprived architect"""
     buffer = io.BytesIO()
     page_width = A4[0] * 2
     page_height = A4[1]
     buffer.seek(0)
     return buffer.getvalue()
+# 🖼️ Converting PDFs to images, because we can't leave well enough alone
 def pdf_to_image(pdf_bytes):
+    """🔎 Turns your PDF into pictures because some people just want to see the world rendered"""
     try:
         doc = fitz.open(stream=pdf_bytes, filetype="pdf")
         images = []
 md_files = [f for f in glob.glob("*.md") if os.path.basename(f) != "README.md"]
 md_options = [os.path.splitext(os.path.basename(f))[0] for f in md_files]
+# 🎪 The main Streamlit show begins here
 with st.sidebar:
     st.markdown("### PDF Options")
     if md_options:
             mime="audio/mpeg"
         )
+# 🚀 Generating the PDF with more complexity than a rocket launch
 with st.spinner("Generating PDF..."):
     pdf_bytes = create_pdf(st.session_state.markdown_content, base_font_size, render_with_bold, auto_bold_numbers, enlarge_numbered, num_columns)
+# 📺 Displaying the preview, because everyone loves to window shop
 with st.container():
     pdf_images = pdf_to_image(pdf_bytes)
     if pdf_images:
     else:
         st.info("Download the PDF to view it locally.")
+# 💾 Last chance to save your masterpiece before it's gone forever
 with st.sidebar:
     st.download_button(
         label="💾📄 Save PDF",
         data=pdf_bytes,
         file_name=f"{prefix} {selected_md}.pdf" if selected_md else f"{prefix} output.pdf",
         mime="application/pdf"
+    )