Spaces:

awacke1
/

PDF-Paper-Maker-AI-UI-UX

Running

App Files Files

xet

Community

awacke1 commited on Apr 15

Commit

e393e33

verified ·

1 Parent(s): 698df1e

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -43

app.py CHANGED Viewed

@@ -82,48 +82,23 @@ async def generate_audio(text, voice, filename):
 def detect_and_convert_links(text):
     # Convert Markdown links [text](url) to HTML <a> tags
     md_link_pattern = re.compile(r'\[(.*?)\]\((https?://[^\s\[\]()<>{}]+)\)')
-    def replace_md_link(match):
-        text = match.group(1)
-        url = match.group(2)
-        return f'<a href="{url}" color="blue">{text}</a>'
-    text = md_link_pattern.sub(replace_md_link, text)
     # Convert plain URLs to HTML <a> tags, avoiding already tagged links
     url_pattern = re.compile(
-        r'(?<!href=")(https?://[^\s\[\]()<>{}]+)',
         re.IGNORECASE
     )
-    def replace_url(match):
-        url = match.group(1)
-        return f'<a href="{url}" color="blue">{url}</a>'
-    text = url_pattern.sub(replace_url, text)
     return text
 def apply_emoji_font(text, emoji_font):
-    # Preserve links and bold tags
-    link_pattern = re.compile(r'(<a\s+href="[^"]+"[^>]*>.*?</a>)')
-    bold_pattern = re.compile(r'(<b>.*?</b>)')
-    # Split text around links and bold tags
-    segments = []
-    last_pos = 0
-    for match in link_pattern.finditer(text):
-        start, end = match.span()
-        if last_pos < start:
-            segments.append(('text', text[last_pos:start]))
-        segments.append(('link', match.group(0)))
-        last_pos = end
-    for match in bold_pattern.finditer(text[last_pos:]):
-        start, end = match.span()
-        if last_pos < start + last_pos:
-            segments.append(('text', text[last_pos:start + last_pos]))
-        segments.append(('bold', match.group(0)))
-        last_pos = start + end
-    if last_pos < len(text):
-        segments.append(('text', text[last_pos:]))
-    # Apply emoji font to text segments only
     emoji_pattern = re.compile(
         r"([\U0001F300-\U0001F5FF"
         r"\U0001F600-\U0001F64F"
@@ -144,24 +119,23 @@ def apply_emoji_font(text, emoji_font):
         emoji = unicodedata.normalize('NFC', emoji)
         return f'<font face="{emoji_font}">{emoji}</font>'
-    result = []
-    for seg_type, content in segments:
-        if seg_type == 'text':
             # Apply font to non-emoji text and emoji separately
             parts = []
             last_pos = 0
-            for match in emoji_pattern.finditer(content):
                 start, end = match.span()
                 if last_pos < start:
-                    parts.append(f'<font face="DejaVuSans">{content[last_pos:start]}</font>')
                 parts.append(replace_emoji(match))
                 last_pos = end
-            if last_pos < len(content):
-                parts.append(f'<font face="DejaVuSans">{content[last_pos:]}</font>')
             result.append(''.join(parts))
-        else:
-            # Keep links and bold tags unchanged
-            result.append(content)
     return ''.join(result)

 def detect_and_convert_links(text):
     # Convert Markdown links [text](url) to HTML <a> tags
     md_link_pattern = re.compile(r'\[(.*?)\]\((https?://[^\s\[\]()<>{}]+)\)')
+    text = md_link_pattern.sub(r'<a href="\2" color="blue">\1</a>', text)
     # Convert plain URLs to HTML <a> tags, avoiding already tagged links
     url_pattern = re.compile(
+        r'(?<!href=")(https?://[^\s<>{}]+)',
         re.IGNORECASE
     )
+    text = url_pattern.sub(r'<a href="\1" color="blue">\1</a>', text)
     return text
 def apply_emoji_font(text, emoji_font):
+    # Protect existing tags
+    tag_pattern = re.compile(r'(<[^>]+>)')
+    segments = tag_pattern.split(text)
+    result = []
+    # Apply emoji font only to non-tag text
     emoji_pattern = re.compile(
         r"([\U0001F300-\U0001F5FF"
         r"\U0001F600-\U0001F64F"
         emoji = unicodedata.normalize('NFC', emoji)
         return f'<font face="{emoji_font}">{emoji}</font>'
+    for segment in segments:
+        if tag_pattern.match(segment):
+            # Keep tags unchanged
+            result.append(segment)
+        else:
             # Apply font to non-emoji text and emoji separately
             parts = []
             last_pos = 0
+            for match in emoji_pattern.finditer(segment):
                 start, end = match.span()
                 if last_pos < start:
+                    parts.append(f'<font face="DejaVuSans">{segment[last_pos:start]}</font>')
                 parts.append(replace_emoji(match))
                 last_pos = end
+            if last_pos < len(segment):
+                parts.append(f'<font face="DejaVuSans">{segment[last_pos:]}</font>')
             result.append(''.join(parts))
     return ''.join(result)