Spaces:

mihalykiss
/

test

Running

App Files Files Community

mihalykiss commited on 18 days ago

Commit

c1d5432

verified ·

1 Parent(s): e40cdcc

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -5

app.py CHANGED Viewed

@@ -59,11 +59,11 @@ def clean_text(text: str) -> str:
     text = re.sub(r'\s+([,.;:?!])', r'\1', text)
     return text
-if tokenizer: # Only set normalizer if tokenizer loaded successfully
     newline_to_space = Replace(Regex(r'\s*\n\s*'), " ")
-    join_hyphen_break = Replace(Regex(r'(\w+)[--]\s*\n\s*(\w+)'), r"\1\2") # Corrected hyphen regex
     tokenizer.backend_tokenizer.normalizer = Sequence([
-        tokenizer.backend_tokenizer.normalizer, # Keep existing normalizers
         join_hyphen_break,
         newline_to_space,
         Strip()
@@ -82,7 +82,7 @@ description = """
         <li><span class="icon">✅</span> <strong>Human Verification: </strong> Clearly identifies human-written content.</li>
         <li><span class="icon">🔍</span> <strong>Model Detection: </strong> Capable of identifying content from over 40 AI models.</li>
         <li><span class="icon">📈</span> <strong>Accuracy: </strong> Performs optimally with more extensive text inputs.</li>
-        <li><span class="icon">📄</span> <strong>Read more: </strong> Our methodology is detailed in our research paper:
             <a href="https://aclanthology.org/2025.genaidetect-1.15/" target="_blank" class="learn-more-link"> <b> LINK </b></a>.
         </li>
     </ul>
@@ -175,7 +175,11 @@ modern_css = """
     --border-radius-md: 8px;
     --border-radius-lg: 12px;
 }
 body {
     font-family: 'Inter', sans-serif;
     background: linear-gradient(135deg, #f5f7fa 0%, #eef2f7 100%);
@@ -372,6 +376,7 @@ h1 {
     font-size: clamp(13px, 2vw, 14px);
     color: var(--text-secondary);
 }
 #bottom_text p {
     margin: 0;
 }

     text = re.sub(r'\s+([,.;:?!])', r'\1', text)
     return text
+if tokenizer:
     newline_to_space = Replace(Regex(r'\s*\n\s*'), " ")
+    join_hyphen_break = Replace(Regex(r'(\w+)[--]\s*\n\s*(\w+)'), r"\1\2")
     tokenizer.backend_tokenizer.normalizer = Sequence([
+        tokenizer.backend_tokenizer.normalizer,
         join_hyphen_break,
         newline_to_space,
         Strip()
         <li><span class="icon">✅</span> <strong>Human Verification: </strong> Clearly identifies human-written content.</li>
         <li><span class="icon">🔍</span> <strong>Model Detection: </strong> Capable of identifying content from over 40 AI models.</li>
         <li><span class="icon">📈</span> <strong>Accuracy: </strong> Performs optimally with more extensive text inputs.</li>
+        <li><span class="icon">📄</span> <strong>Read more: </strong> Our methodology is detailed in our research paper: &nbsp;
             <a href="https://aclanthology.org/2025.genaidetect-1.15/" target="_blank" class="learn-more-link"> <b> LINK </b></a>.
         </li>
     </ul>
     --border-radius-md: 8px;
     --border-radius-lg: 12px;
 }
+.features-list strong::after {
+  content: " ";
+  display: inline-block;
+  width: 0.2em;
+}
 body {
     font-family: 'Inter', sans-serif;
     background: linear-gradient(135deg, #f5f7fa 0%, #eef2f7 100%);
     font-size: clamp(13px, 2vw, 14px);
     color: var(--text-secondary);
 }
 #bottom_text p {
     margin: 0;
 }