mihalykiss commited on
Commit
c1d5432
Β·
verified Β·
1 Parent(s): e40cdcc

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -5
app.py CHANGED
@@ -59,11 +59,11 @@ def clean_text(text: str) -> str:
59
  text = re.sub(r'\s+([,.;:?!])', r'\1', text)
60
  return text
61
 
62
- if tokenizer: # Only set normalizer if tokenizer loaded successfully
63
  newline_to_space = Replace(Regex(r'\s*\n\s*'), " ")
64
- join_hyphen_break = Replace(Regex(r'(\w+)[--]\s*\n\s*(\w+)'), r"\1\2") # Corrected hyphen regex
65
  tokenizer.backend_tokenizer.normalizer = Sequence([
66
- tokenizer.backend_tokenizer.normalizer, # Keep existing normalizers
67
  join_hyphen_break,
68
  newline_to_space,
69
  Strip()
@@ -82,7 +82,7 @@ description = """
82
  <li><span class="icon">βœ…</span> <strong>Human Verification: </strong> Clearly identifies human-written content.</li>
83
  <li><span class="icon">πŸ”</span> <strong>Model Detection: </strong> Capable of identifying content from over 40 AI models.</li>
84
  <li><span class="icon">πŸ“ˆ</span> <strong>Accuracy: </strong> Performs optimally with more extensive text inputs.</li>
85
- <li><span class="icon">πŸ“„</span> <strong>Read more: </strong> Our methodology is detailed in our research paper:
86
  <a href="https://aclanthology.org/2025.genaidetect-1.15/" target="_blank" class="learn-more-link"> <b> LINK </b></a>.
87
  </li>
88
  </ul>
@@ -175,7 +175,11 @@ modern_css = """
175
  --border-radius-md: 8px;
176
  --border-radius-lg: 12px;
177
  }
178
-
 
 
 
 
179
  body {
180
  font-family: 'Inter', sans-serif;
181
  background: linear-gradient(135deg, #f5f7fa 0%, #eef2f7 100%);
@@ -372,6 +376,7 @@ h1 {
372
  font-size: clamp(13px, 2vw, 14px);
373
  color: var(--text-secondary);
374
  }
 
375
  #bottom_text p {
376
  margin: 0;
377
  }
 
59
  text = re.sub(r'\s+([,.;:?!])', r'\1', text)
60
  return text
61
 
62
+ if tokenizer:
63
  newline_to_space = Replace(Regex(r'\s*\n\s*'), " ")
64
+ join_hyphen_break = Replace(Regex(r'(\w+)[--]\s*\n\s*(\w+)'), r"\1\2")
65
  tokenizer.backend_tokenizer.normalizer = Sequence([
66
+ tokenizer.backend_tokenizer.normalizer,
67
  join_hyphen_break,
68
  newline_to_space,
69
  Strip()
 
82
  <li><span class="icon">βœ…</span> <strong>Human Verification: </strong> Clearly identifies human-written content.</li>
83
  <li><span class="icon">πŸ”</span> <strong>Model Detection: </strong> Capable of identifying content from over 40 AI models.</li>
84
  <li><span class="icon">πŸ“ˆ</span> <strong>Accuracy: </strong> Performs optimally with more extensive text inputs.</li>
85
+ <li><span class="icon">πŸ“„</span> <strong>Read more: </strong> Our methodology is detailed in our research paper: &nbsp;
86
  <a href="https://aclanthology.org/2025.genaidetect-1.15/" target="_blank" class="learn-more-link"> <b> LINK </b></a>.
87
  </li>
88
  </ul>
 
175
  --border-radius-md: 8px;
176
  --border-radius-lg: 12px;
177
  }
178
+ .features-list strong::after {
179
+ content: " ";
180
+ display: inline-block;
181
+ width: 0.2em;
182
+ }
183
  body {
184
  font-family: 'Inter', sans-serif;
185
  background: linear-gradient(135deg, #f5f7fa 0%, #eef2f7 100%);
 
376
  font-size: clamp(13px, 2vw, 14px);
377
  color: var(--text-secondary);
378
  }
379
+
380
  #bottom_text p {
381
  margin: 0;
382
  }