Spaces:

changcheng967
/

DouletAI_Humanizer

Runtime error

App Files Files Community

changcheng967 commited on Jun 12, 2025

Commit

8826e0b

verified ·

1 Parent(s): c712a46

Update src/streamlit_app.py

Browse files

Files changed (1) hide show

src/streamlit_app.py +44 -36

src/streamlit_app.py CHANGED Viewed

@@ -1,55 +1,63 @@
-from transformers import pipeline
 import streamlit as st
 import torch
 import time
-# Limit CPU threads for better responsiveness
 torch.set_num_threads(2)
-st.title("AI Humanizer Lite (CPU Friendly)")
-# Load pipelines once per session
-if "detect_pipe" not in st.session_state or "humanizer_pipe" not in st.session_state:
-    with st.spinner("Loading models (takes ~10s on CPU)..."):
-        st.session_state.detect_pipe = pipeline(
-            "text-classification",
-            model="roberta-base-openai-detector",
-            device=-1,
-        )
-        st.session_state.humanizer_pipe = pipeline(
-            "text2text-generation",
-            model="sshleifer/distilbart-cnn-12-6",
-            device=-1,
-        )
-def detect_ai(text: str) -> float:
-    try:
-        outputs = st.session_state.detect_pipe(text[:256])
         for out in outputs:
             if out["label"].lower() == "ai":
-                return out["score"]
-    except Exception as e:
-        st.error(f"Error during AI detection: {e}")
-    return 0.0
-def humanize_text(text: str) -> str:
     prompt = f"Rewrite this text naturally: {text}"
-    try:
-        result = st.session_state.humanizer_pipe(prompt, max_length=128, num_beams=3)
-        return result[0]["generated_text"]
-    except Exception as e:
-        st.error(f"Error during text rewriting: {e}")
-        return text
-text = st.text_area("Paste AI-generated text here", height=200)
-if st.button("Humanize"):
     if not text.strip():
         st.warning("Please enter some text!")
     else:
-        with st.spinner("Detecting AI content..."):
             score = detect_ai(text)
-            st.write(f"AI detection score: {score:.2%}")
         if score < 0.5:
             st.success("This text looks human already! No need to rewrite.")

+from transformers import pipeline, AutoTokenizer
 import streamlit as st
 import torch
 import time
+# Limit CPU threads for performance
 torch.set_num_threads(2)
+st.title("AI Humanizer Lite (CPU Friendly) — Unlimited Text Detection")
+@st.cache_resource(show_spinner=False)
+def load_models():
+    detect_pipe = pipeline("text-classification", model="roberta-base-openai-detector", device=-1)
+    tokenizer = AutoTokenizer.from_pretrained("roberta-base-openai-detector")
+    return detect_pipe, tokenizer
+detect_pipe, tokenizer = load_models()
+def chunk_text(text, max_tokens=256):
+    tokens = tokenizer.tokenize(text)
+    chunks = []
+    for i in range(0, len(tokens), max_tokens):
+        chunk_tokens = tokens[i:i+max_tokens]
+        chunk_text = tokenizer.convert_tokens_to_string(chunk_tokens)
+        chunks.append(chunk_text)
+    return chunks
+def detect_ai(text):
+    chunks = chunk_text(text)
+    scores = []
+    for chunk in chunks:
+        outputs = detect_pipe(chunk)
+        # Find "AI" label score or 0.0 fallback
+        ai_score = 0.0
         for out in outputs:
             if out["label"].lower() == "ai":
+                ai_score = out["score"]
+        scores.append(ai_score)
+    # Aggregate results: max score means any AI-like chunk triggers high detection
+    final_score = max(scores) if scores else 0.0
+    return final_score
+def humanize_text(text):
+    # Use a smaller summarization or rewriting model
+    humanizer_pipe = pipeline("text2text-generation", model="sshleifer/distilbart-cnn-12-6", device=-1)
     prompt = f"Rewrite this text naturally: {text}"
+    result = humanizer_pipe(prompt, max_length=128, num_beams=3)
+    return result[0]["generated_text"]
+text = st.text_area("Paste AI-generated text here", height=300)
+if st.button("Detect & Humanize"):
     if not text.strip():
         st.warning("Please enter some text!")
     else:
+        with st.spinner("Detecting AI content on chunks..."):
+            start = time.time()
             score = detect_ai(text)
+            duration = time.time() - start
+            st.write(f"AI detection score: {score:.2%} (Processed in {duration:.1f}s)")
         if score < 0.5:
             st.success("This text looks human already! No need to rewrite.")