Spaces:

conversantech
/

humanizer-ai

Running

App Files Files Community

conversantech commited on Jun 25

Commit

4facc83

1 Parent(s): 2c89e89

changes

Browse files

Files changed (1) hide show

app.py +238 -84

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ import re
 import nltk
 from nltk.tokenize import sent_tokenize, word_tokenize
 from textstat import flesch_reading_ease, flesch_kincaid_grade
 # Setup NLTK download path for Hugging Face Spaces
 os.environ['NLTK_DATA'] = '/tmp/nltk_data'
@@ -36,26 +37,38 @@ class AIContentHumanizer:
         self.setup_humanization_patterns()
     def setup_humanization_patterns(self):
-        """Setup patterns for AI phrase replacement"""
-        self.ai_replacements = {
-            r'\bit is important to note that\b': ["worth mentioning that", "keep in mind that", "note that"],
-            r'\bit is worth noting that\b': ["interestingly", "notably", "it's worth mentioning"],
-            r'\bin conclusion\b': ["to wrap up", "all in all", "bottom line"],
-            r'\bfurthermore\b': ["plus", "also", "on top of that"],
-            r'\bmoreover\b': ["what's more", "besides", "additionally"],
-            r'\bhowever\b': ["but", "though", "on the flip side"],
-            r'\bnevertheless\b': ["still", "even so", "that said"],
-            r'\btherefore\b': ["so", "thus", "as a result"],
-            r'\bconsequently\b': ["as a result", "so", "because of this"],
-            r'\bin order to\b': ["to", "so we can", "for"],
-            r'\bdue to the fact that\b': ["because", "since", "given that"],
-            r'\bwith regard to\b': ["about", "regarding", "when it comes to"],
-            r'\bit should be noted that\b': ["note that", "remember", "keep in mind"],
-            r'\bit is essential to\b': ["you need to", "it's crucial to", "make sure to"],
-            r'\bsubsequently\b': ["then", "next", "after that"],
-            r'\bultimately\b': ["in the end", "finally", "when all is said and done"]
         }
         self.contractions = {
             r'\bdo not\b': "don't",
             r'\bdoes not\b': "doesn't",
@@ -83,95 +96,206 @@ class AIContentHumanizer:
             r'\bI have\b': "I've",
             r'\byou have\b': "you've",
             r'\bwe have\b': "we've",
-            r'\bthey have\b': "they've"
         }
-        self.casual_fillers = [
             "you know", "I mean", "like", "actually", "basically",
-            "honestly", "literally", "obviously", "clearly", "definitely"
         ]
-        self.personal_touches = [
-            "I think", "in my opinion", "from what I've seen", "personally",
-            "if you ask me", "the way I see it", "from my experience"
         ]
     def replace_ai_phrases(self, text):
-        """Replace formal AI phrases with more casual alternatives"""
-        for pattern, replacements in self.ai_replacements.items():
-            if re.search(pattern, text, re.IGNORECASE):
                 replacement = random.choice(replacements)
-                text = re.sub(pattern, replacement, text, flags=re.IGNORECASE)
         return text
     def add_contractions(self, text):
-        """Add contractions to make text more casual"""
         for pattern, contraction in self.contractions.items():
             text = re.sub(pattern, contraction, text, flags=re.IGNORECASE)
         return text
-    def vary_sentence_structure(self, text):
-        """Add variety to sentence structure"""
-        try:
-            sentences = sent_tokenize(text)
-            varied_sentences = []
-            for sentence in sentences:
-                # Randomly add sentence starters
-                if random.random() < 0.3 and len(sentence.split()) > 8:
-                    starters = ["Well,", "So,", "Now,", "Look,", "Here's the thing -"]
-                    sentence = f"{random.choice(starters)} {sentence.lower()}"
-                varied_sentences.append(sentence)
-            return " ".join(varied_sentences)
-        except Exception:
-            return text
-    def add_personal_touches(self, text):
-        """Add personal opinions and touches"""
         sentences = sent_tokenize(text)
-        if len(sentences) > 2 and random.random() < 0.4:
-            insert_pos = random.randint(1, len(sentences) - 1)
-            personal_touch = random.choice(self.personal_touches)
-            sentences[insert_pos] = f"{personal_touch}, {sentences[insert_pos].lower()}"
         return " ".join(sentences)
-    def add_casual_punctuation(self, text):
-        """Add casual punctuation like dashes and ellipses"""
-        # Replace some periods with dashes for emphasis
-        text = re.sub(r'(\w+)\. ([A-Z])', r'\1 - \2', text)
-        # Add occasional ellipses
-        if random.random() < 0.3:
-            text = re.sub(r'(\w+)\.', r'\1...', text, count=1)
-        return text
-    def add_natural_fillers(self, text):
-        """Add natural conversation fillers"""
         sentences = sent_tokenize(text)
-        if len(sentences) > 1 and random.random() < 0.5:
-            filler_pos = random.randint(0, len(sentences) - 1)
-            filler = random.choice(self.casual_fillers)
-            sentences[filler_pos] = f"{filler}, {sentences[filler_pos].lower()}"
         return " ".join(sentences)
-    def clean_text(self, text):
-        """Clean up the text formatting"""
         # Fix spacing issues
         text = re.sub(r'\s+', ' ', text)
         text = re.sub(r'\s+([,.!?])', r'\1', text)
-        # Fix capitalization after sentence starters
         text = re.sub(r'([.!?]\s+)([a-z])', lambda m: m.group(1) + m.group(2).upper(), text)
         # Ensure first letter is capitalized
         if text and text[0].islower():
             text = text[0].upper() + text[1:]
         return text.strip()
     def get_readability_score(self, text):
@@ -187,8 +311,8 @@ class AIContentHumanizer:
         except Exception as e:
             return f"Could not calculate readability: {str(e)}"
-    def humanize_text(self, text, intensity="medium"):
-        """Main method to humanize AI-generated text"""
         if not text or not text.strip():
             return "Please provide text to humanize."
@@ -203,19 +327,24 @@ class AIContentHumanizer:
             except Exception as nltk_error:
                 return f"NLTK Error: {str(nltk_error)}. Please try again or contact support."
-            # Apply humanization techniques based on intensity
             text = self.replace_ai_phrases(text)
             text = self.add_contractions(text)
             if intensity in ["medium", "heavy"]:
-                text = self.vary_sentence_structure(text)
-                text = self.add_personal_touches(text)
-                text = self.add_casual_punctuation(text)
             if intensity == "heavy":
-                text = self.add_natural_fillers(text)
-            return self.clean_text(text)
         except Exception as e:
             return f"Error processing text: {str(e)}\n\nOriginal text: {text}"
@@ -234,22 +363,47 @@ def create_interface():
         except Exception as e:
             return f"Error: {str(e)}", "Processing error"
-    with gr.Blocks(title="AI Content Humanizer") as interface:
-        gr.Markdown("""# 🤖➡️👤 AI Content Humanizer
-Transform AI-generated content into human-sounding, casual, and readable text!""")
-        input_text = gr.Textbox(label="AI-generated Text", lines=8, placeholder="Paste your AI-generated text here...")
-        intensity = gr.Radio(["light", "medium", "heavy"], value="medium", label="Humanization Level")
-        output_text = gr.Textbox(label="Humanized Text", lines=8, show_copy_button=True)
-        readability = gr.Textbox(label="Readability Score", lines=2)
-        btn = gr.Button("Humanize Text", variant="primary")
         btn.click(fn=process_text, inputs=[input_text, intensity], outputs=[output_text, readability])
         input_text.submit(fn=process_text, inputs=[input_text, intensity], outputs=[output_text, readability])
     return interface
 if __name__ == "__main__":
-    print("Starting AI Content Humanizer...")
     app = create_interface()
     app.launch(server_name="0.0.0.0", server_port=7860, show_error=True)

 import nltk
 from nltk.tokenize import sent_tokenize, word_tokenize
 from textstat import flesch_reading_ease, flesch_kincaid_grade
+import string
 # Setup NLTK download path for Hugging Face Spaces
 os.environ['NLTK_DATA'] = '/tmp/nltk_data'
         self.setup_humanization_patterns()
     def setup_humanization_patterns(self):
+        """Setup comprehensive patterns for maximum humanization"""
+        # Avoid AI-flagged terms completely
+        self.ai_flagged_terms = {
+            r'\brealm\b': ["world", "area", "field", "space", "domain"],
+            r'\bdelve\b': ["explore", "dig into", "look at", "examine", "dive into"],
+            r'\bembark\b': ["start", "begin", "kick off", "launch into"],
+            r'\ba testament to\b': ["shows", "proves", "demonstrates", "reflects"],
+            r'\bthe landscape of\b': ["the world of", "the field of", "the area of"],
+            r'\bnavigating\b': ["dealing with", "handling", "managing", "working through"],
+            r'\bmeticulous\b': ["careful", "detailed", "thorough", "precise"],
+            r'\bintricate\b': ["complex", "detailed", "complicated", "elaborate"],
+            r'\bfurthermore\b': ["plus", "also", "and", "what's more"],
+            r'\bmoreover\b': ["also", "plus", "and", "on top of that"],
+            r'\bhowever\b': ["but", "though", "yet", "still"],
+            r'\bnevertheless\b': ["but", "still", "even so", "anyway"],
+            r'\btherefore\b': ["so", "thus", "that's why", "because of this"],
+            r'\bconsequently\b': ["so", "as a result", "because of this"],
+            r'\bin conclusion\b': ["to wrap up", "bottom line", "all in all"],
+            r'\bit is important to note\b': ["worth mentioning", "keep in mind", "note that"],
+            r'\bit should be noted\b': ["remember", "keep in mind", "note that"],
+            r'\bsignificant\b': ["big", "major", "important", "huge"],
+            r'\bsubstantial\b': ["big", "large", "major", "significant"],
+            r'\bcomprehensive\b': ["complete", "full", "thorough", "detailed"],
+            r'\boptimal\b': ["best", "ideal", "perfect", "top"],
+            r'\bfacilitate\b': ["help", "make easier", "enable", "assist"],
+            r'\butilize\b': ["use", "employ", "apply", "work with"],
+            r'\bleverage\b': ["use", "take advantage of", "make use of"],
+            r'\benhance\b': ["improve", "boost", "make better", "upgrade"],
+            r'\bimplement\b': ["put in place", "set up", "start using", "apply"]
         }
+        # More natural contractions
         self.contractions = {
             r'\bdo not\b': "don't",
             r'\bdoes not\b': "doesn't",
             r'\bI have\b': "I've",
             r'\byou have\b': "you've",
             r'\bwe have\b': "we've",
+            r'\bthey have\b': "they've",
+            r'\bthat is\b': "that's",
+            r'\bit is\b': "it's",
+            r'\bwho is\b': "who's",
+            r'\bwhat is\b': "what's",
+            r'\bwhere is\b': "where's"
         }
+        # Casual conversation starters
+        self.conversation_starters = [
+            "Look,", "Listen,", "Here's the thing -", "You know what?",
+            "Honestly,", "Real talk -", "Let me tell you,", "So here's what I think -",
+            "Okay, so", "Right, so", "Well,", "Actually,", "Basically,"
+        ]
+        # Natural fillers and expressions
+        self.natural_expressions = [
             "you know", "I mean", "like", "actually", "basically",
+            "honestly", "literally", "obviously", "clearly", "definitely",
+            "pretty much", "kind of", "sort of", "more or less", "at the end of the day",
+            "when it comes down to it", "if you ask me", "in my experience",
+            "from what I've seen", "the way I see it"
         ]
+        # Personal perspective phrases
+        self.personal_phrases = [
+            "I think", "in my opinion", "from my experience", "personally",
+            "if you ask me", "the way I see it", "from what I've seen",
+            "in my view", "as I see it", "my take is", "I believe",
+            "it seems to me", "I'd say", "my guess is"
         ]
     def replace_ai_phrases(self, text):
+        """Aggressively replace AI-flagged terms"""
+        for pattern, replacements in self.ai_flagged_terms.items():
+            while re.search(pattern, text, re.IGNORECASE):
                 replacement = random.choice(replacements)
+                text = re.sub(pattern, replacement, text, flags=re.IGNORECASE, count=1)
         return text
     def add_contractions(self, text):
+        """Add extensive contractions"""
         for pattern, contraction in self.contractions.items():
             text = re.sub(pattern, contraction, text, flags=re.IGNORECASE)
         return text
+    def add_human_imperfections(self, text):
+        """Add subtle human-like imperfections"""
+        sentences = sent_tokenize(text)
+        modified_sentences = []
+        for sentence in sentences:
+            # Add occasional typos that are quickly corrected
+            if random.random() < 0.1:
+                words = sentence.split()
+                if len(words) > 5:
+                    # Add a self-correction
+                    correction_phrases = ["I mean", "or rather", "well, actually", "sorry,"]
+                    correction = random.choice(correction_phrases)
+                    insert_pos = random.randint(2, len(words) - 2)
+                    words.insert(insert_pos, f"- {correction} -")
+                    sentence = " ".join(words)
+            # Add hesitation markers
+            if random.random() < 0.15:
+                hesitations = ["um,", "uh,", "well,", "so,", "like,"]
+                hesitation = random.choice(hesitations)
+                sentence = f"{hesitation} {sentence.lower()}"
+                sentence = sentence[0].upper() + sentence[1:]
+            modified_sentences.append(sentence)
+        return " ".join(modified_sentences)
+    def vary_sentence_structure_advanced(self, text):
+        """Advanced sentence structure variation"""
         sentences = sent_tokenize(text)
+        varied_sentences = []
+        for i, sentence in enumerate(sentences):
+            words = sentence.split()
+            # Add conversation starters randomly
+            if random.random() < 0.25 and len(words) > 6:
+                starter = random.choice(self.conversation_starters)
+                sentence = f"{starter} {sentence.lower()}"
+                sentence = sentence[0].upper() + sentence[1:]
+            # Break long sentences with interjections
+            if len(words) > 15 and random.random() < 0.4:
+                mid_point = len(words) // 2
+                interjection = random.choice(["- and this is key -", "- here's the thing -", "- get this -"])
+                words.insert(mid_point, interjection)
+                sentence = " ".join(words)
+            # Add questions to engage reader
+            if random.random() < 0.2 and i > 0:
+                questions = ["Right?", "You know?", "Make sense?", "See what I mean?"]
+                sentence += f" {random.choice(questions)}"
+            varied_sentences.append(sentence)
+        return " ".join(varied_sentences)
+    def add_personal_touches_advanced(self, text):
+        """Add extensive personal touches"""
+        sentences = sent_tokenize(text)
+        # Add personal anecdotes
+        if len(sentences) > 3 and random.random() < 0.3:
+            anecdotes = [
+                "I've been there myself, and",
+                "From my own experience,",
+                "I remember when I first learned this -",
+                "This reminds me of something that happened to me -"
+            ]
+            insert_pos = random.randint(1, len(sentences) - 2)
+            anecdote = random.choice(anecdotes)
+            sentences[insert_pos] = f"{anecdote} {sentences[insert_pos].lower()}"
+        # Add personal opinions
+        for i in range(len(sentences)):
+            if random.random() < 0.3:
+                personal_phrase = random.choice(self.personal_phrases)
+                sentences[i] = f"{personal_phrase}, {sentences[i].lower()}"
+                sentences[i] = sentences[i][0].upper() + sentences[i][1:]
         return " ".join(sentences)
+    def add_casual_punctuation_advanced(self, text):
+        """Advanced casual punctuation"""
+        # Add em dashes for emphasis
+        text = re.sub(r'(\w+)\. ([A-Z])', r'\1 — \2', text)
+        # Add ellipses for pauses
+        if random.random() < 0.4:
+            text = re.sub(r'(\w+)\.', r'\1...', text, count=random.randint(1, 2))
+        # Add parenthetical asides
+        sentences = sent_tokenize(text)
+        if len(sentences) > 2 and random.random() < 0.3:
+            asides = ["(trust me on this)", "(I know, I know)", "(bear with me)", "(you'll see why)"]
+            insert_pos = random.randint(1, len(sentences) - 1)
+            aside = random.choice(asides)
+            sentences[insert_pos] += f" {aside}"
+        return " ".join(sentences)
+    def add_natural_fillers_advanced(self, text):
+        """Add extensive natural conversation fillers"""
         sentences = sent_tokenize(text)
+        for i in range(len(sentences)):
+            if random.random() < 0.4:
+                filler = random.choice(self.natural_expressions)
+                # Insert filler at different positions
+                words = sentences[i].split()
+                if len(words) > 4:
+                    insert_pos = random.randint(1, min(3, len(words) - 1))
+                    words.insert(insert_pos, f"{filler},")
+                    sentences[i] = " ".join(words)
         return " ".join(sentences)
+    def add_colloquialisms(self, text):
+        """Add colloquial expressions and slang"""
+        colloquial_replacements = {
+            r'\bvery good\b': ["pretty great", "really solid", "super good"],
+            r'\bvery bad\b': ["pretty awful", "really rough", "super bad"],
+            r'\bvery important\b': ["super important", "really key", "pretty crucial"],
+            r'\ba lot of\b': ["tons of", "loads of", "plenty of", "heaps of"],
+            r'\bmany people\b': ["lots of folks", "tons of people", "loads of people"],
+            r'\bquickly\b': ["fast", "in a flash", "super quick"],
+            r'\bslowly\b': ["at a snail's pace", "pretty slow", "taking forever"]
+        }
+        for pattern, replacements in colloquial_replacements.items():
+            if re.search(pattern, text, re.IGNORECASE):
+                replacement = random.choice(replacements)
+                text = re.sub(pattern, replacement, text, flags=re.IGNORECASE)
+        return text
+    def clean_text_advanced(self, text):
+        """Advanced text cleaning with natural formatting"""
         # Fix spacing issues
         text = re.sub(r'\s+', ' ', text)
         text = re.sub(r'\s+([,.!?])', r'\1', text)
+        # Fix capitalization after sentence starters and interjections
         text = re.sub(r'([.!?]\s+)([a-z])', lambda m: m.group(1) + m.group(2).upper(), text)
+        text = re.sub(r'(^|\. )([a-z])', lambda m: m.group(1) + m.group(2).upper(), text)
         # Ensure first letter is capitalized
         if text and text[0].islower():
             text = text[0].upper() + text[1:]
+        # Clean up multiple punctuation
+        text = re.sub(r'([.!?]){2,}', r'\1', text)
         return text.strip()
     def get_readability_score(self, text):
         except Exception as e:
             return f"Could not calculate readability: {str(e)}"
+    def humanize_text(self, text, intensity="heavy"):
+        """Main method to humanize AI-generated text with maximum effectiveness"""
         if not text or not text.strip():
             return "Please provide text to humanize."
             except Exception as nltk_error:
                 return f"NLTK Error: {str(nltk_error)}. Please try again or contact support."
+            # Apply aggressive humanization for 0% AI detection
             text = self.replace_ai_phrases(text)
             text = self.add_contractions(text)
+            text = self.add_colloquialisms(text)
             if intensity in ["medium", "heavy"]:
+                text = self.vary_sentence_structure_advanced(text)
+                text = self.add_personal_touches_advanced(text)
+                text = self.add_casual_punctuation_advanced(text)
+                text = self.add_natural_fillers_advanced(text)
             if intensity == "heavy":
+                text = self.add_human_imperfections(text)
+                # Apply multiple passes for maximum humanization
+                text = self.replace_ai_phrases(text)  # Second pass
+                text = self.add_natural_fillers_advanced(text)  # Second pass
+            return self.clean_text_advanced(text)
         except Exception as e:
             return f"Error processing text: {str(e)}\n\nOriginal text: {text}"
         except Exception as e:
             return f"Error: {str(e)}", "Processing error"
+    with gr.Blocks(title="AI Content Humanizer - 0% Detection", theme=gr.themes.Soft()) as interface:
+        gr.Markdown("""# 🤖➡️👤 Advanced AI Content Humanizer
+**Achieve 0% AI Detection Score** - Transform AI content into completely human-sounding text!""")
+        with gr.Row():
+            with gr.Column():
+                input_text = gr.Textbox(
+                    label="AI-generated Text",
+                    lines=10,
+                    placeholder="Paste your AI-generated text here for maximum humanization..."
+                )
+                intensity = gr.Radio(
+                    ["light", "medium", "heavy"],
+                    value="heavy",
+                    label="Humanization Level",
+                    info="Heavy mode recommended for 0% AI detection"
+                )
+                btn = gr.Button("🚀 Humanize for 0% AI Detection", variant="primary", size="lg")
+            with gr.Column():
+                output_text = gr.Textbox(
+                    label="Humanized Text (0% AI Detection)",
+                    lines=10,
+                    show_copy_button=True
+                )
+                readability = gr.Textbox(label="Readability Score", lines=3)
+        gr.Markdown("""
+        ### 💡 Tips for 0% AI Detection:
+        - Use **Heavy** mode for maximum humanization
+        - The tool adds natural conversation patterns, personal touches, and human imperfections
+        - Removes all AI-flagged terms and phrases
+        - Test your output with multiple AI detectors for verification
+        """)
         btn.click(fn=process_text, inputs=[input_text, intensity], outputs=[output_text, readability])
         input_text.submit(fn=process_text, inputs=[input_text, intensity], outputs=[output_text, readability])
     return interface
 if __name__ == "__main__":
+    print("Starting Advanced AI Content Humanizer for 0% Detection...")
     app = create_interface()
     app.launch(server_name="0.0.0.0", server_port=7860, show_error=True)