Spaces:

conversantech
/

humanizer-ai

Running

App Files Files Community

conversantech commited on Jun 25

Commit

f974a84

verified ·

1 Parent(s): 2958018

Create app.py

Browse files

Files changed (1) hide show

app.py +354 -0

app.py ADDED Viewed

	@@ -0,0 +1,354 @@

+import gradio as gr
+import random
+import re
+import nltk
+from nltk.tokenize import sent_tokenize, word_tokenize
+from nltk.corpus import stopwords
+from nltk.tag import pos_tag
+import string
+from textstat import flesch_reading_ease, flesch_kincaid_grade
+import spacy
+from transformers import pipeline, AutoTokenizer, AutoModelForSequenceClassification
+import torch
+# Download required NLTK data
+try:
+    nltk.download('punkt', quiet=True)
+    nltk.download('averaged_perceptron_tagger', quiet=True)
+    nltk.download('stopwords', quiet=True)
+    nltk.download('wordnet', quiet=True)
+except:
+    pass
+class AIContentHumanizer:
+    def __init__(self):
+        self.setup_models()
+        self.setup_humanization_patterns()
+    def setup_models(self):
+        """Initialize AI detection and paraphrasing models"""
+        try:
+            # Load spaCy model
+            self.nlp = spacy.load("en_core_web_sm")
+        except:
+            # Fallback if spaCy model not available
+            self.nlp = None
+        # Paraphrasing patterns and synonyms
+        self.synonyms = {
+            'however': ['but', 'yet', 'though', 'nevertheless', 'still'],
+            'therefore': ['so', 'thus', 'hence', 'as a result', 'consequently'],
+            'furthermore': ['also', 'moreover', 'additionally', 'besides', 'plus'],
+            'nevertheless': ['however', 'yet', 'still', 'but', 'though'],
+            'consequently': ['therefore', 'so', 'thus', 'as a result', 'hence'],
+            'significant': ['important', 'major', 'notable', 'considerable', 'substantial'],
+            'utilize': ['use', 'employ', 'apply', 'make use of', 'take advantage of'],
+            'demonstrate': ['show', 'prove', 'display', 'exhibit', 'reveal'],
+            'numerous': ['many', 'several', 'various', 'countless', 'multiple'],
+            'substantial': ['significant', 'considerable', 'large', 'major', 'important']
+        }
+    def setup_humanization_patterns(self):
+        """Setup patterns for humanizing text"""
+        self.ai_phrases = [
+            r'\b(it is important to note that|it should be noted that|it is worth noting that)\b',
+            r'\b(in conclusion|to conclude|in summary|to summarize)\b',
+            r'\b(furthermore|moreover|additionally|in addition)\b',
+            r'\b(however|nevertheless|nonetheless|on the other hand)\b',
+            r'\b(therefore|consequently|as a result|thus)\b',
+            r'\b(various|numerous|several|multiple)\b',
+            r'\b(significant|substantial|considerable|notable)\b',
+            r'\b(utilize|implement|demonstrate|facilitate)\b'
+        ]
+        self.human_replacements = {
+            'it is important to note that': ['worth mentioning', 'notably', 'interestingly'],
+            'it should be noted that': ['keep in mind', 'remember', 'note that'],
+            'furthermore': ['also', 'plus', 'what\'s more', 'on top of that'],
+            'moreover': ['also', 'besides', 'what\'s more', 'and'],
+            'however': ['but', 'though', 'yet', 'still'],
+            'therefore': ['so', 'that\'s why', 'which means'],
+            'consequently': ['so', 'as a result', 'that\'s why'],
+            'numerous': ['many', 'lots of', 'plenty of', 'tons of'],
+            'significant': ['big', 'major', 'important', 'key'],
+            'utilize': ['use', 'make use of', 'work with'],
+            'demonstrate': ['show', 'prove', 'make clear'],
+            'facilitate': ['help', 'make easier', 'enable']
+        }
+        self.contraction_map = {
+            'it is': 'it\'s', 'that is': 'that\'s', 'there is': 'there\'s',
+            'we are': 'we\'re', 'they are': 'they\'re', 'you are': 'you\'re',
+            'i am': 'I\'m', 'he is': 'he\'s', 'she is': 'she\'s',
+            'will not': 'won\'t', 'cannot': 'can\'t', 'do not': 'don\'t',
+            'does not': 'doesn\'t', 'did not': 'didn\'t', 'have not': 'haven\'t',
+            'has not': 'hasn\'t', 'had not': 'hadn\'t', 'would not': 'wouldn\'t',
+            'should not': 'shouldn\'t', 'could not': 'couldn\'t'
+        }
+    def add_human_errors(self, text):
+        """Add subtle human-like imperfections"""
+        sentences = sent_tokenize(text)
+        humanized_sentences = []
+        for sentence in sentences:
+            # Occasionally add filler words
+            if random.random() < 0.3:
+                fillers = ['actually', 'basically', 'really', 'pretty much', 'kind of', 'sort of']
+                filler = random.choice(fillers)
+                words = sentence.split()
+                if len(words) > 3:
+                    insert_pos = random.randint(1, min(3, len(words)-1))
+                    words.insert(insert_pos, filler)
+                    sentence = ' '.join(words)
+            # Occasionally use more casual phrasing
+            if random.random() < 0.2:
+                sentence = sentence.replace(' and ', ' & ')
+            humanized_sentences.append(sentence)
+        return ' '.join(humanized_sentences)
+    def vary_sentence_structure(self, text):
+        """Vary sentence structures to appear more human"""
+        sentences = sent_tokenize(text)
+        varied_sentences = []
+        for i, sentence in enumerate(sentences):
+            # Randomly combine short sentences
+            if i < len(sentences) - 1 and len(sentence.split()) < 8 and len(sentences[i+1].split()) < 8:
+                if random.random() < 0.4:
+                    connectors = [' and ', ', ', ' - ', ' but ']
+                    connector = random.choice(connectors)
+                    combined = sentence.rstrip('.') + connector + sentences[i+1].lower()
+                    varied_sentences.append(combined)
+                    sentences[i+1] = ""  # Skip next sentence
+                    continue
+            if sentence:  # Only add non-empty sentences
+                varied_sentences.append(sentence)
+        return ' '.join(varied_sentences)
+    def replace_formal_words(self, text):
+        """Replace formal words with casual alternatives"""
+        for formal, casual_options in self.human_replacements.items():
+            if formal in text.lower():
+                replacement = random.choice(casual_options)
+                text = re.sub(r'\b' + re.escape(formal) + r'\b', replacement, text, flags=re.IGNORECASE)
+        return text
+    def add_contractions(self, text):
+        """Add contractions to make text more conversational"""
+        for full_form, contraction in self.contraction_map.items():
+            text = re.sub(r'\b' + re.escape(full_form) + r'\b', contraction, text, flags=re.IGNORECASE)
+        return text
+    def adjust_punctuation(self, text):
+        """Adjust punctuation for more natural flow"""
+        # Replace some periods with commas for flow
+        sentences = sent_tokenize(text)
+        if len(sentences) > 2:
+            # Occasionally use semicolons
+            if random.random() < 0.3:
+                idx = random.randint(0, len(sentences)-2)
+                if len(sentences[idx].split()) > 6:
+                    sentences[idx] = sentences[idx].rstrip('.') + ';'
+                    sentences[idx+1] = sentences[idx+1][0].lower() + sentences[idx+1][1:]
+        return ' '.join(sentences)
+    def add_personal_touches(self, text):
+        """Add personal touches and opinions"""
+        personal_phrases = [
+            "I think", "In my opinion", "From what I've seen", "Personally,",
+            "I believe", "It seems to me", "From my experience"
+        ]
+        sentences = sent_tokenize(text)
+        if len(sentences) > 1 and random.random() < 0.4:
+            # Add personal phrase to a random sentence
+            idx = random.randint(0, len(sentences)-1)
+            personal_phrase = random.choice(personal_phrases)
+            sentences[idx] = personal_phrase + " " + sentences[idx].lower()
+        return ' '.join(sentences)
+    def paraphrase_with_synonyms(self, text):
+        """Replace words with synonyms"""
+        words = word_tokenize(text)
+        new_words = []
+        for word in words:
+            lower_word = word.lower()
+            if lower_word in self.synonyms and random.random() < 0.3:
+                synonym = random.choice(self.synonyms[lower_word])
+                new_words.append(synonym)
+            else:
+                new_words.append(word)
+        return ' '.join(new_words)
+    def humanize_text(self, text, intensity="medium"):
+        """Main humanization function"""
+        if not text or not text.strip():
+            return "Please provide text to humanize."
+        # Clean input
+        text = text.strip()
+        # Apply humanization techniques based on intensity
+        if intensity == "light":
+            text = self.add_contractions(text)
+            text = self.replace_formal_words(text)
+        elif intensity == "medium":
+            text = self.replace_formal_words(text)
+            text = self.add_contractions(text)
+            text = self.paraphrase_with_synonyms(text)
+            text = self.vary_sentence_structure(text)
+        else:  # heavy
+            text = self.replace_formal_words(text)
+            text = self.add_contractions(text)
+            text = self.paraphrase_with_synonyms(text)
+            text = self.vary_sentence_structure(text)
+            text = self.add_human_errors(text)
+            text = self.adjust_punctuation(text)
+            text = self.add_personal_touches(text)
+        return text
+    def get_readability_score(self, text):
+        """Calculate readability metrics"""
+        try:
+            flesch_score = flesch_reading_ease(text)
+            fk_grade = flesch_kincaid_grade(text)
+            if flesch_score >= 90:
+                level = "Very Easy"
+            elif flesch_score >= 80:
+                level = "Easy"
+            elif flesch_score >= 70:
+                level = "Fairly Easy"
+            elif flesch_score >= 60:
+                level = "Standard"
+            elif flesch_score >= 50:
+                level = "Fairly Difficult"
+            elif flesch_score >= 30:
+                level = "Difficult"
+            else:
+                level = "Very Difficult"
+            return f"Flesch Score: {flesch_score:.1f} ({level})\nGrade Level: {fk_grade:.1f}"
+        except:
+            return "Could not calculate readability"
+def create_interface():
+    humanizer = AIContentHumanizer()
+    def process_text(input_text, intensity):
+        if not input_text:
+            return "Please enter some text to humanize.", ""
+        humanized = humanizer.humanize_text(input_text, intensity)
+        readability = humanizer.get_readability_score(humanized)
+        return humanized, readability
+    # Custom CSS for better UI
+    css = """
+    .gradio-container {
+        font-family: 'Inter', sans-serif;
+    }
+    .main-header {
+        text-align: center;
+        margin-bottom: 30px;
+    }
+    .feature-box {
+        border: 1px solid #e1e5e9;
+        border-radius: 8px;
+        padding: 15px;
+        margin: 10px 0;
+        background: #f8f9fa;
+    }
+    """
+    with gr.Blocks(css=css, title="AI Content Humanizer") as interface:
+        gr.HTML("""
+        <div class="main-header">
+            <h1>🤖➡️👤 AI Content Humanizer</h1>
+            <p>Transform AI-generated content into natural, human-like text</p>
+        </div>
+        """)
+        with gr.Row():
+            with gr.Column(scale=2):
+                input_text = gr.Textbox(
+                    label="📝 Enter AI-generated text",
+                    placeholder="Paste your AI-generated content here...",
+                    lines=10,
+                    max_lines=20
+                )
+                intensity = gr.Radio(
+                    choices=["light", "medium", "heavy"],
+                    value="medium",
+                    label="🎛️ Humanization Intensity",
+                    info="Light: Basic changes | Medium: Moderate restructuring | Heavy: Extensive humanization"
+                )
+                humanize_btn = gr.Button("✨ Humanize Text", variant="primary", size="lg")
+            with gr.Column(scale=2):
+                output_text = gr.Textbox(
+                    label="✅ Humanized Text",
+                    lines=10,
+                    max_lines=20,
+                    interactive=False
+                )
+                readability_info = gr.Textbox(
+                    label="📊 Readability Analysis",
+                    lines=3,
+                    interactive=False
+                )
+        gr.HTML("""
+        <div class="feature-box">
+            <h3>🎯 Features:</h3>
+            <ul>
+                <li><strong>Smart Paraphrasing:</strong> Replaces formal AI language with natural expressions</li>
+                <li><strong>Sentence Restructuring:</strong> Varies sentence patterns for human-like flow</li>
+                <li><strong>Casual Contractions:</strong> Adds natural contractions and informal language</li>
+                <li><strong>Personal Touch:</strong> Incorporates personal opinions and experiences</li>
+                <li><strong>Readability Analysis:</strong> Provides readability scores and grade levels</li>
+            </ul>
+        </div>
+        """)
+        # Example texts
+        examples = [
+            ["Artificial intelligence has numerous applications in various industries. It is important to note that AI can significantly enhance productivity and efficiency. Furthermore, machine learning algorithms can process vast amounts of data to generate valuable insights.", "medium"],
+            ["The implementation of sustainable practices is crucial for environmental conservation. Organizations must utilize innovative technologies to facilitate eco-friendly operations. Moreover, it is essential to demonstrate commitment to reducing carbon footprint.", "heavy"],
+            ["In conclusion, the research demonstrates that renewable energy sources are becoming increasingly viable. Therefore, governments should implement policies that promote clean energy adoption. It is worth noting that this transition requires substantial investment.", "light"]
+        ]
+        gr.Examples(
+            examples=examples,
+            inputs=[input_text, intensity],
+            label="📚 Try these examples:"
+        )
+        humanize_btn.click(
+            fn=process_text,
+            inputs=[input_text, intensity],
+            outputs=[output_text, readability_info]
+        )
+    return interface
+if __name__ == "__main__":
+    interface = create_interface()
+    interface.launch()