Spaces:

Jay-Rajput
/

AIDetector

Sleeping

App Files Files Community

Jay-Rajput commited on Sep 14

Commit

5234a81

1 Parent(s): 59f5880

fix detect

Browse files

Files changed (2) hide show

app.py +108 -31
test_detector.py +76 -0

app.py CHANGED Viewed

@@ -192,6 +192,16 @@ class AdvancedAITextDetector:
             starters = [s.split()[0].lower() for s in sentences if s.split()]
             starter_diversity = len(set(starters)) / len(starters) if starters else 0
             scores['starter_diversity'] = starter_diversity
         # 2. N-gram analysis
         words = text.lower().split()
@@ -210,6 +220,7 @@ class AdvancedAITextDetector:
         # 3. ChatGPT-specific patterns
         chatgpt_score = 0
         # Common ChatGPT phrases (weighted by specificity)
         high_confidence_phrases = [
@@ -229,6 +240,15 @@ class AdvancedAITextDetector:
             "in other words", "that being said", "that said"
         ]
         text_lower = text.lower()
         # Check high confidence phrases
@@ -241,6 +261,11 @@ class AdvancedAITextDetector:
             if phrase in text_lower:
                 chatgpt_score += 0.08
         # Check for structured lists (very common in ChatGPT)
         has_numbered = bool(re.search(r'\n\s*\d+[\.\)]\s', text))
         has_bullets = bool(re.search(r'\n\s*[-•*]\s', text))
@@ -253,13 +278,26 @@ class AdvancedAITextDetector:
         if has_colons:
             chatgpt_score += 0.10
-        # Formal tone indicators
         formal_words = ['utilize', 'implement', 'facilitate', 'enhance', 'optimize',
                        'comprehensive', 'significant', 'substantial', 'various', 'numerous']
         formal_count = sum(1 for word in formal_words if word in text_lower)
         chatgpt_score += min(formal_count * 0.05, 0.25)
         scores['chatgpt_patterns'] = min(chatgpt_score, 1.0)
         # 4. Complexity uniformity (AI has uniform complexity)
         if len(sentences) > 2:
@@ -283,15 +321,18 @@ class AdvancedAITextDetector:
             scores['paragraph_consistency'] = 1 - min(para_cv, 1.0)
         # Calculate final statistical score
-        # Weight the features based on their importance for ChatGPT detection
         weights = {
-            'chatgpt_patterns': 0.35,
-            'sent_length_std': -0.15,  # Lower std = more AI
-            'starter_diversity': -0.10,  # Lower diversity = more AI
-            'trigram_repetition': 0.15,
-            'bigram_diversity': -0.10,
-            'complexity_variance': -0.10,
-            'paragraph_consistency': 0.15
         }
         final_score = 0.5  # Start neutral
@@ -299,10 +340,19 @@ class AdvancedAITextDetector:
             if feature in weights:
                 weight = weights[feature]
                 if weight < 0:
-                    # Inverse relationship
                     final_score += abs(weight) * (1 - value)
                 else:
                     final_score += weight * value
         return min(max(final_score, 0), 1), scores
@@ -361,28 +411,33 @@ class AdvancedAITextDetector:
             # Weighted average
             final_score = sum(s * w for s, w in zip(all_scores, normalized_weights))
-            # Boost score if multiple models agree strongly
-            agreement_scores = [s for s in all_scores if s > 0.7 or s < 0.3]
             if len(agreement_scores) >= 2:
                 avg_agreement = np.mean(agreement_scores)
-                if avg_agreement > 0.7:
-                    final_score = min(final_score * 1.1, 0.95)
-                elif avg_agreement < 0.3:
-                    final_score = max(final_score * 0.9, 0.05)
         else:
             final_score = 0.5
-        # 4. Classification with better thresholds for ChatGPT
-        if final_score >= 0.70:
             classification = "AI-Generated (High Confidence)"
             confidence = "HIGH"
-        elif final_score >= 0.55:
             classification = "Likely AI-Generated"
             confidence = "MEDIUM-HIGH"
-        elif final_score >= 0.45:
             classification = "Uncertain"
             confidence = "LOW"
-        elif final_score >= 0.30:
             classification = "Likely Human-Written"
             confidence = "MEDIUM"
         else:
@@ -405,30 +460,30 @@ class AdvancedAITextDetector:
         """Create detailed explanation"""
         exp = []
-        # Overall assessment
-        if score >= 0.70:
             exp.append("🤖 STRONG AI INDICATORS: The text exhibits multiple characteristics typical of AI-generated content.")
-        elif score >= 0.55:
             exp.append("⚠️ PROBABLE AI: Several AI patterns detected, suggesting machine generation.")
-        elif score >= 0.45:
             exp.append("❓ INCONCLUSIVE: Mixed signals - could be AI-assisted or edited content.")
-        elif score >= 0.30:
             exp.append("✍️ PROBABLE HUMAN: More human-like characteristics than AI patterns.")
         else:
             exp.append("👤 STRONG HUMAN INDICATORS: Text shows natural human writing patterns.")
         # Model consensus
         if model_results:
-            high_ai = [name for name, s in model_results.items() if s > 0.65]
-            high_human = [name for name, s in model_results.items() if s < 0.35]
             if len(high_ai) >= 2:
                 exp.append(f"\n\n✓ Multiple models detect AI: {', '.join(high_ai)}")
             elif len(high_human) >= 2:
                 exp.append(f"\n\n✓ Multiple models detect human writing: {', '.join(high_human)}")
-        # Specific indicators
-        if stat_details.get('chatgpt_patterns', 0) > 0.5:
             exp.append("\n\n⚡ High density of ChatGPT-style phrases and structures detected")
         if stat_details.get('sent_length_std', 1) < 0.3:
@@ -436,6 +491,16 @@ class AdvancedAITextDetector:
         if stat_details.get('trigram_repetition', 0) > 0.1:
             exp.append("\n🔁 Repeated phrase patterns detected")
         return " ".join(exp)
@@ -493,6 +558,7 @@ def analyze_text(text):
         analysis = result['statistical_analysis']
         if 'chatgpt_patterns' in analysis:
             output += f"\n- **ChatGPT Pattern Score:** {analysis['chatgpt_patterns']:.2f}/1.00"
         if 'sent_length_std' in analysis:
@@ -501,6 +567,14 @@ def analyze_text(text):
             output += f"\n- **Phrase Repetition:** {analysis['trigram_repetition']:.3f}"
         if 'starter_diversity' in analysis:
             output += f"\n- **Sentence Starter Diversity:** {analysis['starter_diversity']:.3f}"
     # Visual representation
     ai_prob = result['ai_probability']
@@ -561,9 +635,12 @@ interface = gr.Interface(
         # ChatGPT example
         ["Artificial intelligence has revolutionized numerous industries in recent years. It's important to note that this technology offers both opportunities and challenges. Machine learning algorithms can process vast amounts of data, identify patterns, and make predictions with remarkable accuracy. Furthermore, AI applications span various domains including healthcare, finance, and transportation. However, it's crucial to consider the ethical implications. Issues such as bias in algorithms, job displacement, and privacy concerns require careful consideration. Additionally, the development of AI must be guided by responsible practices. In conclusion, while AI presents tremendous potential for innovation and progress, we must approach its implementation thoughtfully and ethically."],
-        # Human example
         ["So yesterday I'm at the coffee shop, right? And this guy next to me is having the LOUDEST phone conversation about his crypto investments. Like, dude, we get it, you bought Dogecoin. But here's the thing - he kept saying he was gonna be a millionaire by next week. Next week! I almost choked on my latte. The barista and I made eye contact and we both just tried not to laugh. I mean, good luck to him and all, but maybe don't count those chickens yet? Anyway, that's my coffee shop drama for the week. Still better than working from home where my cat judges me all day."],
         # Mixed/edited example
         ["The impact of social media on society has been profound. Studies show that people spend an average of 2.5 hours daily on social platforms. But honestly, I think it's probably way more than that - I know I'm constantly checking my phone! These platforms have transformed how we communicate, share information, and even how we see ourselves. There are definitely benefits, like staying connected with friends and family across distances. However, we're also seeing rises in anxiety and depression linked to social media use, especially among teenagers. It's a complex issue that deserves our attention."]
     ],

             starters = [s.split()[0].lower() for s in sentences if s.split()]
             starter_diversity = len(set(starters)) / len(starters) if starters else 0
             scores['starter_diversity'] = starter_diversity
+            # Human writing indicators - sentence length variety
+            short_sentences = sum(1 for length in sent_lengths if length < 8)
+            long_sentences = sum(1 for length in sent_lengths if length > 20)
+            scores['sentence_variety'] = (short_sentences + long_sentences) / len(sent_lengths)
+            # Conversational patterns (human indicators)
+            conversational_starters = ['so', 'well', 'actually', 'basically', 'like', 'you know', 'i mean', 'anyway']
+            conv_count = sum(1 for starter in starters if starter in conversational_starters)
+            scores['conversational_patterns'] = conv_count / len(starters) if starters else 0
         # 2. N-gram analysis
         words = text.lower().split()
         # 3. ChatGPT-specific patterns
         chatgpt_score = 0
+        human_score = 0
         # Common ChatGPT phrases (weighted by specificity)
         high_confidence_phrases = [
             "in other words", "that being said", "that said"
         ]
+        # Human writing indicators
+        human_indicators = [
+            "i think", "i feel", "i believe", "i guess", "i suppose",
+            "honestly", "frankly", "personally", "in my opinion",
+            "you know", "right", "like", "um", "uh", "well",
+            "actually", "basically", "literally", "totally", "really",
+            "so", "anyway", "btw", "lol", "haha", "omg"
+        ]
         text_lower = text.lower()
         # Check high confidence phrases
             if phrase in text_lower:
                 chatgpt_score += 0.08
+        # Check human indicators
+        for phrase in human_indicators:
+            if phrase in text_lower:
+                human_score += 0.1
         # Check for structured lists (very common in ChatGPT)
         has_numbered = bool(re.search(r'\n\s*\d+[\.\)]\s', text))
         has_bullets = bool(re.search(r'\n\s*[-•*]\s', text))
         if has_colons:
             chatgpt_score += 0.10
+        # Formal tone indicators (AI) vs informal (human)
         formal_words = ['utilize', 'implement', 'facilitate', 'enhance', 'optimize',
                        'comprehensive', 'significant', 'substantial', 'various', 'numerous']
+        informal_words = ['gonna', 'wanna', 'gotta', 'kinda', 'sorta', 'yeah', 'nah',
+                         'awesome', 'cool', 'sucks', 'crazy', 'insane', 'ridiculous']
         formal_count = sum(1 for word in formal_words if word in text_lower)
+        informal_count = sum(1 for word in informal_words if word in text_lower)
         chatgpt_score += min(formal_count * 0.05, 0.25)
+        human_score += min(informal_count * 0.08, 0.3)
+        # Contractions and casual language
+        contractions = ['don\'t', 'won\'t', 'can\'t', 'isn\'t', 'aren\'t', 'wasn\'t', 'weren\'t',
+                       'i\'m', 'you\'re', 'he\'s', 'she\'s', 'it\'s', 'we\'re', 'they\'re']
+        contraction_count = sum(1 for word in contractions if word in text_lower)
+        human_score += min(contraction_count * 0.05, 0.2)
         scores['chatgpt_patterns'] = min(chatgpt_score, 1.0)
+        scores['human_patterns'] = min(human_score, 1.0)
         # 4. Complexity uniformity (AI has uniform complexity)
         if len(sentences) > 2:
             scores['paragraph_consistency'] = 1 - min(para_cv, 1.0)
         # Calculate final statistical score
+        # Weight the features based on their importance for detection
         weights = {
+            'chatgpt_patterns': 0.25,      # AI patterns
+            'human_patterns': -0.20,       # Human patterns (negative weight)
+            'sent_length_std': -0.10,      # Lower std = more AI
+            'starter_diversity': -0.08,    # Lower diversity = more AI
+            'sentence_variety': -0.12,     # More variety = more human
+            'conversational_patterns': -0.15,  # More conversational = more human
+            'trigram_repetition': 0.10,    # More repetition = more AI
+            'bigram_diversity': -0.08,     # Lower diversity = more AI
+            'complexity_variance': -0.08,  # Lower variance = more AI
+            'paragraph_consistency': 0.10  # More consistency = more AI
         }
         final_score = 0.5  # Start neutral
             if feature in weights:
                 weight = weights[feature]
                 if weight < 0:
+                    # Inverse relationship - human indicators reduce AI score
                     final_score += abs(weight) * (1 - value)
                 else:
+                    # Direct relationship - AI indicators increase AI score
                     final_score += weight * value
+        # Apply confidence boost for strong human indicators
+        if scores.get('human_patterns', 0) > 0.3 and scores.get('conversational_patterns', 0) > 0.2:
+            final_score *= 0.7  # Reduce AI probability for strong human indicators
+        # Apply confidence boost for strong AI indicators
+        if scores.get('chatgpt_patterns', 0) > 0.4 and scores.get('paragraph_consistency', 0) > 0.7:
+            final_score = min(final_score * 1.2, 0.95)  # Increase AI probability
         return min(max(final_score, 0), 1), scores
             # Weighted average
             final_score = sum(s * w for s, w in zip(all_scores, normalized_weights))
+            # Apply model agreement boost with more conservative thresholds
+            agreement_scores = [s for s in all_scores if s > 0.75 or s < 0.25]
             if len(agreement_scores) >= 2:
                 avg_agreement = np.mean(agreement_scores)
+                if avg_agreement > 0.75:
+                    final_score = min(final_score * 1.05, 0.90)  # More conservative boost
+                elif avg_agreement < 0.25:
+                    final_score = max(final_score * 0.95, 0.10)  # More conservative reduction
+            # Additional human text protection - if statistical analysis strongly suggests human
+            if stat_score < 0.3 and len([s for s in all_scores if s < 0.4]) >= 2:
+                final_score = max(final_score * 0.8, 0.15)  # Strong protection for human text
         else:
             final_score = 0.5
+        # 4. Classification with improved thresholds to reduce false positives
+        if final_score >= 0.75:
             classification = "AI-Generated (High Confidence)"
             confidence = "HIGH"
+        elif final_score >= 0.60:
             classification = "Likely AI-Generated"
             confidence = "MEDIUM-HIGH"
+        elif final_score >= 0.40:
             classification = "Uncertain"
             confidence = "LOW"
+        elif final_score >= 0.25:
             classification = "Likely Human-Written"
             confidence = "MEDIUM"
         else:
         """Create detailed explanation"""
         exp = []
+        # Overall assessment with improved thresholds
+        if score >= 0.75:
             exp.append("🤖 STRONG AI INDICATORS: The text exhibits multiple characteristics typical of AI-generated content.")
+        elif score >= 0.60:
             exp.append("⚠️ PROBABLE AI: Several AI patterns detected, suggesting machine generation.")
+        elif score >= 0.40:
             exp.append("❓ INCONCLUSIVE: Mixed signals - could be AI-assisted or edited content.")
+        elif score >= 0.25:
             exp.append("✍️ PROBABLE HUMAN: More human-like characteristics than AI patterns.")
         else:
             exp.append("👤 STRONG HUMAN INDICATORS: Text shows natural human writing patterns.")
         # Model consensus
         if model_results:
+            high_ai = [name for name, s in model_results.items() if s > 0.70]
+            high_human = [name for name, s in model_results.items() if s < 0.30]
             if len(high_ai) >= 2:
                 exp.append(f"\n\n✓ Multiple models detect AI: {', '.join(high_ai)}")
             elif len(high_human) >= 2:
                 exp.append(f"\n\n✓ Multiple models detect human writing: {', '.join(high_human)}")
+        # AI-specific indicators
+        if stat_details.get('chatgpt_patterns', 0) > 0.4:
             exp.append("\n\n⚡ High density of ChatGPT-style phrases and structures detected")
         if stat_details.get('sent_length_std', 1) < 0.3:
         if stat_details.get('trigram_repetition', 0) > 0.1:
             exp.append("\n🔁 Repeated phrase patterns detected")
+        # Human-specific indicators
+        if stat_details.get('human_patterns', 0) > 0.3:
+            exp.append("\n\n💬 Strong human conversational patterns detected")
+        if stat_details.get('conversational_patterns', 0) > 0.2:
+            exp.append("\n🗣️ Conversational language and casual expressions found")
+        if stat_details.get('sentence_variety', 0) > 0.4:
+            exp.append("\n📝 Natural sentence length variation (human characteristic)")
         return " ".join(exp)
         analysis = result['statistical_analysis']
+        # AI indicators
         if 'chatgpt_patterns' in analysis:
             output += f"\n- **ChatGPT Pattern Score:** {analysis['chatgpt_patterns']:.2f}/1.00"
         if 'sent_length_std' in analysis:
             output += f"\n- **Phrase Repetition:** {analysis['trigram_repetition']:.3f}"
         if 'starter_diversity' in analysis:
             output += f"\n- **Sentence Starter Diversity:** {analysis['starter_diversity']:.3f}"
+        # Human indicators
+        if 'human_patterns' in analysis:
+            output += f"\n- **Human Pattern Score:** {analysis['human_patterns']:.2f}/1.00"
+        if 'conversational_patterns' in analysis:
+            output += f"\n- **Conversational Patterns:** {analysis['conversational_patterns']:.3f}"
+        if 'sentence_variety' in analysis:
+            output += f"\n- **Sentence Variety:** {analysis['sentence_variety']:.3f} (higher = more human-like)"
     # Visual representation
     ai_prob = result['ai_probability']
         # ChatGPT example
         ["Artificial intelligence has revolutionized numerous industries in recent years. It's important to note that this technology offers both opportunities and challenges. Machine learning algorithms can process vast amounts of data, identify patterns, and make predictions with remarkable accuracy. Furthermore, AI applications span various domains including healthcare, finance, and transportation. However, it's crucial to consider the ethical implications. Issues such as bias in algorithms, job displacement, and privacy concerns require careful consideration. Additionally, the development of AI must be guided by responsible practices. In conclusion, while AI presents tremendous potential for innovation and progress, we must approach its implementation thoughtfully and ethically."],
+        # Human example - conversational
         ["So yesterday I'm at the coffee shop, right? And this guy next to me is having the LOUDEST phone conversation about his crypto investments. Like, dude, we get it, you bought Dogecoin. But here's the thing - he kept saying he was gonna be a millionaire by next week. Next week! I almost choked on my latte. The barista and I made eye contact and we both just tried not to laugh. I mean, good luck to him and all, but maybe don't count those chickens yet? Anyway, that's my coffee shop drama for the week. Still better than working from home where my cat judges me all day."],
+        # Human example - personal reflection
+        ["I've been thinking about this whole social media thing lately. You know, I used to post everything - what I ate for breakfast, random thoughts, selfies. But now I'm kinda over it? Like, I still check Instagram and stuff, but I don't feel the need to share every little thing anymore. Maybe I'm getting old, or maybe I just realized that most people don't actually care about my lunch. It's weird how we went from sharing everything to being more private. I think it's actually healthier this way, but I miss the old days sometimes when social media felt more fun and less performative."],
         # Mixed/edited example
         ["The impact of social media on society has been profound. Studies show that people spend an average of 2.5 hours daily on social platforms. But honestly, I think it's probably way more than that - I know I'm constantly checking my phone! These platforms have transformed how we communicate, share information, and even how we see ourselves. There are definitely benefits, like staying connected with friends and family across distances. However, we're also seeing rises in anxiety and depression linked to social media use, especially among teenagers. It's a complex issue that deserves our attention."]
     ],

test_detector.py ADDED Viewed

	@@ -0,0 +1,76 @@

+#!/usr/bin/env python3
+"""
+Test script for the improved AI text detector
+"""
+import sys
+import os
+sys.path.append(os.path.dirname(os.path.abspath(__file__)))
+from app import AdvancedAITextDetector
+def test_detector():
+    """Test the detector with various text samples"""
+    print("Initializing detector...")
+    detector = AdvancedAITextDetector()
+    # Test cases
+    test_cases = [
+        {
+            "name": "Human - Conversational",
+            "text": "So yesterday I'm at the coffee shop, right? And this guy next to me is having the LOUDEST phone conversation about his crypto investments. Like, dude, we get it, you bought Dogecoin. But here's the thing - he kept saying he was gonna be a millionaire by next week. Next week! I almost choked on my latte.",
+            "expected": "human"
+        },
+        {
+            "name": "AI - ChatGPT Style",
+            "text": "Artificial intelligence has revolutionized numerous industries in recent years. It's important to note that this technology offers both opportunities and challenges. Machine learning algorithms can process vast amounts of data, identify patterns, and make predictions with remarkable accuracy. Furthermore, AI applications span various domains including healthcare, finance, and transportation.",
+            "expected": "ai"
+        },
+        {
+            "name": "Human - Personal Reflection",
+            "text": "I've been thinking about this whole social media thing lately. You know, I used to post everything - what I ate for breakfast, random thoughts, selfies. But now I'm kinda over it? Like, I still check Instagram and stuff, but I don't feel the need to share every little thing anymore.",
+            "expected": "human"
+        },
+        {
+            "name": "AI - Formal Academic",
+            "text": "The implementation of machine learning algorithms requires careful consideration of various factors. It is essential to understand that these systems must be designed with robust error handling mechanisms. Additionally, the development process should incorporate comprehensive testing protocols to ensure optimal performance.",
+            "expected": "ai"
+        }
+    ]
+    print("\n" + "="*80)
+    print("TESTING IMPROVED AI TEXT DETECTOR")
+    print("="*80)
+    for i, test_case in enumerate(test_cases, 1):
+        print(f"\n{i}. {test_case['name']}")
+        print("-" * 50)
+        result = detector.detect(test_case['text'])
+        print(f"AI Probability: {result['ai_probability']}%")
+        print(f"Classification: {result['classification']}")
+        print(f"Confidence: {result['confidence']}")
+        # Check if result matches expectation
+        ai_prob = result['ai_probability']
+        if test_case['expected'] == 'human' and ai_prob < 40:
+            print("✅ CORRECT - Human text correctly identified")
+        elif test_case['expected'] == 'ai' and ai_prob > 60:
+            print("✅ CORRECT - AI text correctly identified")
+        else:
+            print("❌ INCORRECT - Misclassification detected")
+        # Show key indicators
+        if 'statistical_analysis' in result:
+            stats = result['statistical_analysis']
+            print(f"Human Patterns: {stats.get('human_patterns', 0):.2f}")
+            print(f"ChatGPT Patterns: {stats.get('chatgpt_patterns', 0):.2f}")
+            print(f"Conversational: {stats.get('conversational_patterns', 0):.2f}")
+    print("\n" + "="*80)
+    print("TEST COMPLETE")
+    print("="*80)
+if __name__ == "__main__":
+    test_detector()