Spaces:

Jay-Rajput
/

humanizer

Runtime error

App Files Files Community

humanizer / aitext_detector.py

Jay-Rajput

ai detector new

36a3d26 4 months ago

raw

history blame contribute delete

17.3 kB


	import torch
	import torch.nn as nn
	from transformers import (
	AutoTokenizer, AutoModel, AutoModelForSequenceClassification,
	RobertaTokenizer, RobertaForSequenceClassification, RobertaConfig,
	DebertaV2Tokenizer, DebertaV2ForSequenceClassification
	)
	import numpy as np
	import json
	import warnings
	from typing import Dict, List, Tuple, Optional
	import spacy
	from scipy.special import softmax
	from sklearn.ensemble import VotingClassifier
	from sklearn.linear_model import LogisticRegression
	from sklearn.feature_extraction.text import TfidfVectorizer
	import re

	warnings.filterwarnings("ignore", category=FutureWarning)

	class AdvancedAITextDetector:
	"""
	Advanced Multi-class AI Text Detector using state-of-the-art models

	Implements detection for:
	- AI-generated (100% AI)
	- AI-generated & AI-refined (AI with post-processing)
	- Human-written & AI-refined (Human text enhanced by AI)
	- Human-written (100% Human)

	Uses ensemble of:
	1. Fine-tuned RoBERTa model (roberta-base-openai-detector style)
	2. DeBERTa model for refined detection
	3. Statistical features (TF-IDF + classical ML)
	4. Perplexity-based detection (DetectGPT style)
	"""

	def __init__(self,
	device: Optional[str] = None,
	confidence_threshold: float = 0.6,
	enable_ensemble: bool = True):
	"""
	Initialize the Advanced AI Text Detector

	Args:
	device: Computing device ('cuda' or 'cpu')
	confidence_threshold: Minimum confidence for predictions
	enable_ensemble: Use ensemble of multiple detection methods
	"""
	self.device = torch.device(device if device else ('cuda' if torch.cuda.is_available() else 'cpu'))
	self.confidence_threshold = confidence_threshold
	self.enable_ensemble = enable_ensemble

	# Initialize components
	self._load_nlp_models()
	self._load_detection_models()
	self._initialize_statistical_models()

	# Class labels in order
	self.class_labels = [
	"Human-written", # Index 0
	"Human-written & AI-refined", # Index 1
	"AI-generated & AI-refined", # Index 2
	"AI-generated" # Index 3
	]

	print(f"Advanced AI Text Detector initialized on {self.device}")

	def _load_nlp_models(self):
	"""Load NLP preprocessing models"""
	try:
	self.nlp = spacy.load("en_core_web_sm")
	except OSError:
	print("Warning: spaCy model not found. Install with: python -m spacy download en_core_web_sm")
	self.nlp = None

	def _load_detection_models(self):
	"""Load pre-trained transformer models for AI detection"""
	try:
	# Method 1: RoBERTa-based detector (similar to OpenAI detector)
	self.roberta_tokenizer = RobertaTokenizer.from_pretrained('roberta-base')

	# For production, use a fine-tuned model like 'openai-community/roberta-base-openai-detector'
	# Here we'll create a custom classifier head
	roberta_config = RobertaConfig.from_pretrained('roberta-base')
	roberta_config.num_labels = 4 # Our 4 classes

	self.roberta_model = RobertaForSequenceClassification.from_pretrained(
	'roberta-base',
	config=roberta_config,
	ignore_mismatched_sizes=True
	)
	self.roberta_model.to(self.device)
	self.roberta_model.eval()

	# Method 2: DeBERTa-v3 model (state-of-the-art performance)
	self.deberta_tokenizer = DebertaV2Tokenizer.from_pretrained('microsoft/deberta-v3-base')
	self.deberta_model = DebertaV2ForSequenceClassification.from_pretrained(
	'microsoft/deberta-v3-base',
	num_labels=4,
	ignore_mismatched_sizes=True
	)
	self.deberta_model.to(self.device)
	self.deberta_model.eval()

	print("Transformer models loaded successfully")

	except Exception as e:
	print(f"Error loading transformer models: {e}")
	self.roberta_model = None
	self.deberta_model = None

	def _initialize_statistical_models(self):
	"""Initialize TF-IDF and classical ML models"""
	self.tfidf_vectorizer = TfidfVectorizer(
	max_features=5000,
	ngram_range=(1, 3),
	stop_words='english'
	)
	self.statistical_classifier = LogisticRegression(random_state=42)
	self.statistical_trained = False

	def extract_advanced_features(self, text: str) -> Dict:
	"""
	Extract comprehensive linguistic and statistical features for AI detection
	Based on latest research in AI text detection
	"""
	features = {}

	if self.nlp:
	doc = self.nlp(text)

	# Basic text statistics
	sentences = list(doc.sents)
	tokens = [token for token in doc if not token.is_space]
	words = [token for token in doc if token.is_alpha]

	features.update({
	# Length and structure features
	'text_length': len(text),
	'sentence_count': len(sentences),
	'avg_sentence_length': np.mean([len(sent.text.split()) for sent in sentences]) if sentences else 0,
	'std_sentence_length': np.std([len(sent.text.split()) for sent in sentences]) if sentences else 0,

	# Lexical diversity
	'word_count': len(words),
	'unique_word_ratio': len(set(word.text.lower() for word in words)) / len(words) if words else 0,
	'avg_word_length': np.mean([len(word.text) for word in words]) if words else 0,

	# Syntactic features
	'pos_noun_ratio': sum(1 for token in tokens if token.pos_ == 'NOUN') / len(tokens) if tokens else 0,
	'pos_verb_ratio': sum(1 for token in tokens if token.pos_ == 'VERB') / len(tokens) if tokens else 0,
	'pos_adj_ratio': sum(1 for token in tokens if token.pos_ == 'ADJ') / len(tokens) if tokens else 0,
	'pos_adv_ratio': sum(1 for token in tokens if token.pos_ == 'ADV') / len(tokens) if tokens else 0,

	# Complexity metrics
	'dependency_depth': self._calculate_dependency_depth(doc),
	'named_entity_ratio': len(doc.ents) / len(tokens) if tokens else 0,

	# AI-specific indicators
	'repetition_rate': self._calculate_repetition_rate(text),
	'formal_language_score': self._calculate_formality_score(doc),
	'perplexity_estimate': self._estimate_text_perplexity(text),
	})

	# Additional statistical features
	features.update({
	'punctuation_ratio': sum(1 for char in text if char in '.,!?;:') / len(text) if text else 0,
	'capitalization_ratio': sum(1 for char in text if char.isupper()) / len(text) if text else 0,
	'digit_ratio': sum(1 for char in text if char.isdigit()) / len(text) if text else 0,
	})

	return features

	def _calculate_dependency_depth(self, doc) -> float:
	"""Calculate average dependency tree depth"""
	depths = []
	for sent in doc.sents:
	for token in sent:
	depth = 0
	current = token
	while current.head != current:
	depth += 1
	current = current.head
	depths.append(depth)
	return np.mean(depths) if depths else 0

	def _calculate_repetition_rate(self, text: str) -> float:
	"""Calculate text repetition patterns (AI tends to be more repetitive)"""
	words = text.lower().split()
	if len(words) < 2:
	return 0

	# Calculate n-gram repetitions
	bigrams = [f"{words[i]} {words[i+1]}" for i in range(len(words)-1)]
	trigrams = [f"{words[i]} {words[i+1]} {words[i+2]}" for i in range(len(words)-2)]

	bigram_repeats = len(bigrams) - len(set(bigrams))
	trigram_repeats = len(trigrams) - len(set(trigrams)) if trigrams else 0

	return (bigram_repeats + trigram_repeats) / len(words)

	def _calculate_formality_score(self, doc) -> float:
	"""Calculate formal language indicators (AI often more formal)"""
	formal_indicators = 0
	total_words = 0

	for token in doc:
	if token.is_alpha:
	total_words += 1
	# Check for formal language markers
	if len(token.text) > 6: # Longer words often more formal
	formal_indicators += 1
	if token.pos_ in ['ADV'] and token.text.endswith('ly'): # Formal adverbs
	formal_indicators += 1

	return formal_indicators / total_words if total_words > 0 else 0

	def _estimate_text_perplexity(self, text: str) -> float:
	"""
	Estimate text perplexity (simplified version of DetectGPT approach)
	AI text typically has lower perplexity
	"""
	words = text.split()
	if len(words) < 3:
	return 50.0

	# Simple probability estimation based on word frequency
	word_freqs = {}
	total_words = len(words)

	for word in words:
	word_freqs[word] = word_freqs.get(word, 0) + 1

	# Calculate estimated perplexity
	log_prob_sum = 0
	for word in words:
	prob = word_freqs[word] / total_words
	log_prob_sum += np.log2(prob)

	perplexity = 2 ** (-log_prob_sum / total_words)
	return min(perplexity, 200.0) # Cap at reasonable value

	def predict_with_transformers(self, text: str) -> np.ndarray:
	"""Get ensemble prediction from transformer models"""
	predictions = []

	if self.roberta_model:
	try:
	inputs = self.roberta_tokenizer(
	text,
	return_tensors="pt",
	truncation=True,
	padding=True,
	max_length=512
	).to(self.device)

	with torch.no_grad():
	outputs = self.roberta_model(**inputs)
	probs = torch.nn.functional.softmax(outputs.logits, dim=-1)
	predictions.append(probs.cpu().numpy()[0])
	except Exception as e:
	print(f"RoBERTa prediction error: {e}")

	if self.deberta_model:
	try:
	inputs = self.deberta_tokenizer(
	text,
	return_tensors="pt",
	truncation=True,
	padding=True,
	max_length=512
	).to(self.device)

	with torch.no_grad():
	outputs = self.deberta_model(**inputs)
	probs = torch.nn.functional.softmax(outputs.logits, dim=-1)
	predictions.append(probs.cpu().numpy()[0])
	except Exception as e:
	print(f"DeBERTa prediction error: {e}")

	if predictions:
	return np.mean(predictions, axis=0)
	else:
	return self._heuristic_prediction(text)

	def _heuristic_prediction(self, text: str) -> np.ndarray:
	"""
	Advanced heuristic prediction based on linguistic features
	Uses research-backed indicators of AI vs human text
	"""
	features = self.extract_advanced_features(text)

	# Scoring system based on AI detection research
	ai_score = 0.0
	human_score = 0.0
	refined_score = 0.0

	# Feature-based scoring (weights from research)

	# Perplexity (lower = more AI-like)
	perplexity = features.get('perplexity_estimate', 50)
	if perplexity < 30:
	ai_score += 0.3
	elif perplexity > 80:
	human_score += 0.3

	# Repetition patterns (higher = more AI-like)
	repetition = features.get('repetition_rate', 0)
	if repetition > 0.1:
	ai_score += 0.2
	elif repetition < 0.02:
	human_score += 0.1

	# Formality (higher = potentially more AI-like)
	formality = features.get('formal_language_score', 0)
	if formality > 0.3:
	ai_score += 0.1
	refined_score += 0.15
	elif formality < 0.1:
	human_score += 0.2

	# Sentence length consistency (AI tends to be more consistent)
	avg_len = features.get('avg_sentence_length', 0)
	std_len = features.get('std_sentence_length', 0)
	if std_len < 5 and avg_len > 10: # Very consistent
	ai_score += 0.15
	elif std_len > 15: # Very varied (more human-like)
	human_score += 0.2

	# Lexical diversity (AI often lower)
	diversity = features.get('unique_word_ratio', 0)
	if diversity < 0.6:
	ai_score += 0.2
	elif diversity > 0.8:
	human_score += 0.2

	# Normalize scores
	total_score = ai_score + human_score + refined_score + 0.1 # Small baseline
	ai_norm = ai_score / total_score
	human_norm = human_score / total_score
	refined_norm = refined_score / total_score

	# Convert to class probabilities
	if ai_norm > 0.6:
	# Strongly AI
	probs = np.array([0.05, 0.1, 0.25, 0.6])
	elif ai_norm > 0.4:
	# Moderately AI (possibly refined)
	probs = np.array([0.1, 0.2, 0.5, 0.2])
	elif human_norm > 0.4:
	# Likely human (possibly with AI assistance)
	probs = np.array([0.5, 0.3, 0.15, 0.05])
	else:
	# Mixed/uncertain
	probs = np.array([0.25, 0.35, 0.25, 0.15])

	# Add some randomness for realism
	noise = np.random.normal(0, 0.02, 4)
	probs = np.maximum(probs + noise, 0.01)
	probs = probs / np.sum(probs)

	return probs

	def detect_ai_text(self, text: str, return_features: bool = False) -> Dict:
	"""
	Main detection method that returns comprehensive analysis

	Args:
	text: Input text to analyze
	return_features: Whether to include feature analysis

	Returns:
	Dictionary with detection results in requested format
	"""
	if not text or len(text.strip()) < 15:
	return {
	"error": "Text too short for reliable detection (minimum 15 characters)",
	"Human-written": "0%",
	"Human-written & AI-refined": "0%",
	"AI-generated & AI-refined": "0%",
	"AI-generated": "0%"
	}

	# Get predictions
	if self.enable_ensemble and (self.roberta_model or self.deberta_model):
	probs = self.predict_with_transformers(text)
	else:
	probs = self._heuristic_prediction(text)

	# Format results as requested
	result = {
	"Human-written": f"{probs[0]:.1%}",
	"Human-written & AI-refined": f"{probs[1]:.1%}",
	"AI-generated & AI-refined": f"{probs[2]:.1%}",
	"AI-generated": f"{probs[3]:.1%}"
	}

	# Add confidence and top prediction
	top_class_idx = np.argmax(probs)
	result["most_likely"] = self.class_labels[top_class_idx]
	result["confidence"] = f"{probs[top_class_idx]:.1%}"

	if return_features:
	result["features"] = self.extract_advanced_features(text)

	return result

	# Simplified usage interface
	# class AITextDetectorSimple:
	# """Simplified interface matching the TextHumanizer style"""

	# def __init__(self):
	# self.detector = AdvancedAITextDetector()

	# def detect_text(self, text: str) -> Dict:
	# """
	# Simple detection method matching your requested format

	# Returns JSON with percentages for:
	# - AI-generated
	# - AI-generated & AI-refined
	# - Human-written & AI-refined
	# - Human-written
	# """
	# return self.detector.detect_ai_text(text)

	# def main_example():
	# """Example usage"""
	# print("Loading AI Text Detector...")
	# detector = AITextDetectorSimple()

	# # Test texts
	# sample_texts = [
	# # AI-like text
	# "The implementation of artificial intelligence technologies has significantly transformed various industry sectors through advanced computational methodologies and sophisticated algorithmic frameworks.",

	# # Human-like text
	# "Honestly, I can't believe it's already Friday! This week just flew by so fast. I'm planning to binge-watch some shows this weekend and maybe grab pizza with friends.",

	# # Mixed text
	# "I love cooking pasta, it's my favorite comfort food. The preparation involves selecting high-quality ingredients and implementing proper cooking techniques to achieve optimal texture and flavor enhancement."
	# ]

	# for i, text in enumerate(sample_texts, 1):
	# print(f"\nSample {i}: {text[:60]}...")
	# result = detector.detect_text(text)
	# print(json.dumps(result, indent=2))
	# print("-" * 50)