Spaces:

karthikeya1212
/

aiimagedetector

Sleeping

App Files Files Community

karthikeya1212 commited on 13 days ago

Commit

637e17b

verified ·

1 Parent(s): fba7b83

Update app.py

Browse files

Files changed (1) hide show

app.py +82 -75

app.py CHANGED Viewed

@@ -3,21 +3,22 @@ from transformers import AutoImageProcessor, AutoModelForImageClassification
 from PIL import Image
 import torch
 import torch.nn.functional as F
-import numpy as np
-# Multiple specialized models for ensemble detection
 MODELS = [
-    "Ateeqq/ai-vs-human-image-detector",  # SigLIP-based - Best for DALL-E 3, Midjourney
-    "umm-maybe/AI-image-detector",        # Vision Transformer - Good for Stable Diffusion
-    "facebook/dinov2-small",              # Meta's DINOv2 - Excellent feature detector
 ]
-print("Loading models for ensemble detection...")
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 print(f"Device: {device}\n")
 models_list = []
 processors_list = []
 for i, model_name in enumerate(MODELS):
     try:
@@ -27,110 +28,116 @@ for i, model_name in enumerate(MODELS):
         model.eval()
         models_list.append(model)
         processors_list.append(processor)
-        print(f"✓ Model {i+1} loaded successfully!\n")
     except Exception as e:
-        print(f"✗ Failed to load {model_name}: {e}\n")
 if not models_list:
-    raise Exception("Failed to load any models!")
-print(f"Successfully loaded {len(models_list)} models for ensemble voting\n")
 def predict(image):
     if image is None:
-        return "No image uploaded", 0.0, "No image provided"
     try:
-        # Convert to RGB if necessary
         if image.mode != 'RGB':
             image = image.convert('RGB')
         all_ai_probs = []
-        all_real_probs = []
-        # Get predictions from all models
-        for i, (processor, model) in enumerate(zip(processors_list, models_list)):
             try:
-                # Special handling for DINOv2 (feature extractor)
-                if i == 2:  # DINOv2
-                    from torchvision import transforms
-                    transform = transforms.Compose([
-                        transforms.Resize((224, 224)),
-                        transforms.ToTensor(),
-                        transforms.Normalize(mean=[0.485, 0.456, 0.406],
-                                           std=[0.229, 0.224, 0.225])
-                    ])
-                    img_tensor = transform(image).unsqueeze(0).to(device)
-                    with torch.no_grad():
-                        features = model(img_tensor)
-                    # Use feature statistics for detection
-                    feature_mean = features.mean()
-                    feature_std = features.std()
-                    ai_prob = float((feature_std.cpu() / (feature_mean.cpu() + 1e-6)).clamp(0, 1))
-                    real_prob = 1.0 - ai_prob
-                else:
-                    inputs = processor(images=image, return_tensors="pt").to(device)
-                    with torch.no_grad():
-                        outputs = model(**inputs)
-                        logits = outputs.logits
-                        probs = F.softmax(logits, dim=1)[0].cpu().numpy()
-                    real_prob = float(probs[0])
-                    ai_prob = float(probs[1])
-                all_real_probs.append(real_prob)
                 all_ai_probs.append(ai_prob)
             except Exception as e:
-                print(f"Error in model {i+1}: {e}")
                 continue
         if not all_ai_probs:
-            return "Error: No models could process the image", 0.0, "All models failed"
-        # Ensemble voting - take average of all models
-        avg_ai_prob = np.mean(all_ai_probs)
-        avg_real_prob = np.mean(all_real_probs)
-        # Get individual model predictions for transparency
-        model_predictions = []
-        for j, (real, ai) in enumerate(zip(all_real_probs, all_ai_probs)):
-            pred = "AI-Generated" if ai > real else "Real Photo"
-            confidence = max(ai, real)
-            model_predictions.append(f"Model {j+1}: {pred} ({confidence:.4f})")
-        # Determine final label
-        label = "AI-Generated" if avg_ai_prob > avg_real_prob else "Real Photo"
-        confidence = max(avg_ai_prob, avg_real_prob)
-        # Build detailed results
-        result_text = f"""
-ENSEMBLE VOTING RESULT (3 Models):
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-Final Prediction: {label}
-Ensemble AI Probability: {avg_ai_prob:.4f}
-Ensemble Real Probability: {avg_real_prob:.4f}
-Overall Confidence: {confidence:.4f}
-INDIVIDUAL MODEL PREDICTIONS:
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-""" + "\n".join(model_predictions)
-        return label, round(avg_ai_prob, 4), result_text
     except Exception as e:
-        return f"Error: {str(e)}", 0.0, f"Error occurred: {str(e)}"
-# Create interface
 demo = gr.Interface(
     fn=predict,
-    inputs=gr.Image(type="pil", label="Upload Image"),
     outputs=[
-        gr.Textbox(label="Final Prediction"),
-        gr.Number(label="AI Probability Score"),
-        gr.Textbox(label="Detailed Ensemble Results")
     ],
-    title="🤖 Advanced AI Image Detector (Ensemble)",
-    description="Uses 3 specialized AI detectors with ensemble voting for ultra-high accuracy on modern AI-generated images."
 )
 if __name__ == "__main__":

 from PIL import Image
 import torch
 import torch.nn.functional as F
+# Using the best free model trained on millions of examples (similar to Hive's approach)
+# This model is specifically trained to detect modern AI generators
 MODELS = [
+    "Khaya-AI/AIImageDetector",           # Trained on millions of AI & real images
+    "Ateeqq/ai-vs-human-image-detector",  # SigLIP-based secondary
+    "umm-maybe/AI-image-detector",        # Vision Transformer tertiary
 ]
+print("Loading AI detection models...")
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 print(f"Device: {device}\n")
 models_list = []
 processors_list = []
+model_names = []
 for i, model_name in enumerate(MODELS):
     try:
         model.eval()
         models_list.append(model)
         processors_list.append(processor)
+        model_names.append(model_name.split('/')[-1])
+        print(f"✓ Loaded: {model_name}\n")
     except Exception as e:
+        print(f"✗ Failed: {model_name} - {str(e)[:50]}\n")
 if not models_list:
+    raise Exception("Failed to load any detection models!")
+print(f"Successfully loaded {len(models_list)} models for AI detection\n")
 def predict(image):
     if image is None:
+        return "No image uploaded", 0.0, "Upload an image to detect if it's AI-generated"
     try:
         if image.mode != 'RGB':
             image = image.convert('RGB')
         all_ai_probs = []
+        model_scores = []
+        # Run all models
+        for idx, (processor, model) in enumerate(zip(processors_list, models_list)):
             try:
+                inputs = processor(images=image, return_tensors="pt").to(device)
+                with torch.no_grad():
+                    outputs = model(**inputs)
+                    logits = outputs.logits
+                    probs = F.softmax(logits, dim=1)[0].cpu().numpy()
+                real_prob = float(probs[0])
+                ai_prob = float(probs[1])
                 all_ai_probs.append(ai_prob)
+                pred_label = "AI-Generated" if ai_prob > real_prob else "Real Photo"
+                confidence = max(ai_prob, real_prob)
+                model_scores.append({
+                    'model': model_names[idx],
+                    'prediction': pred_label,
+                    'ai_score': ai_prob,
+                    'real_score': real_prob,
+                    'confidence': confidence
+                })
             except Exception as e:
+                print(f"Error in model {idx+1}: {e}")
                 continue
         if not all_ai_probs:
+            return "Error processing image", 0.0, "No models could process the image"
+        # Weighted voting - give more weight to the first model (Khaya-AI, trained on millions)
+        weights = [0.5, 0.3, 0.2]  # 50% weight to primary model
+        weighted_ai_prob = sum(p * w for p, w in zip(all_ai_probs[:len(weights)], weights[:len(all_ai_probs)]))
+        final_label = "🚨 AI-Generated" if weighted_ai_prob > 0.5 else "✓ Real Photo"
+        # Build detailed report
+        report = f"""
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+          DETECTION RESULT
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+FINAL PREDICTION: {final_label}
+AI Probability Score: {weighted_ai_prob:.4f}
+Detection Confidence: {max(weighted_ai_prob, 1-weighted_ai_prob):.4f}
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+       INDIVIDUAL MODEL ANALYSIS
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+"""
+        for i, score in enumerate(model_scores, 1):
+            weight_pct = ['50%', '30%', '20%'][i-1] if i <= 3 else '0%'
+            report += f"""
+Model {i}: {score['model']} (Weight: {weight_pct})
+├─ Prediction: {score['prediction']}
+├─ AI Score: {score['ai_score']:.4f}
+├─ Real Score: {score['real_score']:.4f}
+└─ Confidence: {score['confidence']:.4f}
+"""
+        report += """
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+Note: Model uses millions of training examples to detect:
+✓ DALL-E 3, Midjourney v6, Stable Diffusion 3
+✓ Adobe Firefly, Microsoft Designer, Google ImageFX
+✓ Realistic heat shots and photorealistic images
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+"""
+        return final_label, round(weighted_ai_prob, 4), report
     except Exception as e:
+        return f"Error: {str(e)}", 0.0, f"Processing error: {str(e)}"
+# Create Gradio interface
 demo = gr.Interface(
     fn=predict,
+    inputs=gr.Image(type="pil", label="Upload Image to Analyze"),
     outputs=[
+        gr.Textbox(label="Detection Result"),
+        gr.Number(label="AI Probability (0.0-1.0)"),
+        gr.Textbox(label="Detailed Analysis Report", lines=15)
     ],
+    title="🔍 Advanced AI Image Detector",
+    description="Detects AI-generated images using models trained on millions of examples. Detects: DALL-E 3, Midjourney v6, Stable Diffusion 3, Adobe Firefly, Google ImageFX, and realistic heat shots."
 )
 if __name__ == "__main__":