add age and gender detector

2025-09-22 12:09:59 +08:00 · 2025-07-28 18:11:45 +03:00 · 2025-07-28 18:11:45 +03:00 · fdfab8972c
commit fdfab8972c
parent 972c98bce5
5 changed files with 1072 additions and 0 deletions
--- a/api.py
+++ b/api.py
@ -30,6 +30,24 @@ import config as global_config
 import logging
 import subprocess

+from fastapi import FastAPI, WebSocket, WebSocketDisconnect, UploadFile, File, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+import cv2
+import numpy as np
+import asyncio
+import json
+import time
+import logging
+from datetime import datetime
+from typing import Dict
+
+from face_detector import AgeGenderDetector
+from utils import decode_base64_image
+
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
 import nltk
 nltk.download('averaged_perceptron_tagger_eng')

@ -871,6 +889,45 @@ change_gpt_sovits_weights(gpt_path = gpt_path, sovits_path = sovits_path)
 # 接口部分
 # --------------------------------
 app = FastAPI()
+# CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+
+
+# Global detector instance
+detector = AgeGenderDetector()
+
+# WebSocket connection manager
+class ConnectionManager:
+    def __init__(self):
+        self.active_connections: Dict[str, WebSocket] = {}
+    
+    async def connect(self, websocket: WebSocket, session_id: str):
+        await websocket.accept()
+        self.active_connections[session_id] = websocket
+        logger.info(f"🔌 Connected: {session_id}")
+    
+    def disconnect(self, session_id: str):
+        self.active_connections.pop(session_id, None)
+        logger.info(f"🔌 Disconnected: {session_id}")
+    
+    async def send_message(self, session_id: str, message: dict):
+        websocket = self.active_connections.get(session_id)
+        if websocket:
+            try:
+                await websocket.send_text(json.dumps(message))
+            except:
+                self.disconnect(session_id)
+
+manager = ConnectionManager()
+
+

@app.post("/")
 async def tts_endpoint(request: Request):
@ -1101,6 +1158,99 @@ async def tts_endpoint(
    print(f"the base path is {refer_wav_path}")
    return handle(refer_wav_path, prompt_text, prompt_language, text, text_language, cut_punc, top_k, top_p, temperature, speed, inp_refs, sample_steps, if_sr)

+@app.post("/analyze_image")
+async def analyze_image(file: UploadFile = File(...)):
+    """Analyze uploaded image"""
+    try:
+        # Read image
+        image_data = await file.read()
+        
+        # Convert to OpenCV format
+        nparr = np.frombuffer(image_data, np.uint8)
+        image = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
+        
+        if image is None:
+            raise HTTPException(status_code=400, detail="Invalid image format")
+        
+        # Process image
+        start_time = time.time()
+        results = detector.process_image(image)
+        processing_time = time.time() - start_time
+        
+        # Cleanup periodically
+        if len(detector.face_results) > 50:
+            detector.cleanup_old_results()
+        
+        return {
+            "success": True,
+            "processing_time": round(processing_time, 2),
+            "people": results,
+            "total_people": len(results),
+            "timestamp": datetime.now().isoformat()
+        }
+    
+    except Exception as e:
+        logger.error(f"Image analysis error: {e}")
+        raise HTTPException(status_code=500, detail=str(e))
+
+@app.websocket("/ws/{session_id}")
+async def websocket_endpoint(websocket: WebSocket, session_id: str):
+    """WebSocket endpoint for real-time processing"""
+    await manager.connect(websocket, session_id)
+    
+    def result_callback(person_id: str, result: dict):
+        """Callback for when analysis is complete"""
+        asyncio.create_task(manager.send_message(session_id, {
+            "type": "analysis_complete",
+            "person_id": person_id,
+            "result": result,
+            "timestamp": datetime.now().isoformat()
+        }))
+    
+    try:
+        while True:
+            # Receive data
+            data = await websocket.receive_text()
+            message = json.loads(data)
+            
+            if message.get("type") == "frame":
+                # Process frame
+                base64_image = message.get("image")
+                if base64_image:
+                    image = decode_base64_image(base64_image)
+                    if image is not None:
+                        results = detector.process_image(image, callback=result_callback)
+                        
+                        # Send immediate response
+                        await manager.send_message(session_id, {
+                            "type": "frame_processed",
+                            "people": results,
+                            "total_people": len(results),
+                            "timestamp": datetime.now().isoformat()
+                        })
+            
+            elif message.get("type") == "ping":
+                await manager.send_message(session_id, {
+                    "type": "pong",
+                    "timestamp": datetime.now().isoformat()
+                })
+    
+    except WebSocketDisconnect:
+        manager.disconnect(session_id)
+    except Exception as e:
+        logger.error(f"WebSocket error: {e}")
+        manager.disconnect(session_id)
+
+@app.get("/stats")
+async def get_stats():
+    """Get system statistics"""
+    return {
+        "active_connections": len(manager.active_connections),
+        "known_persons": len(detector.face_encodings),
+        "cached_results": len(detector.face_results),
+        "analysis_queue_size": detector.analysis_queue.qsize(),
+        "system_time": datetime.now().isoformat()
+    }

 if __name__ == "__main__":
    logging.info("the server is running")
--- a/detectors.py
+++ b/detectors.py
@ -0,0 +1,528 @@
+"""
+detectors.py - Face Detection Algorithms and Validators
+Contains different face detection methods and quality validation
+"""
+
+import cv2
+import numpy as np
+import logging
+from typing import List, Tuple
+
+logger = logging.getLogger(__name__)
+
+class EnhancedFaceDetector:
+    """Enhanced face detector using multiple detection methods"""
+    
+    def __init__(self):
+        self.detectors = {}
+        self.load_detectors()
+    
+    def load_detectors(self):
+        """Load multiple face detection algorithms"""
+        # 1. MediaPipe Face Detection (primary)
+        try:
+            import mediapipe as mp
+            self.mp_face_detection = mp.solutions.face_detection
+            self.mp_face_detector = self.mp_face_detection.FaceDetection(
+                model_selection=1, 
+                min_detection_confidence=0.5  # Relaxed threshold
+            )
+            self.detectors['mediapipe'] = True
+            logger.info("✅ MediaPipe Face Detector loaded")
+        except ImportError:
+            logger.warning("⚠️ MediaPipe not available - install with: pip install mediapipe")
+            self.detectors['mediapipe'] = False
+        
+        # 2. Haar Cascade (fallback)
+        try:
+            self.face_cascade = cv2.CascadeClassifier(
+                cv2.data.haarcascades + 'haarcascade_frontalface_default.xml'
+            )
+            self.detectors['haar'] = True
+            logger.info("✅ Haar cascade loaded as fallback")
+        except Exception as e:
+            logger.error(f"❌ Haar cascade loading error: {e}")
+            self.detectors['haar'] = False
+    
+    def detect_faces_mediapipe(self, image):
+        """Detect faces using MediaPipe (most accurate)"""
+        if not self.detectors.get('mediapipe', False):
+            return []
+        
+        try:
+            # Convert BGR to RGB
+            rgb_image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+            results = self.mp_face_detector.process(rgb_image)
+            
+            faces = []
+            if results.detections:
+                h, w = image.shape[:2]
+                
+                for detection in results.detections:
+                    bbox = detection.location_data.relative_bounding_box
+                    confidence = detection.score[0]
+                    
+                    # Convert relative coordinates to absolute
+                    x = max(0, int(bbox.xmin * w))
+                    y = max(0, int(bbox.ymin * h))
+                    width = int(bbox.width * w)
+                    height = int(bbox.height * h)
+                    
+                    # Ensure face is within image bounds
+                    x = min(x, w - 1)
+                    y = min(y, h - 1)
+                    width = min(width, w - x)
+                    height = min(height, h - y)
+                    
+                    if width > 30 and height > 30:  # Minimum size
+                        faces.append((x, y, width, height, confidence))
+            
+            return faces
+            
+        except Exception as e:
+            logger.error(f"MediaPipe detection error: {e}")
+            return []
+    
+    def detect_faces_haar(self, image):
+        """Detect faces using Haar cascades (fallback)"""
+        if not self.detectors.get('haar', False):
+            return []
+        
+        try:
+            gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+            faces = self.face_cascade.detectMultiScale(
+                gray, 
+                scaleFactor=1.1, 
+                minNeighbors=3,      # Relaxed from 5
+                minSize=(30, 30),    # Relaxed from (80, 80)
+                maxSize=(500, 500)
+            )
+            
+            # Add estimated confidence
+            faces_with_conf = []
+            for (x, y, w, h) in faces:
+                # Estimate confidence based on face size
+                confidence = min(0.9, max(0.5, (w * h) / (100 * 100)))
+                faces_with_conf.append((x, y, w, h, confidence))
+            
+            return faces_with_conf
+            
+        except Exception as e:
+            logger.error(f"Haar detection error: {e}")
+            return []
+    
+    def detect_faces_dnn(self, image):
+        """Detect faces using OpenCV DNN (optional third method)"""
+        try:
+            # This requires pre-trained DNN model files
+            # For now, we'll skip this implementation
+            # You can add DNN detection here if you have the model files
+            return []
+        except Exception as e:
+            logger.error(f"DNN detection error: {e}")
+            return []
+    
+    def detect_faces(self, image):
+        """Main face detection using best available method"""
+        all_faces = []
+        
+        # Try MediaPipe first (most accurate)
+        faces = self.detect_faces_mediapipe(image)
+        if faces:
+            all_faces.extend([(x, y, w, h, conf, 'mediapipe') for x, y, w, h, conf in faces])
+        
+        # If no MediaPipe faces or low confidence, try Haar
+        if not all_faces or max([f[4] for f in all_faces]) < 0.7:
+            faces = self.detect_faces_haar(image)
+            all_faces.extend([(x, y, w, h, conf, 'haar') for x, y, w, h, conf in faces])
+        
+        # Filter and remove duplicates
+        filtered_faces = self.filter_and_deduplicate_faces(all_faces)
+        
+        return filtered_faces
+    
+    def filter_and_deduplicate_faces(self, faces):
+        """Remove duplicate faces and apply quality filters"""
+        if not faces:
+            return []
+        
+        # Sort by confidence (highest first)
+        faces.sort(key=lambda x: x[4], reverse=True)
+        
+        filtered = []
+        for face in faces:
+            x, y, w, h, conf, method = face
+            
+            # Apply quality checks
+            if not self.is_valid_face_detection(x, y, w, h, conf):
+                continue
+            
+            # Check for overlap with existing faces
+            is_duplicate = False
+            for existing in filtered:
+                if self.faces_overlap(face, existing):
+                    is_duplicate = True
+                    break
+            
+            if not is_duplicate:
+                filtered.append(face)
+        
+        return filtered
+    
+    def is_valid_face_detection(self, x, y, w, h, confidence):
+        """Validate face detection quality"""
+        # Minimum confidence threshold (relaxed)
+        if confidence < 0.3:
+            return False
+        
+        # Minimum size check (relaxed)
+        if w < 30 or h < 30:
+            return False
+        
+        # Aspect ratio check (more permissive)
+        aspect_ratio = w / h
+        if aspect_ratio < 0.4 or aspect_ratio > 2.5:
+            return False
+        
+        # Coordinates should be positive
+        if x < 0 or y < 0:
+            return False
+        
+        return True
+    
+    def faces_overlap(self, face1, face2, threshold=0.5):
+        """Check if two face detections overlap significantly"""
+        x1, y1, w1, h1 = face1[:4]
+        x2, y2, w2, h2 = face2[:4]
+        
+        # Calculate intersection area
+        xi1 = max(x1, x2)
+        yi1 = max(y1, y2)
+        xi2 = min(x1 + w1, x2 + w2)
+        yi2 = min(y1 + h1, y2 + h2)
+        
+        if xi2 <= xi1 or yi2 <= yi1:
+            return False
+        
+        intersection = (xi2 - xi1) * (yi2 - yi1)
+        
+        # Calculate union area
+        area1 = w1 * h1
+        area2 = w2 * h2
+        union = area1 + area2 - intersection
+        
+        # Calculate IoU (Intersection over Union)
+        iou = intersection / union if union > 0 else 0
+        
+        return iou > threshold
+
+
+class FaceQualityValidator:
+    """Validate face quality before analysis"""
+    
+    @staticmethod
+    def is_face_clear(face_img, blur_threshold=30):
+        """Check if face is clear enough (not too blurry)"""
+        try:
+            gray = cv2.cvtColor(face_img, cv2.COLOR_BGR2GRAY)
+            laplacian_var = cv2.Laplacian(gray, cv2.CV_64F).var()
+            return laplacian_var > blur_threshold
+        except:
+            return True  # If check fails, assume it's OK
+    
+    @staticmethod
+    def has_sufficient_size(face_img, min_size=30):
+        """Check if face has sufficient resolution"""
+        h, w = face_img.shape[:2]
+        return min(h, w) >= min_size
+    
+    @staticmethod
+    def is_properly_aligned(face_img):
+        """Basic check for face alignment (relaxed)"""
+        try:
+            h, w = face_img.shape[:2]
+            # More permissive aspect ratio
+            aspect_ratio = w / h
+            return 0.3 <= aspect_ratio <= 3.0
+        except:
+            return True  # If check fails, assume it's OK
+    
+    @staticmethod
+    def has_good_contrast(face_img, min_std=20):
+        """Check if face has sufficient contrast"""
+        try:
+            gray = cv2.cvtColor(face_img, cv2.COLOR_BGR2GRAY)
+            std_dev = np.std(gray)
+            return std_dev > min_std
+        except:
+            return True  # If check fails, assume it's OK
+    
+    @staticmethod
+    def is_well_lit(face_img, min_brightness=30, max_brightness=220):
+        """Check if face is well lit (not too dark or overexposed)"""
+        try:
+            gray = cv2.cvtColor(face_img, cv2.COLOR_BGR2GRAY)
+            mean_brightness = np.mean(gray)
+            return min_brightness < mean_brightness < max_brightness
+        except:
+            return True  # If check fails, assume it's OK
+    
+    @staticmethod
+    def validate_face(face_img):
+        """Complete face validation with relaxed criteria"""
+        if face_img is None or face_img.size == 0:
+            return False, "Empty face image"
+        
+        if not FaceQualityValidator.has_sufficient_size(face_img):
+            return False, "Face too small"
+        
+        # Skip strict checks for now - they were too restrictive
+        # if not FaceQualityValidator.is_face_clear(face_img):
+        #     return False, "Face too blurry"
+        
+        if not FaceQualityValidator.is_properly_aligned(face_img):
+            return False, "Face poorly aligned"
+        
+        # Optional additional checks (commented out for relaxed validation)
+        # if not FaceQualityValidator.has_good_contrast(face_img):
+        #     return False, "Face has poor contrast"
+        
+        # if not FaceQualityValidator.is_well_lit(face_img):
+        #     return False, "Face is poorly lit"
+        
+        return True, "Face valid"
+    
+    @staticmethod
+    def get_face_quality_score(face_img):
+        """Get overall quality score for face (0-100)"""
+        if face_img is None or face_img.size == 0:
+            return 0
+        
+        score = 0
+        
+        # Size score (0-25 points)
+        h, w = face_img.shape[:2]
+        min_dim = min(h, w)
+        if min_dim >= 100:
+            score += 25
+        elif min_dim >= 60:
+            score += 20
+        elif min_dim >= 30:
+            score += 15
+        else:
+            score += 5
+        
+        # Clarity score (0-25 points)
+        try:
+            gray = cv2.cvtColor(face_img, cv2.COLOR_BGR2GRAY)
+            laplacian_var = cv2.Laplacian(gray, cv2.CV_64F).var()
+            if laplacian_var > 100:
+                score += 25
+            elif laplacian_var > 50:
+                score += 20
+            elif laplacian_var > 20:
+                score += 15
+            else:
+                score += 10
+        except:
+            score += 15  # Default moderate score
+        
+        # Alignment score (0-25 points)
+        try:
+            aspect_ratio = w / h
+            if 0.8 <= aspect_ratio <= 1.2:
+                score += 25  # Perfect square-ish
+            elif 0.6 <= aspect_ratio <= 1.6:
+                score += 20  # Good
+            elif 0.4 <= aspect_ratio <= 2.0:
+                score += 15  # Acceptable
+            else:
+                score += 5   # Poor
+        except:
+            score += 15  # Default moderate score
+        
+        # Contrast score (0-25 points)
+        try:
+            gray = cv2.cvtColor(face_img, cv2.COLOR_BGR2GRAY)
+            std_dev = np.std(gray)
+            if std_dev > 60:
+                score += 25
+            elif std_dev > 40:
+                score += 20
+            elif std_dev > 20:
+                score += 15
+            else:
+                score += 5
+        except:
+            score += 15  # Default moderate score
+        
+        return min(100, score)
+    
+    @staticmethod
+    def enhance_face_for_analysis(face_img):
+        """Apply basic enhancement to improve face for analysis"""
+        try:
+            # Convert to LAB color space
+            lab = cv2.cvtColor(face_img, cv2.COLOR_BGR2LAB)
+            l, a, b = cv2.split(lab)
+            
+            # Apply CLAHE to L channel (brightness)
+            clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(4, 4))
+            l = clahe.apply(l)
+            
+            # Merge back
+            enhanced = cv2.merge([l, a, b])
+            enhanced = cv2.cvtColor(enhanced, cv2.COLOR_LAB2BGR)
+            
+            # Apply slight Gaussian blur to reduce noise
+            enhanced = cv2.GaussianBlur(enhanced, (3, 3), 0)
+            
+            return enhanced
+            
+        except Exception as e:
+            logger.error(f"Face enhancement error: {e}")
+            return face_img
+
+
+class FaceTracker:
+    """Track faces across frames for better stability"""
+    
+    def __init__(self, max_distance=50, max_age=30):
+        self.tracks = {}
+        self.next_id = 1
+        self.max_distance = max_distance
+        self.max_age = max_age
+    
+    def update(self, detections):
+        """Update tracks with new detections"""
+        # Calculate distances between existing tracks and new detections
+        matched_tracks = {}
+        unmatched_detections = list(detections)
+        
+        for track_id, track in self.tracks.items():
+            if track['age'] > self.max_age:
+                continue  # Skip old tracks
+            
+            best_match = None
+            best_distance = float('inf')
+            
+            for i, detection in enumerate(unmatched_detections):
+                x, y, w, h = detection[:4]
+                center_x, center_y = x + w//2, y + h//2
+                
+                track_x, track_y = track['center']
+                distance = np.sqrt((center_x - track_x)**2 + (center_y - track_y)**2)
+                
+                if distance < self.max_distance and distance < best_distance:
+                    best_distance = distance
+                    best_match = i
+            
+            if best_match is not None:
+                detection = unmatched_detections[best_match]
+                x, y, w, h = detection[:4]
+                
+                # Update track
+                self.tracks[track_id].update({
+                    'center': (x + w//2, y + h//2),
+                    'bbox': (x, y, w, h),
+                    'age': 0,
+                    'confidence': detection[4] if len(detection) > 4 else 0.5
+                })
+                
+                matched_tracks[track_id] = detection
+                unmatched_detections.pop(best_match)
+        
+        # Age existing tracks
+        for track_id in list(self.tracks.keys()):
+            if track_id not in matched_tracks:
+                self.tracks[track_id]['age'] += 1
+                if self.tracks[track_id]['age'] > self.max_age:
+                    del self.tracks[track_id]
+        
+        # Create new tracks for unmatched detections
+        for detection in unmatched_detections:
+            x, y, w, h = detection[:4]
+            self.tracks[self.next_id] = {
+                'center': (x + w//2, y + h//2),
+                'bbox': (x, y, w, h),
+                'age': 0,
+                'confidence': detection[4] if len(detection) > 4 else 0.5,
+                'created_frame': self.next_id
+            }
+            matched_tracks[self.next_id] = detection
+            self.next_id += 1
+        
+        return matched_tracks
+    
+    def get_stable_faces(self, min_track_length=3):
+        """Get faces that have been tracked for a minimum number of frames"""
+        stable_tracks = {}
+        for track_id, track in self.tracks.items():
+            if track['age'] < min_track_length:
+                stable_tracks[track_id] = track
+        return stable_tracks
+
+
+class MultiScaleDetector:
+    """Detect faces at multiple scales for better accuracy"""
+    
+    def __init__(self, base_detector):
+        self.base_detector = base_detector
+        self.scales = [1.0, 0.8, 1.2]  # Different scales to try
+    
+    def detect_faces(self, image):
+        """Detect faces at multiple scales"""
+        all_detections = []
+        h, w = image.shape[:2]
+        
+        for scale in self.scales:
+            if scale != 1.0:
+                # Resize image
+                new_w = int(w * scale)
+                new_h = int(h * scale)
+                resized = cv2.resize(image, (new_w, new_h))
+            else:
+                resized = image
+            
+            # Detect faces
+            faces = self.base_detector.detect_faces(resized)
+            
+            # Scale coordinates back to original size
+            for face in faces:
+                x, y, w_f, h_f, conf, method = face
+                if scale != 1.0:
+                    x = int(x / scale)
+                    y = int(y / scale)
+                    w_f = int(w_f / scale)
+                    h_f = int(h_f / scale)
+                
+                all_detections.append((x, y, w_f, h_f, conf, f"{method}_scale_{scale}"))
+        
+        # Remove duplicates and return best detections
+        return self.base_detector.filter_and_deduplicate_faces(all_detections)
+
+
+# Factory function to create detector with best available methods
+def create_face_detector(use_tracking=False, use_multiscale=False):
+    """
+    Factory function to create the best available face detector
+    
+    Args:
+        use_tracking: Enable face tracking across frames
+        use_multiscale: Enable multi-scale detection
+    
+    Returns:
+        Configured face detector
+    """
+    base_detector = EnhancedFaceDetector()
+    
+    if use_multiscale:
+        detector = MultiScaleDetector(base_detector)
+    else:
+        detector = base_detector
+    
+    if use_tracking:
+        # Note: Tracking would need to be integrated into the main detection loop
+        logger.info("Face tracking enabled")
+    
+    return detector
--- a/face_detector.py
+++ b/face_detector.py
@ -0,0 +1,344 @@
+"""
+face_detector.py - Core Face Detection and Analysis
+Exact same logic as your working code, just modularized
+"""
+
+import cv2
+import numpy as np
+from PIL import Image
+import torch
+import time
+import threading
+from queue import Queue
+import logging
+from typing import Dict, List, Optional
+
+logger = logging.getLogger(__name__)
+
+class AgeGenderDetector:
+    """Enhanced Age & Gender Detection System - EXACT SAME LOGIC AS YOUR WORKING CODE"""
+    
+    def __init__(self):
+        self.face_results = {}
+        self.face_encodings = {}
+        self.person_counter = 0
+        self.analysis_queue = Queue()
+        self.running = True
+        
+        # Load models
+        self.load_models()
+        
+        # Start analysis worker
+        self.analysis_thread = threading.Thread(target=self.analysis_worker, daemon=True)
+        self.analysis_thread.start()
+        
+        logger.info("✅ AgeGenderDetector initialized")
+    
+    def load_models(self):
+        """Load AI models - EXACT SAME AS YOUR WORKING CODE"""
+        try:
+            # Load DeepFace
+            from deepface import DeepFace
+            self.deepface = DeepFace
+            logger.info("✅ DeepFace loaded")
+        except ImportError:
+            logger.error("❌ DeepFace not available")
+            self.deepface = None
+        
+        try:
+            # Load HuggingFace age model
+            from transformers import AutoImageProcessor, SiglipForImageClassification
+            model_name = "prithivMLmods/facial-age-detection"
+            self.age_model = SiglipForImageClassification.from_pretrained(model_name)
+            self.age_processor = AutoImageProcessor.from_pretrained(model_name)
+            logger.info("✅ HuggingFace age model loaded")
+        except Exception as e:
+            logger.error(f"❌ HuggingFace model error: {e}")
+            self.age_model = None
+            self.age_processor = None
+        
+        # Age labels
+        self.id2label = {
+            "0": "01-10", "1": "11-20", "2": "21-30", "3": "31-40",
+            "4": "41-55", "5": "56-65", "6": "66-80", "7": "80+"
+        }
+        
+        # Face detector
+        self.face_cascade = cv2.CascadeClassifier(cv2.data.haarcascades + 'haarcascade_frontalface_default.xml')
+    
+    def analysis_worker(self):
+        """Background analysis worker - EXACT SAME AS YOUR WORKING CODE"""
+        while self.running:
+            try:
+                if not self.analysis_queue.empty():
+                    task = self.analysis_queue.get(timeout=0.1)
+                    if task is None:
+                        break
+                    
+                    person_id = task['id']
+                    face_img = task['image']
+                    callback = task.get('callback')
+                    
+                    # Analyze
+                    age, age_conf = self.analyze_age(face_img)
+                    gender, gender_conf = self.analyze_gender(face_img)
+                    
+                    # Store results
+                    current_time = time.time()
+                    if person_id in self.face_results:
+                        first_seen = self.face_results[person_id].get('first_seen', current_time)
+                    else:
+                        first_seen = current_time
+                    
+                    result = {
+                        'age': age,
+                        'age_conf': age_conf,
+                        'gender': gender,
+                        'gender_conf': gender_conf,
+                        'timestamp': current_time,
+                        'first_seen': first_seen
+                    }
+                    
+                    self.face_results[person_id] = result
+                    
+                    # Call callback if provided
+                    if callback:
+                        callback(person_id, result)
+                
+                else:
+                    time.sleep(0.01)
+            except Exception as e:
+                logger.error(f"Analysis worker error: {e}")
+                time.sleep(0.1)
+    
+    def analyze_age(self, face_img):
+        """Analyze age using HuggingFace - EXACT SAME AS YOUR WORKING CODE"""
+        if self.age_model is None or face_img.size == 0:
+            return "Unknown", 0.0
+        
+        try:
+            # Convert to PIL
+            if len(face_img.shape) == 3:
+                face_pil = Image.fromarray(cv2.cvtColor(face_img, cv2.COLOR_BGR2RGB))
+            else:
+                face_pil = Image.fromarray(face_img).convert("RGB")
+            
+            # Process
+            inputs = self.age_processor(images=face_pil, return_tensors="pt")
+            
+            with torch.no_grad():
+                outputs = self.age_model(**inputs)
+                logits = outputs.logits
+                probs = torch.nn.functional.softmax(logits, dim=1).squeeze().tolist()
+            
+            # Get prediction
+            max_idx = probs.index(max(probs))
+            age_range = self.id2label[str(max_idx)]
+            confidence = probs[max_idx] * 100
+            
+            return age_range, confidence
+        except Exception as e:
+            logger.error(f"Age analysis error: {e}")
+            return "Unknown", 0.0
+    
+    def analyze_gender(self, face_img):
+        """Analyze gender using DeepFace - EXACT SAME AS YOUR WORKING CODE"""
+        if self.deepface is None or face_img.size == 0:
+            return "Unknown", 0.0
+        
+        try:
+            result = self.deepface.analyze(
+                face_img, 
+                actions=['gender'], 
+                enforce_detection=False,
+                silent=True
+            )
+            
+            if isinstance(result, list):
+                analysis = result[0]
+            else:
+                analysis = result
+            
+            gender = analysis.get('dominant_gender', 'Unknown')
+            gender_probs = analysis.get('gender', {})
+            confidence = max(gender_probs.values()) if gender_probs else 0.0
+            
+            # Simplify gender
+            if gender in ['Man', 'Male']:
+                gender = 'Male'
+            elif gender in ['Woman', 'Female']:
+                gender = 'Female'
+            
+            return gender, confidence
+        except Exception as e:
+            logger.error(f"Gender analysis error: {e}")
+            return "Unknown", 0.0
+    
+    def get_face_encoding(self, face_img):
+        """Get face encoding for recognition - EXACT SAME AS YOUR WORKING CODE"""
+        if self.deepface is None or face_img.size == 0:
+            return None
+        
+        try:
+            # Preprocess
+            face_resized = cv2.resize(face_img, (160, 160))
+            
+            # Get embedding
+            embedding = self.deepface.represent(
+                face_resized, 
+                model_name='Facenet',
+                enforce_detection=False,
+                detector_backend='opencv'
+            )
+            
+            if isinstance(embedding, list) and len(embedding) > 0:
+                return np.array(embedding[0]['embedding'])
+            elif isinstance(embedding, dict):
+                return np.array(embedding['embedding'])
+            return None
+        except Exception as e:
+            # Fallback encoding
+            try:
+                face_resized = cv2.resize(face_img, (64, 64))
+                face_gray = cv2.cvtColor(face_resized, cv2.COLOR_BGR2GRAY)
+                hist = cv2.calcHist([face_gray], [0], None, [32], [0, 256])
+                return hist.flatten()
+            except:
+                return None
+    
+    def find_matching_person(self, face_img, threshold=0.4):
+        """Find matching person - EXACT SAME AS YOUR WORKING CODE"""
+        current_encoding = self.get_face_encoding(face_img)
+        if current_encoding is None:
+            return None, 0
+        
+        best_match = None
+        best_similarity = 0
+        
+        for person_id, stored_encoding in self.face_encodings.items():
+            try:
+                # Cosine similarity
+                similarity = np.dot(current_encoding, stored_encoding) / (
+                    np.linalg.norm(current_encoding) * np.linalg.norm(stored_encoding)
+                )
+                
+                if similarity > threshold and similarity > best_similarity:
+                    best_similarity = similarity
+                    best_match = person_id
+            except:
+                continue
+        
+        return best_match, best_similarity if best_match else (None, 0)
+    
+    def register_new_person(self, face_img):
+        """Register new person - EXACT SAME AS YOUR WORKING CODE"""
+        encoding = self.get_face_encoding(face_img)
+        if encoding is None:
+            return None
+        
+        self.person_counter += 1
+        person_id = f"person_{self.person_counter}"
+        self.face_encodings[person_id] = encoding
+        
+        logger.info(f"👤 NEW PERSON: {person_id}")
+        return person_id
+    
+    def identify_person(self, face_img):
+        """Identify person (new or existing) - EXACT SAME AS YOUR WORKING CODE"""
+        match_result = self.find_matching_person(face_img)
+        
+        if match_result[0]:
+            person_id, similarity = match_result
+            logger.info(f"👤 RECOGNIZED: {person_id} ({similarity:.3f})")
+            return person_id, False
+        else:
+            person_id = self.register_new_person(face_img)
+            return person_id, True
+    
+    def detect_faces(self, image):
+        """Detect faces in image - EXACT SAME AS YOUR WORKING CODE"""
+        gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+        faces = self.face_cascade.detectMultiScale(gray, 1.1, 4, minSize=(60, 60))
+        return faces
+    
+    def process_image(self, image, callback=None):
+        """Process image and return results - EXACT SAME AS YOUR WORKING CODE"""
+        faces = self.detect_faces(image)
+        results = []
+        
+        for i, (x, y, w, h) in enumerate(faces):
+            face_img = image[y:y+h, x:x+w]
+            person_id, is_new = self.identify_person(face_img)
+            
+            if person_id:
+                # Get existing result or create placeholder
+                result = self.face_results.get(person_id, {
+                    'age': 'Analyzing...',
+                    'age_conf': 0,
+                    'gender': 'Analyzing...',
+                    'gender_conf': 0,
+                    'timestamp': time.time(),
+                    'first_seen': time.time()
+                })
+                
+                # Add to analysis queue
+                task = {
+                    'id': person_id,
+                    'image': face_img,
+                    'callback': callback
+                }
+                self.analysis_queue.put(task)
+                
+                # Determine status
+                current_time = time.time()
+                first_seen = result.get('first_seen', current_time)
+                time_known = current_time - first_seen
+                
+                if time_known < 3:
+                    status = "NEW"
+                elif time_known < 60:
+                    status = "CURRENT"
+                else:
+                    status = "RETURNING"
+                
+                # Convert age to approximate number
+                age_display = result['age']
+                if result['age'] in self.id2label.values():
+                    age_map = {
+                        "01-10": "~6 years", "11-20": "~16 years", "21-30": "~25 years",
+                        "31-40": "~35 years", "41-55": "~48 years", "56-65": "~60 years",
+                        "66-80": "~73 years", "80+": "~85 years"
+                    }
+                    age_display = age_map.get(result['age'], result['age'])
+                
+                results.append({
+                    'person_id': person_id,
+                    'status': status,
+                    'age': age_display,
+                    'age_confidence': result['age_conf'],
+                    'gender': result['gender'],
+                    'gender_confidence': result['gender_conf'],
+                    'face_coordinates': [int(x), int(y), int(w), int(h)],
+                    'is_new': is_new
+                })
+        
+        return results
+    
+    def cleanup_old_results(self):
+        """Cleanup old results - EXACT SAME AS YOUR WORKING CODE"""
+        current_time = time.time()
+        old_persons = [
+            pid for pid, result in self.face_results.items()
+            if current_time - result.get('timestamp', 0) > 300  # 5 minutes
+        ]
+        
+        for person_id in old_persons:
+            self.face_results.pop(person_id, None)
+            self.face_encodings.pop(person_id, None)
+            logger.info(f"🗑️ REMOVED: {person_id}")
+    
+    def __del__(self):
+        """Cleanup when detector is destroyed"""
+        self.running = False
+        if hasattr(self, 'analysis_thread'):
+            self.analysis_thread.join(timeout=1.0)
--- a/requirements.txt
+++ b/requirements.txt
@ -39,3 +39,17 @@ x-transformers==2.1.37
 torchmetrics==1.5.0  
 attrdict==2.0.1
 activations==0.1.0
+fastapi==0.104.1
+uvicorn[standard]==0.24.0
+websockets==12.0
+python-multipart==0.0.6
+opencv-python==4.8.1.78
+pillow==10.1.0
+numpy<2.0
+torch>=2.1.0
+transformers>=4.35.0
+deepface>=0.0.79
+tensorflow>=2.15.0
+python-jose[cryptography]==3.3.0
+passlib[bcrypt]==1.7.4
+aiofiles==23.2.1
--- a/utils.py
+++ b/utils.py
@ -0,0 +1,36 @@
+"""
+utils.py - Utility Functions
+Exact same utility functions from your working code
+"""
+
+import cv2
+import numpy as np
+from PIL import Image
+import base64
+import io
+import logging
+
+logger = logging.getLogger(__name__)
+
+def decode_base64_image(base64_string: str) -> np.ndarray:
+    """
+    Decode base64 image to numpy array - EXACT SAME AS YOUR WORKING CODE
+    """
+    try:
+        # Remove data URL prefix if present
+        if ',' in base64_string:
+            base64_string = base64_string.split(',')[1]
+        
+        # Decode base64
+        image_data = base64.b64decode(base64_string)
+        
+        # Convert to PIL Image
+        pil_image = Image.open(io.BytesIO(image_data))
+        
+        # Convert to OpenCV format
+        opencv_image = cv2.cvtColor(np.array(pil_image), cv2.COLOR_RGB2BGR)
+        
+        return opencv_image
+    except Exception as e:
+        logger.error(f"Image decode error: {e}")
+        return None