""" Person Manager - 人员识别与管理模块 功能: - 人脸检测(MediaPipe) - 人脸识别,判断是否为同一个人 - 人员库管理,新人自动添加 - 追踪人员进出记录 """ import cv2 import numpy as np import json import datetime from pathlib import Path from config import DATA_DIR try: import mediapipe as mp HAS_MEDIAPIPE = True except ImportError: HAS_MEDIAPIPE = False print("[PersonManager] MediaPipe not installed, using basic detection") try: import face_recognition HAS_FACE_REC = True except ImportError: HAS_FACE_REC = False print("[PersonManager] face_recognition not installed, using basic matching") class PersonManager: """人员识别与管理器""" def __init__(self): self.persons_db_path = DATA_DIR / "persons.json" self.faces_dir = DATA_DIR / "faces" # 创建目录 self.faces_dir.mkdir(parents=True, exist_ok=True) # 加载人员库 self.persons = self._load_persons_db() # 初始化检测器状态 self.face_detector = None self.mp_face_detection = None self.cv_face_detector = None self.has_mediapipe = HAS_MEDIAPIPE # 从配置读取参数 try: from config import config_mgr self.config['mediapipe_min_confidence'] = config_mgr.get('min_detection_confidence', 0.3) self.config['confirm_frames'] = config_mgr.get('confirm_frames', 3) except: pass # 初始化检测器 self._init_detectors() # 配置 self.config = { 'face_match_threshold': 0.6, # 人脸匹配阈值 'unknown_person_id': 'unknown', # 未知人员ID 'max_persons': 100, # 最大人员数量 # 方案1: 参数调整 'mediapipe_min_confidence': 0.3, # 降低阈值,更容易检测 'mediapipe_model_selection': 1, # 1: 远距离模型 'haar_scale_factor': 1.05, # Haar更细粒度 'haar_min_neighbors': 2, # 降低邻居要求 # 方案2: 连续性判断 'confirm_frames': 3, # 连续几帧确认 'leave_frames': 2, # 连续几帧消失才算离开 } # 方案2: 追踪状态(连续判断) self.tracked_persons = {} # {person_id: {'frames': count, 'confirmed': bool}} self.prev_persons = [] # 前一帧检测到的人 self.confirmation_buffer = {} # 确认缓冲区 # 统计 self.total_detections = 0 self.known_persons_detected = 0 self.new_persons_added = 0 def _load_persons_db(self): """加载人员数据库""" if self.persons_db_path.exists(): try: with open(self.persons_db_path, 'r', encoding='utf-8') as f: return json.load(f) except: return {} return {} def _save_persons_db(self): """保存人员数据库""" with open(self.persons_db_path, 'w', encoding='utf-8') as f: json.dump(self.persons, f, ensure_ascii=False, indent=2) def _init_detectors(self): """初始化检测器""" # MediaPipe 人脸检测(方案1: 参数调整) if self.has_mediapipe: try: mp_face_detection = mp.solutions.face_detection self.face_detector = mp_face_detection.FaceDetection( model_selection=self.config['mediapipe_model_selection'], # 远距离模型 min_detection_confidence=self.config['mediapipe_min_confidence'] # 降低阈值 ) self.mp_face_detection = mp_face_detection print(f"[PersonManager] MediaPipe initialized (model={self.config['mediapipe_model_selection']}, conf={self.config['mediapipe_min_confidence']})") except Exception as e: print(f"[PersonManager] MediaPipe init failed: {e}") self.face_detector = None self.has_mediapipe = False # OpenCV 人脸检测(备用) try: model_path = cv2.data.haarcascades + 'haarcascade_frontalface_default.xml' if Path(model_path).exists(): self.cv_face_detector = cv2.CascadeClassifier(model_path) print("[PersonManager] OpenCV Haar Cascade initialized (backup)") except Exception as e: self.cv_face_detector = None print(f"[PersonManager] OpenCV detector init failed: {e}") # 方案3: YOLO 检测(更准确) self.yolo_detector = None try: from ultralytics import YOLO # 使用轻量级 nano 模型 self.yolo_detector = YOLO('yolov8n.pt') # nano 模型,快速 print("[PersonManager] YOLOv8nano initialized (most accurate)") except ImportError: print("[PersonManager] YOLO not installed. Install with: pip install ultralytics") except Exception as e: print(f"[PersonManager] YOLO init failed: {e}") def detect_faces(self, image): """检测人脸(优先使用 YOLO,其次 MediaPipe,最后 Haar) Args: image: 图片(numpy array 或路径) Returns: list: [{'bbox': [x,y,w,h], 'confidence': float}] """ if isinstance(image, str): image = cv2.imread(image) if image is None: return [] faces = [] # 方案3: YOLO 检测(优先,最准确) if self.yolo_detector is not None: try: results = self.yolo_detector(image, classes=[0], verbose=False) # class 0 = person for r in results: for box in r.boxes: x1, y1, x2, y2 = box.xyxy[0].tolist() conf = box.conf[0].item() # 转换为 [x, y, w, h] 格式 faces.append({ 'bbox': [int(x1), int(y1), int(x2-x1), int(y2-y1)], 'confidence': conf, 'source': 'yolo' }) if faces: print(f"[PersonManager] YOLO detected {len(faces)} persons") return faces # YOLO 检测成功,直接返回 except Exception as e: print(f"[PersonManager] YOLO detection failed: {e}") # 方案1+2: MediaPipe 检测 if self.has_mediapipe and self.face_detector is not None: rgb_image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB) results = self.face_detector.process(rgb_image) if results.detections: for detection in results.detections: bboxC = detection.location_data.relative_bounding_box h, w, _ = image.shape x = int(bboxC.xmin * w) y = int(bboxC.ymin * h) width = int(bboxC.width * w) height = int(bboxC.height * h) faces.append({ 'bbox': [x, y, width, height], 'confidence': detection.score[0], 'source': 'mediapipe' }) if faces: return faces # 备用: OpenCV Haar 检测 if self.cv_face_detector is not None: gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY) detections = self.cv_face_detector.detectMultiScale( gray, scaleFactor=self.config['haar_scale_factor'], minNeighbors=self.config['haar_min_neighbors'], minSize=(30, 30) ) for (x, y, w, h) in detections: faces.append({ 'bbox': [x, y, w, h], 'confidence': 0.8, 'source': 'opencv' }) return faces def extract_face_encoding(self, image, face_bbox): """提取人脸特征(用于识别是否为同一个人) 使用 MediaPipe 的人脸关键点作为特征,不依赖 dlib Args: image: 图片 face_bbox: [x, y, w, h] Returns: numpy array: 人脸特征向量 """ if isinstance(image, str): image = cv2.imread(image) if image is None: return None x, y, w, h = face_bbox # 确保坐标有效 h_img, w_img = image.shape[:2] x = max(0, min(x, w_img - 1)) y = max(0, min(y, h_img - 1)) w = max(1, min(w, w_img - x)) h = max(1, min(h, h_img - y)) # 提取人脸区域 face_image = image[y:y+h, x:x+w] # 方法1:使用 face_recognition(如果安装了) if HAS_FACE_REC: try: rgb_face = cv2.cvtColor(face_image, cv2.COLOR_BGR2RGB) encodings = face_recognition.face_encodings(rgb_face) if len(encodings) > 0: return encodings[0] except: pass # 方法2:使用 MediaPipe 人脸关键点(推荐) if self.has_mediapipe: try: mp_face_mesh = mp.solutions.face_mesh face_mesh = mp_face_mesh.FaceMesh(static_image_mode=True, max_num_faces=1) rgb_face = cv2.cvtColor(face_image, cv2.COLOR_BGR2RGB) results = face_mesh.process(rgb_face) if results.multi_face_landmarks: # 提取关键点坐标作为特征 landmarks = results.multi_face_landmarks[0] features = [] for landmark in landmarks.landmark: features.extend([landmark.x, landmark.y, landmark.z]) face_mesh.close() return np.array(features) except: pass # 方法3:使用颜色直方图(最简单,备用) face_resized = cv2.resize(face_image, (64, 64)) hsv = cv2.cvtColor(face_resized, cv2.COLOR_BGR2HSV) hist_h = cv2.calcHist([hsv], [0], None, [16], [0, 180]) hist_s = cv2.calcHist([hsv], [1], None, [16], [0, 256]) hist_v = cv2.calcHist([hsv], [2], None, [16], [0, 256]) feature = np.concatenate([ cv2.normalize(hist_h, hist_h).flatten(), cv2.normalize(hist_s, hist_s).flatten(), cv2.normalize(hist_v, hist_v).flatten() ]) return feature def match_face(self, face_encoding, threshold=None): """匹配人脸,找出对应的已知人员 Args: face_encoding: 人脸特征向量 threshold: 匹配阈值 Returns: dict: {'person_id': str, 'name': str, 'is_new': bool} """ if threshold is None: threshold = self.config['face_match_threshold'] if face_encoding is None: return {'person_id': 'unknown', 'name': 'Unknown', 'is_new': False} best_match = None best_distance = float('inf') for person_id, person_data in self.persons.items(): if 'face_encoding' in person_data: stored_encoding = np.array(person_data['face_encoding']) if HAS_FACE_REC: # face_recognition 距离计算 distance = face_recognition.face_distance([stored_encoding], face_encoding)[0] else: # 简单特征距离 distance = np.linalg.norm(stored_encoding - face_encoding) if distance < best_distance: best_distance = distance best_match = person_data if best_match and best_distance < threshold: self.known_persons_detected += 1 return { 'person_id': best_match.get('person_id'), 'name': best_match.get('name', 'Unknown'), 'is_new': False, 'confidence': 1 - best_distance } # 未匹配到,是新人员 return { 'person_id': 'unknown', 'name': 'Unknown', 'is_new': True, 'confidence': 0 } def add_new_person(self, image, face_bbox, name=None): """添加新人员到库 Args: image: 图片 face_bbox: 人脸位置 name: 人员名称(可选) Returns: dict: 新人员信息 """ if isinstance(image, str): image = cv2.imread(image) # 提取特征 face_encoding = self.extract_face_encoding(image, face_bbox) if face_encoding is None: return None # 生成人员ID person_id = f"person_{len(self.persons) + 1}" if name is None: name = f"Person #{len(self.persons) + 1}" # 保存人脸图片 x, y, w, h = face_bbox face_image = image[y:y+h, x:x+w] face_path = self.faces_dir / f"{person_id}.jpg" cv2.imwrite(str(face_path), face_image) # 记录到数据库 person_data = { 'person_id': person_id, 'name': name, 'face_encoding': face_encoding.tolist() if isinstance(face_encoding, np.ndarray) else face_encoding, 'face_path': str(face_path), 'first_seen': datetime.datetime.now().isoformat(), 'last_seen': datetime.datetime.now().isoformat(), 'visit_count': 1 } self.persons[person_id] = person_data self._save_persons_db() self.new_persons_added += 1 print(f"[PersonManager] New person added: {person_id} ({name})") return person_data def update_person_visit(self, person_id): """更新人员访问记录""" if person_id in self.persons: self.persons[person_id]['last_seen'] = datetime.datetime.now().isoformat() self.persons[person_id]['visit_count'] += 1 self._save_persons_db() def analyze_image(self, image_path, save_new_person=True): """分析图片中的人员(带连续性判断) Args: image_path: 图片路径 save_new_person: 是否保存新人员 Returns: dict: { 'faces': list, # 检测到的人脸 'persons': list, # 识别的人员 'new_count': int, # 新人员数量 'known_count': int, # 已知人员数量 'confirmed_change': bool, # 是否有确认的人员变化 } """ image = cv2.imread(image_path) if image is None: return {'faces': [], 'persons': [], 'error': 'Cannot load image'} self.total_detections += 1 # 检测人脸 faces = self.detect_faces(image) current_count = len(faces) # 方案2: 连续性判断 confirmed_change = False confirmed_persons = [] # 检查人数变化 prev_count = len(self.prev_persons) if current_count != prev_count: # 人数变化,记录到缓冲区 key = f"count_{current_count}" if key not in self.confirmation_buffer: self.confirmation_buffer[key] = {'count': 0, 'persons': []} self.confirmation_buffer[key]['count'] += 1 # 临时识别人员 temp_persons = [] for face in faces: bbox = face['bbox'] encoding = self.extract_face_encoding(image, bbox) match_result = self.match_face(encoding) person_info = { 'person_id': match_result['person_id'] if not match_result['is_new'] else 'unknown', 'name': match_result['name'], 'bbox': bbox, 'is_new': match_result['is_new'], 'confidence': face['confidence'], 'source': face['source'] } temp_persons.append(person_info) self.confirmation_buffer[key]['persons'] = temp_persons # 达到确认帧数 if self.confirmation_buffer[key]['count'] >= self.config['confirm_frames']: confirmed_change = True confirmed_persons = temp_persons print(f"[PersonManager] Confirmed: {prev_count} -> {current_count} persons (after {self.config['confirm_frames']} frames)") # 清空其他缓冲区 self.confirmation_buffer = {} # 更新前一帧状态 self.prev_persons = temp_persons else: # 人数不变,清空变化缓冲区,维持当前状态 if current_count > 0: # 识别当前人员 temp_persons = [] for face in faces: bbox = face['bbox'] encoding = self.extract_face_encoding(image, bbox) match_result = self.match_face(encoding) person_info = { 'person_id': match_result['person_id'] if not match_result['is_new'] else 'unknown', 'name': match_result['name'], 'bbox': bbox, 'is_new': match_result['is_new'], 'confidence': face['confidence'], 'source': face['source'] } temp_persons.append(person_info) confirmed_persons = temp_persons self.prev_persons = temp_persons # 清空变化缓冲区 keys_to_remove = [k for k in self.confirmation_buffer.keys() if not k.endswith(f"_{current_count}")] for k in keys_to_remove: del self.confirmation_buffer[k] # 统计新人和已知人员 new_count = 0 known_count = 0 persons_to_save = [] for person in confirmed_persons: if person['is_new']: new_count += 1 # 只有确认后才保存新人 if confirmed_change and save_new_person and len(self.persons) < self.config['max_persons']: # 找到对应的 face bbox for face in faces: if face['bbox'] == person['bbox']: new_person = self.add_new_person(image, face['bbox']) if new_person: person['person_id'] = new_person['person_id'] person['name'] = new_person['name'] persons_to_save.append(person) break else: known_count += 1 self.update_person_visit(person['person_id']) persons_to_save.append(person) return { 'faces': faces, 'persons': persons_to_save, 'new_count': new_count, 'known_count': known_count, 'total_count': len(persons_to_save), 'confirmed_change': confirmed_change, 'current_count': current_count, 'prev_count': prev_count, 'detection_source': faces[0]['source'] if faces else 'none' } def get_persons_list(self): """获取人员列表""" return [ { 'person_id': p['person_id'], 'name': p['name'], 'visit_count': p['visit_count'], 'first_seen': p['first_seen'], 'last_seen': p['last_seen'] } for p in self.persons.values() ] def get_stats(self): """获取统计信息""" return { 'total_persons': len(self.persons), 'total_detections': self.total_detections, 'known_persons_detected': self.known_persons_detected, 'new_persons_added': self.new_persons_added, 'recognition_rate': self.known_persons_detected / max(self.total_detections, 1) } def reset(self): """重置统计""" self.total_detections = 0 self.known_persons_detected = 0 self.new_persons_added = 0 # 全局实例 person_manager = PersonManager() if __name__ == "__main__": # 测试 import sys if len(sys.argv) >= 2: test_image = sys.argv[1] print(f"[Test] Analyzing: {test_image}") result = person_manager.analyze_image(test_image) print(f"[Test] Faces detected: {len(result['faces'])}") print(f"[Test] Persons: {result['total_count']}") print(f"[Test] New: {result['new_count']}, Known: {result['known_count']}") for person in result['persons']: status = "NEW" if person['is_new'] else "KNOWN" print(f" - [{status}] {person['name']} (confidence: {person['confidence']:.2f})") else: print("Usage: python person_manager.py ")