momentry_core/scripts/analyze_video_faces.py

#!/usr/bin/env python3
"""
分析 sftpgo demo 用戶視頻中的人臉
"""

import cv2
import numpy as np
import os
import sys
import json
import time
from datetime import datetime
import psycopg2
from psycopg2.extras import RealDictCursor

# 導入人臉識別處理器
sys.path.append(os.path.dirname(os.path.abspath(__file__)))
try:
    from face_recognition_processor import FaceRecognitionProcessor
except ImportError as e:
    print(f"❌ 無法導入人臉識別處理器: {e}")
    sys.exit(1)


class VideoFaceAnalyzer:
    def __init__(self):
        """初始化分析器"""
        self.processor = None
        self.db_conn = None
        self.output_dir = "/tmp/face_analysis_results"

        # 創建輸出目錄
        os.makedirs(self.output_dir, exist_ok=True)

    def connect_database(self):
        """連接數據庫"""
        try:
            self.db_conn = psycopg2.connect(
                host="localhost",
                port=5432,
                database="momentry",
                user="accusys",
                password="accusys",
            )
            print("✅ 數據庫連接成功")
            return True
        except Exception as e:
            print(f"❌ 數據庫連接失敗: {e}")
            return False

    def load_face_processor(self, use_mps=True):
        """加載人臉識別處理器"""
        try:
            print("加載人臉識別處理器...")
            self.processor = FaceRecognitionProcessor()
            self.processor.load_models(use_mps=use_mps)
            print("✅ 人臉識別處理器加載成功")
            return True
        except Exception as e:
            print(f"❌ 人臉識別處理器加載失敗: {e}")
            return False

    def extract_video_frames(self, video_path, interval_seconds=10, max_frames=100):
        """從視頻中提取幀"""
        print(f"從視頻提取幀: {video_path}")

        if not os.path.exists(video_path):
            print(f"❌ 視頻文件不存在: {video_path}")
            return []

        cap = cv2.VideoCapture(video_path)
        if not cap.isOpened():
            print(f"❌ 無法打開視頻文件: {video_path}")
            return []

        # 獲取視頻信息
        fps = cap.get(cv2.CAP_PROP_FPS)
        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
        duration = total_frames / fps if fps > 0 else 0

        print(f"  視頻信息: {duration:.1f}秒, {total_frames}幀, {fps:.1f}FPS")

        frames = []
        frame_interval = int(fps * interval_seconds) if fps > 0 else 30

        for frame_idx in range(0, total_frames, frame_interval):
            if len(frames) >= max_frames:
                break

            cap.set(cv2.CAP_PROP_POS_FRAMES, frame_idx)
            ret, frame = cap.read()

            if ret:
                timestamp = frame_idx / fps if fps > 0 else 0
                frames.append(
                    {"frame_idx": frame_idx, "timestamp": timestamp, "image": frame}
                )

        cap.release()
        print(f"✅ 提取了 {len(frames)} 個幀 (間隔: {interval_seconds}秒)")
        return frames

    def detect_faces_in_frames(self, frames, video_uuid, video_name):
        """在幀中檢測人臉"""
        if not frames or not self.processor:
            return []

        print(f"在 {len(frames)} 個幀中檢測人臉...")

        all_detections = []

        for i, frame_data in enumerate(frames):
            frame_idx = frame_data["frame_idx"]
            timestamp = frame_data["timestamp"]
            image = frame_data["image"]

            print(f"  處理幀 {i + 1}/{len(frames)} (時間: {timestamp:.1f}秒)")

            # 檢測人臉
            detections = self.processor.detect_faces(image)

            if detections:
                print(f"    ✅ 檢測到 {len(detections)} 個人臉")

                for detection in detections:
                    detection_info = {
                        "video_uuid": video_uuid,
                        "video_name": video_name,
                        "frame_idx": frame_idx,
                        "timestamp": timestamp,
                        "x": detection["x"],
                        "y": detection["y"],
                        "width": detection["width"],
                        "height": detection["height"],
                        "confidence": float(detection["confidence"]),
                        "embedding": detection.get("embedding"),
                        "attributes": detection.get("attributes"),
                        "detected_at": datetime.now().isoformat(),
                    }
                    all_detections.append(detection_info)

                    # 在圖像上繪製邊界框
                    x = detection["x"]
                    y = detection["y"]
                    width = detection["width"]
                    height = detection["height"]
                    x1, y1 = int(x), int(y)
                    x2, y2 = int(x + width), int(y + height)

                    cv2.rectangle(image, (x1, y1), (x2, y2), (0, 255, 0), 2)
                    cv2.putText(
                        image,
                        f"Face: {detection['confidence']:.2f}",
                        (x1, y1 - 10),
                        cv2.FONT_HERSHEY_SIMPLEX,
                        0.5,
                        (0, 255, 0),
                        2,
                    )

                # 保存帶有邊界框的幀
                output_path = os.path.join(
                    self.output_dir, f"{video_uuid}_frame_{frame_idx:06d}.jpg"
                )
                cv2.imwrite(output_path, image)

        return all_detections

    def save_detections_to_db(self, detections):
        """將檢測結果保存到數據庫"""
        if not detections or not self.db_conn:
            return 0

        print(f"將 {len(detections)} 個檢測結果保存到數據庫...")

        cursor = self.db_conn.cursor()
        saved_count = 0

        for detection in detections:
            try:
                # 插入人臉檢測記錄
                cursor.execute(
                    """
                    INSERT INTO face_detections (
                        video_uuid, frame_number, timestamp_secs,
                        x, y, width, height, confidence,
                        embedding, attributes, created_at
                    ) VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s)
                    RETURNING id
                """,
                    (
                        detection["video_uuid"],
                        detection["frame_idx"],
                        detection["timestamp"],
                        detection["x"],
                        detection["y"],
                        detection["width"],
                        detection["height"],
                        detection["confidence"],
                        json.dumps(detection["embedding"])
                        if detection["embedding"]
                        else None,
                        json.dumps(detection["attributes"])
                        if detection["attributes"]
                        else None,
                        detection["detected_at"],
                    ),
                )

                saved_count += 1

            except Exception as e:
                print(f"❌ 保存檢測結果失敗: {e}")
                continue

        self.db_conn.commit()
        cursor.close()

        print(f"✅ 成功保存 {saved_count} 個檢測結果到數據庫")
        return saved_count

    def analyze_video(self, video_path, video_uuid, video_name):
        """分析單個視頻"""
        print(f"\n{'=' * 60}")
        print(f"分析視頻: {video_name}")
        print(f"UUID: {video_uuid}")
        print(f"路徑: {video_path}")
        print(f"{'=' * 60}")

        start_time = time.time()

        # 提取幀
        frames = self.extract_video_frames(
            video_path, interval_seconds=30, max_frames=50
        )

        if not frames:
            print("❌ 無法從視頻提取幀")
            return False

        # 檢測人臉
        detections = self.detect_faces_in_frames(frames, video_uuid, video_name)

        if not detections:
            print("⚠️  未在視頻中檢測到人臉")
            # 仍然保存結果（空結果）
            result = {
                "video_uuid": video_uuid,
                "video_name": video_name,
                "total_frames": len(frames),
                "faces_detected": 0,
                "detections": [],
                "analysis_time": time.time() - start_time,
            }
        else:
            # 保存到數據庫
            saved_count = self.save_detections_to_db(detections)

            # 生成結果摘要
            result = {
                "video_uuid": video_uuid,
                "video_name": video_name,
                "total_frames": len(frames),
                "faces_detected": len(detections),
                "saved_to_db": saved_count,
                "unique_faces": len(
                    set((d["x"], d["y"], d["width"], d["height"]) for d in detections)
                ),
                "detections": detections[:10],  # 只保存前10個檢測結果
                "analysis_time": time.time() - start_time,
            }

        # 保存結果到 JSON 文件
        result_file = os.path.join(self.output_dir, f"{video_uuid}_analysis.json")
        with open(result_file, "w", encoding="utf-8") as f:
            json.dump(result, f, indent=2, ensure_ascii=False)

        print(f"\n分析完成:")
        print(f"  - 處理幀數: {len(frames)}")
        print(f"  - 檢測到人臉: {len(detections)}")
        print(f"  - 分析時間: {result['analysis_time']:.1f}秒")
        print(f"  - 結果文件: {result_file}")

        return True

    def generate_report(self, video_results):
        """生成分析報告"""
        report_file = os.path.join(self.output_dir, "face_analysis_report.md")

        with open(report_file, "w", encoding="utf-8") as f:
            f.write("# 人臉分析報告\n\n")
            f.write(f"生成時間: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}\n\n")

            f.write("## 視頻分析摘要\n\n")
            f.write("| 視頻名稱 | UUID | 處理幀數 | 檢測到人臉 | 分析時間 |\n")
            f.write("|----------|------|----------|------------|----------|\n")

            total_frames = 0
            total_faces = 0
            total_time = 0

            for result in video_results:
                f.write(f"| {result['video_name']} | {result['video_uuid']} | ")
                f.write(f"{result['total_frames']} | {result['faces_detected']} | ")
                f.write(f"{result['analysis_time']:.1f}秒 |\n")

                total_frames += result["total_frames"]
                total_faces += result["faces_detected"]
                total_time += result["analysis_time"]

            f.write(
                f"| **總計** | - | **{total_frames}** | **{total_faces}** | **{total_time:.1f}秒** |\n\n"
            )

            f.write("## 詳細結果\n\n")

            for result in video_results:
                f.write(f"### {result['video_name']}\n\n")
                f.write(f"- **UUID**: {result['video_uuid']}\n")
                f.write(f"- **處理幀數**: {result['total_frames']}\n")
                f.write(f"- **檢測到人臉**: {result['faces_detected']}\n")

                if "unique_faces" in result:
                    f.write(f"- **獨特人臉**: {result['unique_faces']}\n")

                f.write(f"- **分析時間**: {result['analysis_time']:.1f}秒\n")
                f.write(f"- **結果文件**: `{result['video_uuid']}_analysis.json`\n\n")

                if result["faces_detected"] > 0:
                    f.write("#### 檢測示例\n\n")
                    f.write("| 時間戳 | 位置 | 置信度 | 屬性 |\n")
                    f.write("|--------|------|--------|------|\n")

                    for i, detection in enumerate(
                        result.get("detections", [])[:5]
                    ):  # 只顯示前5個
                        timestamp = detection.get("timestamp", 0)
                        x = detection.get("x", 0)
                        y = detection.get("y", 0)
                        width = detection.get("width", 0)
                        height = detection.get("height", 0)
                        confidence = detection.get("confidence", 0)
                        attributes = detection.get("attributes", {})

                        f.write(f"| {timestamp:.1f}秒 | ({x},{y},{width},{height}) | ")
                        f.write(f"{confidence:.3f} | ")

                        if attributes:
                            attrs = []
                            if attributes.get("age"):
                                attrs.append(f"年齡: {attributes['age']}")
                            if attributes.get("gender"):
                                attrs.append(f"性別: {attributes['gender']}")
                            f.write(", ".join(attrs))
                        else:
                            f.write("-")

                        f.write(" |\n")

                f.write("\n---\n\n")

            f.write("## 輸出文件\n\n")
            f.write("以下文件已生成:\n\n")

            for filename in os.listdir(self.output_dir):
                filepath = os.path.join(self.output_dir, filename)
                if os.path.isfile(filepath):
                    size = os.path.getsize(filepath)
                    f.write(f"- `{filename}` ({size:,} bytes)\n")

        print(f"\n📊 分析報告已生成: {report_file}")
        return report_file

    def cleanup(self):
        """清理資源"""
        if self.db_conn:
            self.db_conn.close()
            print("✅ 數據庫連接已關閉")


def main():
    """主函數"""
    print("=" * 60)
    print("sftpgo demo 用戶視頻人臉分析")
    print("=" * 60)

    # 視頻文件路徑
    demo_dir = "/Users/accusys/momentry/var/sftpgo/data/demo"

    videos = [
        {
            "path": os.path.join(
                demo_dir,
                "ExaSAN PCIe series - Director Ou Yu-Zhi Shares His Experience.mp4",
            ),
            "uuid": "9760d0820f0cf9a7",
            "name": "ExaSAN PCIe series - Director Ou Yu-Zhi Shares His Experience.mp4",
        },
        {
            "path": os.path.join(demo_dir, "Old_Time_Movie_Show_-_Charade_1963.HD.mov"),
            "uuid": "384b0ff44aaaa1f1",
            "name": "Old_Time_Movie_Show_-_Charade_1963.HD.mov",
        },
    ]

    # 初始化分析器
    analyzer = VideoFaceAnalyzer()

    try:
        # 連接數據庫
        if not analyzer.connect_database():
            print("⚠️  將在無數據庫連接模式下運行")

        # 加載人臉識別處理器
        if not analyzer.load_face_processor(use_mps=True):
            print("❌ 無法加載人臉識別處理器")
            return False

        # 分析每個視頻
        video_results = []

        for video_info in videos:
            if os.path.exists(video_info["path"]):
                success = analyzer.analyze_video(
                    video_info["path"], video_info["uuid"], video_info["name"]
                )

                if success:
                    # 讀取結果文件
                    result_file = os.path.join(
                        analyzer.output_dir, f"{video_info['uuid']}_analysis.json"
                    )

                    if os.path.exists(result_file):
                        with open(result_file, "r", encoding="utf-8") as f:
                            result = json.load(f)
                            video_results.append(result)
            else:
                print(f"❌ 視頻文件不存在: {video_info['path']}")

        # 生成報告
        if video_results:
            report_file = analyzer.generate_report(video_results)

            print(f"\n{'=' * 60}")
            print("分析完成!")
            print(f"{'=' * 60}")

            print(f"\n📁 輸出目錄: {analyzer.output_dir}")
            print(f"📊 分析報告: {report_file}")

            # 顯示摘要
            total_frames = sum(r["total_frames"] for r in video_results)
            total_faces = sum(r["faces_detected"] for r in video_results)
            total_time = sum(r["analysis_time"] for r in video_results)

            print(f"\n📈 分析摘要:")
            print(f"  - 總處理視頻: {len(video_results)}")
            print(f"  - 總處理幀數: {total_frames}")
            print(f"  - 總檢測人臉: {total_faces}")
            print(f"  - 總分析時間: {total_time:.1f}秒")

            # 列出生成的文件
            print(f"\n📄 生成的文件:")
            for filename in sorted(os.listdir(analyzer.output_dir)):
                filepath = os.path.join(analyzer.output_dir, filename)
                if os.path.isfile(filepath):
                    size = os.path.getsize(filepath)
                    print(f"  - {filename} ({size:,} bytes)")

        return True

    except Exception as e:
        print(f"❌ 分析過程中發生錯誤: {e}")
        import traceback

        traceback.print_exc()
        return False

    finally:
        analyzer.cleanup()


if __name__ == "__main__":
    success = main()
    sys.exit(0 if success else 1)