diff --git a/.env.development b/.env.development
index c8cf21c..861e3f8 100644
--- a/.env.development
+++ b/.env.development
@@ -41,8 +41,8 @@ MOMENTRY_PYTHON_PATH=/Users/accusys/momentry_core/venv/bin/python
 MOMENTRY_SCRIPTS_DIR=/Users/accusys/momentry_core/scripts
 
 # Logging
-RUST_LOG=debug
-MOMENTRY_LOG_LEVEL=debug
+RUST_LOG=info
+MOMENTRY_LOG_LEVEL=info
 
 # Media
 MOMENTRY_MEDIA_BASE_URL=https://wp.momentry.ddns.net
@@ -77,5 +77,27 @@ MOMENTRY_LLM_SUMMARY_URL=http://127.0.0.1:8082/v1/chat/completions
 MOMENTRY_LLM_SUMMARY_MODEL=google_gemma-4-26B-A4B-it-Q5_K_M.gguf
 MOMENTRY_LLM_SUMMARY_ENABLED=true
 
+# LLM Chat (A4B on port 8082)
+MOMENTRY_LLM_CHAT_URL=http://127.0.0.1:8082/v1/chat/completions
+MOMENTRY_LLM_CHAT_MODEL=google_gemma-4-26B-A4B-it-Q5_K_M.gguf
+
+# LLM Vision (E4B on port 8083)
+MOMENTRY_LLM_VISION_URL=http://127.0.0.1:8083/v1/chat/completions
+MOMENTRY_LLM_VISION_MODEL=gemma-4-E4B-it-Q4_K_M.gguf
+
 # Embedding (ANE CoreML server)
 MOMENTRY_EMBED_URL=http://localhost:11436
+
+# === Binary & Data Paths (for start_momentry.sh) ===
+MOMENTRY_LOG_DIR=/Users/accusys/momentry/logs
+MOMENTRY_PG_BIN_DIR=/Users/accusys/pgsql/18.3/bin
+MOMENTRY_PG_DATA_DIR=/Users/accusys/pgsql/data
+MOMENTRY_QDRANT_BIN=/Users/accusys/.cargo/bin/qdrant
+MOMENTRY_QDRANT_STORAGE_DIR=/Users/accusys/momentry/qdrant_storage
+MOMENTRY_LLAMACPP_BIN=/Users/accusys/llama/bin/llama-server
+MOMENTRY_LLM_A4B_MODEL_PATH=/Users/accusys/models/google_gemma-4-26B-A4B-it-Q5_K_M.gguf
+MOMENTRY_LLM_A4B_MMPROJ_PATH=/Users/accusys/models/gemma-4-26B-A4B-it.mmproj-f16.gguf
+MOMENTRY_LLM_E4B_MODEL_PATH=/Users/accusys/models/gemma-4-E4B-it-Q4_K_M.gguf
+MOMENTRY_LLM_E4B_MMPROJ_PATH=/Users/accusys/models/mmproj-gemma-4-E4B-it-BF16.gguf
+MOMENTRY_OLLAMA_BIN=/Users/accusys/bin/ollama
+MOMENTRY_PLAYGROUND_BIN=target/debug/momentry_playground
diff --git a/.env.example b/.env.example
index 1cfbbdb..24d2e75 100644
--- a/.env.example
+++ b/.env.example
@@ -32,6 +32,16 @@ MOMENTRY_LLM_SUMMARY_URL=http://127.0.0.1:8082/v1/chat/completions
 MOMENTRY_LLM_SUMMARY_MODEL=google_gemma-4-26B-A4B-it-Q5_K_M.gguf
 MOMENTRY_LLM_SUMMARY_TIMEOUT=120
 
+# LLM Chat (A4B)
+MOMENTRY_LLM_CHAT_URL=http://127.0.0.1:8082/v1/chat/completions
+MOMENTRY_LLM_CHAT_MODEL=google_gemma-4-26B-A4B-it-Q5_K_M.gguf
+MOMENTRY_LLM_CHAT_TIMEOUT=120
+
+# LLM Vision (E4B)
+MOMENTRY_LLM_VISION_URL=http://127.0.0.1:8083/v1/chat/completions
+MOMENTRY_LLM_VISION_MODEL=gemma-4-E4B-it-Q4_K_M.gguf
+MOMENTRY_LLM_VISION_TIMEOUT=120
+
 # === Paths ===
 MOMENTRY_OUTPUT_DIR=/Users/accusys/momentry/output_dev
 MOMENTRY_BACKUP_DIR=/Users/accusys/momentry/backup
diff --git a/.gitignore b/.gitignore
index b5a894d..7753297 100644
--- a/.gitignore
+++ b/.gitignore
@@ -15,6 +15,35 @@ __pycache__/
 node_modules/
 *.log
 /tmp/
-*.log
+*.diff
+*.bundle
+*.probe.json
+*.cut.json
+.qdrant-initialized
+dump.rdb
+fix55.js
+checksums.sha256
 
 scripts/swift_processors/.build/
+.opencode/
+.vscode/
+backups/
+logs/
+output/
+models/
+data/
+storage/
+thumbnails/
+services/
+model_checkpoints/
+release/delivery/
+release/system/
+release/phase*/
+release/dev_*.sql
+release/migrate_*.sql
+release/files/
+package-lock.json
+package.json
+portal/dist/
+portal/src-tauri/icons/
+momentry_runtime/logs/
diff --git a/AGENTS.md b/AGENTS.md
index ebdf62a..dde43ed 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -14,6 +14,7 @@ Rust-based digital asset management system with video analysis and RAG capabilit
 - **🔴 DELETE / REMOVE / DROP / CLEAR 任何資料前必須先問使用者「要刪嗎？」獲得明確同意後才能執行**
 - **🔴 Qdrant collection 刪除、DB truncate、檔案刪除、資料清空 — 一律要先問**
 - **🔴 不確定是否該刪 → 先問，不要自己決定**
+- **🔴 改變議題前必須先存檔紀錄**：使用 `todowrite` 工具或建立紀錄文件（如 `docs_v1.0/M4_workspace/YYYY-MM-DD_topic_handoff.md`），確保上下文不丟失
 
 ### 開發範圍界定
 | 範圍 | 狀態 | 說明 |
diff --git a/Cargo.toml b/Cargo.toml
index c5fb540..b712fa6 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -134,6 +134,14 @@ path = "src/bin/integrated_player.rs"
 name = "release"
 path = "src/bin/release.rs"
 
+[[bin]]
+name = "vectorize_missing"
+path = "src/bin/vectorize_missing.rs"
+
+[[bin]]
+name = "sync_qdrant_from_pg"
+path = "src/bin/sync_qdrant_from_pg.rs"
+
 [[bin]]
 name = "service"
 path = "src/bin/service.rs"
diff --git a/config/README.md b/config/README.md
index 4306b33..f55b39f 100644
--- a/config/README.md
+++ b/config/README.md
@@ -1,105 +1,178 @@
-# Momentry Core 配置管理
+# Momentry Core Config Management
 
-## 目錄結構
+## Directory Structure
 
 ```
 momentry_core_0.1/
-├── .env.example          # 配置模板（已納入版本控制）
-├── .env                  # 本地配置（已從版本控制排除）
-├── .env.local           # 本地覆蓋配置（已從版本控制排除）
+├── .env.example          # Template (version controlled)
+├── .env                  # Local config (gitignored)
+├── .env.development      # Playground dev overrides (gitignored)
+├── .env.local            # Local overrides (gitignored)
 ├── config/
-│   └── README.md        # 本文件
-└── src/core/config.rs   # 配置代碼
+│   ├── README.md         # This file
+│   └── port_registry.tsv # Central port registry
+└── src/core/config.rs    # Config code with lazy_static env reading
 ```
 
-## 配置加載順序
+## Load Order
 
-1. `.env` - 默認本地配置
-2. `.env.local` - 本地覆蓋（最高優先級）
+For `momentry_playground` (development):
+1. `.env` — shared defaults
+2. `.env.development` — dev-specific overrides (loaded by playground binary)
 
-## 環境變數列表
+For `momentry` (production):
+1. `.env` — production config
 
-### 數據庫配置
+In Rust: `config.rs` reads env vars with lazy_static, falling back to hardcoded defaults.
 
-| 變數 | 說明 | 默認值 |
-|------|------|--------|
-| `DATABASE_URL` | PostgreSQL 連接字串 | `postgres://accusys@localhost:5432/momentry` |
+## Environment Variables
 
-### Redis 配置
+### Server
 
-| 變數 | 說明 | 默認值 |
-|------|------|--------|
-| `REDIS_URL` | Redis 連接字串 | `redis://:accusys@localhost:6379` |
-| `REDIS_PASSWORD` | Redis 密碼 | `accusys` |
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `MOMENTRY_SERVER_PORT` | Server port (3002=prod, 3003=dev) | `3002` |
+| `MOMENTRY_REDIS_PREFIX` | Redis key prefix | `momentry:` (prod), `momentry_dev:` (dev) |
 
-### 存儲路徑
+### Database
 
-| 變數 | 說明 | 默認值 |
-|------|------|--------|
-| `MOMENTRY_OUTPUT_DIR` | 輸出目錄 | `/Users/accusys/momentry/output` |
-| `MOMENTRY_BACKUP_DIR` | 備份目錄 | `/Users/accusys/momentry/backup/momentry` |
-| `MOMENTRY_SCRIPTS_DIR` | 腳本目錄 | `/Users/accusys/momentry_core_0.1/scripts` |
-| `MOMENTRY_PYTHON_PATH` | Python 路徑 | `/opt/homebrew/bin/python3.11` |
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `DATABASE_URL` | PostgreSQL connection string | `postgres://accusys@localhost:5432/momentry` |
+| `DATABASE_SCHEMA` | Schema for dev isolation | `dev` |
+| `MONGODB_URL` | MongoDB connection string | `mongodb://localhost:27017` |
+| `MONGODB_DATABASE` | MongoDB database name | `momentry` (prod), `momentry_dev` (dev) |
+| `MONGODB_CACHE_ENABLED` | MongoDB cache toggle | `true` |
+| `MONGODB_CACHE_TTL_VIDEOS` | Cache TTL for videos | `300` |
+| `MONGODB_CACHE_TTL_SEARCH` | Cache TTL for search | `300` |
+| `MONGODB_CACHE_TTL_HYBRID_SEARCH` | Cache TTL for hybrid search | `600` |
+| `MONGODB_CACHE_TTL_VIDEO_META` | Cache TTL for video metadata | `3600` |
 
-### 處理器超時（秒）
+### Redis
 
-| 變數 | 說明 | 默認值 |
-|------|------|--------|
-| `MOMENTRY_ASR_TIMEOUT` | ASR 處理超時 | `3600` |
-| `MOMENTRY_CUT_TIMEOUT` | CUT 處理超時 | `3600` |
-| `MOMENTRY_DEFAULT_TIMEOUT` | 默認超時 | `7200` |
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `REDIS_URL` | Redis connection string | `redis://:accusys@localhost:6379` |
+| `REDIS_PASSWORD` | Redis password | `accusys` |
+| `REDIS_CACHE_TTL_HEALTH` | Health check cache TTL | `30` |
+| `REDIS_CACHE_TTL_VIDEO_META` | Video metadata cache TTL | `3600` |
 
-### 日誌
+### Qdrant
 
-| 變數 | 說明 | 默認值 |
-|------|------|--------|
-| `RUST_LOG` | 日誌級別 | `info` |
-| `MOMENTRY_LOG_LEVEL` | 日誌級別（備選） | `info` |
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `QDRANT_URL` | Qdrant server URL | `http://localhost:6333` |
+| `QDRANT_API_KEY` | Qdrant API key | `Test3200Test3200Test3200` |
+| `QDRANT_COLLECTION` | Collection name | `momentry_rule1` (prod), `momentry_dev_rule1_v2` (dev) |
 
-## 使用方式
+### LLM
 
-### 1. 首次設置
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `MOMENTRY_LLM_CHAT_URL` | Chat/function-calling endpoint | `http://127.0.0.1:8082/v1/chat/completions` |
+| `MOMENTRY_LLM_CHAT_MODEL` | Chat model name | `google_gemma-4-26B-A4B-it-Q5_K_M.gguf` |
+| `MOMENTRY_LLM_VISION_URL` | Vision LLM endpoint (E4B) | falls back to CHAT_URL |
+| `MOMENTRY_LLM_VISION_MODEL` | Vision model name (E4B) | falls back to CHAT_MODEL |
+| `MOMENTRY_LLM_SUMMARY_URL` | Summary LLM endpoint (5W1H) | falls back to CHAT_URL |
+| `MOMENTRY_LLM_SUMMARY_MODEL` | Summary model name | falls back to CHAT_MODEL |
+| `MOMENTRY_LLM_SUMMARY_ENABLED` | Toggle 5W1H summary generation | `true` |
+| `MOMENTRY_LLM_SUMMARY_TIMEOUT` | 5W1H timeout in seconds | `120` |
+| `MOMENTRY_LLM_CHAT_TIMEOUT` | Chat LLM timeout in seconds | `120` |
+| `MOMENTRY_LLM_VISION_TIMEOUT` | Vision LLM timeout in seconds | `120` |
+
+### Embedding
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `MOMENTRY_EMBED_URL` | Embedding server URL | `http://localhost:11436` |
+
+### TMDb Integration
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `TMDB_API_KEY` | TMDb API key (required for probe) | (none) |
+| `MOMENTRY_TMDB_PROBE_ENABLED` | Enable TMDb probe during register | `false` |
+
+### Paths
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `MOMENTRY_OUTPUT_DIR` | Output directory for processing | `/Users/accusys/momentry/output` |
+| `MOMENTRY_BACKUP_DIR` | Backup directory | `/Users/accusys/momentry/backup/momentry` |
+| `MOMENTRY_SCRIPTS_DIR` | Python scripts directory | `/Users/accusys/momentry_core_0.1/scripts` |
+| `MOMENTRY_PYTHON_PATH` | Python interpreter path | `/opt/homebrew/bin/python3.11` |
+| `MOMENTRY_MEDIA_BASE_URL` | Base URL for media serving | (none) |
+
+### Processor Timeouts
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `MOMENTRY_ASR_TIMEOUT` | ASR timeout in seconds | `3600` |
+| `MOMENTRY_CUT_TIMEOUT` | CUT timeout in seconds | `3600` |
+| `MOMENTRY_DEFAULT_TIMEOUT` | Default timeout in seconds | `7200` |
+
+### Logging
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `RUST_LOG` | Rust log level (tracing) | `info` |
+| `MOMENTRY_LOG_LEVEL` | Fallback log level | `info` |
+
+### Worker
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `MOMENTRY_WORKER_ENABLED` | Enable background worker | `true` |
+| `MOMENTRY_MAX_CONCURRENT` | Max concurrent jobs | `6` |
+| `MOMENTRY_POLL_INTERVAL` | Poll interval in seconds | `10` |
+| `MOMENTRY_WORKER_BATCH_SIZE` | Batch size | `5` |
+
+### Synonym Expansion
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `MOMENTRY_SYNONYM_FILES` | Comma-separated paths to synonym JSON files | (none) |
+| `MOMENTRY_SYNONYM_FILE` | Single synonym file (deprecated) | (none) |
+
+### Encryption
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `AUDIT_ENCRYPTION_KEY` | 32-byte hex encryption key (64 hex chars) | (none) |
+
+## Port Registry
+
+See `config/port_registry.tsv` for the authoritative list of all ports and their owners.
+
+| Port | Service | Owner | Config Key |
+|------|---------|-------|------------|
+| 5432 | PostgreSQL | postgres | `DATABASE_URL` |
+| 6379 | Redis | redis-server | `REDIS_URL` |
+| 6333 | Qdrant | qdrant | `QDRANT_URL` |
+| 8082 | LLM Chat (A4B) | llama-server | `MOMENTRY_LLM_CHAT_URL` |
+| 8083 | LLM Vision (E4B) | llama-server | `MOMENTRY_LLM_VISION_URL` |
+| 11434 | Ollama | ollama | `MOMENTRY_OLLAMA_URL` |
+| 11436 | Embedding | embeddinggemma_server.py | `MOMENTRY_EMBED_URL` |
+| 27017 | MongoDB | mongod | `MONGODB_URL` |
+| 3002 | Production API | momentry | `MOMENTRY_SERVER_PORT` |
+| 3003 | Playground API | momentry_playground | `MOMENTRY_SERVER_PORT` |
+
+## Quick Start
 
 ```bash
-# 複製模板
+# 1. Copy template
 cp .env.example .env
 
-# 編輯配置
-nano .env
+# 2. Edit .env for production or use .env.development for playground
+# 3. Start all services
+./scripts/start_momentry.sh
 ```
 
-### 2. 本地覆蓋
+## Version Control
 
-創建 `.env.local` 設置僅本地適用的配置：
-
-```bash
-# .env.local 示例
-DATABASE_URL=postgres://local:password@localhost:5432/momentry_dev
-MOMENTRY_LOG_LEVEL=debug
-```
-
-### 3. 運行應用
-
-```bash
-# 加載配置並運行
-source .env && cargo run
-
-# 或使用 direnv
-direnv allow
-```
-
-## 版本控制策略
-
-| 文件 | 版本控制 | 說明 |
-|------|---------|------|
-| `.env.example` | ✅ 追蹤 | 模板，包含所有選項 |
-| `.env` | ❌ 忽略 | 本地敏感配置 |
-| `.env.local` | ❌ 忽略 | 本地覆蓋配置 |
-
-## 部署檢查清單
-
-- [ ] 複製 `.env.example` 到 `.env`
-- [ ] 設置數據庫連接
-- [ ] 設置 Redis 密碼
-- [ ] 配置目錄路徑
-- [ ] 確認日誌級別
+| File | Tracked | Purpose |
+|------|---------|---------|
+| `.env.example` | ✅ Yes | Template with all options documented |
+| `.env` | ❌ No | Local sensitive config |
+| `.env.development` | ❌ No | Dev-specific overrides |
+| `.env.local` | ❌ No | Local overrides (highest priority) |
diff --git a/config/port_registry.tsv b/config/port_registry.tsv
index dc1b202..cba1061 100644
--- a/config/port_registry.tsv
+++ b/config/port_registry.tsv
@@ -16,7 +16,9 @@
 6379	redis		redis-server		REDIS_URL			redis://...:6379	start_momentry.sh
 6333	qdrant		qdrant			QDRANT_URL			http://...:6333		start_momentry.sh
 8081	wordpress	Caddy			-				-			Caddyfile
-8082	llm		llama-server		MOMENTRY_LLM_CHAT_URL		http://...:8082		start_momentry.sh
+8082	llm-chat	llama-server		MOMENTRY_LLM_CHAT_URL		http://...:8082		start_momentry.sh
+8083	llm-vision	llama-server		MOMENTRY_LLM_VISION_URL		http://...:8083		start_momentry.sh
 9000	php-fpm		php-fpm			-				9000			brew services
 11434	ollama		ollama			MOMENTRY_OLLAMA_URL		http://...:11434	start_momentry.sh
 11436	embedding	embeddinggemma		MOMENTRY_EMBED_URL		http://...:11436	start_momentry.sh
+27017	mongodb		mongod			MONGODB_URL			mongodb://...:27017	start_momentry.sh
diff --git a/deliverable_v1.1.0/AGENTS.md b/deliverable_v1.1.0/AGENTS.md
new file mode 100644
index 0000000..179b760
--- /dev/null
+++ b/deliverable_v1.1.0/AGENTS.md
@@ -0,0 +1,761 @@
+# AGENTS.md - Momentry Core
+
+Rust-based digital asset management system with video analysis and RAG capabilities.
+
+---
+
+## ⚠️ CRITICAL: 開發隔離原則
+
+### 絕對禁止事項
+- **絕對不可修改 `/Users/accusys/wordpress/` 目錄下的任何檔案**
+- **絕對不可修改 n8n 工作流或設定**
+- **絕對不可修改 WordPress 或 n8n 的資料庫 table**
+- **除非是 release 作業，絕對不可動 port 3002 (production)**
+- **🔴 DELETE / REMOVE / DROP / CLEAR 任何資料前必須先問使用者「要刪嗎？」獲得明確同意後才能執行**
+- **🔴 Qdrant collection 刪除、DB truncate、檔案刪除、資料清空 — 一律要先問**
+- **🔴 不確定是否該刪 → 先問，不要自己決定**
+
+### 開發範圍界定
+| 範圍 | 狀態 | 說明 |
+|------|------|------|
+| `momentry_core_0.1/` | ✅ **可開發** | Momentry Core 主要開發目錄 |
+| `momentry_core_0.1/portal/` | ✅ **可開發** | Tauri Portal 前端 |
+| `momentry_core_0.1/src/` | ✅ **可開發** | Rust 後端程式碼 |
+| `/Users/accusys/wordpress/` | ❌ **禁止修改** | WordPress/Marcom 團隊負責 |
+| n8n 工作流 | ❌ **禁止修改** | 自動化流程，與 dev 無關 |
+| WordPress/n8n 資料庫 table | ❌ **禁止修改** | Marcom 團隊管理，與 dev 無關 |
+
+### 開發環境
+| 服務 | Port | 用途 | 命令 |
+|------|------|------|------|
+| Playground | 3003 | **唯一開發環境** | `cargo run --bin momentry_playground -- server` |
+| Production | 3002 | ❌ 禁止修改 | `cargo run -- server` (僅 release 時) |
+| Portal (Tauri) | 1420 | 前端開發 | `npm run tauri dev` |
+
+## ⚠️ 交叉污染防制 (Cross-Contamination Prevention)
+
+**每個執行前必須評估是否會汙染其他獨立作業。**
+
+### Scope Isolation Matrix
+
+| 執行內容 | 允許的 Scope | 禁止影響 | 檢查事項 |
+|----------|-------------|----------|----------|
+| M4 delivery binary | `target/release/momentry` | Playground (3003), Production (3002) | 確認舊 process 未被誤殺 |
+| Playground server | `localhost:3003`, `dev.*` schema | Production (3002), `public.*` schema | `DATABASE_SCHEMA=dev` |
+| Production deploy | `localhost:3002`, `public.*` schema | Playground (3003), `dev.*` schema | 先停 production，不影響 playground |
+| Git commit | 只包含意圖修改的檔案 | 無關的 untracked files | `git status` 確認 stage 內容正確 |
+| CI / packaged tests | 測試環境 | 正式資料 | 測試用 DB 不能連到 production |
+| Doc changes | 指定文件 | 其他文件、程式碼 | `git diff --stat` 檢查 scope |
+| SQL migration | 目標 schema | 其他 schema、無關 table | `WHERE` clause 要精準 |
+| `sed` / `grep` / mass edit | 目標檔案集 | 非目標檔案 | 先用 `grep -c` 確認只有目標檔案匹配 |
+
+### Recent Violations / Near-Misses
+
+| 事件 | 問題 | 防止方式 |
+|------|------|----------|
+| `sed` API doc 編號 | `sed -i '' 's/.../.../g'` 改到所有行 | 先 `grep -c` 確認匹配，`git diff` 再提交 |
+| 亂加 `/api/v1/register` route | 不必要的 API 別名，汙染路由表 | 角色切換：路由設計不該由實作方決定 |
+| `API_WORKSPACE/` vs `GUIDES/` vs `REFERENCE/` vs `DESIGN/` vs `OPERATIONS/` vs `INTEGRATIONS/` | 文件放到錯誤分類 | API 文件改在 API_WORKSPACE/modules/ 編輯，`make deploy` 生成到 GUIDES/ |
+| Build release binary in plan mode | 浪費時間，無意義 | 嚴格遵守 plan/build mode 規定 |
+
+### ⛔ 嚴格測試隔離規則 (Strict Test Isolation)
+- **所有測試 (Test) 必須在 Dev (3003) 進行**。
+- **絕對禁止 (ABSOLUTELY FORBIDDEN)** 在任何測試指令、Demo 流程或 API 檢查中使用 `localhost:3002`。
+- 即使是「測試 Unregister」或「檢查版本」，若未明確標示為 "Production Deployment"，一律視為違規。
+- **預設行為**: 所有 curl, CLI, 或程式碼測試指令，預設 URL 必須為 `http://localhost:3003`。
+
+### 違反後果
+- 修改 WordPress/n8n 可能影響 marcom 團隊工作與生產環境
+- 修改 WordPress/n8n 資料庫 table 可能破壞自動化流程與資料完整性
+- 修改 port 3002 可能中斷正在使用的服務 (這是非常嚴重的錯誤)
+- 所有 dev 測試必須在 playground (3003) 進行
+
+---
+
+## AI Coding Principles (Karpathy-Inspired)
+
+Behavioral guidelines to reduce common LLM coding mistakes.
+Source: [andrej-karpathy-skills](https://github.com/forrestchang/andrej-karpathy-skills) (94K stars)
+
+**Tradeoff:** These guidelines bias toward caution over speed. For trivial tasks, use judgment.
+
+### 1. Think Before Coding
+
+**Don't assume. Don't hide confusion. Surface tradeoffs.**
+
+- State your assumptions explicitly. If uncertain, ask.
+- If multiple interpretations exist, present them - don't pick silently.
+- If a simpler approach exists, say so. Push back when warranted.
+- If something is unclear, stop. Name what's confusing. Ask.
+
+### 2. Simplicity First
+
+**Minimum code that solves the problem. Nothing speculative.**
+
+- No features beyond what was asked.
+- No abstractions for single-use code.
+- No "flexibility" or "configurability" that wasn't requested.
+- No error handling for impossible scenarios.
+- If you write 200 lines and it could be 50, rewrite it.
+
+Ask yourself: "Would a senior engineer say this is overcomplicated?" If yes, simplify.
+
+### 3. Surgical Changes
+
+**Touch only what you must. Clean up only your own mess.**
+
+When editing existing code:
+- Don't "improve" adjacent code, comments, or formatting.
+- Don't refactor things that aren't broken.
+- Match existing style, even if you'd do it differently.
+- If you notice unrelated dead code, mention it - don't delete it.
+
+When your changes create orphans:
+- Remove imports/variables/functions that YOUR changes made unused.
+- Don't remove pre-existing dead code unless asked.
+
+The test: Every changed line should trace directly to the user's request.
+
+### 4. Goal-Driven Execution
+
+**Define success criteria. Loop until verified.**
+
+Transform tasks into verifiable goals:
+- "Add validation" -> "Write tests for invalid inputs, then make them pass"
+- "Fix the bug" -> "Write a test that reproduces it, then make it pass"
+- "Refactor X" -> "Ensure tests pass before and after"
+
+For multi-step tasks, state a brief plan:
+```
+1. [Step] -> verify: [check]
+2. [Step] -> verify: [check]
+3. [Step] -> verify: [check]
+```
+
+Strong success criteria let you loop independently. Weak criteria ("make it work") require constant clarification.
+
+---
+
+These guidelines are working if: fewer unnecessary changes in diffs, fewer rewrites due to overcomplication, and clarifying questions come before implementation rather than after mistakes.
+
+---
+
+## Terminology (V4.0)
+
+| Term | Scope | Description | Example |
+|------|-------|-------------|---------|
+| **file_uuid** | Video file | Video file identifier (renamed from `video_uuid`) | `384b0ff44aaaa1f1` |
+| **identity_uuid** | Global identity | Global person identity (cross-file) | `a9a90105-6d6b-46ff-92da-0c3c1a57dff4` |
+| **face_id** | Single detection | Single face detection (frame-level) | `face_100` |
+| **trace_id** | Face tracking | Face tracking ID (Face Tracker output) | `2` |
+| **chunk_id** | Sentence chunk | Sentence chunk (from pre_chunks via rules) | `chunk_1` |
+| **speaker_id** | Speaker segment | Speaker ID (from ASRX) | `SPEAKER_0` |
+| **person_id** | ❌ **Deprecated** | Video-local person ID (removed in V4.0) | - |
+
+### Architecture (V4.0)
+
+```
+Face → Identity (Two-layer, direct binding)
+  ↓
+  person_identities table: REMOVED
+  file_identities table: ADDED (N:N relationship)
+```
+
+### Key Changes (V3.x → V4.0)
+
+| Change | V3.x | V4.0 |
+|--------|------|------|
+| **video_uuid** | Used everywhere | **file_uuid** |
+| **person_identities** | Required (303 records) | **Removed** |
+| **person_id APIs** | 28 endpoints | **Removed** (except register/bind) |
+| **Face binding** | Person → Identity | **Face → Identity** (direct) |
+| **Chunk binding** | Manual | **Auto** (time alignment) |
+
+---
+
+## Build & Run Commands
+
+```bash
+# Build project (use debug builds for development/testing)
+cargo build
+cargo build --bin momentry
+cargo build --bin momentry_playground
+
+# Build all binaries
+cargo build --bins
+
+# Run CLI
+cargo run -- --help
+cargo run -- register /path/to/video.mp4
+cargo run -- server --host 0.0.0.0 --port 3002
+
+# Run playground (development binary)
+cargo run --bin momentry_playground -- server
+cargo run --bin momentry_playground -- --help
+```
+
+### ⚠️ CRITICAL: `cargo build --release` PROHIBITION
+- **NEVER run `cargo build --release` unless the user explicitly says "release the binary" or "正式 release"**
+- `cargo build --release` is SLOW and only needed when producing a production binary for deployment
+- For all development, testing, debugging, and linting: use `cargo build` or `cargo check`
+- If uncertain, ALWAYS ask the user first
+
+## Binaries
+
+| Binary | Purpose | Port | Redis Prefix | Environment |
+|--------|---------|------|--------------|-------------|
+| `momentry` | Production | 3002 | `momentry:` | `.env` |
+| `momentry_playground` | Development | 3003 | `momentry_dev:` | `.env.development` |
+| `momentry_player` | Video player | - | - | - |
+
+## Testing
+
+```bash
+# Run all tests
+cargo test
+
+# Run single test by name
+cargo test test_name
+
+# Run with output
+cargo test -- --nocapture
+
+# Doc tests
+cargo test --doc
+```
+
+## Linting & Formatting
+
+```bash
+# Format code (edition=2021, max_width=100, tab_spaces=4)
+cargo fmt
+cargo fmt -- --check
+
+# Lint
+cargo clippy
+cargo clippy --all-features
+
+# Check for errors
+cargo check
+cargo check --all-features
+```
+
+## Code Style
+
+### General
+- Use Rust 2021 edition
+- Use tracing for logging (not println!)
+- Keep lines under 100 characters
+
+### Imports (order: std → external → local)
+```rust
+use std::path::Path;
+use anyhow::{Context, Result};
+use async_trait::async_trait;
+use serde::{Deserialize, Serialize};
+
+use crate::core::chunk::Chunk;
+```
+
+### Error Handling
+- Use `anyhow::Result<T>` for application code
+- Use `thiserror` for library code
+- Use `.context()` for error context
+- Use `anyhow::bail!()` for early returns
+
+```rust
+fn example() -> Result<SomeType> {
+    let output = Command::new("ffprobe")
+        .args([...])
+        .output()
+        .context("Failed to run ffprobe")?;
+
+    if !output.status.success() {
+        anyhow::bail!("Command failed");
+    }
+    Ok(result)
+}
+```
+
+### Naming
+- Types/Enums: PascalCase (`VideoRecord`, `ChunkType`)
+- Functions/Variables: snake_case (`get_video_by_uuid`)
+- Traits: PascalCase with -er suffix (`Database`, `ChunkStore`)
+- Files: snake_case (`postgres_db.rs`)
+
+### Types
+- Use `serde::{Deserialize, Serialize}` for serializable types
+- Use `#[serde(rename_all = "snake_case")]` for enum variants
+- Use explicit numeric types (i64, u32, f64)
+
+```rust
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct VideoRecord {
+    pub id: i64,
+    pub uuid: String,
+    pub duration: f64,
+    pub width: u32,
+}
+
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq)]
+#[serde(rename_all = "snake_case")]
+pub enum ChunkType {
+    TimeBased,
+    Sentence,
+    Cut,
+}
+```
+
+### Async Programming
+- Use `tokio` runtime with full features
+- Use `#[async_trait]` for async trait methods
+
+```rust
+#[async_trait]
+pub trait Database: Send + Sync {
+    async fn init() -> Result<Self>
+    where Self: Sized;
+}
+```
+
+## Code Structure
+
+```
+src/
+├── main.rs           # CLI entry point
+├── lib.rs            # Library exports
+├── core/
+│   ├── api_key/     # API key management (anomaly, blacklist, encryption, etc.)
+│   ├── chunk/        # Chunking logic
+│   ├── config.rs     # Centralized configuration (env vars)
+│   ├── db/          # Database (PostgreSQL, MongoDB, Redis, Qdrant)
+│   ├── embedding/   # Vector embeddings
+│   ├── overlay/     # Video overlay
+│   ├── probe/       # ffprobe integration
+│   ├── processor/   # ASR, OCR, YOLO, Face, Pose, CUT, ASRX
+│   │   └── executor.rs  # Unified Python script executor
+│   ├── storage/     # File management
+│   └── thumbnail/   # Thumbnail extraction
+├── api/              # HTTP API (axum)
+├── player/           # Video player
+├── ui/               # TUI components
+└── watcher/          # File system watcher
+```
+
+## Key Dependencies
+
+- **Error handling**: `anyhow`, `thiserror`
+- **Async**: `tokio` (full features), `async-trait`
+- **CLI**: `clap` (derive)
+- **Serialization**: `serde`, `serde_json`, `chrono`
+- **Database**: `sqlx`, `mongodb`, `redis` (1.0), `qdrant-client`
+- **HTTP**: `axum`, `tower`
+- **Logging**: `tracing`, `tracing-subscriber`
+- **Config**: `once_cell` (lazy static config)
+
+## Environment Variables
+
+### Server
+- `MOMENTRY_SERVER_PORT` - API server port (default: `3002` for production, `3003` for playground)
+- `MOMENTRY_REDIS_PREFIX` - Redis key prefix (default: `momentry:` for production, `momentry_dev:` for playground)
+- `MOMENTRY_API_KEY` - API key for Player online mode testing
+
+### Testing API Key
+```bash
+export MOMENTRY_API_KEY="muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69"
+
+# Test Player online mode
+cargo run --features player --bin momentry_player -- -o
+```
+
+### Database
+- `DATABASE_URL` - PostgreSQL (default: `postgres://accusys@localhost:5432/momentry`)
+
+### Redis
+- `REDIS_URL` - Redis URL (default: `redis://:accusys@localhost:6379`)
+- `REDIS_PASSWORD` - Redis password (default: `accusys`)
+
+### Paths
+- `MOMENTRY_OUTPUT_DIR` - Output directory (default: `/Users/accusys/momentry/output`)
+- `MOMENTRY_BACKUP_DIR` - Backup directory
+- `MOMENTRY_PYTHON_PATH` - Python path (default: `/opt/homebrew/bin/python3.11`)
+- `MOMENTRY_SCRIPTS_DIR` - Scripts directory
+
+### Processor Timeouts
+- `MOMENTRY_ASR_TIMEOUT` - ASR timeout in seconds (default: 3600)
+- `MOMENTRY_CUT_TIMEOUT` - CUT timeout in seconds (default: 3600)
+- `MOMENTRY_DEFAULT_TIMEOUT` - Default timeout (default: 7200)
+
+### TMDb Integration (Face Clustering)
+- `TMDB_API_KEY` - TMDb API key for movie metadata lookup (required for `MOMENTRY_TMDB_PROBE_ENABLED=true`)
+- `MOMENTRY_TMDB_PROBE_ENABLED` - Enable TMDb probe during registration (default: `false`)
+  - Register phase: searches TMDb by filename, creates identities with tmdb_id/tmdb_profile
+  - Post-process phase: matches detected faces against TMDb identities via cosine similarity
+
+### Synonym Expansion
+- `MOMENTRY_SYNONYM_FILES` - Comma-separated paths to synonym JSON files (e.g., `data/english_synonyms.json,data/llm_synonyms.json`)
+- `MOMENTRY_SYNONYM_FILE` - Single synonym JSON file path (deprecated, use above)
+
+### Logging
+- `RUST_LOG` or `MOMENTRY_LOG_LEVEL` - Log level (default: `info`)
+
+## Notes
+
+- Unit tests exist (86 library tests)
+- Video processing uses external tools (ffprobe, Python scripts)
+- Multi-database architecture (PostgreSQL, MongoDB, Redis, Qdrant)
+- Monitor directory is a separate system (not Rust)
+- PythonExecutor provides unified script execution with timeout support
+- Redis 1.0.x for improved performance
+- FaceNet CoreML model (`models/facenet512.mlpackage`) replaces InsightFace for embedding extraction (MIT license, ANE-accelerated)
+
+### LLM Synonym Generation
+
+Generate synonym database using llama.cpp (Gemma4):
+
+```bash
+# Generate full database (162 entries, ~5 minutes)
+python3 scripts/generate_synonyms_llamacpp.py
+
+# Quick test
+python3 scripts/generate_synonyms_llamacpp.py --test
+
+# Resume from existing file
+python3 scripts/generate_synonyms_llamacpp.py --resume
+
+# Output: data/llm_synonyms.json (27 Chinese + 135 English words)
+```
+
+## Task Management
+
+### 使用 todowrite 追蹤任務
+```bash
+# 創建任務清單
+/todo 建立配置模組 [in_progress]
+/todo 添加單元測試 [pending]
+
+# 更新狀態
+/todo 完成標記 [completed]
+```
+
+### 任務批次建議
+- 一次處理 1-2 個功能
+- 每個功能完成後驗證 (clippy + test)
+- 驗證通過後再繼續下一個
+
+## Code Review Checklist
+
+完成任務後檢查：
+- [ ] `cargo clippy --lib` 通過
+- [ ] `cargo test --lib` 通過
+- [ ] `cargo fmt -- --check` 通過
+- [ ] 文檔已更新 (如需要)
+- [ ] 新功能有單元測試
+
+## Commit Guidelines
+
+```bash
+# feat: 新功能
+git commit -m "feat: add monitor_jobs table"
+
+# fix: 錯誤修復
+git commit -m "fix: resolve SQL injection in store_vector"
+
+# refactor: 重構
+git commit -m "refactor: use parameterized queries"
+
+# docs: 文檔更新
+git commit -m "docs: update AGENTS.md with new modules"
+```
+
+## Pre-commit Hook
+
+專案已配置 `.git/hooks/pre-commit`，提交前自動檢查：
+
+```bash
+# 檢查內容
+1. cargo fmt --check    # Rust 格式化檢查
+2. cargo clippy --lib   # Rust Lint 檢查
+3. cargo test --lib     # Rust 單元測試
+4. ruff check           # Python Lint 檢查
+5. ruff format --check  # Python 格式化檢查
+6. markdownlint         # Markdown 格式檢查
+7. shellcheck           # Shell 腳本檢查
+
+# 跳過檢查（不建議）
+git commit --no-verify
+
+# 跳過特定檢查
+git commit --skip-checks
+```
+
+**注意**: Hook 僅檢查已暫存的 Rust/Python/Markdown 文件。
+
+### Python 環境設置
+```bash
+# 安裝 ruff
+pip install ruff==0.11.2
+
+# 格式化 Python 文件
+ruff format scripts/
+
+# Lint Python 文件
+ruff check scripts/
+```
+
+### Markdown 環境設置
+```bash
+# 安裝 markdownlint-cli (使用系統 Node.js)
+npm install -g markdownlint-cli
+
+# 檢查 Markdown 文件
+markdownlint docs/
+
+# 配置檔案
+.markdownlint.json
+```
+
+### Shell 環境設置
+```bash
+# 安裝 shellcheck
+brew install shellcheck
+
+# 檢查 Shell 腳本
+shellcheck scripts/*.sh monitor/**/*.sh
+```
+
+**注意**: Hook 只檢查 error 等級的 shellcheck 問題，style 警告會顯示但不阻擋提交。
+
+## Release Workflow
+
+### Release 前準備
+每次 release production binary 前，必須：
+
+1. **建立 Release Tag**
+   ```bash
+   git tag -a v0.X.X -m "Release vX.X.X - YYYY-MM-DD"
+   git push origin v0.X.X
+   ```
+
+2. **備份獨立 Source Code**
+   ```bash
+   # 建立 release 獨立目錄
+   RELEASE_DIR="/Users/accusys/momentry_core_releases/v0.X.X"
+   mkdir -p "$RELEASE_DIR"
+   
+   # 複製完整原始碼（排除不必要的檔案）
+   rsync -av --exclude='.git' --exclude='target' --exclude='node_modules' \
+         /Users/accusys/momentry_core_0.1/ "$RELEASE_DIR/"
+   
+   # 記錄 release 資訊
+   echo "Release: v0.X.X" > "$RELEASE_DIR/RELEASE_INFO.txt"
+   echo "Date: $(date)" >> "$RELEASE_DIR/RELEASE_INFO.txt"
+   echo "Git Commit: $(git rev-parse HEAD)" >> "$RELEASE_DIR/RELEASE_INFO.txt"
+   echo "Binary: $(ls -la target/release/momentry)" >> "$RELEASE_DIR/RELEASE_INFO.txt"
+   ```
+
+3. **備份 Binary**
+   ```bash
+   cp target/release/momentry "$RELEASE_DIR/momentry_v0.X.X"
+   cp target/release/momentry_playground "$RELEASE_DIR/momentry_playground_v0.X.X" 2>/dev/null
+   ```
+
+4. **記錄資料庫 Schema**
+   ```bash
+   pg_dump -U accusys -d momentry --schema-only > "$RELEASE_DIR/schema_v0.X.X.sql"
+   ```
+
+### 重要性
+- 避免 release binary 與 current source code 不一致
+- 方便追蹤特定 release 的程式碼狀態
+- 必要時可快速復原或比對差異
+- 確保資料庫 schema 與程式碼版本對應
+
+## Reference Documents
+
+| 文件 | 用途 |
+|------|------|
+| `docs/OPENCODE_GUIDE.md` | OpenCode 使用規範 |
+| `docs/ARCHITECTURE_EVALUATION.md` | 架構優化待評估項目 (含 GraphRAG) |
+| `docs/PENDING_ISSUES.md` | 待解決問題追蹤 |
+| `docs/MOMENTRY_CORE_MONITORING.md` | 監控系統規範 |
+| `docs/MOMENTRY_CORE_REDIS_KEYS.md` | Redis Key 設計規範 |
+| `docs/PYTHON.md` | Python 腳本規範 |
+| `docs/FILE_CHANGE_MANAGEMENT.md` | 文件修改管理規範 |
+| `docs/YOLO_RESUME_INTEGRATION.md` | YOLO Resume 功能整合記錄 |
+| `docs/DOCUMENT_EMBEDDING_STRATEGY.md` | Parent-Child 嵌入策略 |
+| `docs/PROCESSING_PIPELINE.md` | 處理流程文檔 |
+| `docs/N8N_DEMO_WORKFLOW.md` | n8n 工作流文檔 |
+| `docs/FRESH_MAC_INSTALLATION.md` | 全新 Mac 安裝指南 |
+| `docs/SERVICES.md` | 服務總覽與管理 |
+| `docs/SFTPGO_DEMO_USER.md` | SFTPGo 用戶指南 |
+
+## Document Change Workflow
+
+修改文件前請參考 `docs/FILE_CHANGE_MANAGEMENT.md`，確保：
+
+1. **修改前**：完整閱讀文件、執行預檢清單
+2. **修改中**：提供變更計畫、取得確認
+3. **修改後**：展示 diff、更新版本歷史
+4. **驗證**：執行 lint/test、提交前審查
+
+### AI 工具修改規範
+
+AI 工具修改文件時：
+- 必須先完整閱讀文件（不可只讀取部分章節）
+- 修改前先提出變更計畫供確認
+- 修改後展示 diff 內容
+- 更新版本歷史表
+
+## PHP Development
+
+WordPress 作為 Momentry Portal，負責 n8n 自動化與 sftpgo 檔案服務的頁面整合。
+
+### 編輯器設定
+
+| 編輯器 | LSP 方案 | 安裝方式 |
+|--------|----------|----------|
+| VS Code | Intelephense | Extension Marketplace (推薦) |
+| Cursor | Intelephense | Extension Marketplace (推薦) |
+| CLI | phpactor | `~/bin/phpactor` |
+
+### Intelephense (VS Code/Cursor)
+
+1. 安裝 Extension: 搜尋 "Intelephense"
+2. 設定:
+```json
+{
+  "intelephense.stubs": ["wordpress"]
+}
+```
+
+### phpactor (CLI)
+
+```bash
+# 安裝方式
+brew install composer
+curl -sSL https://github.com/phpactor/phpactor/releases/latest/download/phpactor.phar -o ~/bin/phpactor
+chmod +x ~/bin/phpactor
+
+# 安裝 WordPress Stubs
+cd /Users/accusys/wordpress/web
+composer require --dev php-stubs/wordpress-stubs
+
+# 建立 WordPress 索引
+cd /Users/accusys/wordpress/web
+~/bin/phpactor index:build --reset
+
+# 常用指令
+~/bin/phpactor class:search "WP_User"      # 搜尋類別
+~/bin/phpactor index:query WP_User          # 查看類別資訊
+~/bin/phpactor navigate /path/to/file.php  # 導航到定義
+```
+
+### WordPress 程式碼位置
+| 類型 | 路徑 |
+|------|------|
+| 主題 | `/Users/accusys/wordpress/web/wp-content/themes/` |
+| 插件 | `/Users/accusys/wordpress/web/wp-content/plugins/` |
+
+### 與 marcom 團隊協作
+| 角色 | 負責 |
+|------|------|
+| marcom 團隊 | Figma 設計 / Elementor 建構 |
+| OpenCode | 程式碼實作 / 重構 |
+
+### 開發時程
+```
+Phase 1: marcom 建構 (現在)    → Elementor 頁面建構
+Phase 2: 交付審視 (TBD)      → 功能確認 / 重構評估
+Phase 3: OpenCode 重構        → 純程式碼實作，交付無 Elementor 依賴版本
+```
+
+## M4 通知規範
+
+### 固定通知方式
+
+通知 M4 的唯一管道：**`M4_workspace/` 下建立回覆文件 + `git commit`**。不需口頭、即時訊息、郵件。
+
+### 命名規則
+
+```
+docs_v1.0/M4_workspace/YYYY-MM-DD_<topic>_response.md   (回覆 M4 問題)
+docs_v1.0/M4_workspace/YYYY-MM-DD_<topic>.md             (主動通報)
+docs_v1.0/M4_workspace/YYYY-MM-DD_<topic>_test_report.md (測試報告)
+```
+
+### 觸發時機
+
+| 情境 | 動作 |
+|------|------|
+| M4 提交問題報告到 `M4_workspace/` | 修復後，回覆 `*_response.md` |
+| 完成 M4 要求的任務 | 回覆 `*_response.md` |
+| 重大變更（模型替換、架構變更） | 主動通知 `*.md` |
+| 新測試包產出 | `*_test_report.md` |
+
+### 交付檢查
+
+1. 文件寫入 `docs_v1.0/M4_workspace/`
+2. `git add` 包含該文件
+3. `git commit` 含相關變更
+4. M4 透過 git log 查看
+
+詳細規範見 `docs_v1.0/M4_workspace/M4_NOTIFICATION_PROTOCOL.md`。
+
+## UUID Naming Rule
+
+**Never use bare `uuid` in API route paths, query params, JSON keys, or code variable names. Always qualify:**
+
+| Context | Must use | Never |
+|---------|----------|-------|
+| Video/file resource | `file_uuid` | `uuid` |
+| Identity resource | `identity_uuid` | `uuid` |
+| Query parameter | `file_uuid=`, `identity_uuid=` | `uuid=` |
+| Route path | `:file_uuid`, `:identity_uuid` | `:uuid` |
+| JSON key | `"file_uuid"`, `"identity_uuid"` | `"uuid"` |
+
+This applies to docs, code, API responses, and curl examples. Exceptions: internal database primary key names (e.g. `identities.uuid` column).
+
+## Document Compliance Checklist
+
+Before creating any file in `docs_v1.0/` (API_WORKSPACE, GUIDES, REFERENCE, DESIGN, OPERATIONS, INTEGRATIONS), verify all items below.
+**IMPORTANT**: API functional documents are generated from `API_WORKSPACE/modules/`. Edit modules there, then run `make deploy` in `API_WORKSPACE/` to update `GUIDES/`. Never edit generated files in `GUIDES/` directly. See `DESIGN/Modular_Doc_System_V1.0.md` for the full system design.
+
+### P0 — Mandatory (7 items)
+
+| # | Check | Rule |
+|---|-------|------|
+| 1 | YAML frontmatter | `title`, `version`, `date`, `author`, `status` present |
+| 2 | Version history | Table at bottom of file tracking changes |
+| 3 | Top info table | scope, status, applicable to, etc. |
+| 4 | PascalCase filename | e.g. `DetectorRegistry.md`, not `detector_registry.md` |
+| 5 | `_` separator | Within filenames use `_`, never spaces or other chars |
+| 6 | English content | Entire file in English |
+| 7 | Correct directory | File must reside in appropriate directory: `API_WORKSPACE/modules/` (API endpoint modules), `GUIDES/` (user docs, generated), `REFERENCE/` (data models), `DESIGN/` (architecture), `OPERATIONS/` (infra/release), `INTEGRATIONS/` (n8n/tests) |
+
+### P0b — UUID Naming
+
+| # | Check | Rule |
+|---|-------|------|
+| 8 | `file_uuid` not bare `uuid` | All file references use `file_uuid` (see UUID Naming Rule above) |
+| 9 | `identity_uuid` not bare `uuid` | All identity references use `identity_uuid` |
+
+### P1 — Suggested (3 items)
+
+| # | Check | Note |
+|---|-------|------|
+| 1 | Cross-references | Link to related docs in API_WORKSPACE/, GUIDES/, REFERENCE/, DESIGN/, OPERATIONS/ |
+| 2 | Glossary terms | Define non-obvious terms inline or link glossary |
+| 3 | Diagrams | Include Mermaid/ASCII diagram for complex topics |
+
+### Exception
+
+`M4_workspace/` files are exempt from this checklist (free-format reply documents).
+
+---
+
+## Delivery Procedure
+
+完整交付程序（M4_workspace → M5 → Release → Deploy → Public）見：
+
+`docs_v1.0/OPERATIONS/DELIVERY_PROCEDURE.md`
diff --git a/deliverable_v1.1.0/SYSTEM_AUDIT_2026-05-17.md b/deliverable_v1.1.0/SYSTEM_AUDIT_2026-05-17.md
new file mode 100644
index 0000000..eca8e02
--- /dev/null
+++ b/deliverable_v1.1.0/SYSTEM_AUDIT_2026-05-17.md
@@ -0,0 +1,71 @@
+# System Audit — 2026-05-17
+
+## Current State
+
+### Embedding Storage (三重冗余，無主)
+
+| 資料類型 | PG pgvector | Qdrant | JSON 檔案 |
+|---------|------------|--------|-----------|
+| Sentence 向量 | `chunk.embedding` ✅ | `dev_v1` / `rule1_v2` / `sentence_*` ✅ | ❌ 無 |
+| Story 向量 | `chunk.embedding` ✅ | `dev_v1` / `dev_stories` ✅ | `.story_llm.json` ✅ |
+| Face 向量 | ❌ 已清除（依使用者指示） | `dev_faces` ✅ (97K) | `.face.json` ✅ |
+| Voice 向量 | ❌ 無 | `dev_voice` ✅ (4K) | ❌ 無 |
+
+### Pipeline 問題
+
+| 問題 | 影響 |
+|------|------|
+| `processor_results.duration_secs` 全為 0 | 無法查各步驟耗時 |
+| `processor_results.started_at/completed_at` 全 NULL | 時間線遺失 |
+| Redis timing 在 job 完成後被清掉 | 唯一 timing 來源消失 |
+| `get_chunk_by_chunk_id_and_uuid` 原本是 stub（已修） | Smart search 找不到 PG chunk |
+| `server.rs::search()` 未 mount 但仍編譯 | Dead code，混淆 Qdrant 用途 |
+| Face embedding 只寫 Qdrant 不寫 PG | 已刪除則全失 |
+
+### Qdrant Collections 現況
+
+| Collection | Points | 來源 | UUID |
+|-----------|--------|------|------|
+| `dev_v1` | 9,936 | PG rebuild | ✅ bd80fec... |
+| `dev_faces` | 97,000 | face.json rebuild | ✅ bd80fec... |
+| `dev_stories` | 560 | Snapshot | ✅ bd80fec... |
+| `dev_voice` | 4,188 | Snapshot | ✅ bd80fec... |
+| `dev_rule1_v2` | 3,417 | Snapshot | ✅ bd80fec... |
+| `sentence_story` | 4,188 | Snapshot | ✅ bd80fec... |
+| `sentence_summary` | 4,188 | Snapshot | ✅ bd80fec... |
+
+## Safeguards & Fixes
+
+### P0 — 必須修
+
+| # | Fix | 做法 |
+|---|-----|------|
+| 1 | **Pipeline timing 寫入 DB** | `update_processor_result()` 加入 `started_at`、`completed_at`、`duration_secs` |
+| 2 | **Qdrant 不當主要儲存** | Embedding 以 PG `chunk.embedding` 為 source of truth，Qdrant 唯讀 cache |
+| 3 | **Smart search 只走 PG pgvector** | `search_parent_chunks_semantic` 已正確，無需 Qdrant |
+| 4 | **移除 `server.rs::search()` dead code** | 或 mount 到正式 route 並確認可用 |
+
+### P1 — 建議修
+
+| # | Fix | 做法 |
+|---|-----|------|
+| 5 | **刪除 Qdrant 前先 snapshot** | 自動 snapshot script |
+| 6 | **清理多餘 Qdrant collections** | `dev_voice` / `dev_stories` / `dev_rule1_v2` / `sentence_*` 無 server reader，可移除 |
+| 7 | **Face embedding 寫入 PG 或移除 dead code** | 目前 face Qdrant write 無人讀取，可移除 `sync_face_embeddings` |
+| 8 | **UUID 一致性檢查** | 同一 content 不應產生不同 UUID |
+
+### P2 — 可選
+
+| # | Fix | 做法 |
+|---|-----|------|
+| 9 | `chunk_selector.rs` （player binary）hardcode `momentry_rule1` | 改讀 env var 或 PG |
+| 10 | AGENTS.md 已加入 delete 安全規則 | ✅ Done |
+
+## Data Recovery Path
+
+| 資料來源 | 可恢復到 | 方法 |
+|---------|---------|------|
+| `chunk.embedding` (PG) | Qdrant `dev_v1` | SQL → Qdrant upsert |
+| `face.json` (磁碟) | Qdrant `dev_faces` | Python script |
+| `story_llm.json` (磁碟) | Qdrant `dev_stories` | Python script |
+| Qdrant snapshots (phase1) | Qdrant collections | Snapshot upload API |
diff --git a/deliverable_v1.1.0/html_docs/doc/01_auth.html b/deliverable_v1.1.0/html_docs/doc/01_auth.html
new file mode 100644
index 0000000..11a47c9
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/01_auth.html
@@ -0,0 +1,388 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>01 Auth - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: auth -->
+<!-- description: Authentication — login, logout, JWT, session cookie, API key -->
+<!-- depends: -->
+
+<h2>Base URL</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Environment</th>
+<th>URL</th>
+<th>Purpose</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Production</td>
+<td><code>http://localhost:3002</code></td>
+<td>Production deployment</td>
+</tr>
+<tr>
+<td>External (M5)</td>
+<td><code>https://m5api.momentry.ddns.net</code></td>
+<td>Remote access</td>
+</tr>
+</tbody>
+</table>
+<h2>Variables</h2>
+<p>All examples in this documentation use these environment variables:</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://localhost:3002&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;your-api-key-here&quot;</span>
+</code></pre></div>
+
+<h2>Authentication</h2>
+<p>All endpoints under <code>/api/v1/*</code> require authentication.
+The following endpoints are public (no auth needed):</p>
+<ul>
+<li><code>GET /health</code></li>
+<li><code>POST /api/v1/auth/login</code></li>
+<li><code>POST /api/v1/auth/logout</code></li>
+</ul>
+<h3>Three Authentication Modes</h3>
+<p>The system supports three authentication methods, checked in <strong>priority order</strong> by the middleware:</p>
+<div class="codehilite"><pre><span></span><code>Middleware priority:
+  1. Session Cookie (Portal/browser)
+  2. JWT Bearer (API clients, CLI)
+  3. API Key Header (legacy compatibility)
+  4. API Key Query Param (?api_key=)
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Mode</th>
+<th>Transport</th>
+<th>Expiry</th>
+<th>Scope</th>
+<th>Best for</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td><code>Cookie: session_id=&lt;session_id&gt;</code></td>
+<td>24h</td>
+<td>per-browser session</td>
+<td>Portal (browser)</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td><code>Authorization: Bearer &lt;token&gt;</code></td>
+<td>1h</td>
+<td>per-login token</td>
+<td>API clients, CLI, scripts</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td><code>X-API-Key: &lt;key&gt;</code></td>
+<td>90d</td>
+<td>fixed key for automation</td>
+<td>Legacy scripts, WordPress</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Login</h3>
+<p><strong>Default accounts &amp; API keys:</strong></p>
+<table class="table">
+<thead>
+<tr>
+<th>Username</th>
+<th>Password</th>
+<th>API Key</th>
+<th>Role</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>admin</code></td>
+<td><code>admin</code></td>
+<td>—</td>
+<td>admin</td>
+</tr>
+<tr>
+<td><code>demo</code></td>
+<td><code>demo</code></td>
+<td><code>muser_demo_key_32chars_abcdef1234567890</code></td>
+<td>user</td>
+</tr>
+</tbody>
+</table>
+<p>The demo API key is set via <code>MOMENTRY_DEMO_API_KEY</code> env var and can be used in place of JWT for marcom integrations:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Using API key instead of JWT</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_demo_key_32chars_abcdef1234567890&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login as admin</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;admin&quot;, &quot;password&quot;: &quot;admin&quot;}&#39;</span>
+
+<span class="c1"># Login as demo user</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;demo&quot;, &quot;password&quot;: &quot;demo&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Success Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;jwt&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;eyJhbGciOiJIUzI1NiIs...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_key&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;muser_...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;user&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;username&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;role&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;expires_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-18T13:00:00Z&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jwt</code></td>
+<td>string</td>
+<td>JWT access token. Use as <code>Authorization: Bearer &lt;jwt&gt;</code>. Expires in 1 hour.</td>
+</tr>
+<tr>
+<td><code>api_key</code></td>
+<td>string</td>
+<td>Legacy API key. Use as <code>X-API-Key: &lt;key&gt;</code>. Good for 90 days.</td>
+</tr>
+<tr>
+<td><code>user.username</code></td>
+<td>string</td>
+<td>Username</td>
+</tr>
+<tr>
+<td><code>user.role</code></td>
+<td>string</td>
+<td>Role: <code>admin</code>, <code>user</code>, or <code>readonly</code></td>
+</tr>
+<tr>
+<td><code>expires_at</code></td>
+<td>string</td>
+<td>ISO8601 timestamp of JWT expiration</td>
+</tr>
+</tbody>
+</table>
+<p>The login endpoint also sets a <code>Set-Cookie</code> header for browser-based clients:</p>
+<div class="codehilite"><pre><span></span><code><span class="nt">Set-Cookie</span><span class="o">:</span><span class="w"> </span><span class="nt">session_id</span><span class="o">=&lt;</span><span class="nt">session_id</span><span class="o">&gt;;</span><span class="w"> </span><span class="nt">Path</span><span class="o">=/;</span><span class="w"> </span><span class="nt">HttpOnly</span><span class="o">;</span><span class="w"> </span><span class="nt">SameSite</span><span class="o">=</span><span class="nt">Strict</span><span class="o">;</span><span class="w"> </span><span class="nt">Max-Age</span><span class="o">=</span><span class="nt">86400</span>
+</code></pre></div>
+
+<h4>Error Response (401)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Invalid username or password&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3>Using JWT</h3>
+<p>JWT is preferred for API clients (CLI scripts, WordPress). It is validated by the middleware without a database lookup (stateless).</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login and capture JWT</span>
+<span class="nv">JWT</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;print(json.load(sys.stdin)[&#39;jwt&#39;])&quot;</span><span class="k">)</span>
+
+<span class="c1"># Use JWT for all subsequent requests</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span>
+</code></pre></div>
+
+<p>JWT is short-lived (1 hour). When it expires, request a new one via login.</p>
+<hr />
+<h3>Using Session Cookie (Browser)</h3>
+<p>Browser-based clients (Portal) get a session cookie automatically after login. The browser sends the cookie with every request—no manual header needed.</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login captures the session cookie from Set-Cookie header</span>
+curl<span class="w"> </span>-v<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span>
+
+<span class="c1"># Browser automatically sends: Cookie: session_id=&lt;session_id&gt;</span>
+<span class="c1"># No manual header needed for subsequent requests</span>
+</code></pre></div>
+
+<p>The session cookie is HttpOnly (not accessible from JavaScript) and SameSite=Strict (protected against CSRF).</p>
+<hr />
+<h3>Using Legacy API Key</h3>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+
+<span class="c1"># Also accepted via Bearer header (non-JWT format) or query parameter:</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?api_key=</span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>API keys are validated via SHA256 hash lookup in the database. They are long-lived (90 days) and intended for automation.</p>
+<h3>Obtaining an API Key (CLI)</h3>
+<div class="codehilite"><pre><span></span><code>momentry<span class="w"> </span>api-key<span class="w"> </span>create<span class="w"> </span><span class="s2">&quot;My API Key&quot;</span><span class="w"> </span>--key-type<span class="w"> </span>user
+</code></pre></div>
+
+<hr />
+<h3>Logout</h3>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Logout using the session cookie (browser)</span>
+curl<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=&lt;uuid&gt;&quot;</span>
+</code></pre></div>
+
+<h4>What logout does</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Auth mode</th>
+<th>Effect</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td>Session deleted from database. Same cookie returns 401 on subsequent requests.</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td>JWT remains valid until expiry. (JWT is stateless — logout adds JWT to a blacklist only if API key mode is used.)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td>API key remains valid. (Legacy keys are shared across sessions — revoking would break other clients.)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example: full session lifecycle</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># 1. Login</span>
+<span class="nv">SESSION_ID</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-D<span class="w"> </span>-<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sed<span class="w"> </span><span class="s1">&#39;s/.*session_id=\([^;]*\).*/\1/&#39;</span><span class="k">)</span>
+
+<span class="c1"># 2. Use session (works)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 200</span>
+
+<span class="c1"># 3. Logout</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → {&quot;success&quot;: true}</span>
+
+<span class="c1"># 4. Use session again (rejected)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 401</span>
+</code></pre></div>
+
+<hr />
+<h3>Authentication Flow Summary</h3>
+<div class="codehilite"><pre><span></span><code>Login Request
+     │
+     ▼
+┌──────────────────┐
+│  1. Check users  │ ← users table (argon2 password verify)
+│     table        │
+└──────┬───────────┘
+       │
+   ┌───┴───┐
+   │ match │
+   └───┬───┘
+       │
+       ▼
+┌──────────────────┐
+│  2. Create JWT   │ ← 1h expiry, signed with JWT_SECRET
+├──────────────────┤
+│  3. Create       │ ← 24h expiry, stored in sessions table
+│     session      │
+├──────────────────┤
+│  4. Set-Cookie   │ ← HttpOnly, SameSite=Strict, Path=/
+├──────────────────┤
+│  5. Return       │ ← JWT + api_key + user info to client
+└──────────────────┘
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>Protected Request
+     │
+     ▼
+┌──────────────────────┐
+│  Middleware checks:  │
+│                      │
+│  1. Cookie session?  │ → DB lookup session → get api_key → verify
+│                      │
+│  2. JWT Bearer?      │ → verify JWT signature → decode claims
+│                      │
+│  3. X-API-Key?       │ → SHA256 hash → DB lookup → verify
+│                      │
+│  4. ?api_key=?       │ → same as #3
+│                      │
+│  5. None → 401       │
+└──────────────────────┘
+</code></pre></div>
+
+<hr />
+<h3>Error Responses</h3>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid authentication</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Session expired or logged out</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>JWT expired</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>API key revoked or inactive</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Related</h3>
+<ul>
+<li><code>POST /api/v1/resource/tmdb/check</code> — test authentication + TMDb API connectivity</li>
+<li><code>GET /health/detailed</code> — view auth status (integrations section)</li>
+</ul>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/02_health.html b/deliverable_v1.1.0/html_docs/doc/02_health.html
new file mode 100644
index 0000000..0ed4b92
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/02_health.html
@@ -0,0 +1,277 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>02 Health - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: health -->
+<!-- description: Health check endpoints -->
+<!-- depends: 01_auth -->
+
+<h2>Health Check</h2>
+<h3><code>GET /health</code></h3>
+<p><strong>Auth</strong>: Public
+<strong>Scope</strong>: system-level</p>
+<p>Returns basic server health status — used by load balancers and monitoring.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, version}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_git_hash&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_timestamp&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T13:38:15Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;uptime_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3015</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>version</code></td>
+<td>string</td>
+<td>Semver version</td>
+</tr>
+<tr>
+<td><code>build_git_hash</code></td>
+<td>string</td>
+<td>Git commit hash</td>
+</tr>
+<tr>
+<td><code>build_timestamp</code></td>
+<td>string</td>
+<td>Binary build time</td>
+</tr>
+<tr>
+<td><code>uptime_ms</code></td>
+<td>integer</td>
+<td>Milliseconds since server start</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /health/detailed</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Returns full system health including each service status, resource utilization, pipeline readiness, schema migration status, identity file sync status, and external integrations.</p>
+<blockquote>
+<p>Requires authentication (JWT, session cookie, or API key). The basic <code>/health</code> endpoint remains public for load balancer checks.</p>
+</blockquote>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health/detailed&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, services, resources: {cpu: .resources.cpu_used_percent, memory: .resources.memory_used_percent}}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;services&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;postgres&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;redis&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;qdrant&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">}</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;resources&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;cpu_used_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">12.5</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;memory_available_mb&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">32768</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;memory_used_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">31.7</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;pipeline&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;scripts_ready&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;scripts_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;asr&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;yolo&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;pose&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;ocr&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;cut&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;scene&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;asrx&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;visual_chunk&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;models_ready&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;models_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;scripts_integrity&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">332</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;ffmpeg&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;schema&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;table_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;applied&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[{</span><span class="nt">&quot;filename&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;migrate_add_users_table.sql&quot;</span><span class="p">}],</span>
+<span class="w">    </span><span class="nt">&quot;required&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[],</span>
+<span class="w">    </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;identities&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;directory_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;files_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3481</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;index_ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;db_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3481</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;synced&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;integrations&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;tmdb&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;api_key_configured&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;enabled&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;api_reachable&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Response Fields</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> if all essential services healthy</td>
+</tr>
+<tr>
+<td><code>services</code></td>
+<td>object</td>
+<td>Per-service status (postgres, redis, qdrant)</td>
+</tr>
+<tr>
+<td><code>services.*.status</code></td>
+<td>string</td>
+<td><code>ok</code>, <code>error</code>, or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>services.*.latency_ms</code></td>
+<td>int</td>
+<td>Response time in milliseconds</td>
+</tr>
+<tr>
+<td><code>resources</code></td>
+<td>object</td>
+<td>CPU, memory usage</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_ready</code></td>
+<td>boolean</td>
+<td>Scripts directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_count</code></td>
+<td>int</td>
+<td>Number of Python processor scripts</td>
+</tr>
+<tr>
+<td><code>pipeline.processors</code></td>
+<td>object</td>
+<td>Per-processor availability</td>
+</tr>
+<tr>
+<td><code>pipeline.models_ready</code></td>
+<td>boolean</td>
+<td>Models directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_integrity</code></td>
+<td>object</td>
+<td>SHA256 checksum verification results</td>
+</tr>
+<tr>
+<td><code>schema.ok</code></td>
+<td>boolean</td>
+<td>All required migrations applied</td>
+</tr>
+<tr>
+<td><code>identities.synced</code></td>
+<td>boolean</td>
+<td>Identity file count matches DB count</td>
+</tr>
+<tr>
+<td><code>integrations.tmdb</code></td>
+<td>object</td>
+<td>TMDB API key config and reachability</td>
+</tr>
+</tbody>
+</table>
+<h4>Health status rules</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Condition</th>
+<th>status</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>All services ok</td>
+<td><code>ok</code></td>
+</tr>
+<tr>
+<td>Any service error</td>
+<td><code>degraded</code></td>
+</tr>
+<tr>
+<td>Postgres or Redis error</td>
+<td><code>degraded</code> (server still responds)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Stats Endpoints</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Auth</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/sftpgo</code></td>
+<td>No</td>
+<td>SFTPGo service status</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/03_register.html b/deliverable_v1.1.0/html_docs/doc/03_register.html
new file mode 100644
index 0000000..8e211ba
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/03_register.html
@@ -0,0 +1,444 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>03 Register - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: register -->
+<!-- description: File registration — register, scan -->
+<!-- depends: 01_auth -->
+
+<h2>File Registration</h2>
+<h3><code>POST /api/v1/files/register</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Register a video file for processing. Returns the file's metadata and UUID.</p>
+<p><strong>New in v0.1.2</strong>: Registration now <strong>automatically triggers the processing pipeline</strong> — no need to call <code>POST /api/v1/file/:file_uuid/process</code> separately. The system will:
+1. Register the file and run ffprobe
+2. Auto-run offline TMDb probe (reads local identity files, no API calls)
+3. Create a monitor job for the worker
+4. Worker starts all 10 processors (Cut → ASR → ASRX → YOLO → OCR → Face → Pose → VisualChunk → Story → 5W1H)</p>
+<p>If the file already exists (same content hash), returns the existing record with <code>already_exists: true</code>.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Path to video file on disk</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex pattern for batch register (requires <code>file_path</code> to be a directory)</td>
+</tr>
+<tr>
+<td><code>user_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>User ID to associate with registration</td>
+</tr>
+<tr>
+<td><code>content_hash</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Pre-computed SHA-256 hash (skips computation)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Register a single file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39;</span>
+
+<span class="c1"># Batch register files matching a pattern in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;already_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;File registered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the registered file</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name (auto-renamed if name conflict)</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Canonical path on disk</td>
+</tr>
+<tr>
+<td><code>file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>"unknown"</code></td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Total frame count</td>
+</tr>
+<tr>
+<td><code>already_exists</code></td>
+<td>boolean</td>
+<td>True if same content was already registered</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+<tr>
+<td><code>400</code></td>
+<td>Invalid request body</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File path does not exist</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/files/scan</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Scan the filesystem directory and list all media files, showing which are registered, processing, or unregistered.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Items per page (alias: <code>limit</code>)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Max items (alias for <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex filter on file name (e.g., <code>.*\\.mp4$</code>)</td>
+</tr>
+<tr>
+<td><code>sort_by</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>name</code></td>
+<td>Sort field: <code>name</code>, <code>size</code>, <code>modified</code>, <code>status</code></td>
+</tr>
+<tr>
+<td><code>sort_order</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>asc</code></td>
+<td>Sort direction: <code>asc</code> or <code>desc</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Full scan</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, registered_count, unregistered_count}&#39;</span>
+
+<span class="c1"># Paginated (page 1, 5 per page)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?page=1&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{page, total_pages, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Regex filter: only mp4 files</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?pattern=.*\\.mp4</span>$<span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{filtered_total, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Sort by file size (largest first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=size&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, file_size}]&#39;</span>
+
+<span class="c1"># Sort by modified time (most recent first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=modified&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, modified_time}]&#39;</span>
+
+<span class="c1"># Sort by status</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=status&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, status}]&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;files&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">12345678</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;is_registered&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;registration_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">107</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;filtered_total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">80</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_pages&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;registered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">26</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;unregistered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">81</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>files</code></td>
+<td>array</td>
+<td>Array of file info objects (paginated)</td>
+</tr>
+<tr>
+<td><code>files[].file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>files[].relative_path</code></td>
+<td>string</td>
+<td>Path relative to scan root</td>
+</tr>
+<tr>
+<td><code>files[].file_path</code></td>
+<td>string</td>
+<td>Absolute path on disk</td>
+</tr>
+<tr>
+<td><code>files[].file_size</code></td>
+<td>integer</td>
+<td>File size in bytes</td>
+</tr>
+<tr>
+<td><code>files[].modified_time</code></td>
+<td>string</td>
+<td>Last modified timestamp (ISO8601)</td>
+</tr>
+<tr>
+<td><code>files[].is_registered</code></td>
+<td>boolean</td>
+<td>Whether file is registered in DB</td>
+</tr>
+<tr>
+<td><code>files[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].status</code></td>
+<td>string</td>
+<td><code>"completed"</code>, <code>"processing"</code>, <code>"registered"</code>, <code>"unregistered"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>files[].registration_time</code></td>
+<td>string</td>
+<td>DB registration timestamp (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].job_id</code></td>
+<td>integer</td>
+<td>Processing job ID (only if a job exists)</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total files found on disk (unfiltered)</td>
+</tr>
+<tr>
+<td><code>filtered_total</code></td>
+<td>integer</td>
+<td>Files matching regex filter</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>total_pages</code></td>
+<td>integer</td>
+<td>Total pages</td>
+</tr>
+<tr>
+<td><code>registered_count</code></td>
+<td>integer</td>
+<td>Files registered in DB</td>
+</tr>
+<tr>
+<td><code>unregistered_count</code></td>
+<td>integer</td>
+<td>Files not yet registered</td>
+</tr>
+</tbody>
+</table>
+<h4>Notes</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Feature</th>
+<th>Behavior</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Regex</strong></td>
+<td>Case-insensitive (<code>(?i)</code> prefix auto-applied). Applied to <code>file_name</code>.</td>
+</tr>
+<tr>
+<td><strong>Sort order</strong></td>
+<td>Default (<code>sort_by=name</code>): registered files first, then alphabetically. <code>sort_by=status</code>: alphabetical by status string.</td>
+</tr>
+<tr>
+<td><strong>Pagination</strong></td>
+<td><code>page_size</code> and <code>limit</code> are aliases. Default: show all results.</td>
+</tr>
+<tr>
+<td><strong>Processing order</strong></td>
+<td><code>pattern</code> regex filter → <code>sort_by</code>/<code>sort_order</code> → <code>page</code>/<code>page_size</code> slice.</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/04_lookup.html b/deliverable_v1.1.0/html_docs/doc/04_lookup.html
new file mode 100644
index 0000000..1ce9106
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/04_lookup.html
@@ -0,0 +1,291 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>04 Lookup - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: lookup -->
+<!-- description: File lookup by name and unregistration -->
+<!-- depends: 01_auth, 03_register -->
+
+<h2>File Lookup</h2>
+<h3><code>GET /api/v1/files/lookup</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Search registered files by file name. Performs a case-insensitive LIKE search on the file name column. Returns basic info about matching files.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File name to search for (partial matches supported)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Look up a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=video.mp4&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+
+<span class="c1"># Partial name search</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=charade&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.matches[].file_name&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;matches&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a03485a40b2df2d3&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;next_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video (2).mp4&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Searched name</td>
+</tr>
+<tr>
+<td><code>exists</code></td>
+<td>boolean</td>
+<td>Exact name match exists</td>
+</tr>
+<tr>
+<td><code>matches</code></td>
+<td>array</td>
+<td>Array of matching registered files</td>
+</tr>
+<tr>
+<td><code>matches[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>matches[].file_name</code></td>
+<td>string</td>
+<td>Registered file name</td>
+</tr>
+<tr>
+<td><code>matches[].file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>matches[].status</code></td>
+<td>string</td>
+<td>Registration/processing status</td>
+</tr>
+<tr>
+<td><code>next_name</code></td>
+<td>string</td>
+<td>Suggested name for avoiding conflicts</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Unregister</h2>
+<h3><code>POST /api/v1/unregister</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Delete a registered file from the system. Supports single file by UUID, or batch by directory + regex pattern.</p>
+<h4>What gets deleted</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Removed (default)</th>
+<th>Not removed</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Database records (videos, chunks, embeddings, processor_results, pre_chunks)</td>
+<td>The original source video file on disk</td>
+</tr>
+<tr>
+<td>Processor output JSON files (<code>{uuid}.*.json</code>) — unless <code>delete_output_files: false</code></td>
+<td>Temp/working directories</td>
+</tr>
+<tr>
+<td>In-memory cache entries</td>
+<td></td>
+</tr>
+<tr>
+<td>MongoDB cached lists</td>
+<td></td>
+</tr>
+</tbody>
+</table>
+<blockquote>
+<p>⚠️ Database deletion is <strong>irreversible</strong>. To keep output files, set <code>"delete_output_files": false</code>.</p>
+</blockquote>
+<h4>Request Parameters</h4>
+<p>At least one mode must be specified: either <code>file_uuid</code> alone, or <code>file_path</code> + <code>pattern</code> together.</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Single file UUID to delete</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Directory path (for batch delete)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Regex pattern (requires <code>file_path</code>)</td>
+</tr>
+<tr>
+<td><code>delete_output_files</code></td>
+<td>boolean</td>
+<td>No</td>
+<td><code>true</code></td>
+<td>If <code>true</code>, also delete processor output JSON files (<code>{uuid}.*.json</code>). Set to <code>false</code> to keep them.</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Delete a single file by UUID (default: also deletes output JSON files)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Keep output JSON files, only delete DB records</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;delete_output_files&quot;: false}&#39;</span>
+
+<span class="c1"># Batch delete all mp4 files in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a03485a40b2df2d3&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Video unregistered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>True if deletion succeeded</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>UUID of the deleted file (single mode)</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Neither <code>file_uuid</code> nor <code>file_path</code>+<code>pattern</code> provided</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/05_process.html b/deliverable_v1.1.0/html_docs/doc/05_process.html
new file mode 100644
index 0000000..69cba53
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/05_process.html
@@ -0,0 +1,505 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>05 Process - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: process -->
+<!-- description: Processing pipeline — trigger, probe, progress, jobs -->
+<!-- depends: 01_auth, 03_register -->
+
+<h2>Processing Pipeline</h2>
+<h3><code>POST /api/v1/file/:file_uuid/process</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Trigger the processing pipeline for a registered file. Creates a monitor job that the worker picks up and processes sequentially. Returns immediately with the job info—processing runs asynchronously in the background.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>processors</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Specific processors to run: <code>["cut","asr","asrx","yolo","ocr","face","pose","visual_chunk","story","5w1h"]</code></td>
+</tr>
+<tr>
+<td><code>rules</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Rule names to apply (currently unused)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Run all processors</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-d<span class="w"> </span><span class="s1">&#39;{}&#39;</span>
+
+<span class="c1"># Run specific processors only</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;processors&quot;: [&quot;asr&quot;, &quot;face&quot;, &quot;yolo&quot;]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;processing&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;pids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="mi">12345</span><span class="p">,</span><span class="w"> </span><span class="mi">12346</span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Processing triggered for video.mp4&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>job_id</code></td>
+<td>integer</td>
+<td>Monitor job ID (for job tracking)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the file</td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>"processing"</code></td>
+</tr>
+<tr>
+<td><code>pids</code></td>
+<td>integer[]</td>
+<td>Process IDs of started processors</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/probe</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Get ffprobe metadata for a registered file. Returns video/audio stream info, codec details, duration, resolution, and frame rate.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/probe&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">794863677</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;cached&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;format&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;filename&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;format_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;mov,mp4,m4a,3gp&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;120.5&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;size&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;12345678&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;bit_rate&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;819200&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;streams&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;index&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;codec_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;h264&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;codec_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;r_frame_rate&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;24/1&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;120.5&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>file_size</code></td>
+<td>integer</td>
+<td>File size in bytes (from filesystem)</td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Estimated total frames</td>
+</tr>
+<tr>
+<td><code>cached</code></td>
+<td>boolean</td>
+<td>True if result was from cached probe JSON</td>
+</tr>
+<tr>
+<td><code>format</code></td>
+<td>object</td>
+<td>Container format info (ffprobe format section)</td>
+</tr>
+<tr>
+<td><code>streams</code></td>
+<td>array</td>
+<td>Array of stream info objects</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/progress/:file_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Get real-time processing progress for a file via Redis pub/sub. Includes per-processor status, current/total frames, ETA, and system resource stats.</p>
+<h4>Pipeline Order</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Order</th>
+<th>Processor</th>
+<th>Dependencies</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>1</td>
+<td><code>cut</code></td>
+<td>—</td>
+<td>Scene detection</td>
+</tr>
+<tr>
+<td>2</td>
+<td><code>asr</code></td>
+<td>cut</td>
+<td>Speech-to-text (per scene)</td>
+</tr>
+<tr>
+<td>3</td>
+<td><code>asrx</code></td>
+<td>asr</td>
+<td>Speaker diarization</td>
+</tr>
+<tr>
+<td>4</td>
+<td><code>yolo</code></td>
+<td>—</td>
+<td>Object detection</td>
+</tr>
+<tr>
+<td>5</td>
+<td><code>ocr</code></td>
+<td>—</td>
+<td>Text recognition</td>
+</tr>
+<tr>
+<td>6</td>
+<td><code>face</code></td>
+<td>—</td>
+<td>Face detection &amp; embedding</td>
+</tr>
+<tr>
+<td>7</td>
+<td><code>pose</code></td>
+<td>—</td>
+<td>Pose estimation</td>
+</tr>
+<tr>
+<td>8</td>
+<td><code>visual_chunk</code></td>
+<td>yolo</td>
+<td>Visual scene chunks</td>
+</tr>
+<tr>
+<td>9</td>
+<td><code>story</code></td>
+<td>asr, asrx, cut, yolo, face</td>
+<td>Scene summaries (template)</td>
+</tr>
+<tr>
+<td>10</td>
+<td><code>5w1h</code></td>
+<td>story</td>
+<td>5W1H analysis (Gemma4 LLM)</td>
+</tr>
+</tbody>
+</table>
+<p>All processors except <code>story</code> and <code>5w1h</code> run concurrently when their dependencies are met. Story and 5W1H run sequentially after their prerequisites.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/progress/</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{overall_progress, processors: [.processors[] | {processor_type, status}]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;overall_progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">71</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;cpu_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">45.2</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;gpu_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">30.1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;memory_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">62.4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;asr&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;complete&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">100</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;running&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">65</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;face&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>overall_progress</code></td>
+<td>integer</td>
+<td>Overall progress percentage (0–100)</td>
+</tr>
+<tr>
+<td><code>processors</code></td>
+<td>array</td>
+<td>Per-processor status list</td>
+</tr>
+<tr>
+<td><code>processors[].processor_type</code></td>
+<td>string</td>
+<td>Processor name (<code>asr</code>, <code>cut</code>, <code>yolo</code>, etc.)</td>
+</tr>
+<tr>
+<td><code>processors[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"complete"</code>, or <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>processors[].progress</code></td>
+<td>integer</td>
+<td>Per-processor progress (0–100)</td>
+</tr>
+<tr>
+<td><code>processors[].eta_seconds</code></td>
+<td>integer</td>
+<td>Estimated seconds remaining (running processors)</td>
+</tr>
+<tr>
+<td><code>processors[].current</code></td>
+<td>integer</td>
+<td>Current frame count</td>
+</tr>
+<tr>
+<td><code>processors[].total</code></td>
+<td>integer</td>
+<td>Total frame count</td>
+</tr>
+<tr>
+<td><code>cpu_percent</code></td>
+<td>float</td>
+<td>Current CPU usage</td>
+</tr>
+<tr>
+<td><code>gpu_percent</code></td>
+<td>float</td>
+<td>Current GPU utilization</td>
+</tr>
+<tr>
+<td><code>memory_percent</code></td>
+<td>float</td>
+<td>Current memory usage</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/jobs</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>List all processing jobs (monitor jobs) in the system. Shows job status, which file each job is processing, and current processor info.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/jobs&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{count, jobs: [.jobs[] | {uuid, status}]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;jobs&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;running&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;current_processor&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;started_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:01:00Z&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jobs</code></td>
+<td>array</td>
+<td>Array of job info objects</td>
+</tr>
+<tr>
+<td><code>jobs[].id</code></td>
+<td>integer</td>
+<td>Job ID</td>
+</tr>
+<tr>
+<td><code>jobs[].uuid</code></td>
+<td>string</td>
+<td>File UUID being processed</td>
+</tr>
+<tr>
+<td><code>jobs[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"completed"</code>, <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>jobs[].current_processor</code></td>
+<td>string</td>
+<td>Currently active processor, or null</td>
+</tr>
+<tr>
+<td><code>count</code></td>
+<td>integer</td>
+<td>Total job count</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Jobs per page</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/06_search.html b/deliverable_v1.1.0/html_docs/doc/06_search.html
new file mode 100644
index 0000000..8f62e1a
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/06_search.html
@@ -0,0 +1,280 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>06 Search - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: search -->
+<!-- description: Vector search, BM25, smart search, universal search, visual search -->
+<!-- depends: 01_auth -->
+
+<h2>Search APIs</h2>
+<h3><code>POST /api/v1/search/smart</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Semantic vector search using EmbeddingGemma-300m. Generates a query embedding via EmbeddingGemma (port 11436), then searches pgvector <code>story_parent</code> and <code>llm_parent</code> chunks by cosine similarity.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>File UUID to search within</td>
+</tr>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>5</td>
+<td>Max results to return</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>5</td>
+<td>Items per page</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/smart&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;query&quot;: &quot;Audrey Hepburn&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;parent_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1087822</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;scene_order&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1087822</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">104438</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">104538</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">4351.6</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">4355.76</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;summary&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;[4352s-4356s, 4s] Cast: Audrey Hepburn. Total: 2 lines, 10 words. Speakers: Audrey Hepburn (2 lines)&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;similarity&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.67</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;strategy&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;semantic_vector_search&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/search/universal</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Multi-type BM25 full-text search across chunks, frames, and persons. Uses PostgreSQL <code>tsvector</code>.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>types</code></td>
+<td>string[]</td>
+<td>No</td>
+<td><code>["chunk","frame","person"]</code></td>
+<td>Search types</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>10</td>
+<td>Max results per type</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>20</td>
+<td>Items per page</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/universal&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;query&quot;: &quot;Cary Grant&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;chunk&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;bd80fec92b0b6963d177a2c55bf713e2_2&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;story_child&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5103</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5127</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">212.64</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">213.64</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;[213s-214s] Cary Grant: \&quot;Olá!\&quot;&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.9</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;took_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">18</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/search/frames</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Search face detection frames by identity name or trace ID.</p>
+<hr />
+<h3><code>POST /api/v1/search/identity_text</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Search text chunks spoken by a specific identity.</p>
+<hr />
+<h3>Visual Search</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual</code></td>
+<td>Search visual chunks</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/class</code></td>
+<td>Search by object class</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/density</code></td>
+<td>Search by object density</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/combination</code></td>
+<td>Search by object combination</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/stats</code></td>
+<td>Visual chunk statistics</td>
+</tr>
+</tbody>
+</table>
+<h4>Embedding Model</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Detail</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Model</strong></td>
+<td>EmbeddingGemma-300m</td>
+</tr>
+<tr>
+<td><strong>Endpoint</strong></td>
+<td><code>POST /api/v1/embeddings</code> on port 11436</td>
+</tr>
+<tr>
+<td><strong>Dimension</strong></td>
+<td>768</td>
+</tr>
+<tr>
+<td><strong>Storage</strong></td>
+<td>pgvector (<code>chunk.embedding</code> column)</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/07_identity.html b/deliverable_v1.1.0/html_docs/doc/07_identity.html
new file mode 100644
index 0000000..cfeaaa4
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/07_identity.html
@@ -0,0 +1,510 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>07 Identity - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: identity -->
+<!-- description: Global identities — CRUD, detail, files, faces, bind, unbind, search -->
+<!-- depends: 01_auth -->
+
+<h2>Global Identities</h2>
+<h3><code>GET /api/v1/identities</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>List all registered identities with pagination.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities?page=1&amp;page_size=20&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{count, identities: [.identities[] | {name}]}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get detailed information for a specific identity, including metadata and TMDb references.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;people&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;confirmed&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;tmdb_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">112</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;tmdb_profile&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;{output}/identities/{identity_uuid}/profile.jpg&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;metadata&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{},</span>
+<span class="w">  </span><span class="nt">&quot;reference_data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{},</span>
+<span class="w">  </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;updated_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>identity_uuid</code></td>
+<td>string</td>
+<td>Identity identifier</td>
+</tr>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>identity_type</code></td>
+<td>string</td>
+<td><code>"people"</code> or null</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td><code>.json</code>, <code>auto</code>, <code>tmdb</code>, <code>user_defined</code>, or <code>merged</code></td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>"confirmed"</code>, <code>"pending"</code>, or <code>"inactive"</code></td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>TMDb person ID (only if source = tmdb)</td>
+</tr>
+<tr>
+<td><code>tmdb_profile</code></td>
+<td>string</td>
+<td>Local profile image path (<code>{output}/identities/{uuid}/profile.jpg</code>)</td>
+</tr>
+<tr>
+<td><code>metadata</code></td>
+<td>object</td>
+<td>Metadata JSON (tmdb_character, cast_order, etc.)</td>
+</tr>
+<tr>
+<td><code>created_at</code></td>
+<td>string</td>
+<td>Creation timestamp</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>DELETE /api/v1/identity/:identity_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Delete an identity permanently.</p>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/files</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all files where this identity appears. Returns per-file summary including face count, confidence, and appearance time range.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/files&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/faces</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all face detection records associated with this identity.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/faces&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File where face was detected</td>
+</tr>
+<tr>
+<td><code>frame_number</code></td>
+<td>integer</td>
+<td>Frame number of detection</td>
+</tr>
+<tr>
+<td><code>face_id</code></td>
+<td>string</td>
+<td>Face ID (format: <code>face_{frame_number}</code>)</td>
+</tr>
+<tr>
+<td><code>confidence</code></td>
+<td>float</td>
+<td>Detection confidence</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/chunks</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all text chunks (sentences) spoken while this identity's face was on screen. Useful for finding what a person said.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/chunks&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;bd80fec92b0b6963d177a2c55bf713e2&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;bd80fec92b0b6963d177a2c55bf713e2_2&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5103</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5127</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">212.64</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">213.64</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text_content&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;[213s-214s] Cary Grant: \&quot;Olá!\&quot;&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File identifier</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>string</td>
+<td>Sentence chunk identifier</td>
+</tr>
+<tr>
+<td><code>start_frame</code></td>
+<td>integer</td>
+<td>Frame-accurate start position</td>
+</tr>
+<tr>
+<td><code>end_frame</code></td>
+<td>integer</td>
+<td>Frame-accurate end position</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>text_content</code></td>
+<td>string</td>
+<td>Spoken text content</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/bind</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Bind a face detection to an identity. Associates the face trace with the identity for future search and recognition.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File where face is detected</td>
+</tr>
+<tr>
+<td><code>face_id</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Face ID (format: <code>{frame}_{idx}</code>)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/bind&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;face_id&quot;: &quot;1_5&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/unbind</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Unbind a face detection from an identity. Removes the identity association from the face record.</p>
+<hr />
+<h3><code>GET /api/v1/identities/search</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Search identities by name (ILIKE search). Returns matching identity records.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search?q=Cary&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td>Identity source</td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>TMDb ID (if source = tmdb)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Associated file</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<hr />
+<h3><code>POST /api/v1/identity/upload</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Upload an identity.json file to create or update an identity. Accepts the same format as the identity.json files stored on disk.</p>
+<p>If an identity with the same <code>name</code> already exists, it will be updated with the new values.</p>
+<h4>Request</h4>
+<p>The request body is an <code>IdentityFile</code> object:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>identity_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity identifier</td>
+</tr>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>identity_type</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>"people"</code> or null</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>.json</code>, <code>auto</code>, <code>tmdb</code>, <code>user_defined</code>, or <code>merged</code></td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>"confirmed"</code>, <code>"pending"</code>, or <code>"inactive"</code></td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>TMDb person ID</td>
+</tr>
+<tr>
+<td><code>tmdb_profile</code></td>
+<td>string</td>
+<td>No</td>
+<td>TMDb profile image URL</td>
+</tr>
+<tr>
+<td><code>metadata</code></td>
+<td>object</td>
+<td>No</td>
+<td>Arbitrary metadata JSON</td>
+</tr>
+<tr>
+<td><code>file_bindings</code></td>
+<td>array</td>
+<td>No</td>
+<td>Array of <code>{ file_uuid, trace_ids, face_count }</code> (informational)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/upload&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{</span>
+<span class="s1">    &quot;version&quot;: 1,</span>
+<span class="s1">    &quot;identity_uuid&quot;: &quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;,</span>
+<span class="s1">    &quot;name&quot;: &quot;Cary Grant&quot;,</span>
+<span class="s1">    &quot;identity_type&quot;: &quot;people&quot;,</span>
+<span class="s1">    &quot;source&quot;: &quot;.json&quot;,</span>
+<span class="s1">    &quot;status&quot;: &quot;confirmed&quot;,</span>
+<span class="s1">    &quot;metadata&quot;: {},</span>
+<span class="s1">    &quot;file_bindings&quot;: []</span>
+<span class="s1">  }&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Identity uploaded successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/profile-image</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Upload a profile image (JPEG or PNG) for an identity. The image is saved to <code>{output}/identities/{uuid}/profile.{ext}</code>.</p>
+<p>Uses <code>multipart/form-data</code> with field name <code>image</code>.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/profile-image&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-F<span class="w"> </span><span class="s2">&quot;image=@/path/to/photo.jpg&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/output/identities/.../profile.jpg&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Profile image saved: profile.jpg&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Missing image field or unsupported format</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>415</code></td>
+<td>Unsupported image type (use JPEG or PNG)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/profile-image</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Retrieve the profile image for an identity. Returns the raw image data with appropriate Content-Type header.</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/profile-image&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>profile.jpg
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Response Header</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>content-type</code></td>
+<td><code>image/jpeg</code> or <code>image/png</code></td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/08_identity_agent.html b/deliverable_v1.1.0/html_docs/doc/08_identity_agent.html
new file mode 100644
index 0000000..64a8bed
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/08_identity_agent.html
@@ -0,0 +1,97 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>08 Identity Agent - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: identity_agent -->
+<!-- description: Identity agent — match from photo, match from trace -->
+<!-- depends: 01_auth, 07_identity -->
+
+<h2>Identity Agent</h2>
+<h3><code>POST /api/v1/agents/identity/match-from-photo</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Upload a face photo to match against known identities. Detects face via InsightFace, extracts 512D embedding via CoreML FaceNet, then searches pgvector for the closest identity.</p>
+<h4>Request</h4>
+<p><code>multipart/form-data</code> with field <code>image</code> (JPEG/PNG) and optional <code>file_uuid</code>.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/match-from-photo&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-F<span class="w"> </span><span class="s2">&quot;image=@/path/to/face.jpg&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-F<span class="w"> </span><span class="s2">&quot;file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;matches&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a90105...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;similarity&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.87</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/agents/identity/match-from-trace</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Match a face trace (tracked face across frames) against known identities. Samples 3 angles from the trace, generates embeddings, and searches pgvector.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File containing the trace</td>
+</tr>
+<tr>
+<td><code>trace_id</code></td>
+<td>integer</td>
+<td>Yes</td>
+<td>Face trace ID to match</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/match-from-trace&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;trace_id&quot;: 10}&#39;</span>
+</code></pre></div>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/08_media.html b/deliverable_v1.1.0/html_docs/doc/08_media.html
new file mode 100644
index 0000000..fae655d
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/08_media.html
@@ -0,0 +1,303 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>08 Media - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: media -->
+<!-- description: Video streaming & frame extraction -->
+<!-- depends: 01_auth -->
+
+<h2>Video Streaming &amp; Frame Extraction</h2>
+<p>All video streaming endpoints support the following common query parameters:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>mode</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>normal</code></td>
+<td><code>normal</code> or <code>debug</code> (draws detection overlays)</td>
+</tr>
+<tr>
+<td><code>audio</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>on</code></td>
+<td><code>on</code> or <code>off</code></td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/video</code></h3>
+<p>Stream the full video file with range support for seeking.</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<h4>Response</h4>
+<ul>
+<li><strong>200</strong>: Video stream (<code>Content-Type</code> based on file extension)</li>
+<li><strong>206</strong>: Partial content (range request)</li>
+<li>Supports <code>Range</code> header for seeking</li>
+</ul>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/trace/:trace_id/video</code></h3>
+<p>Stream video with highlights for a specific face trace (follows a single person across frames with bounding box overlay).</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/video/bbox</code></h3>
+<p>Stream video with bounding box overlay for all detected objects/faces.</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Uses a built-in 5×7 bitmap font renderer to draw labels directly on video frames via FFmpeg <code>drawtext</code> filter.</p>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/thumbnail</code></h3>
+<p>Extract a single frame from a video as JPEG image. Uses FFmpeg <code>select</code> filter.</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>frame</code></td>
+<td>integer</td>
+<td>Yes</td>
+<td>—</td>
+<td>Zero-based frame number to extract</td>
+</tr>
+<tr>
+<td><code>x</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>Crop start X (left edge). Requires <code>y</code>, <code>w</code>, <code>h</code>.</td>
+</tr>
+<tr>
+<td><code>y</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>Crop start Y (top edge). Requires <code>x</code>, <code>w</code>, <code>h</code>.</td>
+</tr>
+<tr>
+<td><code>w</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>Crop width in pixels. Requires <code>x</code>, <code>y</code>, <code>h</code>.</td>
+</tr>
+<tr>
+<td><code>h</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>Crop height in pixels. Requires <code>x</code>, <code>y</code>, <code>w</code>.</td>
+</tr>
+</tbody>
+</table>
+<p>All four crop params (<code>x</code>, <code>y</code>, <code>w</code>, <code>h</code>) must be provided together or omitted.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Extract frame 1000 (full frame)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/bd80fec92b0b6963d177a2c55bf713e2/thumbnail?frame=1000&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>frame_1000.jpg
+
+<span class="c1"># Extract and crop face region (x=320, y=240, w=160, h=160)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/bd80fec92b0b6963d177a2c55bf713e2/thumbnail?frame=1000&amp;x=320&amp;y=240&amp;w=160&amp;h=160&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>face_crop.jpg
+</code></pre></div>
+
+<h4>Response</h4>
+<ul>
+<li><strong>200</strong>: <code>image/jpeg</code> binary data</li>
+<li><strong>404</strong>: File not found</li>
+<li><strong>500</strong>: FFmpeg error (e.g., frame number exceeds video duration)</li>
+</ul>
+<h3><code>GET /api/v1/file/:file_uuid/clip</code></h3>
+<p>Extract a video clip (time range) as MPEG-TS stream. Uses FFmpeg <code>-ss</code> fast seek.</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>start_frame</code></td>
+<td>integer</td>
+<td>No*</td>
+<td>—</td>
+<td>Start frame (zero-based). <strong>Frame-accurate</strong> — use this for precision.</td>
+</tr>
+<tr>
+<td><code>end_frame</code></td>
+<td>integer</td>
+<td>No*</td>
+<td>—</td>
+<td>End frame (zero-based, inclusive). Requires <code>start_frame</code>.</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>No*</td>
+<td>—</td>
+<td>Start time in seconds. Approximate (FPS-dependent). Fallback if frames not given.</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>No*</td>
+<td>—</td>
+<td>End time in seconds. Approximate (FPS-dependent). Fallback if frames not given.</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>No</td>
+<td>video FPS</td>
+<td>Override frames-per-second for frame↔time calculation. Defaults to video's detected FPS.</td>
+</tr>
+<tr>
+<td><code>mode</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>normal</code></td>
+<td><code>normal</code> or <code>debug</code> (draws "CLIP" overlay)</td>
+</tr>
+<tr>
+<td><code>audio</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>on</code></td>
+<td><code>on</code> or <code>off</code></td>
+</tr>
+</tbody>
+</table>
+<p>Either (<code>start_frame</code>+<code>end_frame</code>) OR (<code>start_time</code>+<code>end_time</code>) must be provided.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Clip by frame range (primary)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/bd80fec92b0b6963d177a2c55bf713e2/clip?start_frame=0&amp;end_frame=47&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>clip.ts
+
+<span class="c1"># Clip by time range (fallback)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/bd80fec92b0b6963d177a2c55bf713e2/clip?start_time=30&amp;end_time=45&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>clip.ts
+</code></pre></div>
+
+<h4>Response</h4>
+<ul>
+<li><strong>200</strong>: <code>video/mp2t</code> MPEG-TS stream</li>
+<li><strong>400</strong>: Missing/invalid range parameters</li>
+<li><strong>404</strong>: File not found</li>
+<li><strong>500</strong>: FFmpeg error</li>
+</ul>
+<h4>Technical Notes</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Detail</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Backend</strong></td>
+<td>FFmpeg (<code>ffmpeg-full</code>)</td>
+</tr>
+<tr>
+<td><strong>Seek</strong></td>
+<td><code>-ss</code> before <code>-i</code> (fast keyframe seek)</td>
+</tr>
+<tr>
+<td><strong>Format</strong></td>
+<td>MPEG-TS (<code>mpegts</code> muxer, pipe-safe)</td>
+</tr>
+<tr>
+<td><strong>Codec</strong></td>
+<td>H.264 + AAC</td>
+</tr>
+<tr>
+<td><strong>Cache</strong></td>
+<td><code>Cache-Control: public, max-age=86400</code> (24h)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<table class="table">
+<thead>
+<tr>
+<th>Detail</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Backend</strong></td>
+<td>FFmpeg (<code>ffmpeg-full</code>)</td>
+</tr>
+<tr>
+<td><strong>Filter</strong></td>
+<td><code>select=eq(n\,FRAME)</code> to select frame, optional <code>crop=W:H:X:Y</code></td>
+</tr>
+<tr>
+<td><strong>Output</strong></td>
+<td>Single JPEG via pipe (<code>image2pipe</code>, <code>mjpeg</code> codec)</td>
+</tr>
+<tr>
+<td><strong>Cache</strong></td>
+<td><code>Cache-Control: public, max-age=86400</code> (24h)</td>
+</tr>
+<tr>
+<td><strong>Frame number</strong></td>
+<td>Zero-based (<code>frame=0</code> = first frame of video)</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/09_tmdb.html b/deliverable_v1.1.0/html_docs/doc/09_tmdb.html
new file mode 100644
index 0000000..0f48d89
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/09_tmdb.html
@@ -0,0 +1,123 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>09 Tmdb - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: tmdb -->
+<!-- description: TMDb enrichment endpoints — prefetch, probe, resource, check -->
+<!-- depends: 01_auth, 03_register -->
+
+<h2>TMDb Enrichment</h2>
+<blockquote>
+<p><strong>Offline operation</strong>: TMDb prefetch now checks local identity files first (<code>identities/_index.json</code> + <code>*.tmdb.json</code>).
+If local files exist, no external API call is made. Internet is only needed for initial data seeding.</p>
+</blockquote>
+<h3>Overview</h3>
+<p>TMDb enrichment is an optional identity enrichment step that can be run after Pipeline face detection completes. The workflow is:</p>
+<ol>
+<li><strong>Prefetch</strong> (requires internet): Download movie cast data from TMDb API → cache to <code>{file_uuid}.tmdb.json</code></li>
+<li><strong>Probe</strong>: Read local cache → create identities for <strong>all</strong> cast members (<code>source='tmdb'</code>) + save <code>identity.json</code> + download profile image to <code>{OUTPUT}/identities/{uuid}/profile.jpg</code></li>
+<li><strong>Match</strong>: The worker automatically matches video faces against TMDb identities when <code>MOMENTRY_TMDB_PROBE_ENABLED=true</code></li>
+</ol>
+<h3><code>POST /api/v1/agents/tmdb/prefetch</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Fetch TMDb cast data for a registered file and cache it locally. This is the only step requiring internet access.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to enrich</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/tmdb/prefetch&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;cache_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/output/...tmdb.json&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/file/:file_uuid/tmdb-probe</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Read local TMDb cache and create/update identities. Requires prefetch to have been run first.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/tmdb-probe&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_created, movie_title}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200 — identities created)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;identities_created&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;movie_title&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h4>Response (200 — no cache)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;No TMDb cache found. Run tmdb-prefetch first.&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>GET /api/v1/resource/tmdb</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>View TMDb resource status including configuration, identity counts, and cache file count.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_seeded, cache_files}&#39;</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/resource/tmdb/check</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Ping the TMDb API to verify connectivity and measure latency.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb/check&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.status&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;api_key_configured&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;enabled&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_reachable&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">120</span>
+<span class="p">}</span>
+</code></pre></div>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/10_pipeline.html b/deliverable_v1.1.0/html_docs/doc/10_pipeline.html
new file mode 100644
index 0000000..319e394
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/10_pipeline.html
@@ -0,0 +1,364 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>10 Pipeline - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: pipeline -->
+<!-- description: Pipeline processors, ingestion status, stats endpoints -->
+<!-- depends: 01_auth -->
+
+<h2>Pipeline</h2>
+<h3>Dependency Graph</h3>
+<div class="codehilite"><pre><span></span><code><span class="n">flowchart</span><span class="w"> </span><span class="n">TB</span>
+<span class="w">    </span><span class="n">subgraph</span><span class="w"> </span><span class="n">Processors</span><span class="p">[</span><span class="s">&quot;10 Processors&quot;</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Cut</span><span class="p">[</span><span class="n">Cut</span><span class="p">]</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">ASR</span><span class="p">[</span><span class="n">ASR</span><span class="p">]</span>
+<span class="w">        </span><span class="n">ASR</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">ASRX</span><span class="p">[</span><span class="n">ASRX</span><span class="p">]</span>
+<span class="w">        </span><span class="n">ASRX</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Story</span><span class="p">[</span><span class="n">Story</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Cut</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Story</span>
+<span class="w">        </span><span class="n">YOLO</span><span class="p">[</span><span class="n">YOLO</span><span class="p">]</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">VisualChunk</span><span class="p">[</span><span class="n">VisualChunk</span><span class="p">]</span>
+<span class="w">        </span><span class="n">VisualChunk</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Story</span>
+<span class="w">        </span><span class="n">Face</span><span class="p">[</span><span class="n">Face</span><span class="p">]</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Story</span>
+<span class="w">        </span><span class="n">Story</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">FiveW1H</span><span class="p">[</span><span class="mi">5</span><span class="n">W1H</span><span class="p">]</span>
+<span class="w">        </span><span class="n">OCR</span><span class="p">[</span><span class="n">OCR</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Pose</span><span class="p">[</span><span class="n">Pose</span><span class="p">]</span>
+<span class="w">    </span><span class="n">end</span>
+
+<span class="w">    </span><span class="n">subgraph</span><span class="w"> </span><span class="n">Ingestion</span><span class="p">[</span><span class="s">&quot;入庫 (Post-Processing)&quot;</span><span class="p">]</span>
+<span class="w">        </span><span class="n">ASR</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Rule1</span><span class="p">[</span><span class="n">Rule</span><span class="w"> </span><span class="mi">1</span><span class="w"> </span><span class="n">Sentence</span><span class="p">]</span>
+<span class="w">        </span><span class="n">ASRX</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Rule1</span>
+<span class="w">        </span><span class="n">Rule1</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Vectorize</span><span class="p">[</span><span class="n">Auto</span><span class="o">-</span><span class="n">Vectorize</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Rule1</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Phase1</span><span class="p">[</span><span class="n">Phase</span><span class="w"> </span><span class="mi">1</span><span class="w"> </span><span class="n">Pack</span><span class="p">]</span>
+
+<span class="w">        </span><span class="n">Cut</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Rule3</span><span class="p">[</span><span class="n">Rule</span><span class="w"> </span><span class="mi">3</span><span class="w"> </span><span class="n">Scene</span><span class="p">]</span>
+<span class="w">        </span><span class="n">ASR</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Rule3</span>
+
+<span class="w">        </span><span class="n">Face</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Trace</span><span class="p">[</span><span class="n">Face</span><span class="w"> </span><span class="n">Trace</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Trace</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Qdrant</span><span class="p">[</span><span class="n">Qdrant</span><span class="w"> </span><span class="n">Sync</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Trace</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">TraceChunks</span><span class="p">[</span><span class="n">Trace</span><span class="w"> </span><span class="n">Chunks</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Trace</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">TKG</span><span class="p">[</span><span class="n">TKG</span><span class="w"> </span><span class="n">Builder</span><span class="p">]</span>
+
+<span class="w">        </span><span class="n">Face</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">TMDbMatch</span><span class="p">[</span><span class="n">TMDb</span><span class="w"> </span><span class="n">Match</span><span class="p">]</span>
+<span class="w">        </span><span class="n">Face</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">SceneMeta</span><span class="p">[</span><span class="n">Scene</span><span class="w"> </span><span class="n">Metadata</span><span class="p">]</span>
+<span class="w">        </span><span class="n">YOLO</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">SceneMeta</span>
+<span class="w">        </span><span class="n">Face</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">IdentityAgent</span><span class="p">[</span><span class="n">Identity</span><span class="w"> </span><span class="n">Agent</span><span class="p">]</span>
+<span class="w">        </span><span class="n">ASRX</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">IdentityAgent</span>
+
+<span class="w">        </span><span class="n">Cut</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Agent5W1H</span><span class="p">[</span><span class="mi">5</span><span class="n">W1H</span><span class="w"> </span><span class="n">Agent</span><span class="p">]</span>
+<span class="w">        </span><span class="n">ASR</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Agent5W1H</span>
+<span class="w">        </span><span class="n">Agent5W1H</span><span class="w"> </span><span class="o">--&gt;</span><span class="w"> </span><span class="n">Phase2</span><span class="p">[</span><span class="n">Phase</span><span class="w"> </span><span class="mi">2</span><span class="w"> </span><span class="n">Pack</span><span class="p">]</span>
+<span class="w">    </span><span class="n">end</span>
+
+<span class="w">    </span><span class="n">style</span><span class="w"> </span><span class="n">Processors</span><span class="w"> </span><span class="n">fill</span><span class="o">:</span><span class="err">#</span><span class="mi">1</span><span class="n">a1a2e</span><span class="p">,</span><span class="n">stroke</span><span class="o">:</span><span class="err">#</span><span class="n">e94560</span>
+<span class="w">    </span><span class="n">style</span><span class="w"> </span><span class="n">Ingestion</span><span class="w"> </span><span class="n">fill</span><span class="o">:</span><span class="err">#</span><span class="mi">16213</span><span class="n">e</span><span class="p">,</span><span class="n">stroke</span><span class="o">:</span><span class="err">#</span><span class="mf">0f</span><span class="mi">3460</span>
+</code></pre></div>
+
+<h3>Pipeline Completion Flow</h3>
+<p>The pipeline is <strong>not complete</strong> until both the 10 processors AND the 入庫 (ingestion) steps have finished. The worker polls every 3 seconds and only marks the job as <code>completed</code> when all ingestion steps verify OK.</p>
+<div class="codehilite"><pre><span></span><code><span class="mf">10</span><span class="w"> </span><span class="n">processors</span><span class="w"> </span><span class="n">done</span>
+<span class="w">     </span><span class="err">↓</span><span class="w">  </span><span class="p">(</span><span class="n">job</span><span class="w"> </span><span class="n">status</span><span class="w"> </span><span class="n">stays</span><span class="w"> </span><span class="s">&quot;running&quot;</span><span class="p">)</span>
+<span class="n">Algorithm</span><span class="w"> </span><span class="mf">1</span><span class="w"> </span><span class="n">Trigger</span><span class="p">:</span><span class="w"> </span><span class="n">Rule</span><span class="w"> </span><span class="mf">1</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">Vectorize</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">Phase</span><span class="w"> </span><span class="mf">1</span><span class="w"> </span><span class="n">Pack</span>
+<span class="w">     </span><span class="err">↓</span><span class="w">  </span><span class="p">(</span><span class="n">job</span><span class="w"> </span><span class="kr">run</span><span class="n">s</span><span class="w"> </span><span class="n">in</span><span class="w"> </span><span class="n">parallel</span><span class="p">)</span>
+<span class="n">Algorithm</span><span class="w"> </span><span class="mf">2</span><span class="w"> </span><span class="n">Trigger</span><span class="p">:</span><span class="w"> </span><span class="n">Face</span><span class="w"> </span><span class="n">Trace</span><span class="w"> </span><span class="err">→</span><span class="w"> </span><span class="n">TKG</span><span class="p">,</span><span class="w"> </span><span class="n">Scene</span><span class="w"> </span><span class="n">Metadata</span><span class="p">,</span><span class="w"> </span><span class="n">Identity</span><span class="w"> </span><span class="n">Agent</span><span class="p">,</span><span class="w"> </span><span class="mf">5</span><span class="n">W1H</span><span class="w"> </span><span class="n">Agent</span>
+<span class="w">     </span><span class="err">↓</span><span class="w">  </span><span class="p">(</span><span class="n">poll</span><span class="w"> </span><span class="n">checks</span><span class="w"> </span><span class="n">every</span><span class="w"> </span><span class="mf">3</span><span class="n">s</span><span class="p">)</span>
+<span class="n">Ingestion</span><span class="w"> </span><span class="n">verification</span><span class="p">:</span><span class="w"> </span><span class="n">rule1</span><span class="w"> </span><span class="err">✓</span><span class="w"> </span><span class="n">vectorize</span><span class="w"> </span><span class="err">✓</span><span class="w"> </span><span class="n">rule3</span><span class="w"> </span><span class="err">✓</span><span class="w"> </span><span class="n">face_trace</span><span class="w"> </span><span class="err">✓</span><span class="w"> </span><span class="n">tkg</span><span class="w"> </span><span class="err">✓</span><span class="w"> </span><span class="n">scene_meta</span><span class="w"> </span><span class="err">✓</span><span class="w"> </span><span class="mf">5</span><span class="n">w1h</span><span class="w"> </span><span class="err">✓</span>
+<span class="w">     </span><span class="err">↓</span>
+<span class="n">job</span><span class="w"> </span><span class="n">status</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="s">&quot;completed&quot;</span>
+</code></pre></div>
+
+<h3>10 Processor Stages</h3>
+<table class="table">
+<thead>
+<tr>
+<th>#</th>
+<th>Processor</th>
+<th>Depends On</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>1</td>
+<td><code>Cut</code></td>
+<td>—</td>
+<td>Scene boundary detection (PySceneDetect)</td>
+</tr>
+<tr>
+<td>2</td>
+<td><code>ASR</code></td>
+<td>Cut</td>
+<td>Automatic speech recognition (faster-whisper)</td>
+</tr>
+<tr>
+<td>3</td>
+<td><code>ASRX</code></td>
+<td>ASR</td>
+<td>Speaker diarization + ASR refinement</td>
+</tr>
+<tr>
+<td>4</td>
+<td><code>YOLO</code></td>
+<td>—</td>
+<td>Object detection (YOLOv8)</td>
+</tr>
+<tr>
+<td>5</td>
+<td><code>OCR</code></td>
+<td>—</td>
+<td>Optical character recognition</td>
+</tr>
+<tr>
+<td>6</td>
+<td><code>Face</code></td>
+<td>—</td>
+<td>Face detection + recognition (InsightFace + CoreML)</td>
+</tr>
+<tr>
+<td>7</td>
+<td><code>Pose</code></td>
+<td>—</td>
+<td>Pose estimation</td>
+</tr>
+<tr>
+<td>8</td>
+<td><code>VisualChunk</code></td>
+<td>YOLO</td>
+<td>Visual object chunking</td>
+</tr>
+<tr>
+<td>9</td>
+<td><code>Story</code></td>
+<td>ASRX + Cut + YOLO + Face</td>
+<td>Narrative scene summarization (LLM, with embedding)</td>
+</tr>
+<tr>
+<td>10</td>
+<td><code>5W1H</code></td>
+<td>Story</td>
+<td>Who/What/When/Where/Why extraction (LLM, with embedding)</td>
+</tr>
+</tbody>
+</table>
+<h3>入庫 (Post-Processing / Ingestion)</h3>
+<p>These steps run after the 10 processors and are <strong>required for pipeline completion</strong>. The worker checks all of them before marking the job as done.</p>
+<table class="table">
+<thead>
+<tr>
+<th>#</th>
+<th>Step</th>
+<th>Triggers When</th>
+<th>Verification</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>1</td>
+<td><strong>Rule 1 Sentence Chunking</strong></td>
+<td>ASR + ASRX done</td>
+<td><code>chunk</code> table has rows with <code>chunk_type = 'sentence'</code></td>
+</tr>
+<tr>
+<td>2</td>
+<td><strong>Auto-Vectorize</strong></td>
+<td>Rule 1 done</td>
+<td><code>chunk.embedding</code> IS NOT NULL for sentence chunks</td>
+</tr>
+<tr>
+<td>3</td>
+<td><strong>Phase 1 Pack</strong></td>
+<td>Rule 1 done</td>
+<td><code>release_pack.py --phase 1</code> executed</td>
+</tr>
+<tr>
+<td>4</td>
+<td><strong>Rule 3 Scene Chunking</strong></td>
+<td>All 10 processors done + Cut + ASR</td>
+<td><code>chunk</code> table has rows with <code>chunk_type = 'cut'</code></td>
+</tr>
+<tr>
+<td>5</td>
+<td><strong>Face Trace</strong></td>
+<td>All 10 processors done + Face</td>
+<td><code>face_detections.trace_id</code> IS NOT NULL</td>
+</tr>
+<tr>
+<td>6</td>
+<td><strong>Qdrant Face Sync</strong></td>
+<td>Face Trace done</td>
+<td>Qdrant face_embedding collection populated</td>
+</tr>
+<tr>
+<td>7</td>
+<td><strong>Trace Chunks</strong></td>
+<td>Face Trace done</td>
+<td><code>chunk</code> table has rows with <code>chunk_type = 'trace'</code></td>
+</tr>
+<tr>
+<td>8</td>
+<td><strong>TKG Builder</strong></td>
+<td>Face Trace done</td>
+<td><code>tkg_nodes</code> + <code>tkg_edges</code> tables have rows</td>
+</tr>
+<tr>
+<td>9</td>
+<td><strong>TMDb Face Matching</strong></td>
+<td>TMDb enabled + Face done</td>
+<td><code>face_detections.identity_id</code> IS NOT NULL</td>
+</tr>
+<tr>
+<td>10</td>
+<td><strong>Heuristic Scene Metadata</strong></td>
+<td>Face + YOLO done</td>
+<td><code>{file_uuid}.scene_meta.json</code> exists on disk</td>
+</tr>
+<tr>
+<td>11</td>
+<td><strong>Identity Agent</strong></td>
+<td>Face + ASRX done</td>
+<td><code>identities</code> with <code>source = 'identity_agent'</code></td>
+</tr>
+<tr>
+<td>12</td>
+<td><strong>5W1H Agent</strong></td>
+<td>Cut + ASR done</td>
+<td><code>chunk.summary_text</code> IS NOT NULL for cut chunks</td>
+</tr>
+<tr>
+<td>13</td>
+<td><strong>Release Pack</strong></td>
+<td>5W1H Agent done</td>
+<td><code>release_pack.py --phase 2</code> executed</td>
+</tr>
+</tbody>
+</table>
+<h3>Ingestion Status</h3>
+<p>Check real-time ingestion status for a file:</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/stats/ingestion-status/{file_uuid}&quot;</span>
+</code></pre></div>
+
+<p>Returns per-step <code>done</code> / <code>pending</code> status with detail counts.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;http://localhost:3003/api/v1/stats/ingestion-status/bd80fec9c42afb0307eb28f22c64c76a&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.steps[] | {name, status, detail}&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;bd80fec9c42afb0307eb28f22c64c76a&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;steps&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;rule1_sentence&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 sentence chunks&quot;</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;auto_vectorize&quot;</span><span class="p">,</span><span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 embedded&quot;</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;rule3_scene&quot;</span><span class="p">,</span><span class="w">     </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 scene chunks&quot;</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;face_trace&quot;</span><span class="p">,</span><span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 traces&quot;</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;trace_chunks&quot;</span><span class="p">,</span><span class="w">    </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 trace chunks&quot;</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tkg&quot;</span><span class="p">,</span><span class="w">             </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 nodes, 0 edges&quot;</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;identity_match&quot;</span><span class="p">,</span><span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 identities&quot;</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;scene_metadata&quot;</span><span class="p">,</span><span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;5w1h&quot;</span><span class="p">,</span><span class="w">            </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;detail&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;0 scenes with 5W1H&quot;</span><span class="w"> </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h3>Stats Endpoints</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Auth</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/sftpgo</code></td>
+<td>No</td>
+<td>SFTPGo service status</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/ingestion-status/:file_uuid</code></td>
+<td>No</td>
+<td>Per-file ingestion checklist</td>
+</tr>
+</tbody>
+</table>
+<h3>Configuration</h3>
+<h3><code>POST /api/v1/config/cache</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Toggle the Redis cache on or off.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>enabled</code></td>
+<td>boolean</td>
+<td>Yes</td>
+<td><code>true</code> to enable, <code>false</code> to disable</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/config/cache&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;enabled&quot;: false}&#39;</span>
+</code></pre></div>
+
+<h3>Unmounted Routes</h3>
+<p>The following routes are defined in source code but are <strong>NOT</strong> currently mounted in the router:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Endpoint</th>
+<th>Source file</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>/api/v1/search/persons</code></td>
+<td><code>universal_search.rs</code> (not mounted)</td>
+</tr>
+<tr>
+<td><code>/api/v1/who</code></td>
+<td><code>who.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/who/candidates</code></td>
+<td><code>who.rs</code></td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/12_agent.html b/deliverable_v1.1.0/html_docs/doc/12_agent.html
new file mode 100644
index 0000000..79f83ee
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/12_agent.html
@@ -0,0 +1,207 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>12 Agent - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<h1>Agent Endpoints</h1>
+<p>Agent endpoints provide AI-powered capabilities including translation, identity analysis, and 5W1H extraction.</p>
+<h2>POST /api/v1/agents/translate</h2>
+<p>Translate text between languages using Gemma4 (llama.cpp, port 8082).</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Hello, welcome to Momentry Core.&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;target_language&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Traditional Chinese&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source_language&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;English&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>text</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Text to translate</td>
+</tr>
+<tr>
+<td><code>target_language</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Target language name (e.g. "Traditional Chinese", "Japanese")</td>
+</tr>
+<tr>
+<td><code>source_language</code></td>
+<td>string</td>
+<td>❌</td>
+<td>Source language (default: "auto")</td>
+</tr>
+</tbody>
+</table>
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;translated_text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;您好，歡迎使用 Momentry Core。&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source_language_detected&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;English&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;model_used&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;google_gemma-4-26B-A4B-it-Q5_K_M.gguf&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h3>Supported Language Pairs (tested)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Source</th>
+<th>Target</th>
+<th>Quality</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>English</td>
+<td>Traditional Chinese</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>English</td>
+<td>Japanese</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>Chinese</td>
+<td>English</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>English</td>
+<td>French</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>Chinese</td>
+<td>Japanese</td>
+<td>✅</td>
+</tr>
+</tbody>
+</table>
+<h3>Model</h3>
+<ul>
+<li><strong>Model</strong>: Gemma4 26B (Q5_K_M)</li>
+<li><strong>Engine</strong>: llama.cpp at <code>localhost:8082</code></li>
+<li><strong>Endpoint</strong>: <code>/v1/chat/completions</code> (OpenAI-compatible)</li>
+<li><strong>Temperature</strong>: 0.1</li>
+<li><strong>Max tokens</strong>: 1024</li>
+</ul>
+<h3>Errors</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Status</th>
+<th>Condition</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>500</td>
+<td>LLM unreachable or response parse failure</td>
+</tr>
+<tr>
+<td>401</td>
+<td>Missing/invalid auth</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>POST /api/v1/agents/5w1h/analyze</h2>
+<p>Extract 5W1H (Who, What, When, Where, Why, How) from a scene. Uses Gemma4 LLM on port 8082.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;scene_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;5w1h&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;who&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;what&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;discussing plans&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;when&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;1963&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;where&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;Paris&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;why&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;vacation&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;how&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;in person&quot;</span><span class="p">]</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/5w1h/batch</h2>
+<p>Batch analyze all scenes in a file for 5W1H extraction. Uses the pipeline's <code>parent_chunk_5w1h.py --mode llm</code>.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>GET /api/v1/agents/5w1h/status</h2>
+<p>Get status of the 5W1H agent pipeline for a file.</p>
+<hr />
+<h2>Embedding Model</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Detail</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Model</strong></td>
+<td>EmbeddingGemma-300m</td>
+</tr>
+<tr>
+<td><strong>Endpoint</strong></td>
+<td><code>POST /v1/embeddings</code> on port 11436</td>
+</tr>
+<tr>
+<td><strong>Dimension</strong></td>
+<td>768</td>
+</tr>
+<tr>
+<td><strong>Used by</strong></td>
+<td><code>parent_chunk_5w1h.py --embed</code>, story, 5W1H, search</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/index.html b/deliverable_v1.1.0/html_docs/doc/index.html
new file mode 100644
index 0000000..62b15f8
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/index.html
@@ -0,0 +1,29 @@
+<!DOCTYPE html>
+<html lang="zh-TW">
+<head>
+<meta charset="UTF-8">
+<title>Momentry API 文件</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 900px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 28px; margin-bottom: 8px; }
+p.subtitle { color: #666; margin-bottom: 24px; }
+table { width: 100%; border-collapse: collapse; }
+tr { border-bottom: 1px solid #eee; }
+tr:last-child { border: none; }
+td { padding: 10px 0; }
+td.cn { width: 140px; font-weight: 600; color: #333; }
+td.en { color: #666; font-size: 14px; }
+a { color: #0066cc; text-decoration: none; display: block; }
+a:hover td { background: #f8f8f8; border-radius: 4px; }
+</style>
+</head>
+<body>
+<div class="container">
+<h1>Momentry API 文件</h1>
+<p class="subtitle">API 參考手冊 — 登入後可瀏覽各模組文件</p>
+<table><tr onclick="window.location='01_auth.html'" style="cursor:pointer"><td class="cn">安全認證</td><td class="en">Authentication</td></tr><tr onclick="window.location='02_health.html'" style="cursor:pointer"><td class="cn">健康檢查</td><td class="en">Health</td></tr><tr onclick="window.location='03_register.html'" style="cursor:pointer"><td class="cn">檔案註冊</td><td class="en">File Registration</td></tr><tr onclick="window.location='04_lookup.html'" style="cursor:pointer"><td class="cn">檔案屬性查詢</td><td class="en">File Lookup</td></tr><tr onclick="window.location='05_process.html'" style="cursor:pointer"><td class="cn">處理流程</td><td class="en">Processing</td></tr><tr onclick="window.location='06_search.html'" style="cursor:pointer"><td class="cn">搜尋功能</td><td class="en">Search</td></tr><tr onclick="window.location='07_identity.html'" style="cursor:pointer"><td class="cn">身份識別</td><td class="en">Identity</td></tr><tr onclick="window.location='08_identity_agent.html'" style="cursor:pointer"><td class="cn">智能身份綁定</td><td class="en">Smart Identity Binding</td></tr><tr onclick="window.location='08_media.html'" style="cursor:pointer"><td class="cn">串流與截圖</td><td class="en">Streaming & Thumbnails</td></tr><tr onclick="window.location='09_tmdb.html'" style="cursor:pointer"><td class="cn">TMDb 整合</td><td class="en">TMDb Integration</td></tr><tr onclick="window.location='10_pipeline.html'" style="cursor:pointer"><td class="cn">生產線</td><td class="en">Pipeline</td></tr><tr onclick="window.location='12_agent.html'" style="cursor:pointer"><td class="cn">智慧代理</td><td class="en">AI Agents</td></tr></table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc/login.html b/deliverable_v1.1.0/html_docs/doc/login.html
new file mode 100644
index 0000000..c199107
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc/login.html
@@ -0,0 +1,46 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Login - Momentry Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; display: flex; justify-content: center; align-items: center; height: 100vh; }
+.card { background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; width: 360px; }
+h1 { font-size: 24px; margin-bottom: 24px; text-align: center; }
+input { width: 100%; padding: 10px 12px; margin-bottom: 12px; border: 1px solid #ddd; border-radius: 6px; font-size: 14px; }
+button { width: 100%; padding: 10px; background: #0066cc; color: white; border: none; border-radius: 6px; font-size: 16px; cursor: pointer; }
+button:hover { background: #0052a3; }
+.error { color: #cc0000; font-size: 13px; margin-bottom: 12px; display: none; }
+</style>
+</head>
+<body>
+<div class="card">
+<h1>Momentry Docs</h1>
+<form id="loginForm">
+<input type="text" id="username" placeholder="Username" value="demo" required>
+<input type="password" id="password" placeholder="Password" value="demo" required>
+<div class="error" id="error">Invalid credentials</div>
+<button type="submit">Login</button>
+</form>
+</div>
+<script>
+document.getElementById('loginForm').onsubmit = async function(e) {
+    e.preventDefault();
+    const resp = await fetch('/api/v1/auth/login', {
+        method: 'POST',
+        headers: {'Content-Type': 'application/json'},
+        body: JSON.stringify({
+            username: document.getElementById('username').value,
+            password: document.getElementById('password').value
+        })
+    });
+    if (resp.ok) {
+        window.location.href = '/doc/index.html';
+    } else {
+        document.getElementById('error').style.display = 'block';
+    }
+};
+</script>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc_developer/11_error_codes.html b/deliverable_v1.1.0/html_docs/doc_developer/11_error_codes.html
new file mode 100644
index 0000000..e1bd41c
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc_developer/11_error_codes.html
@@ -0,0 +1,180 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>11 Error Codes - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<!-- module: error_codes -->
+<!-- description: Standard API error codes -->
+<!-- depends: -->
+
+<h2>Error Response Format</h2>
+<p>All API errors follow this JSON structure:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;error&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;code&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;E001_NOT_FOUND&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Resource not found&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;details&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;resource&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;file_uuid&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;value&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;abc&quot;</span><span class="p">}</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>Error Code List</h2>
+<h3>Generic Errors (E0xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E001_NOT_FOUND</code></td>
+<td>404</td>
+<td>Resource not found (file, identity, chunk)</td>
+</tr>
+<tr>
+<td><code>E002_DUPLICATE</code></td>
+<td>409</td>
+<td>Resource already exists</td>
+</tr>
+<tr>
+<td><code>E003_VALIDATION</code></td>
+<td>400</td>
+<td>Request parameter validation failed</td>
+</tr>
+<tr>
+<td><code>E004_UNAUTHORIZED</code></td>
+<td>401</td>
+<td>Invalid API key or token</td>
+</tr>
+<tr>
+<td><code>E005_INTERNAL</code></td>
+<td>500</td>
+<td>Internal server error</td>
+</tr>
+</tbody>
+</table>
+<h3>Processor Errors (E1xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E101_PROCESSOR_FAIL</code></td>
+<td>500</td>
+<td>Python script execution failed</td>
+</tr>
+<tr>
+<td><code>E102_TIMEOUT</code></td>
+<td>504</td>
+<td>Processing timeout</td>
+</tr>
+<tr>
+<td><code>E103_RESUME_FAIL</code></td>
+<td>500</td>
+<td>Resume failed (checkpoint not found)</td>
+</tr>
+<tr>
+<td><code>E104_NO_VIDEO</code></td>
+<td>400</td>
+<td>Video file path not found</td>
+</tr>
+</tbody>
+</table>
+<h3>Identity Errors (E2xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E201_FACE_NOT_FOUND</code></td>
+<td>404</td>
+<td>Face detection not found</td>
+</tr>
+<tr>
+<td><code>E202_MERGE_CONFLICT</code></td>
+<td>409</td>
+<td>Identity merge conflict</td>
+</tr>
+<tr>
+<td><code>E203_CANDIDATE_EMPTY</code></td>
+<td>404</td>
+<td>No candidates available for confirmation</td>
+</tr>
+</tbody>
+</table>
+<h3>TMDb Errors (E3xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E301_TMDB_NO_KEY</code></td>
+<td>400</td>
+<td><code>TMDB_API_KEY</code> environment variable not set</td>
+</tr>
+<tr>
+<td><code>E302_TMDB_UNREACHABLE</code></td>
+<td>502</td>
+<td>TMDb API unreachable or timed out</td>
+</tr>
+<tr>
+<td><code>E303_TMDB_CACHE_NOT_FOUND</code></td>
+<td>200</td>
+<td>No local TMDb cache; run prefetch first</td>
+</tr>
+<tr>
+<td><code>E304_TMDB_PROBE_FAILED</code></td>
+<td>500</td>
+<td>TMDb probe execution failed</td>
+</tr>
+<tr>
+<td><code>E305_TMDB_MOVIE_NOT_FOUND</code></td>
+<td>404</td>
+<td>No matching TMDb movie found from filename</td>
+</tr>
+</tbody>
+</table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc_developer/index.html b/deliverable_v1.1.0/html_docs/doc_developer/index.html
new file mode 100644
index 0000000..6a66aa7
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc_developer/index.html
@@ -0,0 +1,29 @@
+<!DOCTYPE html>
+<html lang="zh-TW">
+<head>
+<meta charset="UTF-8">
+<title>Momentry API 文件</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 900px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 28px; margin-bottom: 8px; }
+p.subtitle { color: #666; margin-bottom: 24px; }
+table { width: 100%; border-collapse: collapse; }
+tr { border-bottom: 1px solid #eee; }
+tr:last-child { border: none; }
+td { padding: 10px 0; }
+td.cn { width: 140px; font-weight: 600; color: #333; }
+td.en { color: #666; font-size: 14px; }
+a { color: #0066cc; text-decoration: none; display: block; }
+a:hover td { background: #f8f8f8; border-radius: 4px; }
+</style>
+</head>
+<body>
+<div class="container">
+<h1>Momentry API 文件</h1>
+<p class="subtitle">API 參考手冊 — 登入後可瀏覽各模組文件</p>
+<table><tr onclick="window.location='11_error_codes.html'" style="cursor:pointer"><td class="cn">錯誤碼</td><td class="en">Error Codes</td></tr></table>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/html_docs/doc_developer/login.html b/deliverable_v1.1.0/html_docs/doc_developer/login.html
new file mode 100644
index 0000000..c199107
--- /dev/null
+++ b/deliverable_v1.1.0/html_docs/doc_developer/login.html
@@ -0,0 +1,46 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Login - Momentry Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; display: flex; justify-content: center; align-items: center; height: 100vh; }
+.card { background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; width: 360px; }
+h1 { font-size: 24px; margin-bottom: 24px; text-align: center; }
+input { width: 100%; padding: 10px 12px; margin-bottom: 12px; border: 1px solid #ddd; border-radius: 6px; font-size: 14px; }
+button { width: 100%; padding: 10px; background: #0066cc; color: white; border: none; border-radius: 6px; font-size: 16px; cursor: pointer; }
+button:hover { background: #0052a3; }
+.error { color: #cc0000; font-size: 13px; margin-bottom: 12px; display: none; }
+</style>
+</head>
+<body>
+<div class="card">
+<h1>Momentry Docs</h1>
+<form id="loginForm">
+<input type="text" id="username" placeholder="Username" value="demo" required>
+<input type="password" id="password" placeholder="Password" value="demo" required>
+<div class="error" id="error">Invalid credentials</div>
+<button type="submit">Login</button>
+</form>
+</div>
+<script>
+document.getElementById('loginForm').onsubmit = async function(e) {
+    e.preventDefault();
+    const resp = await fetch('/api/v1/auth/login', {
+        method: 'POST',
+        headers: {'Content-Type': 'application/json'},
+        body: JSON.stringify({
+            username: document.getElementById('username').value,
+            password: document.getElementById('password').value
+        })
+    });
+    if (resp.ok) {
+        window.location.href = '/doc/index.html';
+    } else {
+        document.getElementById('error').style.display = 'block';
+    }
+};
+</script>
+</body>
+</html>
\ No newline at end of file
diff --git a/deliverable_v1.1.0/modules/01_auth.md b/deliverable_v1.1.0/modules/01_auth.md
new file mode 100644
index 0000000..96b8979
--- /dev/null
+++ b/deliverable_v1.1.0/modules/01_auth.md
@@ -0,0 +1,280 @@
+<!-- module: auth -->
+<!-- description: Authentication — login, logout, JWT, session cookie, API key -->
+<!-- depends: -->
+
+## Base URL
+
+| Environment | URL | Purpose |
+|-------------|-----|---------|
+| Production | `http://localhost:3002` | Production deployment |
+| External (M5) | `https://m5api.momentry.ddns.net` | Remote access |
+
+## Variables
+
+All examples in this documentation use these environment variables:
+
+```bash
+API="http://localhost:3002"
+KEY="your-api-key-here"
+```
+
+## Authentication
+
+All endpoints under `/api/v1/*` require authentication.
+The following endpoints are public (no auth needed):
+
+- `GET /health`
+- `POST /api/v1/auth/login`
+- `POST /api/v1/auth/logout`
+
+### Three Authentication Modes
+
+The system supports three authentication methods, checked in **priority order** by the middleware:
+
+```
+Middleware priority:
+  1. Session Cookie (Portal/browser)
+  2. JWT Bearer (API clients, CLI)
+  3. API Key Header (legacy compatibility)
+  4. API Key Query Param (?api_key=)
+```
+
+| Mode | Transport | Expiry | Scope | Best for |
+|------|-----------|--------|-------|----------|
+| **Session Cookie** | `Cookie: session_id=<session_id>` | 24h | per-browser session | Portal (browser) |
+| **JWT** | `Authorization: Bearer <token>` | 1h | per-login token | API clients, CLI, scripts |
+| **API Key** | `X-API-Key: <key>` | 90d | fixed key for automation | Legacy scripts, WordPress |
+
+---
+
+### Login
+
+**Default accounts & API keys:**
+
+| Username | Password | API Key | Role |
+|----------|----------|---------|------|
+| `admin` | `admin` | — | admin |
+| `demo` | `demo` | `muser_demo_key_32chars_abcdef1234567890` | user |
+
+The demo API key is set via `MOMENTRY_DEMO_API_KEY` env var and can be used in place of JWT for marcom integrations:
+
+```bash
+# Using API key instead of JWT
+curl -s "$API/api/v1/files/scan" -H "X-API-Key: muser_demo_key_32chars_abcdef1234567890"
+```
+
+```bash
+# Login as admin
+curl -s -X POST "$API/api/v1/auth/login" \
+  -H "Content-Type: application/json" \
+  -d '{"username": "admin", "password": "admin"}'
+
+# Login as demo user
+curl -s -X POST "$API/api/v1/auth/login" \
+  -H "Content-Type: application/json" \
+  -d '{"username": "demo", "password": "demo"}'
+```
+
+#### Success Response
+
+```json
+{
+  "success": true,
+  "jwt": "eyJhbGciOiJIUzI1NiIs...",
+  "api_key": "muser_...",
+  "user": {
+    "username": "admin",
+    "role": "admin"
+  },
+  "expires_at": "2026-05-18T13:00:00Z"
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `jwt` | string | JWT access token. Use as `Authorization: Bearer <jwt>`. Expires in 1 hour. |
+| `api_key` | string | Legacy API key. Use as `X-API-Key: <key>`. Good for 90 days. |
+| `user.username` | string | Username |
+| `user.role` | string | Role: `admin`, `user`, or `readonly` |
+| `expires_at` | string | ISO8601 timestamp of JWT expiration |
+
+The login endpoint also sets a `Set-Cookie` header for browser-based clients:
+
+```
+Set-Cookie: session_id=<session_id>; Path=/; HttpOnly; SameSite=Strict; Max-Age=86400
+```
+
+#### Error Response (401)
+
+```json
+{
+  "success": false,
+  "message": "Invalid username or password"
+}
+```
+
+---
+
+### Using JWT
+
+JWT is preferred for API clients (CLI scripts, WordPress). It is validated by the middleware without a database lookup (stateless).
+
+```bash
+# Login and capture JWT
+JWT=$(curl -s -X POST "$API/api/v1/auth/login" \
+  -H "Content-Type: application/json" \
+  -d '{"username":"admin","password":"admin"}' | python3 -c "import json,sys;print(json.load(sys.stdin)['jwt'])")
+
+# Use JWT for all subsequent requests
+curl -H "Authorization: Bearer $JWT" "$API/api/v1/files/scan"
+curl -H "Authorization: Bearer $JWT" "$API/api/v1/resource/tmdb"
+```
+
+JWT is short-lived (1 hour). When it expires, request a new one via login.
+
+---
+
+### Using Session Cookie (Browser)
+
+Browser-based clients (Portal) get a session cookie automatically after login. The browser sends the cookie with every request—no manual header needed.
+
+```bash
+# Login captures the session cookie from Set-Cookie header
+curl -v -X POST "$API/api/v1/auth/login" \
+  -H "Content-Type: application/json" \
+  -d '{"username":"admin","password":"admin"}' 2>&1 | grep "Set-Cookie"
+
+# Browser automatically sends: Cookie: session_id=<session_id>
+# No manual header needed for subsequent requests
+```
+
+The session cookie is HttpOnly (not accessible from JavaScript) and SameSite=Strict (protected against CSRF).
+
+---
+
+### Using Legacy API Key
+
+```bash
+curl -H "X-API-Key: $KEY" "$API/api/v1/files/scan"
+
+# Also accepted via Bearer header (non-JWT format) or query parameter:
+curl -H "Authorization: Bearer $KEY" "$API/api/v1/files/scan"
+curl "$API/api/v1/files/scan?api_key=$KEY"
+```
+
+API keys are validated via SHA256 hash lookup in the database. They are long-lived (90 days) and intended for automation.
+
+### Obtaining an API Key (CLI)
+
+```bash
+momentry api-key create "My API Key" --key-type user
+```
+
+---
+
+### Logout
+
+```bash
+# Logout using the session cookie (browser)
+curl -X POST "$API/api/v1/auth/logout" \
+  -H "Cookie: session_id=<uuid>"
+```
+
+#### What logout does
+
+| Auth mode | Effect |
+|-----------|--------|
+| **Session Cookie** | Session deleted from database. Same cookie returns 401 on subsequent requests. |
+| **JWT** | JWT remains valid until expiry. (JWT is stateless — logout adds JWT to a blacklist only if API key mode is used.) |
+| **API Key** | API key remains valid. (Legacy keys are shared across sessions — revoking would break other clients.) |
+
+#### Example: full session lifecycle
+
+```bash
+# 1. Login
+SESSION_ID=$(curl -s -D - -X POST "$API/api/v1/auth/login" \
+  -H "Content-Type: application/json" \
+  -d '{"username":"admin","password":"admin"}' | grep "Set-Cookie" | sed 's/.*session_id=\([^;]*\).*/\1/')
+
+# 2. Use session (works)
+curl -s -o /dev/null -w "HTTP %{http_code}\n" "$API/api/v1/resource/tmdb" \
+  -H "Cookie: session_id=$SESSION_ID"
+# → HTTP 200
+
+# 3. Logout
+curl -s -X POST "$API/api/v1/auth/logout" \
+  -H "Cookie: session_id=$SESSION_ID"
+# → {"success": true}
+
+# 4. Use session again (rejected)
+curl -s -o /dev/null -w "HTTP %{http_code}\n" "$API/api/v1/resource/tmdb" \
+  -H "Cookie: session_id=$SESSION_ID"
+# → HTTP 401
+```
+
+---
+
+### Authentication Flow Summary
+
+```
+Login Request
+     │
+     ▼
+┌──────────────────┐
+│  1. Check users  │ ← users table (argon2 password verify)
+│     table        │
+└──────┬───────────┘
+       │
+   ┌───┴───┐
+   │ match │
+   └───┬───┘
+       │
+       ▼
+┌──────────────────┐
+│  2. Create JWT   │ ← 1h expiry, signed with JWT_SECRET
+├──────────────────┤
+│  3. Create       │ ← 24h expiry, stored in sessions table
+│     session      │
+├──────────────────┤
+│  4. Set-Cookie   │ ← HttpOnly, SameSite=Strict, Path=/
+├──────────────────┤
+│  5. Return       │ ← JWT + api_key + user info to client
+└──────────────────┘
+```
+
+```
+Protected Request
+     │
+     ▼
+┌──────────────────────┐
+│  Middleware checks:  │
+│                      │
+│  1. Cookie session?  │ → DB lookup session → get api_key → verify
+│                      │
+│  2. JWT Bearer?      │ → verify JWT signature → decode claims
+│                      │
+│  3. X-API-Key?       │ → SHA256 hash → DB lookup → verify
+│                      │
+│  4. ?api_key=?       │ → same as #3
+│                      │
+│  5. None → 401       │
+└──────────────────────┘
+```
+
+---
+
+### Error Responses
+
+| HTTP | When |
+|------|------|
+| `401` | Missing or invalid authentication |
+| `401` | Session expired or logged out |
+| `401` | JWT expired |
+| `401` | API key revoked or inactive |
+
+---
+
+### Related
+
+- `POST /api/v1/resource/tmdb/check` — test authentication + TMDb API connectivity
+- `GET /health/detailed` — view auth status (integrations section)
diff --git a/deliverable_v1.1.0/modules/02_health.md b/deliverable_v1.1.0/modules/02_health.md
new file mode 100644
index 0000000..46f7df0
--- /dev/null
+++ b/deliverable_v1.1.0/modules/02_health.md
@@ -0,0 +1,147 @@
+<!-- module: health -->
+<!-- description: Health check endpoints -->
+<!-- depends: 01_auth -->
+
+## Health Check
+
+### `GET /health`
+
+**Auth**: Public
+**Scope**: system-level
+
+Returns basic server health status — used by load balancers and monitoring.
+
+#### Example
+
+```bash
+curl "$API/health" | jq '{status, version}'
+```
+
+#### Response (200)
+
+```json
+{
+  "status": "ok",
+  "version": "1.0.0",
+  "build_git_hash": "3a6c1865",
+  "build_timestamp": "2026-05-16T13:38:15Z",
+  "uptime_ms": 3015
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `status` | string | `ok` or `degraded` |
+| `version` | string | Semver version |
+| `build_git_hash` | string | Git commit hash |
+| `build_timestamp` | string | Binary build time |
+| `uptime_ms` | integer | Milliseconds since server start |
+
+---
+
+### `GET /health/detailed`
+
+**Auth**: Required
+**Scope**: system-level
+
+Returns full system health including each service status, resource utilization, pipeline readiness, schema migration status, identity file sync status, and external integrations.
+
+> Requires authentication (JWT, session cookie, or API key). The basic `/health` endpoint remains public for load balancer checks.
+
+#### Example
+
+```bash
+curl "$API/health/detailed" | jq '{status, services, resources: {cpu: .resources.cpu_used_percent, memory: .resources.memory_used_percent}}'
+```
+
+#### Response (200)
+
+```json
+{
+  "status": "ok",
+  "version": "1.0.0",
+  "services": {
+    "postgres": {"status": "ok", "latency_ms": 3},
+    "redis": {"status": "ok", "latency_ms": 1},
+    "qdrant": {"status": "ok", "latency_ms": 5}
+  },
+  "resources": {
+    "cpu_used_percent": 12.5,
+    "memory_available_mb": 32768,
+    "memory_used_percent": 31.7
+  },
+  "pipeline": {
+    "scripts_ready": true,
+    "scripts_count": 345,
+    "processors": {
+      "asr": true,
+      "yolo": true,
+      "face": true,
+      "pose": true,
+      "ocr": true,
+      "cut": true,
+      "scene": true,
+      "asrx": true,
+      "visual_chunk": true
+    },
+    "models_ready": true,
+    "models_count": 42,
+    "scripts_integrity": {"matched": 332, "total": 345, "ok": false},
+    "ffmpeg": true
+  },
+  "schema": {
+    "table_exists": true,
+    "applied": [{"filename": "migrate_add_users_table.sql"}],
+    "required": [],
+    "ok": true
+  },
+  "identities": {
+    "directory_exists": true,
+    "files_count": 3481,
+    "index_ok": true,
+    "db_count": 3481,
+    "synced": true
+  },
+  "integrations": {
+    "tmdb": {
+      "api_key_configured": false,
+      "enabled": false,
+      "api_reachable": null
+    }
+  }
+}
+```
+
+#### Response Fields
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `status` | string | `ok` if all essential services healthy |
+| `services` | object | Per-service status (postgres, redis, qdrant) |
+| `services.*.status` | string | `ok`, `error`, or `degraded` |
+| `services.*.latency_ms` | int | Response time in milliseconds |
+| `resources` | object | CPU, memory usage |
+| `pipeline.scripts_ready` | boolean | Scripts directory accessible |
+| `pipeline.scripts_count` | int | Number of Python processor scripts |
+| `pipeline.processors` | object | Per-processor availability |
+| `pipeline.models_ready` | boolean | Models directory accessible |
+| `pipeline.scripts_integrity` | object | SHA256 checksum verification results |
+| `schema.ok` | boolean | All required migrations applied |
+| `identities.synced` | boolean | Identity file count matches DB count |
+| `integrations.tmdb` | object | TMDB API key config and reachability |
+
+#### Health status rules
+
+| Condition | status |
+|-----------|--------|
+| All services ok | `ok` |
+| Any service error | `degraded` |
+| Postgres or Redis error | `degraded` (server still responds) |
+
+---
+
+### Stats Endpoints
+
+| Method | Endpoint | Auth | Description |
+|--------|----------|------|-------------|
+| GET | `/api/v1/stats/sftpgo` | No | SFTPGo service status |
diff --git a/deliverable_v1.1.0/modules/03_register.md b/deliverable_v1.1.0/modules/03_register.md
new file mode 100644
index 0000000..9bae26f
--- /dev/null
+++ b/deliverable_v1.1.0/modules/03_register.md
@@ -0,0 +1,184 @@
+<!-- module: register -->
+<!-- description: File registration — register, scan -->
+<!-- depends: 01_auth -->
+
+## File Registration
+
+### `POST /api/v1/files/register`
+
+**Auth**: Required
+**Scope**: file-level
+
+Register a video file for processing. Returns the file's metadata and UUID.
+
+**New in v0.1.2**: Registration now **automatically triggers the processing pipeline** — no need to call `POST /api/v1/file/:file_uuid/process` separately. The system will:
+1. Register the file and run ffprobe
+2. Auto-run offline TMDb probe (reads local identity files, no API calls)
+3. Create a monitor job for the worker
+4. Worker starts all 10 processors (Cut → ASR → ASRX → YOLO → OCR → Face → Pose → VisualChunk → Story → 5W1H)
+
+If the file already exists (same content hash), returns the existing record with `already_exists: true`.
+
+#### Request Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `file_path` | string | Yes | — | Path to video file on disk |
+| `pattern` | string | No | — | Regex pattern for batch register (requires `file_path` to be a directory) |
+| `user_id` | integer | No | — | User ID to associate with registration |
+| `content_hash` | string | No | — | Pre-computed SHA-256 hash (skips computation) |
+
+#### Example
+
+```bash
+# Register a single file
+curl -s -X POST "$API/api/v1/files/register" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"file_path": "/path/to/video.mp4"}'
+
+# Batch register files matching a pattern in a directory
+curl -s -X POST "$API/api/v1/files/register" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"file_path": "/path/to/dir", "pattern": ".*\\.mp4$"}'
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "file_uuid": "3a6c1865...",
+  "file_name": "video.mp4",
+  "file_path": "/path/to/video.mp4",
+  "file_type": "video",
+  "duration": 120.5,
+  "width": 1920,
+  "height": 1080,
+  "fps": 24.0,
+  "total_frames": 2892,
+  "already_exists": false,
+  "message": "File registered successfully"
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `success` | boolean | Always true on 200 |
+| `file_uuid` | string | 32-char hex UUID of the registered file |
+| `file_name` | string | File name (auto-renamed if name conflict) |
+| `file_path` | string | Canonical path on disk |
+| `file_type` | string | `"video"`, `"audio"`, or `"unknown"` |
+| `duration` | float | Duration in seconds |
+| `width` | integer | Video width in pixels |
+| `height` | integer | Video height in pixels |
+| `fps` | float | Frames per second |
+| `total_frames` | integer | Total frame count |
+| `already_exists` | boolean | True if same content was already registered |
+| `message` | string | Human-readable status |
+
+#### Error Responses
+
+| HTTP | When |
+|------|------|
+| `401` | Missing or invalid API key |
+| `400` | Invalid request body |
+| `404` | File path does not exist |
+
+---
+
+### `GET /api/v1/files/scan`
+
+**Auth**: Required
+**Scope**: file-level
+
+Scan the filesystem directory and list all media files, showing which are registered, processing, or unregistered.
+
+#### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `page` | integer | No | 1 | Page number (1-based) |
+| `page_size` | integer | No | all | Items per page (alias: `limit`) |
+| `limit` | integer | No | all | Max items (alias for `page_size`) |
+| `pattern` | string | No | — | Regex filter on file name (e.g., `.*\\.mp4$`) |
+| `sort_by` | string | No | `name` | Sort field: `name`, `size`, `modified`, `status` |
+| `sort_order` | string | No | `asc` | Sort direction: `asc` or `desc` |
+
+#### Example
+
+```bash
+# Full scan
+curl -s "$API/api/v1/files/scan" -H "X-API-Key: $KEY" | jq '{total, registered_count, unregistered_count}'
+
+# Paginated (page 1, 5 per page)
+curl -s "$API/api/v1/files/scan?page=1&page_size=5" -H "X-API-Key: $KEY" | jq '{page, total_pages, files: [.files[].file_name]}'
+
+# Regex filter: only mp4 files
+curl -s "$API/api/v1/files/scan?pattern=.*\\.mp4$" -H "X-API-Key: $KEY" | jq '{filtered_total, files: [.files[].file_name]}'
+
+# Sort by file size (largest first)
+curl -s "$API/api/v1/files/scan?sort_by=size&sort_order=desc&page_size=5" -H "X-API-Key: $KEY" | jq '[.files[] | {file_name, file_size}]'
+
+# Sort by modified time (most recent first)
+curl -s "$API/api/v1/files/scan?sort_by=modified&sort_order=desc&page_size=5" -H "X-API-Key: $KEY" | jq '[.files[] | {file_name, modified_time}]'
+
+# Sort by status
+curl -s "$API/api/v1/files/scan?sort_by=status&page_size=5" -H "X-API-Key: $KEY" | jq '[.files[] | {file_name, status}]'
+```
+
+#### Response (200)
+
+```json
+{
+  "files": [
+    {
+      "file_name": "video.mp4",
+      "file_size": 12345678,
+      "is_registered": true,
+      "file_uuid": "3a6c1865...",
+      "status": "completed",
+      "registration_time": "2026-05-16T12:00:00Z",
+      "job_id": 42
+    }
+  ],
+  "total": 107,
+  "filtered_total": 80,
+  "page": 1,
+  "page_size": 20,
+  "total_pages": 4,
+  "registered_count": 26,
+  "unregistered_count": 81
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `files` | array | Array of file info objects (paginated) |
+| `files[].file_name` | string | File name |
+| `files[].relative_path` | string | Path relative to scan root |
+| `files[].file_path` | string | Absolute path on disk |
+| `files[].file_size` | integer | File size in bytes |
+| `files[].modified_time` | string | Last modified timestamp (ISO8601) |
+| `files[].is_registered` | boolean | Whether file is registered in DB |
+| `files[].file_uuid` | string | 32-char hex UUID (only if registered) |
+| `files[].status` | string | `"completed"`, `"processing"`, `"registered"`, `"unregistered"`, or `null` |
+| `files[].registration_time` | string | DB registration timestamp (only if registered) |
+| `files[].job_id` | integer | Processing job ID (only if a job exists) |
+| `total` | integer | Total files found on disk (unfiltered) |
+| `filtered_total` | integer | Files matching regex filter |
+| `page` | integer | Current page number |
+| `page_size` | integer | Items per page |
+| `total_pages` | integer | Total pages |
+| `registered_count` | integer | Files registered in DB |
+| `unregistered_count` | integer | Files not yet registered |
+
+#### Notes
+
+| Feature | Behavior |
+|---------|----------|
+| **Regex** | Case-insensitive (`(?i)` prefix auto-applied). Applied to `file_name`. |
+| **Sort order** | Default (`sort_by=name`): registered files first, then alphabetically. `sort_by=status`: alphabetical by status string. |
+| **Pagination** | `page_size` and `limit` are aliases. Default: show all results. |
+| **Processing order** | `pattern` regex filter → `sort_by`/`sort_order` → `page`/`page_size` slice. |
diff --git a/deliverable_v1.1.0/modules/04_lookup.md b/deliverable_v1.1.0/modules/04_lookup.md
new file mode 100644
index 0000000..019c8af
--- /dev/null
+++ b/deliverable_v1.1.0/modules/04_lookup.md
@@ -0,0 +1,138 @@
+<!-- module: lookup -->
+<!-- description: File lookup by name and unregistration -->
+<!-- depends: 01_auth, 03_register -->
+
+## File Lookup
+
+### `GET /api/v1/files/lookup`
+
+**Auth**: Required
+**Scope**: file-level
+
+Search registered files by file name. Performs a case-insensitive LIKE search on the file name column. Returns basic info about matching files.
+
+#### Query Parameters
+
+| Field | Type | Required | Description |
+|-------|------|----------|-------------|
+| `file_name` | string | Yes | File name to search for (partial matches supported) |
+
+#### Example
+
+```bash
+# Look up a specific file
+curl -s "$API/api/v1/files/lookup?file_name=video.mp4" \
+  -H "X-API-Key: $KEY"
+
+# Partial name search
+curl -s "$API/api/v1/files/lookup?file_name=charade" \
+  -H "X-API-Key: $KEY" | jq '.matches[].file_name'
+```
+
+#### Response (200)
+
+```json
+{
+  "file_name": "video.mp4",
+  "exists": true,
+  "matches": [
+    {
+      "file_uuid": "a03485a40b2df2d3",
+      "file_name": "video.mp4",
+      "file_type": "video",
+      "status": "completed"
+    }
+  ],
+  "next_name": "video (2).mp4"
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `file_name` | string | Searched name |
+| `exists` | boolean | Exact name match exists |
+| `matches` | array | Array of matching registered files |
+| `matches[].file_uuid` | string | 32-char hex UUID |
+| `matches[].file_name` | string | Registered file name |
+| `matches[].file_type` | string | `"video"`, `"audio"`, or `null` |
+| `matches[].status` | string | Registration/processing status |
+| `next_name` | string | Suggested name for avoiding conflicts |
+
+---
+
+## Unregister
+
+### `POST /api/v1/unregister`
+
+**Auth**: Required
+**Scope**: file-level
+
+Delete a registered file from the system. Supports single file by UUID, or batch by directory + regex pattern.
+
+#### What gets deleted
+
+| Removed (default) | Not removed |
+|---------|-------------|
+| Database records (videos, chunks, embeddings, processor_results, pre_chunks) | The original source video file on disk |
+| Processor output JSON files (`{uuid}.*.json`) — unless `delete_output_files: false` | Temp/working directories |
+| In-memory cache entries | |
+| MongoDB cached lists | |
+
+> ⚠️ Database deletion is **irreversible**. To keep output files, set `"delete_output_files": false`.
+
+#### Request Parameters
+
+At least one mode must be specified: either `file_uuid` alone, or `file_path` + `pattern` together.
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `file_uuid` | string | * | — | Single file UUID to delete |
+| `file_path` | string | * | — | Directory path (for batch delete) |
+| `pattern` | string | * | — | Regex pattern (requires `file_path`) |
+| `delete_output_files` | boolean | No | `true` | If `true`, also delete processor output JSON files (`{uuid}.*.json`). Set to `false` to keep them. |
+
+#### Example
+
+```bash
+# Delete a single file by UUID (default: also deletes output JSON files)
+curl -s -X POST "$API/api/v1/unregister" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"file_uuid": "'"$FILE_UUID"'"}'
+
+# Keep output JSON files, only delete DB records
+curl -s -X POST "$API/api/v1/unregister" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"file_uuid": "'"$FILE_UUID"'", "delete_output_files": false}'
+
+# Batch delete all mp4 files in a directory
+curl -s -X POST "$API/api/v1/unregister" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"file_path": "/path/to/dir", "pattern": ".*\\.mp4$"}'
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "file_uuid": "a03485a40b2df2d3",
+  "message": "Video unregistered successfully"
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `success` | boolean | True if deletion succeeded |
+| `file_uuid` | string | UUID of the deleted file (single mode) |
+| `message` | string | Human-readable status |
+
+#### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | Neither `file_uuid` nor `file_path`+`pattern` provided |
+| `404` | File UUID not found |
+| `401` | Missing or invalid API key |
diff --git a/deliverable_v1.1.0/modules/05_process.md b/deliverable_v1.1.0/modules/05_process.md
new file mode 100644
index 0000000..9f9baf8
--- /dev/null
+++ b/deliverable_v1.1.0/modules/05_process.md
@@ -0,0 +1,236 @@
+<!-- module: process -->
+<!-- description: Processing pipeline — trigger, probe, progress, jobs -->
+<!-- depends: 01_auth, 03_register -->
+
+## Processing Pipeline
+
+### `POST /api/v1/file/:file_uuid/process`
+
+**Auth**: Required
+**Scope**: file-level
+
+Trigger the processing pipeline for a registered file. Creates a monitor job that the worker picks up and processes sequentially. Returns immediately with the job info—processing runs asynchronously in the background.
+
+#### Request Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `processors` | string[] | No | all | Specific processors to run: `["cut","asr","asrx","yolo","ocr","face","pose","visual_chunk","story","5w1h"]` |
+| `rules` | string[] | No | all | Rule names to apply (currently unused) |
+
+#### Example
+
+```bash
+# Run all processors
+curl -s -X POST "$API/api/v1/file/$FILE_UUID/process" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" -d '{}'
+
+# Run specific processors only
+curl -s -X POST "$API/api/v1/file/$FILE_UUID/process" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"processors": ["asr", "face", "yolo"]}'
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "job_id": 42,
+  "file_uuid": "3a6c1865...",
+  "status": "processing",
+  "pids": [12345, 12346],
+  "message": "Processing triggered for video.mp4"
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `success` | boolean | Always true on 200 |
+| `job_id` | integer | Monitor job ID (for job tracking) |
+| `file_uuid` | string | 32-char hex UUID of the file |
+| `status` | string | `"processing"` |
+| `pids` | integer[] | Process IDs of started processors |
+| `message` | string | Human-readable status |
+
+#### Error Responses
+
+| HTTP | When |
+|------|------|
+| `404` | File UUID not found |
+| `401` | Missing or invalid API key |
+
+---
+
+### `GET /api/v1/file/:file_uuid/probe`
+
+**Auth**: Required
+**Scope**: file-level
+
+Get ffprobe metadata for a registered file. Returns video/audio stream info, codec details, duration, resolution, and frame rate.
+
+#### Example
+
+```bash
+curl -s "$API/api/v1/file/$FILE_UUID/probe" -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "file_uuid": "3a6c1865...",
+  "file_name": "video.mp4",
+  "file_size": 794863677,
+  "duration": 120.5,
+  "width": 1920,
+  "height": 1080,
+  "fps": 24.0,
+  "total_frames": 2892,
+  "cached": true,
+  "format": {
+    "filename": "/path/to/video.mp4",
+    "format_name": "mov,mp4,m4a,3gp",
+    "duration": "120.5",
+    "size": "12345678",
+    "bit_rate": "819200"
+  },
+  "streams": [
+    {
+      "index": 0,
+      "codec_name": "h264",
+      "codec_type": "video",
+      "width": 1920,
+      "height": 1080,
+      "r_frame_rate": "24/1",
+      "duration": "120.5"
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `file_uuid` | string | 32-char hex UUID |
+| `file_name` | string | File name |
+| `file_size` | integer | File size in bytes (from filesystem) |
+| `duration` | float | Duration in seconds |
+| `width` | integer | Video width in pixels |
+| `height` | integer | Video height in pixels |
+| `fps` | float | Frames per second |
+| `total_frames` | integer | Estimated total frames |
+| `cached` | boolean | True if result was from cached probe JSON |
+| `format` | object | Container format info (ffprobe format section) |
+| `streams` | array | Array of stream info objects |
+
+---
+
+### `GET /api/v1/progress/:file_uuid`
+
+**Auth**: Required
+**Scope**: file-level
+
+Get real-time processing progress for a file via Redis pub/sub. Includes per-processor status, current/total frames, ETA, and system resource stats.
+
+#### Pipeline Order
+
+| Order | Processor | Dependencies | Description |
+|-------|-----------|-------------|-------------|
+| 1 | `cut` | — | Scene detection |
+| 2 | `asr` | cut | Speech-to-text (per scene) |
+| 3 | `asrx` | asr | Speaker diarization |
+| 4 | `yolo` | — | Object detection |
+| 5 | `ocr` | — | Text recognition |
+| 6 | `face` | — | Face detection & embedding |
+| 7 | `pose` | — | Pose estimation |
+| 8 | `visual_chunk` | yolo | Visual scene chunks |
+| 9 | `story` | asr, asrx, cut, yolo, face | Scene summaries (template) |
+| 10 | `5w1h` | story | 5W1H analysis (Gemma4 LLM) |
+
+All processors except `story` and `5w1h` run concurrently when their dependencies are met. Story and 5W1H run sequentially after their prerequisites.
+
+#### Example
+
+```bash
+curl -s "$API/api/v1/progress/$FILE_UUID" -H "X-API-Key: $KEY" | jq '{overall_progress, processors: [.processors[] | {processor_type, status}]}'
+```
+
+#### Response (200)
+
+```json
+{
+  "file_uuid": "3a6c1865...",
+  "overall_progress": 71,
+  "cpu_percent": 45.2,
+  "gpu_percent": 30.1,
+  "memory_percent": 62.4,
+  "processors": [
+    {"processor_type": "asr", "status": "complete", "progress": 100},
+    {"processor_type": "yolo", "status": "running", "progress": 65},
+    {"processor_type": "face", "status": "pending", "progress": 0}
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `file_uuid` | string | 32-char hex UUID |
+| `overall_progress` | integer | Overall progress percentage (0–100) |
+| `processors` | array | Per-processor status list |
+| `processors[].processor_type` | string | Processor name (`asr`, `cut`, `yolo`, etc.) |
+| `processors[].status` | string | `"pending"`, `"running"`, `"complete"`, or `"failed"` |
+| `processors[].progress` | integer | Per-processor progress (0–100) |
+| `processors[].eta_seconds` | integer | Estimated seconds remaining (running processors) |
+| `processors[].current` | integer | Current frame count |
+| `processors[].total` | integer | Total frame count |
+| `cpu_percent` | float | Current CPU usage |
+| `gpu_percent` | float | Current GPU utilization |
+| `memory_percent` | float | Current memory usage |
+
+---
+
+### `GET /api/v1/jobs`
+
+**Auth**: Required
+**Scope**: system-level
+
+List all processing jobs (monitor jobs) in the system. Shows job status, which file each job is processing, and current processor info.
+
+#### Example
+
+```bash
+curl -s "$API/api/v1/jobs" -H "X-API-Key: $KEY" | jq '{count, jobs: [.jobs[] | {uuid, status}]}'
+```
+
+#### Response (200)
+
+```json
+{
+  "jobs": [
+    {
+      "id": 42,
+      "uuid": "3a6c1865...",
+      "status": "running",
+      "current_processor": "yolo",
+      "created_at": "2026-05-16T12:00:00Z",
+      "started_at": "2026-05-16T12:01:00Z"
+    }
+  ],
+  "count": 15,
+  "page": 1,
+  "page_size": 20
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `jobs` | array | Array of job info objects |
+| `jobs[].id` | integer | Job ID |
+| `jobs[].uuid` | string | File UUID being processed |
+| `jobs[].status` | string | `"pending"`, `"running"`, `"completed"`, `"failed"` |
+| `jobs[].current_processor` | string | Currently active processor, or null |
+| `count` | integer | Total job count |
+| `page` | integer | Current page number |
+| `page_size` | integer | Jobs per page |
diff --git a/deliverable_v1.1.0/modules/06_search.md b/deliverable_v1.1.0/modules/06_search.md
new file mode 100644
index 0000000..e5b13c3
--- /dev/null
+++ b/deliverable_v1.1.0/modules/06_search.md
@@ -0,0 +1,145 @@
+<!-- module: search -->
+<!-- description: Vector search, BM25, smart search, universal search, visual search -->
+<!-- depends: 01_auth -->
+
+## Search APIs
+
+### `POST /api/v1/search/smart`
+
+**Auth**: Required
+**Scope**: file-level
+
+Semantic vector search using EmbeddingGemma-300m. Generates a query embedding via EmbeddingGemma (port 11436), then searches pgvector `story_parent` and `llm_parent` chunks by cosine similarity.
+
+#### Request Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `file_uuid` | string | Yes | — | File UUID to search within |
+| `query` | string | Yes | — | Search text |
+| `limit` | integer | No | 5 | Max results to return |
+| `page` | integer | No | 1 | Page number |
+| `page_size` | integer | No | 5 | Items per page |
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/search/smart" \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer $JWT" \
+  -d '{"file_uuid": "'"$FILE_UUID"'", "query": "Audrey Hepburn"}'
+```
+
+#### Response (200)
+
+```json
+{
+  "query": "Audrey Hepburn",
+  "results": [
+    {
+      "parent_id": 1087822,
+      "scene_order": 1087822,
+      "start_frame": 104438,
+      "end_frame": 104538,
+      "fps": 24.0,
+      "start_time": 4351.6,
+      "end_time": 4355.76,
+      "summary": "[4352s-4356s, 4s] Cast: Audrey Hepburn. Total: 2 lines, 10 words. Speakers: Audrey Hepburn (2 lines)",
+      "similarity": 0.67
+    }
+  ],
+  "page": 1,
+  "page_size": 5,
+  "strategy": "semantic_vector_search"
+}
+```
+
+---
+
+### `POST /api/v1/search/universal`
+
+**Auth**: Required
+**Scope**: file-level
+
+Multi-type BM25 full-text search across chunks, frames, and persons. Uses PostgreSQL `tsvector`.
+
+#### Request Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `query` | string | Yes | — | Search text |
+| `file_uuid` | string | No | — | Restrict to specific file |
+| `types` | string[] | No | `["chunk","frame","person"]` | Search types |
+| `limit` | integer | No | 10 | Max results per type |
+| `page` | integer | No | 1 | Page number |
+| `page_size` | integer | No | 20 | Items per page |
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/search/universal" \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer $JWT" \
+  -d '{"file_uuid": "'"$FILE_UUID"'", "query": "Cary Grant"}'
+```
+
+#### Response (200)
+
+```json
+{
+  "results": [
+    {
+      "type": "chunk",
+      "chunk_id": "bd80fec92b0b6963d177a2c55bf713e2_2",
+      "chunk_type": "story_child",
+      "start_frame": 5103,
+      "end_frame": 5127,
+      "start_time": 212.64,
+      "end_time": 213.64,
+      "text": "[213s-214s] Cary Grant: \"Olá!\"",
+      "score": 0.9
+    }
+  ],
+  "total": 20,
+  "took_ms": 18
+}
+```
+
+---
+
+### `POST /api/v1/search/frames`
+
+**Auth**: Required
+**Scope**: file-level
+
+Search face detection frames by identity name or trace ID.
+
+---
+
+### `POST /api/v1/search/identity_text`
+
+**Auth**: Required
+**Scope**: file-level
+
+Search text chunks spoken by a specific identity.
+
+---
+
+### Visual Search
+
+| Method | Endpoint | Description |
+|--------|----------|-------------|
+| POST | `/api/v1/search/visual` | Search visual chunks |
+| POST | `/api/v1/search/visual/class` | Search by object class |
+| POST | `/api/v1/search/visual/density` | Search by object density |
+| POST | `/api/v1/search/visual/combination` | Search by object combination |
+| POST | `/api/v1/search/visual/stats` | Visual chunk statistics |
+
+#### Embedding Model
+
+| Detail | Value |
+|--------|-------|
+| **Model** | EmbeddingGemma-300m |
+| **Endpoint** | `POST /api/v1/embeddings` on port 11436 |
+| **Dimension** | 768 |
+| **Storage** | pgvector (`chunk.embedding` column) |
diff --git a/deliverable_v1.1.0/modules/08_identity_agent.md b/deliverable_v1.1.0/modules/08_identity_agent.md
new file mode 100644
index 0000000..f9c86e0
--- /dev/null
+++ b/deliverable_v1.1.0/modules/08_identity_agent.md
@@ -0,0 +1,65 @@
+<!-- module: identity_agent -->
+<!-- description: Identity agent — match from photo, match from trace -->
+<!-- depends: 01_auth, 07_identity -->
+
+## Identity Agent
+
+### `POST /api/v1/agents/identity/match-from-photo`
+
+**Auth**: Required
+**Scope**: file-level
+
+Upload a face photo to match against known identities. Detects face via InsightFace, extracts 512D embedding via CoreML FaceNet, then searches pgvector for the closest identity.
+
+#### Request
+
+`multipart/form-data` with field `image` (JPEG/PNG) and optional `file_uuid`.
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/agents/identity/match-from-photo" \
+  -H "Authorization: Bearer $JWT" \
+  -F "image=@/path/to/face.jpg" \
+  -F "file_uuid=$FILE_UUID"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "matches": [
+    {
+      "identity_uuid": "a9a90105...",
+      "name": "Cary Grant",
+      "similarity": 0.87
+    }
+  ]
+}
+```
+
+---
+
+### `POST /api/v1/agents/identity/match-from-trace`
+
+**Auth**: Required
+**Scope**: file-level
+
+Match a face trace (tracked face across frames) against known identities. Samples 3 angles from the trace, generates embeddings, and searches pgvector.
+
+#### Request Parameters
+
+| Field | Type | Required | Description |
+|-------|------|----------|-------------|
+| `file_uuid` | string | Yes | File containing the trace |
+| `trace_id` | integer | Yes | Face trace ID to match |
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/agents/identity/match-from-trace" \
+  -H "Authorization: Bearer $JWT" \
+  -H "Content-Type: application/json" \
+  -d '{"file_uuid": "'"$FILE_UUID"'", "trace_id": 10}'
+```
diff --git a/deliverable_v1.1.0/modules/09_tmdb.md b/deliverable_v1.1.0/modules/09_tmdb.md
new file mode 100644
index 0000000..7ea3f27
--- /dev/null
+++ b/deliverable_v1.1.0/modules/09_tmdb.md
@@ -0,0 +1,109 @@
+<!-- module: tmdb -->
+<!-- description: TMDb enrichment endpoints — prefetch, probe, resource, check -->
+<!-- depends: 01_auth, 03_register -->
+
+## TMDb Enrichment
+
+> **Offline operation**: TMDb prefetch now checks local identity files first (`identities/_index.json` + `*.tmdb.json`).
+> If local files exist, no external API call is made. Internet is only needed for initial data seeding.
+
+### Overview
+
+TMDb enrichment is an optional identity enrichment step that can be run after Pipeline face detection completes. The workflow is:
+
+1. **Prefetch** (requires internet): Download movie cast data from TMDb API → cache to `{file_uuid}.tmdb.json`
+2. **Probe**: Read local cache → create identities for **all** cast members (`source='tmdb'`) + save `identity.json` + download profile image to `{OUTPUT}/identities/{uuid}/profile.jpg`
+3. **Match**: The worker automatically matches video faces against TMDb identities when `MOMENTRY_TMDB_PROBE_ENABLED=true`
+
+### `POST /api/v1/agents/tmdb/prefetch`
+
+**Auth**: Required
+**Scope**: file-level
+
+Fetch TMDb cast data for a registered file and cache it locally. This is the only step requiring internet access.
+
+#### Request Parameters
+
+| Field | Type | Required | Description |
+|-------|------|----------|-------------|
+| `file_uuid` | string | Yes | File UUID to enrich |
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/agents/tmdb/prefetch" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"file_uuid": "'"$FILE_UUID"'"}'
+```
+
+#### Response (200)
+
+```json
+{"success": true, "file_uuid": "...", "cache_path": "/output/...tmdb.json"}
+```
+
+### `POST /api/v1/file/:file_uuid/tmdb-probe`
+
+**Auth**: Required
+**Scope**: file-level
+
+Read local TMDb cache and create/update identities. Requires prefetch to have been run first.
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/file/$FILE_UUID/tmdb-probe" \
+  -H "X-API-Key: $KEY" | jq '{identities_created, movie_title}'
+```
+
+#### Response (200 — identities created)
+
+```json
+{"success": true, "identities_created": 15, "movie_title": "Charade"}
+```
+
+#### Response (200 — no cache)
+
+```json
+{"success": false, "message": "No TMDb cache found. Run tmdb-prefetch first."}
+```
+
+### `GET /api/v1/resource/tmdb`
+
+**Auth**: Required
+**Scope**: system-level
+
+View TMDb resource status including configuration, identity counts, and cache file count.
+
+#### Example
+
+```bash
+curl -s "$API/api/v1/resource/tmdb" -H "X-API-Key: $KEY" \
+  | jq '{identities_seeded, cache_files}'
+```
+
+### `POST /api/v1/resource/tmdb/check`
+
+**Auth**: Required
+**Scope**: system-level
+
+Ping the TMDb API to verify connectivity and measure latency.
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/resource/tmdb/check" \
+  -H "X-API-Key: $KEY" | jq '.status'
+```
+
+#### Response
+
+```json
+{
+  "api_key_configured": true,
+  "enabled": false,
+  "api_reachable": true,
+  "api_latency_ms": 120
+}
+```
diff --git a/deliverable_v1.1.0/modules/10_pipeline.md b/deliverable_v1.1.0/modules/10_pipeline.md
new file mode 100644
index 0000000..05c1f4a
--- /dev/null
+++ b/deliverable_v1.1.0/modules/10_pipeline.md
@@ -0,0 +1,178 @@
+<!-- module: pipeline -->
+<!-- description: Pipeline processors, ingestion status, stats endpoints -->
+<!-- depends: 01_auth -->
+
+## Pipeline
+
+### Dependency Graph
+
+```mermaid
+flowchart TB
+    subgraph Processors["10 Processors"]
+        Cut[Cut] --> ASR[ASR]
+        ASR --> ASRX[ASRX]
+        ASRX --> Story[Story]
+        Cut --> Story
+        YOLO[YOLO] --> VisualChunk[VisualChunk]
+        VisualChunk --> Story
+        Face[Face] --> Story
+        Story --> FiveW1H[5W1H]
+        OCR[OCR]
+        Pose[Pose]
+    end
+
+    subgraph Ingestion["入庫 (Post-Processing)"]
+        ASR --> Rule1[Rule 1 Sentence]
+        ASRX --> Rule1
+        Rule1 --> Vectorize[Auto-Vectorize]
+        Rule1 --> Phase1[Phase 1 Pack]
+
+        Cut --> Rule3[Rule 3 Scene]
+        ASR --> Rule3
+
+        Face --> Trace[Face Trace]
+        Trace --> Qdrant[Qdrant Sync]
+        Trace --> TraceChunks[Trace Chunks]
+        Trace --> TKG[TKG Builder]
+
+        Face --> TMDbMatch[TMDb Match]
+        Face --> SceneMeta[Scene Metadata]
+        YOLO --> SceneMeta
+        Face --> IdentityAgent[Identity Agent]
+        ASRX --> IdentityAgent
+
+        Cut --> Agent5W1H[5W1H Agent]
+        ASR --> Agent5W1H
+        Agent5W1H --> Phase2[Phase 2 Pack]
+    end
+
+    style Processors fill:#1a1a2e,stroke:#e94560
+    style Ingestion fill:#16213e,stroke:#0f3460
+```
+
+### Pipeline Completion Flow
+
+The pipeline is **not complete** until both the 10 processors AND the 入庫 (ingestion) steps have finished. The worker polls every 3 seconds and only marks the job as `completed` when all ingestion steps verify OK.
+
+```
+10 processors done
+     ↓  (job status stays "running")
+Algorithm 1 Trigger: Rule 1 + Vectorize + Phase 1 Pack
+     ↓  (job runs in parallel)
+Algorithm 2 Trigger: Face Trace → TKG, Scene Metadata, Identity Agent, 5W1H Agent
+     ↓  (poll checks every 3s)
+Ingestion verification: rule1 ✓ vectorize ✓ rule3 ✓ face_trace ✓ tkg ✓ scene_meta ✓ 5w1h ✓
+     ↓
+job status = "completed"
+```
+
+### 10 Processor Stages
+
+| # | Processor | Depends On | Description |
+|---|-----------|------------|-------------|
+| 1 | `Cut` | — | Scene boundary detection (PySceneDetect) |
+| 2 | `ASR` | Cut | Automatic speech recognition (faster-whisper) |
+| 3 | `ASRX` | ASR | Speaker diarization + ASR refinement |
+| 4 | `YOLO` | — | Object detection (YOLOv8) |
+| 5 | `OCR` | — | Optical character recognition |
+| 6 | `Face` | — | Face detection + recognition (InsightFace + CoreML) |
+| 7 | `Pose` | — | Pose estimation |
+| 8 | `VisualChunk` | YOLO | Visual object chunking |
+| 9 | `Story` | ASRX + Cut + YOLO + Face | Narrative scene summarization (LLM, with embedding) |
+| 10 | `5W1H` | Story | Who/What/When/Where/Why extraction (LLM, with embedding) |
+
+### 入庫 (Post-Processing / Ingestion)
+
+These steps run after the 10 processors and are **required for pipeline completion**. The worker checks all of them before marking the job as done.
+
+| # | Step | Triggers When | Verification |
+|---|------|--------------|-------------|
+| 1 | **Rule 1 Sentence Chunking** | ASR + ASRX done | `chunk` table has rows with `chunk_type = 'sentence'` |
+| 2 | **Auto-Vectorize** | Rule 1 done | `chunk.embedding` IS NOT NULL for sentence chunks |
+| 3 | **Phase 1 Pack** | Rule 1 done | `release_pack.py --phase 1` executed |
+| 4 | **Rule 3 Scene Chunking** | All 10 processors done + Cut + ASR | `chunk` table has rows with `chunk_type = 'cut'` |
+| 5 | **Face Trace** | All 10 processors done + Face | `face_detections.trace_id` IS NOT NULL |
+| 6 | **Qdrant Face Sync** | Face Trace done | Qdrant face_embedding collection populated |
+| 7 | **Trace Chunks** | Face Trace done | `chunk` table has rows with `chunk_type = 'trace'` |
+| 8 | **TKG Builder** | Face Trace done | `tkg_nodes` + `tkg_edges` tables have rows |
+| 9 | **TMDb Face Matching** | TMDb enabled + Face done | `face_detections.identity_id` IS NOT NULL |
+| 10 | **Heuristic Scene Metadata** | Face + YOLO done | `{file_uuid}.scene_meta.json` exists on disk |
+| 11 | **Identity Agent** | Face + ASRX done | `identities` with `source = 'identity_agent'` |
+| 12 | **5W1H Agent** | Cut + ASR done | `chunk.summary_text` IS NOT NULL for cut chunks |
+| 13 | **Release Pack** | 5W1H Agent done | `release_pack.py --phase 2` executed |
+
+### Ingestion Status
+
+Check real-time ingestion status for a file:
+
+```bash
+curl "$API/api/v1/stats/ingestion-status/{file_uuid}"
+```
+
+Returns per-step `done` / `pending` status with detail counts.
+
+#### Example
+
+```bash
+curl "http://localhost:3003/api/v1/stats/ingestion-status/bd80fec9c42afb0307eb28f22c64c76a" | jq '.steps[] | {name, status, detail}'
+```
+
+#### Response
+
+```json
+{
+  "file_uuid": "bd80fec9c42afb0307eb28f22c64c76a",
+  "steps": [
+    { "name": "rule1_sentence", "status": "pending", "detail": "0 sentence chunks" },
+    { "name": "auto_vectorize",  "status": "pending", "detail": "0 embedded" },
+    { "name": "rule3_scene",     "status": "pending", "detail": "0 scene chunks" },
+    { "name": "face_trace",      "status": "pending", "detail": "0 traces" },
+    { "name": "trace_chunks",    "status": "pending", "detail": "0 trace chunks" },
+    { "name": "tkg",             "status": "pending", "detail": "0 nodes, 0 edges" },
+    { "name": "identity_match",  "status": "pending", "detail": "0 identities" },
+    { "name": "scene_metadata",  "status": "pending", "detail": null },
+    { "name": "5w1h",            "status": "pending", "detail": "0 scenes with 5W1H" }
+  ]
+}
+```
+
+### Stats Endpoints
+
+| Method | Endpoint | Auth | Description |
+|--------|----------|------|-------------|
+| GET | `/api/v1/stats/sftpgo` | No | SFTPGo service status |
+| GET | `/api/v1/stats/ingestion-status/:file_uuid` | No | Per-file ingestion checklist |
+
+### Configuration
+
+### `POST /api/v1/config/cache`
+
+**Auth**: Required
+**Scope**: system-level
+
+Toggle the Redis cache on or off.
+
+#### Request Parameters
+
+| Field | Type | Required | Description |
+|-------|------|----------|-------------|
+| `enabled` | boolean | Yes | `true` to enable, `false` to disable |
+
+#### Example
+
+```bash
+curl -s -X POST "$API/api/v1/config/cache" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"enabled": false}'
+```
+
+### Unmounted Routes
+
+The following routes are defined in source code but are **NOT** currently mounted in the router:
+
+| Endpoint | Source file |
+|----------|-------------|
+| `/api/v1/search/persons` | `universal_search.rs` (not mounted) |
+| `/api/v1/who` | `who.rs` |
+| `/api/v1/who/candidates` | `who.rs` |
diff --git a/deliverable_v1.1.0/modules/11_error_codes.md b/deliverable_v1.1.0/modules/11_error_codes.md
new file mode 100644
index 0000000..15f2dad
--- /dev/null
+++ b/deliverable_v1.1.0/modules/11_error_codes.md
@@ -0,0 +1,57 @@
+<!-- module: error_codes -->
+<!-- description: Standard API error codes -->
+<!-- depends: -->
+
+## Error Response Format
+
+All API errors follow this JSON structure:
+
+```json
+{
+  "success": false,
+  "error": {
+    "code": "E001_NOT_FOUND",
+    "message": "Resource not found",
+    "details": {"resource": "file_uuid", "value": "abc"}
+  }
+}
+```
+
+## Error Code List
+
+### Generic Errors (E0xx)
+
+| Code | HTTP | Description |
+|------|------|-------------|
+| `E001_NOT_FOUND` | 404 | Resource not found (file, identity, chunk) |
+| `E002_DUPLICATE` | 409 | Resource already exists |
+| `E003_VALIDATION` | 400 | Request parameter validation failed |
+| `E004_UNAUTHORIZED` | 401 | Invalid API key or token |
+| `E005_INTERNAL` | 500 | Internal server error |
+
+### Processor Errors (E1xx)
+
+| Code | HTTP | Description |
+|------|------|-------------|
+| `E101_PROCESSOR_FAIL` | 500 | Python script execution failed |
+| `E102_TIMEOUT` | 504 | Processing timeout |
+| `E103_RESUME_FAIL` | 500 | Resume failed (checkpoint not found) |
+| `E104_NO_VIDEO` | 400 | Video file path not found |
+
+### Identity Errors (E2xx)
+
+| Code | HTTP | Description |
+|------|------|-------------|
+| `E201_FACE_NOT_FOUND` | 404 | Face detection not found |
+| `E202_MERGE_CONFLICT` | 409 | Identity merge conflict |
+| `E203_CANDIDATE_EMPTY` | 404 | No candidates available for confirmation |
+
+### TMDb Errors (E3xx)
+
+| Code | HTTP | Description |
+|------|------|-------------|
+| `E301_TMDB_NO_KEY` | 400 | `TMDB_API_KEY` environment variable not set |
+| `E302_TMDB_UNREACHABLE` | 502 | TMDb API unreachable or timed out |
+| `E303_TMDB_CACHE_NOT_FOUND` | 200 | No local TMDb cache; run prefetch first |
+| `E304_TMDB_PROBE_FAILED` | 500 | TMDb probe execution failed |
+| `E305_TMDB_MOVIE_NOT_FOUND` | 404 | No matching TMDb movie found from filename |
diff --git a/deliverable_v1.1.0/modules/12_agent.md b/deliverable_v1.1.0/modules/12_agent.md
new file mode 100644
index 0000000..e17fbc3
--- /dev/null
+++ b/deliverable_v1.1.0/modules/12_agent.md
@@ -0,0 +1,118 @@
+# Agent Endpoints
+
+Agent endpoints provide AI-powered capabilities including translation, identity analysis, and 5W1H extraction.
+
+## POST /api/v1/agents/translate
+
+Translate text between languages using Gemma4 (llama.cpp, port 8082).
+
+### Request
+
+```json
+{
+  "text": "Hello, welcome to Momentry Core.",
+  "target_language": "Traditional Chinese",
+  "source_language": "English"
+}
+```
+
+| Field | Type | Required | Description |
+|-------|------|----------|-------------|
+| `text` | string | ✅ | Text to translate |
+| `target_language` | string | ✅ | Target language name (e.g. "Traditional Chinese", "Japanese") |
+| `source_language` | string | ❌ | Source language (default: "auto") |
+
+### Response
+
+```json
+{
+  "success": true,
+  "translated_text": "您好，歡迎使用 Momentry Core。",
+  "source_language_detected": "English",
+  "model_used": "google_gemma-4-26B-A4B-it-Q5_K_M.gguf"
+}
+```
+
+### Supported Language Pairs (tested)
+
+| Source | Target | Quality |
+|--------|--------|---------|
+| English | Traditional Chinese | ✅ |
+| English | Japanese | ✅ |
+| Chinese | English | ✅ |
+| English | French | ✅ |
+| Chinese | Japanese | ✅ |
+
+### Model
+
+- **Model**: Gemma4 26B (Q5_K_M)
+- **Engine**: llama.cpp at `localhost:8082`
+- **Endpoint**: `/v1/chat/completions` (OpenAI-compatible)
+- **Temperature**: 0.1
+- **Max tokens**: 1024
+
+### Errors
+
+| Status | Condition |
+|--------|-----------|
+| 500 | LLM unreachable or response parse failure |
+| 401 | Missing/invalid auth |
+
+---
+
+## POST /api/v1/agents/5w1h/analyze
+
+Extract 5W1H (Who, What, When, Where, Why, How) from a scene. Uses Gemma4 LLM on port 8082.
+
+### Request
+
+```json
+{
+  "file_uuid": "3abeee81d94597629ed8cb943f182e94",
+  "scene_id": 42
+}
+```
+
+### Response
+
+```json
+{
+  "success": true,
+  "5w1h": {
+    "who": ["Cary Grant"],
+    "what": ["discussing plans"],
+    "when": ["1963"],
+    "where": ["Paris"],
+    "why": ["vacation"],
+    "how": ["in person"]
+  }
+}
+```
+
+## POST /api/v1/agents/5w1h/batch
+
+Batch analyze all scenes in a file for 5W1H extraction. Uses the pipeline's `parent_chunk_5w1h.py --mode llm`.
+
+### Request
+
+```json
+{
+  "file_uuid": "3abeee81d94597629ed8cb943f182e94"
+}
+```
+
+## GET /api/v1/agents/5w1h/status
+
+Get status of the 5W1H agent pipeline for a file.
+
+---
+
+## Embedding Model
+
+| Detail | Value |
+|--------|-------|
+| **Model** | EmbeddingGemma-300m |
+| **Endpoint** | `POST /v1/embeddings` on port 11436 |
+| **Dimension** | 768 |
+| **Used by** | `parent_chunk_5w1h.py --embed`, story, 5W1H, search |
+
diff --git a/deliverable_v1.1.0/modules/_template.md b/deliverable_v1.1.0/modules/_template.md
new file mode 100644
index 0000000..3a14aff
--- /dev/null
+++ b/deliverable_v1.1.0/modules/_template.md
@@ -0,0 +1,63 @@
+# {Module Name} — API Workspace Module
+
+> Use this template when adding or editing API endpoint documentation modules.
+
+## Module Metadata
+
+Every module MUST start with:
+
+```markdown
+<!-- module: <short_name> -->
+<!-- description: One-line description of what this module covers -->
+<!-- depends: <comma-separated list of dependency module names> -->
+```
+
+## Endpoint Template
+
+Each endpoint MUST use this structure:
+
+### `METHOD /path/to/endpoint`
+
+**Auth**: Required / Optional / Public
+
+**Scope**: file-level / identity-level / system-level
+
+#### Request Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `param1` | string | Yes | — | Description |
+
+#### Example
+
+```bash
+# brief description of what this example demonstrates
+curl -s -X METHOD "$API/path" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"param1": "value"}'
+```
+
+#### Response (200)
+
+```json
+{ "success": true }
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `success` | boolean | Always true on 200 |
+
+#### Error Codes
+
+| Code | HTTP | When |
+|------|------|------|
+| E0xx | 4xx | Description |
+
+## Rules
+
+1. Each module file covers ONE topic group (e.g., `09_tmdb.md` = all TMDb endpoints)
+2. Use `$API` and `$KEY` in all curl examples
+3. Use `$FILE_UUID`, `$IDENTITY_UUID` variables for UUID examples
+4. Module filename = `NN_topic.md` (NN = execution order, 01-99)
+5. `depends` metadata = which modules must be assembled before this one
diff --git a/deliverable_v1.1.0/scripts/build_docs.py b/deliverable_v1.1.0/scripts/build_docs.py
new file mode 100644
index 0000000..ad3a3a6
--- /dev/null
+++ b/deliverable_v1.1.0/scripts/build_docs.py
@@ -0,0 +1,225 @@
+#!/opt/homebrew/bin/python3.11
+"""Build HTML documentation from module source files."""
+import os, markdown, re, glob, shutil
+
+MODULES_DIR = os.path.join(os.path.dirname(__file__), "..", "docs_v1.0", "API_WORKSPACE", "modules")
+DOC_DIR = os.path.join(os.path.dirname(__file__), "..", "docs_v1.0", "doc")
+DOC_DEV_DIR = os.path.join(os.path.dirname(__file__), "..", "docs_v1.0", "doc_developer")
+
+# User-facing modules (no developer content)
+USER_MODULES = {
+    "01_auth", "02_health", "03_register", "04_lookup", "05_process",
+    "06_search", "07_identity", "08_identity_agent", "08_media",
+    "09_tmdb", "10_pipeline", "12_agent",
+}
+
+
+def md_to_html(md_text: str) -> str:
+    """Convert Markdown to HTML."""
+    html = markdown.markdown(md_text, extensions=['fenced_code', 'tables', 'codehilite'])
+    # Wrap tables
+    html = re.sub(r'<table>', '<table class="table">', html)
+    return html
+
+def build_index(files, dev=False):
+    """Build index.html."""
+    links = []
+    for fname in sorted(files):
+        name = os.path.splitext(fname)[0]
+        label = MODULE_LABELS.get(name, name.replace("_", " ").title())
+        if "｜" in label:
+            cn, en = label.split("｜", 1)
+        else:
+            cn, en = label, ""
+        html_name = fname.replace(".md", ".html")
+        links.append(f'<tr onclick="window.location=\'{html_name}\'" style="cursor:pointer"><td class="cn">{cn}</td><td class="en">{en}</td></tr>')
+    
+    title = "Momentry API 開發者文件" if dev else "Momentry API 文件"
+    subtitle = "開發者專用" if dev else "API 參考手冊 — 登入後可瀏覽各模組文件"
+    
+    return f"""<!DOCTYPE html>
+<html lang="zh-TW">
+<head>
+<meta charset="UTF-8">
+<title>{title}</title>
+<style>
+* {{ margin: 0; padding: 0; box-sizing: border-box; }}
+body {{ font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }}
+.container {{ max-width: 900px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }}
+h1 {{ font-size: 28px; margin-bottom: 8px; }}
+p.subtitle {{ color: #666; margin-bottom: 24px; }}
+table {{ width: 100%; border-collapse: collapse; }}
+tr {{ border-bottom: 1px solid #eee; }}
+tr:last-child {{ border: none; }}
+td {{ padding: 10px 0; }}
+td.cn {{ width: 140px; font-weight: 600; color: #333; }}
+td.en {{ color: #666; font-size: 14px; }}
+a {{ color: #0066cc; text-decoration: none; display: block; }}
+a:hover td {{ background: #f8f8f8; border-radius: 4px; }}
+</style>
+</head>
+<body>
+<div class="container">
+<h1>{title}</h1>
+<p class="subtitle">{subtitle}</p>
+<table>{"".join(links)}</table>
+</div>
+</body>
+</html>"""
+
+MODULE_LABELS = {
+    "01_auth": "安全認證｜Authentication",
+    "02_health": "健康檢查｜Health",
+    "03_register": "檔案註冊｜File Registration",
+    "04_lookup": "檔案屬性查詢｜File Lookup",
+    "05_process": "處理流程｜Processing",
+    "06_search": "搜尋功能｜Search",
+    "07_identity": "身份識別｜Identity",
+    "08_identity_agent": "智能身份綁定｜Smart Identity Binding",
+    "08_media": "串流與截圖｜Streaming & Thumbnails",
+    "09_tmdb": "TMDb 整合｜TMDb Integration",
+    "10_pipeline": "生產線｜Pipeline",
+    "11_error_codes": "錯誤碼｜Error Codes",
+    "12_agent": "智慧代理｜AI Agents",
+}
+
+def build_html(md_text: str, title: str) -> str:
+    """Wrap MD content in HTML page."""
+    content = md_to_html(md_text)
+    return f"""<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>{title} - Momentry API Docs</title>
+<style>
+* {{ margin: 0; padding: 0; box-sizing: border-box; }}
+body {{ font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }}
+.container {{ max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }}
+h1 {{ font-size: 24px; margin: 24px 0 12px; }}
+h2 {{ font-size: 20px; margin: 20px 0 10px; color: #222; }}
+h3 {{ font-size: 16px; margin: 16px 0 8px; color: #444; }}
+p {{ line-height: 1.6; margin: 8px 0; }}
+table {{ border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }}
+th, td {{ border: 1px solid #ddd; padding: 8px 12px; text-align: left; }}
+th {{ background: #f0f0f0; font-weight: 600; }}
+code {{ background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }}
+pre {{ background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }}
+pre code {{ background: none; padding: 0; }}
+a {{ color: #0066cc; }}
+.back {{ display: inline-block; margin-bottom: 20px; color: #666; }}
+.back:hover {{ color: #333; }}
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+{content}
+</div>
+</body>
+</html>"""
+
+def login_page() -> str:
+    return """<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Login - Momentry Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; display: flex; justify-content: center; align-items: center; height: 100vh; }
+.card { background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; width: 360px; }
+h1 { font-size: 24px; margin-bottom: 24px; text-align: center; }
+input { width: 100%; padding: 10px 12px; margin-bottom: 12px; border: 1px solid #ddd; border-radius: 6px; font-size: 14px; }
+button { width: 100%; padding: 10px; background: #0066cc; color: white; border: none; border-radius: 6px; font-size: 16px; cursor: pointer; }
+button:hover { background: #0052a3; }
+.error { color: #cc0000; font-size: 13px; margin-bottom: 12px; display: none; }
+</style>
+</head>
+<body>
+<div class="card">
+<h1>Momentry Docs</h1>
+<form id="loginForm">
+<input type="text" id="username" placeholder="Username" value="demo" required>
+<input type="password" id="password" placeholder="Password" value="demo" required>
+<div class="error" id="error">Invalid credentials</div>
+<button type="submit">Login</button>
+</form>
+</div>
+<script>
+document.getElementById('loginForm').onsubmit = async function(e) {
+    e.preventDefault();
+    const resp = await fetch('/api/v1/auth/login', {
+        method: 'POST',
+        headers: {'Content-Type': 'application/json'},
+        body: JSON.stringify({
+            username: document.getElementById('username').value,
+            password: document.getElementById('password').value
+        })
+    });
+    if (resp.ok) {
+        window.location.href = '/doc/index.html';
+    } else {
+        document.getElementById('error').style.display = 'block';
+    }
+};
+</script>
+</body>
+</html>"""
+
+def main():
+    # Clean and recreate doc dirs
+    for d in [DOC_DIR, DOC_DEV_DIR]:
+        if os.path.exists(d):
+            shutil.rmtree(d)
+        os.makedirs(d)
+    
+    md_files = sorted(glob.glob(os.path.join(MODULES_DIR, "*.md")))
+    if not md_files:
+        print(f"No MD files found in {MODULES_DIR}")
+        return
+    
+    user_html = []
+    dev_html = []
+    for md_path in md_files:
+        with open(md_path) as f:
+            md_text = f.read()
+        fname = os.path.basename(md_path)
+        stem = os.path.splitext(fname)[0]
+        
+        # Skip template
+        if stem == "_template":
+            continue
+            
+        # Skip error codes (developer-only)
+        if stem == "11_error_codes":
+            dev_only = True
+        else:
+            dev_only = stem not in USER_MODULES
+        
+        title = stem.replace("_", " ").title()
+        html = build_html(md_text, title)
+        
+        if dev_only:
+            out_path = os.path.join(DOC_DEV_DIR, fname.replace(".md", ".html"))
+            with open(out_path, "w") as f:
+                f.write(html)
+            dev_html.append(fname)
+            print(f"  [dev] {fname}")
+        else:
+            out_path = os.path.join(DOC_DIR, fname.replace(".md", ".html"))
+            with open(out_path, "w") as f:
+                f.write(html)
+            user_html.append(fname)
+            print(f"  [doc] {fname}")
+    
+    # Build indexes + login page
+    for d, files, label in [(DOC_DIR, user_html, "User"), (DOC_DEV_DIR, dev_html, "Dev")]:
+        index = build_index(files)
+        with open(os.path.join(d, "index.html"), "w") as f:
+            f.write(index)
+        with open(os.path.join(d, "login.html"), "w") as f:
+            f.write(login_page())
+        print(f"  {label}: {len(files)} pages -> {d}")
+
+if __name__ == "__main__":
+    main()
diff --git a/deliverable_v1.1.0/scripts/sync_dev_to_public.sh b/deliverable_v1.1.0/scripts/sync_dev_to_public.sh
new file mode 100755
index 0000000..16ebb14
--- /dev/null
+++ b/deliverable_v1.1.0/scripts/sync_dev_to_public.sh
@@ -0,0 +1,148 @@
+#!/bin/bash
+# sync_dev_to_public.sh — 比對 dev/public schema，同步 pipeline 資料
+# Usage: ./sync_dev_to_public.sh [check|sync] [file_uuid]
+
+PSQL="/opt/homebrew/opt/libpq/bin/psql"
+
+set -euo pipefail
+
+SCHEMA="${MOMENTRY_DB_SCHEMA:-dev}"
+DB_URL="${DATABASE_URL:-postgres://accusys@localhost:5432/momentry}"
+MODE="${1:-check}"
+FILE_UUID="${2:-}"
+
+TABLES=("videos" "chunk" "face_detections" "processor_results" "monitor_jobs"
+        "identities" "identity_bindings" "tkg_nodes" "tkg_edges")
+
+TARGET="public"
+
+if [ -z "$FILE_UUID" ]; then
+    echo "Usage: $0 [check|sync] <file_uuid>"
+    echo ""
+    echo "Examples:"
+    echo "  $0 check bd80fec92b0b6963d177a2c55bf713e2"
+    echo "  $0 sync  bd80fec92b0b6963d177a2c55bf713e2"
+    exit 1
+fi
+
+echo "=== Schema Sync: $SCHEMA → $TARGET ==="
+echo "File UUID: $FILE_UUID"
+echo "Mode: $MODE"
+echo ""
+
+check_table() {
+    local table=$1
+    local col=$2
+    local src_count dev_count pub_count
+
+    dev_count=$($PSQL -At "$DB_URL" -c "SELECT COUNT(*) FROM ${SCHEMA}.${table} WHERE ${col} = '${FILE_UUID}';" 2>/dev/null || echo "ERROR")
+    pub_count=$($PSQL -At "$DB_URL" -c "SELECT COUNT(*) FROM ${TARGET}.${table} WHERE ${col} = '${FILE_UUID}';" 2>/dev/null || echo "ERROR")
+
+    if [ "$dev_count" = "ERROR" ] || [ "$pub_count" = "ERROR" ]; then
+        echo "  ⚠️  $table — query error (table may not exist in $TARGET)"
+        return 1
+    fi
+
+    if [ "$dev_count" -eq "$pub_count" ]; then
+        echo "  ✅ $table — $dev_count rows (match)"
+        return 0
+    else
+        echo "  ❌ $table — dev=$dev_count  pub=$pub_count (MISMATCH)"
+        return 1
+    fi
+}
+
+sync_table() {
+    local table=$1
+    local col=$2
+    local src_count dev_count pub_count
+
+    dev_count=$($PSQL -At "$DB_URL" -c "SELECT COUNT(*) FROM ${SCHEMA}.${table} WHERE ${col} = '${FILE_UUID}';" 2>/dev/null || echo "0")
+    pub_count=$($PSQL -At "$DB_URL" -c "SELECT COUNT(*) FROM ${TARGET}.${table} WHERE ${col} = '${FILE_UUID}';" 2>/dev/null || echo "0")
+
+    if [ "$dev_count" = "0" ]; then
+        echo "  ⏭️  $table — dev has 0 rows, skipping"
+        return
+    fi
+
+    if [ "$dev_count" -eq "$pub_count" ]; then
+        echo "  ✅ $table — already synced ($dev_count rows)"
+        return
+    fi
+
+    echo "  🔄 Syncing $table: dev=$dev_count → pub=$pub_count ..."
+
+    # Delete existing public rows, insert from dev
+    $PSQL "$DB_URL" -q -c "DELETE FROM ${TARGET}.${table} WHERE ${col} = '${FILE_UUID}';" 2>/dev/null || true
+
+    # Get columns list (excluding id for SERIAL)
+    COLS=$($PSQL -At "$DB_URL" -c "
+        SELECT string_agg(column_name, ', ' ORDER BY ordinal_position)
+        FROM information_schema.columns
+        WHERE table_schema='${SCHEMA}' AND table_name='${table}'
+          AND column_name != 'id'
+          AND is_updatable='YES';
+    ")
+
+    $PSQL "$DB_URL" -q -c "
+        INSERT INTO ${TARGET}.${table} (${COLS})
+        SELECT ${COLS}
+        FROM ${SCHEMA}.${table}
+        WHERE ${col} = '${FILE_UUID}';
+    " 2>/dev/null && echo "  ✅ $table synced" || echo "  ❌ $table sync FAILED"
+}
+
+echo "=== Checking Tables ==="
+echo ""
+MISMATCH=0
+for table in "${TABLES[@]}"; do
+    # Determine the UUID column name for each table
+    case "$table" in
+        videos) col="file_uuid" ;;
+        chunk) col="file_uuid" ;;
+        face_detections) col="file_uuid" ;;
+        processor_results) col="file_uuid" ;;
+        monitor_jobs) col="uuid" ;;
+        identities) col="uuid" ;;  # identities.uuid is UUID type
+        identity_bindings) col="uuid" ;;
+        tkg_nodes) col="file_uuid" ;;
+        tkg_edges) col="file_uuid" ;;
+        *) col="file_uuid" ;;
+    esac
+
+    if ! check_table "$table" "$col"; then
+        MISMATCH=$((MISMATCH + 1))
+    fi
+done
+
+echo ""
+if [ "$MISMATCH" -eq 0 ]; then
+    echo "✅ All tables in sync"
+    exit 0
+fi
+
+if [ "$MODE" != "sync" ]; then
+    echo "⚠️  $MISMATCH table(s) have mismatches. Run '$0 sync $FILE_UUID' to fix."
+    exit 1
+fi
+
+echo "=== Syncing Tables ==="
+echo ""
+for table in "${TABLES[@]}"; do
+    case "$table" in
+        videos) col="file_uuid" ;;
+        chunk) col="file_uuid" ;;
+        face_detections) col="file_uuid" ;;
+        processor_results) col="file_uuid" ;;
+        monitor_jobs) col="uuid" ;;
+        identities) col="uuid" ;;
+        identity_bindings) col="uuid" ;;
+        tkg_nodes) col="file_uuid" ;;
+        tkg_edges) col="file_uuid" ;;
+        *) col="file_uuid" ;;
+    esac
+    sync_table "$table" "$col"
+done
+
+echo ""
+echo "✅ Sync complete"
diff --git a/deliverable_v1.1.0/scripts/update_qdrant_uuid.py b/deliverable_v1.1.0/scripts/update_qdrant_uuid.py
new file mode 100644
index 0000000..0e72de7
--- /dev/null
+++ b/deliverable_v1.1.0/scripts/update_qdrant_uuid.py
@@ -0,0 +1,174 @@
+#!/usr/bin/env python3
+"""批量更新 Qdrant collection 中的 file_uuid (舊→新)"""
+
+import json
+import subprocess
+import sys
+
+QDRANT_URL = "http://localhost:6333"
+
+# UUID mapping: 舊 → 新
+UUID_MAP = {
+    "aeed71342a899fe4b4c57b7d41bcb692": [
+        "bd80fec92b0b6963d177a2c55bf713e2",
+    ],
+}
+
+# Collections to process
+COLLECTIONS = [
+    "momentry_dev_v1",
+    "momentry_dev_stories",
+    "momentry_dev_voice",
+    "momentry_dev_rule1_v2",
+    "momentry_dev_faces",
+    "sentence_story",
+    "sentence_summary",
+]
+
+
+def qdrant_get(path: str) -> dict:
+    res = subprocess.run(
+        ["curl", "-s", "-X", "GET", f"{QDRANT_URL}{path}"],
+        capture_output=True, text=True
+    )
+    return json.loads(res.stdout) if res.stdout.strip() else {}
+
+
+def qdrant_post(path: str, body: dict) -> dict:
+    tmp = "/tmp/qdrant_post.json"
+    with open(tmp, "w") as f:
+        json.dump(body, f)
+    res = subprocess.run(
+        ["curl", "-s", "-X", "POST", f"{QDRANT_URL}{path}",
+         "-H", "Content-Type: application/json", "-d", f"@{tmp}"],
+        capture_output=True, text=True
+    )
+    return json.loads(res.stdout) if res.stdout.strip() else {}
+
+
+def qdrant_put(path: str, body: dict) -> dict:
+    tmp = "/tmp/qdrant_update.json"
+    with open(tmp, "w") as f:
+        json.dump(body, f)
+    res = subprocess.run(
+        ["curl", "-s", "-X", "PUT", f"{QDRANT_URL}{path}",
+         "-H", "Content-Type: application/json", "-d", f"@{tmp}"],
+        capture_output=True, text=True
+    )
+    return json.loads(res.stdout) if res.stdout.strip() else {}
+
+
+def scroll_all(collection: str, filter_old: dict) -> list:
+    """Scroll all matching points from a collection"""
+    points = []
+    offset = None
+    while True:
+        body = {
+            "limit": 1000,
+            "with_payload": True,
+            "with_vector": True,
+            "filter": filter_old,
+        }
+        if offset:
+            body["offset"] = offset
+        result = qdrant_post(f"/collections/{collection}/points/scroll", body)
+        batch = result.get("result", {}).get("points", [])
+        points.extend(batch)
+        next_offset = result.get("result", {}).get("next_page_offset")
+        if next_offset is None:
+            break
+        offset = next_offset
+    return points
+
+
+def update_points(collection: str, points: list, old_uuid: str, new_uuid: str):
+    """Update file_uuid in payload for the given points"""
+    if not points:
+        return 0
+
+    updated = []
+    for p in points:
+        pl = p.get("payload", {})
+        # Check both 'uuid' and 'file_uuid' fields
+        changed = False
+        if pl.get("uuid") == old_uuid:
+            pl["uuid"] = new_uuid
+            changed = True
+        if pl.get("file_uuid") == old_uuid:
+            pl["file_uuid"] = new_uuid
+            changed = True
+        if changed:
+            updated.append({
+                "id": p["id"],
+                "vector": p["vector"],
+                "payload": pl,
+            })
+
+    if not updated:
+        return 0
+
+    # Update in batches of 500
+    total = len(updated)
+    for i in range(0, total, 500):
+        batch = updated[i:i+500]
+        result = qdrant_put(
+            f"/collections/{collection}/points?wait=true",
+            {"points": batch}
+        )
+        if result.get("status") != "ok":
+            print(f"    Error at {i}: {result}")
+            return i
+    return total
+
+
+def main():
+    for collection in COLLECTIONS:
+        # Check if collection exists
+        info = qdrant_get(f"/collections/{collection}")
+        if "result" not in info:
+            continue
+
+        for old_uuid, new_uuids in UUID_MAP.items():
+            for new_uuid in new_uuids:
+                # Scroll all points with this old UUID
+                filter_body = {
+                    "must": [
+                        {"should": [
+                            {"key": "uuid", "match": {"value": old_uuid}},
+                            {"key": "file_uuid", "match": {"value": old_uuid}},
+                        ]}
+                    ]
+                }
+                points = scroll_all(collection, filter_body)
+                if not points:
+                    continue
+
+                print(f"{collection}: {len(points)} points with UUID {old_uuid[:8]}...")
+                updated = update_points(collection, points, old_uuid, new_uuid)
+                print(f"  → {updated} points updated to {new_uuid[:8]}...")
+
+    # Verify
+    print("\n=== Verification ===")
+    for collection in COLLECTIONS:
+        for old_uuid, new_uuids in UUID_MAP.items():
+            for what, uuid in [("old", old_uuid), ("new", new_uuids[0])]:
+                filter_body = {
+                    "must": [
+                        {"should": [
+                            {"key": "uuid", "match": {"value": uuid}},
+                            {"key": "file_uuid", "match": {"value": uuid}},
+                        ]}
+                    ]
+                }
+                result = qdrant_post(
+                    f"/collections/{collection}/points/count",
+                    {"filter": filter_body}
+                )
+                cnt = result.get("result", {}).get("count", 0)
+                if cnt > 0:
+                    print(f"  {collection}: {cnt} points with {what} UUID")
+    print("✅ Done")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/docs/3002_3003_SEPARATION_STATUS.md b/docs/3002_3003_SEPARATION_STATUS.md
new file mode 100644
index 0000000..ad5a08c
--- /dev/null
+++ b/docs/3002_3003_SEPARATION_STATUS.md
@@ -0,0 +1,70 @@
+# 3002/3003 Schema Separation Status
+
+Date: 2026-05-17
+Status: ✅ Pipeline tables created in `public`; schema incompatibilities remain
+
+## Summary
+
+| Schema | Has pipeline tables | Has auth tables | Used by |
+|--------|-------------------|-----------------|---------|
+| `public` | ✅ (newly created) | ✅ (original) | 3002 (production) — currently using `dev` as workaround |
+| `dev` | ✅ (full, working) | ✅ (synced) | 3003 (playground) |
+
+## What Was Done
+
+### Pipeline tables created in `public` schema (11 tables)
+- `videos`, `chunk`, `chunk_vectors`, `cuts`, `frames`
+- `monitor_jobs`, `processor_results`, `processor_versions`
+- `parent_chunks`, `tkg_edges`, `tkg_nodes`
+
+All include proper sequences, indexes, and constraints matching the `dev` schema.
+
+## Remaining Blockers
+
+### Schema incompatibilities between `dev` and `public`
+
+| Table | dev cols | public cols | Status |
+|-------|---------|------------|--------|
+| identities | 17 | 16 | ⚠️ Different columns (e.g. `name` vs `real_name`/`actor_name`) |
+| face_detections | 16 | 17 | ⚠️ Column count mismatch |
+| identity_bindings | 7 | 8 | ⚠️ Column count mismatch |
+| person_identities | 16 | 15 | ⚠️ Column count mismatch |
+| pre_chunks | 19 | 10 | ⚠️ Significantly different |
+| api_keys | 19 | 19 | ✅ Match |
+| resources | 9 | 9 | ✅ Match |
+| users | 8 | 8 | ✅ Match |
+
+### Identities table key differences
+- `public.identities` uses `real_name` + `actor_name` (old schema)
+- `dev.identities` uses `name` (new unified schema)
+- `dev.identities` has `tmdb_poster`, `file_uuid`, `face_embedding`, `voice_embedding`, `identity_embedding`
+- `public.identities` only has `face_embedding`, `voice_embedding` (no `identity_embedding`)
+
+## Options
+
+### Option A: Full data migration (recommended for later)
+1. Dump data from old public tables
+2. Drop old public tables
+3. Recreate from dev schema DDL
+4. Migrate data with column mapping
+5. Switch 3002 to `DATABASE_SCHEMA=public`
+
+### Option B: Keep current workaround (simplest for now)
+- 3002 continues with `DATABASE_SCHEMA=dev`
+- 3003 uses `DATABASE_SCHEMA=dev`
+- Both share the same schema, but have separate Redis key prefixes + ports
+
+### Option C: Rename dev → public (requires downtime)
+1. Stop all services
+2. Rename `dev` schema to something else
+3. Rename `public` to `public_old`
+4. Rename `dev` to `public`
+5. Update references
+
+## Current Status
+
+✅ Pipeline tables exist in both schemas
+✅ auth tables (users, sessions, jwt_blacklist) exist in both
+✅ Redis key prefixes separate (`momentry:` vs `momentry_dev:`)
+⚠️ 3002 still uses `DATABASE_SCHEMA=dev` workaround
+⛔ Shared tables need migration before 3002 can use `public` schema
diff --git a/docs_v1.0/API_WORKSPACE/.gitignore b/docs_v1.0/API_WORKSPACE/.gitignore
new file mode 100644
index 0000000..6bf8a98
--- /dev/null
+++ b/docs_v1.0/API_WORKSPACE/.gitignore
@@ -0,0 +1,2 @@
+_build/
+.DS_Store
diff --git a/docs_v1.0/API_WORKSPACE/README.md b/docs_v1.0/API_WORKSPACE/README.md
new file mode 100644
index 0000000..39a98c2
--- /dev/null
+++ b/docs_v1.0/API_WORKSPACE/README.md
@@ -0,0 +1,60 @@
+# API Workspace
+
+## Purpose
+
+This directory is the **single source of truth** for all API documentation modules.
+Generated outputs go to `../GUIDES/` as assembled deliverable documents.
+
+## Workflow
+
+```bash
+# 1. Edit a module
+vim modules/09_tmdb.md
+
+# 2. Preview the generated output
+make _build/API_ENDPOINTS.md
+
+# 3. Check diff against current GUIDES/ content
+make check
+
+# 4. Deploy to GUIDES/
+make deploy
+
+# 5. Regenerate all
+make all
+```
+
+## Directory Structure
+
+```
+API_WORKSPACE/
+├── modules/         ← 11 module files (01_auth ... 11_error_codes)
+├── configs/         ← 7 assembly recipies (.toml)
+├── narratives/      ← narrative intros for specific output files
+├── _build/          ← generated output (gitignored)
+├── Makefile         ← build targets
+├── assemble_docs.sh ← assembly engine
+└── README.md
+```
+
+## Available `make` Targets
+
+| Target | Output |
+|--------|--------|
+| `make reference` | `_build/API_REFERENCE.md` |
+| `make endpoints` | `_build/API_ENDPOINTS.md` |
+| `make quickref` | `_build/API_QUICK_REFERENCE.md` |
+| `make errors` | `_build/API_ERROR_CODES.md` |
+| `make index` | `_build/API_INDEX.md` |
+| `make marcom` | `_build/API_TRAINING_MARCOM.md` |
+| `make tmdb` | `_build/TMDb_User_Guide.md` |
+| `make all` | All of the above |
+| `make deploy` | Copy `_build/*` → `../GUIDES/` |
+| `make check` | `diff` against existing `../GUIDES/` files |
+
+## Adding a New Endpoint
+
+1. Add the endpoint to the appropriate module (e.g., `modules/XX_files.md`)
+2. Follow the template in `modules/_template.md`
+3. `make all && make check`
+4. `make deploy`
diff --git a/docs_v1.0/API_WORKSPACE/modules/06_search.md b/docs_v1.0/API_WORKSPACE/modules/06_search.md
index 0fad9df..3d2d83a 100644
--- a/docs_v1.0/API_WORKSPACE/modules/06_search.md
+++ b/docs_v1.0/API_WORKSPACE/modules/06_search.md
@@ -7,7 +7,7 @@
 ### `POST /api/v1/search/smart`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
 Semantic vector search using EmbeddingGemma-300m. Generates a query embedding via EmbeddingGemma (port 11436), then searches pgvector `story_parent` and `llm_parent` chunks by cosine similarity.
 
@@ -15,13 +15,22 @@ Semantic vector search using EmbeddingGemma-300m. Generates a query embedding vi
 
 | Field | Type | Required | Default | Description |
 |-------|------|----------|---------|-------------|
-| `file_uuid` | string | Yes | — | File UUID to search within |
 | `query` | string | Yes | — | Search text |
+| `file_uuid` | string | No | — | File UUID to search within. If omitted, searches all files (global search) |
 | `limit` | integer | No | 5 | Max results to return |
 | `page` | integer | No | 1 | Page number |
 | `page_size` | integer | No | 5 | Items per page |
 
-#### Example
+#### Example (Global Search)
+
+```bash
+curl -s -X POST "$API/api/v1/search/smart" \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer $JWT" \
+  -d '{"query": "Audrey Hepburn"}'
+```
+
+#### Example (File-specific Search)
 
 ```bash
 curl -s -X POST "$API/api/v1/search/smart" \
@@ -37,6 +46,7 @@ curl -s -X POST "$API/api/v1/search/smart" \
   "query": "Audrey Hepburn",
   "results": [
     {
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
       "parent_id": 1087822,
       "scene_order": 1087822,
       "start_frame": 104438,
@@ -54,12 +64,16 @@ curl -s -X POST "$API/api/v1/search/smart" \
 }
 ```
 
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].file_uuid` | string | File UUID where result was found |
+
 ---
 
 ### `POST /api/v1/search/universal`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
 Multi-type BM25 full-text search across chunks, frames, and persons. Uses PostgreSQL `tsvector`.
 
@@ -68,13 +82,22 @@ Multi-type BM25 full-text search across chunks, frames, and persons. Uses Postgr
 | Field | Type | Required | Default | Description |
 |-------|------|----------|---------|-------------|
 | `query` | string | Yes | — | Search text |
-| `file_uuid` | string | No | — | Restrict to specific file |
+| `file_uuid` | string | No | — | Restrict to specific file. If omitted, searches all files (global search) |
 | `types` | string[] | No | `["chunk","frame","person"]` | Search types |
 | `limit` | integer | No | 10 | Max results per type |
 | `page` | integer | No | 1 | Page number |
 | `page_size` | integer | No | 20 | Items per page |
 
-#### Example
+#### Example (Global Search)
+
+```bash
+curl -s -X POST "$API/api/v1/search/universal" \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer $JWT" \
+  -d '{"query": "Cary Grant"}'
+```
+
+#### Example (File-specific Search)
 
 ```bash
 curl -s -X POST "$API/api/v1/search/universal" \
@@ -90,6 +113,7 @@ curl -s -X POST "$API/api/v1/search/universal" \
   "results": [
     {
       "type": "chunk",
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
       "chunk_id": "bd80fec92b0b6963d177a2c55bf713e2_2",
       "chunk_type": "story_child",
       "start_frame": 5103,
@@ -98,6 +122,25 @@ curl -s -X POST "$API/api/v1/search/universal" \
       "end_time": 213.64,
       "text": "[213s-214s] Cary Grant: \"Olá!\"",
       "score": 0.9
+    },
+    {
+      "type": "frame",
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "frame_number": 5105,
+      "timestamp": 212.72,
+      "score": 0.7,
+      "objects": null,
+      "ocr_texts": null,
+      "faces": null
+    },
+    {
+      "type": "person",
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "identity_id": 12,
+      "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+      "name": "Cary Grant",
+      "appearance_count": 542,
+      "score": 0.95
     }
   ],
   "total": 20,
@@ -105,23 +148,78 @@ curl -s -X POST "$API/api/v1/search/universal" \
 }
 ```
 
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].type` | string | Result type: `chunk`, `frame`, or `person` |
+| `results[].file_uuid` | string | File UUID where result was found (all types) |
+
 ---
 
 ### `POST /api/v1/search/frames`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
 Search face detection frames by identity name or trace ID.
 
 ---
 
-### `POST /api/v1/search/identity_text`
+### `GET /api/v1/search/identity_text`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
-Search text chunks spoken by a specific identity.
+Search text chunks → find associated identities. Returns chunks where face detections overlap with text content.
+
+#### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `q` | string | Yes | — | Search text (ILIKE match) |
+| `file_uuid` | string | No | — | Restrict to specific file. If omitted, searches all files (global search) |
+| `limit` | integer | No | 50 | Max results |
+| `page` | integer | No | 1 | Page number |
+| `page_size` | integer | No | 50 | Items per page |
+
+#### Example (Global Search)
+
+```bash
+curl -s "$API/api/v1/search/identity_text?q=love" -H "X-API-Key: $KEY"
+```
+
+#### Example (File-specific Search)
+
+```bash
+curl -s "$API/api/v1/search/identity_text?file_uuid=$FILE_UUID&q=love" -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "total": 5,
+  "results": [
+    {
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "chunk_id": "llm_parent_..._256_270",
+      "start_time": 256.256,
+      "end_time": 270.228,
+      "text_content": "...lack of affection...",
+      "identity_id": 9,
+      "identity_name": "Audrey Hepburn",
+      "identity_source": "tmdb",
+      "trace_id": 94
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].file_uuid` | string | File UUID where chunk was found |
+| `results[].identity_id` | integer | Identity ID if face was detected |
+| `results[].trace_id` | integer | Face trace ID |
 
 ---
 
@@ -145,4 +243,4 @@ Search text chunks spoken by a specific identity.
 | **Storage** | pgvector (`chunk.embedding` column) |
 
 ---
-*Updated: 2026-05-19 12:49:24*
+*Updated: 2026-05-27 — Added global search support for smart, universal, identity_text APIs*
diff --git a/docs_v1.0/API_WORKSPACE/modules/07_identity.md b/docs_v1.0/API_WORKSPACE/modules/07_identity.md
index f662b2f..3178ba9 100644
--- a/docs_v1.0/API_WORKSPACE/modules/07_identity.md
+++ b/docs_v1.0/API_WORKSPACE/modules/07_identity.md
@@ -70,7 +70,16 @@ curl -s "$API/api/v1/identity/$IDENTITY_UUID" -H "X-API-Key: $KEY"
 **Auth**: Required
 **Scope**: identity-level
 
-Delete an identity permanently.
+Delete an identity permanently. All face detections bound to this identity are unbound (`identity_id` set to `NULL`). The identity JSON file is deleted from disk.
+
+#### History & Undo/Redo
+
+Every DELETE records a full snapshot of the identity and its unbound faces. See [`14_identity_history.md`](14_identity_history.md#4-delete-history--undoredo) for:
+
+- Undo via `POST /api/v1/identity/:identity_uuid/undo` — recreates identity and re-binds faces
+- Redo via `POST /api/v1/identity/:identity_uuid/redo` — re-deletes the identity
+
+**Note**: Delete undo/redo reuses the same endpoints as PATCH undo/redo. The endpoint automatically detects whether the identity was deleted (undo) or needs to be re-deleted (redo) based on the history record.
 
 ---
 
@@ -129,124 +138,75 @@ curl -s -X PATCH "$API/api/v1/identity/$IDENTITY_UUID" \
 
 | HTTP | When |
 |------|------|
-| `400` | No fields to update or invalid UUID format |
 | `404` | Identity not found |
+| `500` | Database error |
+
+#### History & Undo/Redo
+
+Every bind records a before/after snapshot. See [`14_identity_history.md`](14_identity_history.md#2-bindunbindtrace-history--undoredo) for:
+
+- `POST /api/v1/identity/:identity_uuid/bind/undo` — Revert a bind
+- `POST /api/v1/identity/:identity_uuid/bind/redo` — Reapply an undone bind
+- `GET /api/v1/identity/:identity_uuid/bind/history` — Query bind operations
 
 ---
 
-### `GET /api/v1/identity/:identity_uuid/files`
+## Metadata (Embedded JSON)
 
-**Auth**: Required
-**Scope**: identity-level
+The `identities.metadata` column is a **JSONB** field that stores arbitrary structured data alongside the identity's core fields (name, status, identity_type). No schema is enforced — any valid JSON object is accepted.
 
-Get all files where this identity appears. Returns per-file summary including face count, confidence, and appearance time range.
+### Merge Behavior
 
-#### Example
+| Operation | Strategy | Example |
+|-----------|----------|---------|
+| **PATCH** | Shallow top-level merge: `COALESCE(metadata,'{}'::jsonb) \|\| $1::jsonb` | Sending `{"tmdb_rating": 8.5}` only adds/overwrites `tmdb_rating`; all other existing keys are preserved. |
+| **mergeinto** | Recursive deep merge — nested sub-keys are merged individually, not replaced wholesale | Target has `{"tmdb": {"biography": "..."}}`, source has `{"tmdb": {"birthday": "1904-01-18"}}` → result is `{"tmdb": {"biography": "...", "birthday": "1904-01-18"}}`. |
+| **Upload (`POST`)** | Direct overwrite — the entire `metadata` field is replaced with the request value. | |
 
-```bash
-curl -s "$API/api/v1/identity/$IDENTITY_UUID/files" -H "X-API-Key: $KEY"
-```
+### Validation
 
----
+| Scenario | Result |
+|----------|--------|
+| PATCH with non-object metadata (`string`, `array`, `number`, `null`) | `400 Bad Request: "metadata must be a JSON object"` |
+| mergeinto with non-object metadata | Accepted (mergeinto validates at application level) |
+| Upload with non-object metadata | Accepted (upload replaces directly) |
 
-### `GET /api/v1/identity/:identity_uuid/faces`
+### Conventional Keys
 
-**Auth**: Required
-**Scope**: identity-level
+| Key | Type | Writer | Purpose |
+|-----|------|--------|---------|
+| `aliases` | `[{locale, name}]` | PATCH, mergeinto | Multilingual display names (see [Alias System](#alias-system-bcp-47-locale-tags)) |
+| `merged_into` | `{uuid, at}` | mergeinto | Marks an identity as merged (undo mechanism reads this) |
+| `tmdb_*` | various | TMDb probe | Movie metadata (biography, birthday, known_for, etc.). Written only when `MOMENTRY_TMDB_PROBE_ENABLED=true`. |
+| `source` | string | mergeinto | Tagged on aliases/metadata when added by merge (`"merge"` value) |
 
-Get all face detection records associated with this identity.
+Custom keys are fully supported — no registration required.
 
-#### Example
+### Search Coverage
 
-```bash
-curl -s "$API/api/v1/identity/$IDENTITY_UUID/faces" -H "X-API-Key: $KEY"
-```
+The identity search endpoint (`GET /api/v1/identity/search`) matches across three scopes:
 
-| Field | Type | Description |
-|-------|------|-------------|
-| `file_uuid` | string | File where face was detected |
-| `frame_number` | integer | Frame number of detection |
-| `face_id` | string | Face ID (format: `face_{frame_number}`) |
-| `confidence` | float | Detection confidence |
+1. `i.name` — exact and ILIKE against display name
+2. `jsonb_array_elements(i.metadata->'aliases')->>'name'` — locale-tagged alias names
+3. `i.metadata::text ILIKE $1` — raw string search across the entire JSON blob (all keys, all values)
 
----
+This means searching for `"1904-01-18"` or `"biography"` will match identities whose metadata contains those strings anywhere.
 
-### `GET /api/v1/identity/:identity_uuid/chunks`
+### History Snapshots
 
-**Auth**: Required
-**Scope**: identity-level
+Every `identity_history` record captures the **full metadata** in both `before_snapshot` and `after_snapshot` (as part of the complete identity JSONB dump). Undo restores the identity row — including metadata — to the `before_snapshot` state.
 
-Get all text chunks (sentences) spoken while this identity's face was on screen. Useful for finding what a person said.
+For merge operations, the MongoDB merge history records `metadata_fields_added` and `metadata_fields_added_paths` (dot-separated paths like `"tmdb.biography"`). Merge undo removes only those specific paths, preserving subsequent manual edits to other metadata keys.
 
-#### Example
+### Best Practices
 
-```bash
-curl -s "$API/api/v1/identity/$IDENTITY_UUID/chunks" -H "X-API-Key: $KEY"
-```
-
-#### Response (200)
-
-```json
-{
-  "success": true,
-  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
-  "data": [
-    {
-      "id": 0,
-      "file_uuid": "bd80fec92b0b6963d177a2c55bf713e2",
-      "chunk_id": "bd80fec92b0b6963d177a2c55bf713e2_2",
-      "chunk_type": "sentence",
-      "start_frame": 5103,
-      "end_frame": 5127,
-      "fps": 24.0,
-      "start_time": 212.64,
-      "end_time": 213.64,
-      "text_content": "[213s-214s] Cary Grant: \"Olá!\""
-    }
-  ]
-}
-```
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `file_uuid` | string | File identifier |
-| `chunk_id` | string | Sentence chunk identifier |
-| `start_frame` | integer | Frame-accurate start position |
-| `end_frame` | integer | Frame-accurate end position |
-| `fps` | float | Frames per second |
-| `start_time` | float | Start time in seconds |
-| `end_time` | float | End time in seconds |
-| `text_content` | string | Spoken text content |
-
----
-
-### `POST /api/v1/identity/:identity_uuid/bind`
-
-**Auth**: Required
-**Scope**: identity-level
-
-Bind a face detection to an identity. Associates the face trace with the identity for future search and recognition.
-
-#### Request Parameters
-
-| Field | Type | Required | Description |
-|-------|------|----------|-------------|
-| `file_uuid` | string | Yes | File where face is detected |
-| `face_id` | string | Yes | Face ID (format: `{frame}_{idx}`) |
-
-#### Side Effects
-
-- 清除該 face detection row 的 `stranger_id`（設為 NULL）
-- 不影響 `identities` 表中原有的 stranger auto-identity 記錄
-
-#### Example
-
-```bash
-curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind" \
-  -H "X-API-Key: $KEY" \
-  -H "Content-Type: application/json" \
-  -d '{"file_uuid": "'"$FILE_UUID"'", "face_id": "1_5"}'
-```
+| Guideline | Reason |
+|-----------|--------|
+| Deep nesting is allowed in metadata | All metadata merge operations use `jsonb_deep_merge()` — nested sub-keys are merged recursively, not replaced wholesale |
+| Use `aliases` for display names | Frontend has built-in locale fallback logic (see [Alias System](#alias-system-bcp-47-locale-tags)) |
+| Avoid >1MB per identity | Metadata is included in search indexing (`metadata::text ILIKE`); large blobs degrade query performance |
+| Don't rely on metadata ordering | JSONB preserves insertion order but PostgreSQL does not guarantee it across operations |
+| No LLM/Gemma4 agent writes to metadata | Only API endpoints (PATCH, mergeinto, upload) and TMDb probe modify `identities.metadata` |
 
 ---
 
@@ -295,6 +255,10 @@ curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind/trace" \
 | `404` | Identity not found |
 | `500` | Database error |
 
+#### History & Undo/Redo
+
+Trace bind operations share the same history/undo/redo system as single-face binds. See [`14_identity_history.md`](14_identity_history.md#2-bindunbindtrace-history--undoredo) for endpoints.
+
 ---
 
 ### `GET /api/v1/identity/:identity_uuid/traces`
@@ -382,6 +346,13 @@ Unbind a face detection from an identity. Removes the identity association from
 - 被 unbind 的 face 不會自動成為 stranger
 - 要重新標記為 stranger 需重新跑 Agent API（`identity/analyze`）
 
+#### History & Undo/Redo
+
+Unbind records a before/after snapshot. See [`14_identity_history.md`](14_identity_history.md#2-bindunbindtrace-history--undoredo) for:
+
+- `POST /api/v1/identity/:identity_uuid/bind/undo` — Revert an unbind
+- `POST /api/v1/identity/:identity_uuid/bind/redo` — Reapply an undone unbind
+
 ---
 
 ### `POST /api/v1/identity/:identity_uuid/mergeinto`
@@ -391,6 +362,13 @@ Unbind a face detection from an identity. Removes the identity association from
 
 Transfer all face bindings from this identity to another identity, then optionally delete or mark the source as merged.
 
+#### Two Merge Cases
+
+| Case | Description | Undo/Redo Support |
+|------|-------------|-------------------|
+| **stranger → identity** | Merge an auto-generated stranger identity into a known identity (TMDb or user-defined) | ✅ 24hr undo/redo |
+| **identity A → identity B** | Merge two known identities (e.g., duplicate entries) | ✅ 24hr undo/redo |
+
 #### Request Parameters
 
 | Field | Type | Required | Default | Description |
@@ -402,8 +380,12 @@ Transfer all face bindings from this identity to another identity, then optional
 
 - 轉移所有 `face_detections.identity_id` 到目標 identity
 - 同時清除所有被轉移 rows 的 `stranger_id`
+- 將 source name 加入 target aliases (with `source: "merge"` tag)
+- 將 source aliases 加入 target aliases (if not already present)
+- 將 source metadata fields 加入 target metadata (if not already present)
 - `keep_history: true`（預設）：source identity 設為 `status='merged'`，保留記錄
 - `keep_history: false`：**刪除** source identity 及其 identity JSON 檔案
+- **記錄 merge history 到 MongoDB**（支援 undo/redo）
 
 #### Example
 
@@ -411,7 +393,7 @@ Transfer all face bindings from this identity to another identity, then optional
 curl -s -X POST "$API/api/v1/identity/$SOURCE_UUID/mergeinto" \
   -H "X-API-Key: $KEY" \
   -H "Content-Type: application/json" \
-  -d '{"into_uuid": "'"$TARGET_UUID"'", "keep_history": false}'
+  -d '{"into_uuid": "'"$TARGET_UUID"'", "keep_history": true}'
 ```
 
 #### Response (200)
@@ -419,11 +401,23 @@ curl -s -X POST "$API/api/v1/identity/$SOURCE_UUID/mergeinto" \
 ```json
 {
   "success": true,
-  "message": "Merged 'stranger_13894' into 'Louis Viret' (52 faces transferred, source deleted)",
-  "data": { "faces_transferred": 52 }
+  "message": "Merged 'stranger_13894' into 'Louis Viret' (52 faces transferred, history kept)",
+  "data": {
+    "merge_id": "550e8400-e29b-41d4-a716-446655440000",
+    "faces_transferred": 52,
+    "aliases_added": 1,
+    "metadata_fields_added": 2
+  }
 }
 ```
 
+| Field | Type | Description |
+|-------|------|-------------|
+| `merge_id` | string | Unique merge operation ID (for undo) |
+| `faces_transferred` | integer | Number of face detections transferred |
+| `aliases_added` | integer | Number of aliases added to target |
+| `metadata_fields_added` | integer | Number of metadata fields added to target |
+
 #### Error Responses
 
 | HTTP | When |
@@ -433,25 +427,189 @@ curl -s -X POST "$API/api/v1/identity/$SOURCE_UUID/mergeinto" \
 
 ---
 
-### `GET /api/v1/identities/search`
+### `POST /api/v1/identity/merge/:merge_id/undo`
 
 **Auth**: Required
 **Scope**: identity-level
 
-Search identities by name (ILIKE search). Returns matching identity records.
+Undo a merge operation within 24 hours. Restores the source identity and reverts face bindings.
+
+#### Undo Behavior
+
+| Action | Description |
+|--------|-------------|
+| Restore source identity | If `keep_history=true`: restore status to `confirmed`<br>If `keep_history=false`: recreate identity from MongoDB snapshot |
+| Restore faces | Transfer faces back to source identity |
+| Remove aliases from target | Remove aliases with `source: "merge"` tag |
+| Remove metadata fields from target | Remove fields that were added from source |
+| **Preserve manual changes** | Keep aliases/metadata manually added after merge |
 
 #### Example
 
 ```bash
-curl -s "$API/api/v1/identities/search?q=Cary" -H "X-API-Key: $KEY"
+curl -s -X POST "$API/api/v1/identity/merge/550e8400-e29b-41d4-a716-446655440000/undo" \
+  -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "message": "Undo merge completed: 'stranger_13894' restored, 52 faces reverted",
+  "data": {
+    "source_identity_restored": {
+      "uuid": "a9a90105...",
+      "name": "stranger_13894",
+      "status": "confirmed"
+    },
+    "faces_reverted": 52,
+    "aliases_removed_from_target": 1,
+    "metadata_fields_removed_from_target": 2
+  }
+}
+```
+
+#### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | Undo deadline expired (>24hr) or already undone |
+| `404` | Merge record not found |
+| `500` | Database error |
+
+---
+
+### `POST /api/v1/identity/merge/:merge_id/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo a previously undone merge operation. See [`14_identity_history.md`](14_identity_history.md#post-apiv1identitymergemerge_idredo) for full details.
+
+---
+
+### `GET /api/v1/identity/merge/history`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Query merge history records from MongoDB.
+
+#### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `source_uuid` | string | No | — | Filter by source identity UUID |
+| `target_uuid` | string | No | — | Filter by target identity UUID |
+| `merge_id` | string | No | — | Filter by specific merge ID |
+| `undone` | bool | No | — | Filter by undone status |
+| `page` | int | No | 1 | Page number |
+| `page_size` | int | No | 20 | Items per page |
+
+#### Example
+
+```bash
+curl -s "$API/api/v1/identity/merge/history?page=1&page_size=10" \
+  -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "total": 5,
+  "page": 1,
+  "page_size": 10,
+  "results": [
+    {
+      "merge_id": "550e8400-e29b-41d4-a716-446655440000",
+      "source_name": "stranger_13894",
+      "target_name": "Louis Viret",
+      "faces_transferred": 52,
+      "merged_at": "2026-05-27T10:00:00Z",
+      "undo_deadline": "2026-05-28T10:00:00Z",
+      "undone": false,
+      "undo_expired": false
+    }
+  ]
+}
 ```
 
 | Field | Type | Description |
 |-------|------|-------------|
-| `name` | string | Identity name |
-| `source` | string | Identity source |
-| `tmdb_id` | integer | TMDb ID (if source = tmdb) |
-| `file_uuid` | string | Associated file |
+| `merge_id` | string | Unique merge operation ID |
+| `source_name` | string | Source identity name |
+| `target_name` | string | Target identity name |
+| `faces_transferred` | integer | Number of faces transferred |
+| `merged_at` | datetime | When merge occurred |
+| `undo_deadline` | datetime | 24hr deadline for undo |
+| `undone` | bool | Whether merge was undone |
+| `undo_expired` | bool | Whether undo deadline passed |
+
+---
+
+### `GET /api/v1/identities/search`
+
+**Auth**: Required
+**Scope**: global / file-level
+
+Search identity name → find associated chunks. Searches identity name and aliases, returns identities with their associated text chunks.
+
+#### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `q` | string | Yes | — | Search text (ILIKE match on name and aliases) |
+| `file_uuid` | string | No | — | Restrict to specific file. If omitted, searches all files (global search) |
+| `limit` | integer | No | 50 | Max results |
+
+#### Example (Global Search)
+
+```bash
+curl -s "$API/api/v1/identities/search?q=Audrey" -H "X-API-Key: $KEY"
+```
+
+#### Example (File-specific Search)
+
+```bash
+curl -s "$API/api/v1/identities/search?q=Audrey&file_uuid=$FILE_UUID" -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "total": 5,
+  "results": [
+    {
+      "identity_id": 9,
+      "name": "Audrey Hepburn",
+      "source": "tmdb",
+      "tmdb_id": 1932,
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "trace_id": 41,
+      "chunk_id": "llm_parent_..._204_207",
+      "start_time": 204.162,
+      "text_content": "...confrontation..."
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].identity_id` | integer | Identity ID |
+| `results[].name` | string | Identity name |
+| `results[].source` | string | Identity source (`tmdb`, `user_defined`, etc.) |
+| `results[].tmdb_id` | integer | TMDb person ID (if source = tmdb) |
+| `results[].file_uuid` | string | File where identity appears |
+| `results[].trace_id` | integer | Face trace ID |
+| `results[].chunk_id` | string | Associated chunk ID |
+| `results[].start_time` | float | Chunk start time |
+| `results[].text_content` | string | Chunk text content |
 
 ---
 
@@ -628,4 +786,4 @@ PATCH /api/v1/identity/:identity_uuid
 This **replaces** the entire `aliases` array. To add to existing aliases, include all existing entries in the request.
 
 ---
-*Updated: 2026-05-25
+*Updated: 2026-05-25 — Added `GET /api/v1/file/:file_uuid/faces` with 4 binding states, filters, strangers table split
diff --git a/docs_v1.0/API_WORKSPACE/modules/14_identity_history.md b/docs_v1.0/API_WORKSPACE/modules/14_identity_history.md
new file mode 100644
index 0000000..d61df17
--- /dev/null
+++ b/docs_v1.0/API_WORKSPACE/modules/14_identity_history.md
@@ -0,0 +1,696 @@
+<!-- module: identity_history -->
+<!-- description: Identity operation history, undo, and redo (PATCH, bind, unbind, bind_trace, mergeinto) -->
+<!-- depends: 01_auth, 07_identity -->
+
+## Identity Operation History
+
+Every mutation on an identity automatically records a before/after snapshot. Use undo/redo to revert or reapply changes, and history to inspect the operation log.
+
+Three independent undo/redo systems exist:
+
+| System | Storage | Operations Covered |
+|--------|---------|-------------------|
+| **PATCH** | PostgreSQL `identity_history` | `update` |
+| **Bind** | PostgreSQL `identity_history` | `bind`, `unbind`, `bind_trace` |
+| **Merge** | MongoDB `identity_merge_history` | mergeinto |
+| **Delete** | PostgreSQL `identity_history` | `delete` |
+
+---
+
+### 1. PATCH History & Undo/Redo
+
+#### Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | PostgreSQL `identity_history` table |
+| Snapshot | Full identity record (all fields) before and after each PATCH |
+| Max records | 256 per identity (oldest auto-deleted when limit exceeded) |
+| Undo steps | Unlimited (no expiry, no step limit) |
+| Redo stack | Cleared on new PATCH (`is_undone=true` + `operation='update'` records are deleted) |
+
+##### Stack Model
+
+```
+PATCH 1 → PATCH 2 → PATCH 3         (undo stack, is_undone=false)
+                           ↓ undo
+PATCH 1 → PATCH 2                   (undo stack)
+           PATCH 3                   (redo stack, is_undone=true)
+                           ↓ redo
+PATCH 1 → PATCH 2 → PATCH 3         (undo stack)
+```
+
+A new PATCH after undo clears only the operation='update' redo stack (PATCH 3 is lost). Bind/merge redo stacks are not affected.
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/undo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Undo the most recent PATCH operations. Restores the identity's `before_snapshot` and marks the history records as undone.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of undo steps to apply (max records undone in one call) |
+
+##### Behavior
+
+- Queries `is_undone=false` records with `operation='update'`, ordered by `created_at DESC`
+- Restores `name`, `identity_type`, `source`, `status`, `metadata`, `tmdb_id`, `tmdb_profile` from the last record's `before_snapshot`
+- Marks the undone records as `is_undone=true` with `undone_at=NOW()`
+- Syncs `identity.json` to disk
+- Updates `_index.json` if name changed
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/undo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "undone_count": 1,
+  "current_state": {
+    "id": 9,
+    "uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+    "name": "Cary Grant",
+    "identity_type": "people",
+    "source": "tmdb",
+    "status": "confirmed",
+    "metadata": {},
+    "tmdb_id": 112,
+    "tmdb_profile": null
+  }
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `undone_count` | integer | Number of history records undone |
+| `current_state` | object | Full identity state after undo |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No undo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo previously undone PATCH operations. Restores the identity's `after_snapshot` and marks the history records as no longer undone.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of redo steps to apply |
+
+##### Behavior
+
+- Queries `is_undone=true` records with `operation='update'`, ordered by `created_at DESC`
+- Restores all identity fields from the last record's `after_snapshot`
+- Marks records as `is_undone=false` with `undone_at=NULL`
+- Syncs `identity.json` to disk
+- Updates `_index.json` if name changed
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/redo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "redone_count": 1,
+  "current_state": {
+    "id": 9,
+    "uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+    "name": "John Smith",
+    "identity_type": "people",
+    "source": "tmdb",
+    "status": "confirmed",
+    "metadata": { "aliases": [...] },
+    "tmdb_id": 112,
+    "tmdb_profile": null
+  }
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `redone_count` | integer | Number of history records redone |
+| `current_state` | object | Full identity state after redo |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No redo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `GET /api/v1/identity/:identity_uuid/history`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Query the PATCH operation history for an identity. Returns paginated records with undo/redo stack counts (filtered to `operation='update'`).
+
+##### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `page` | integer | No | `1` | Page number (1-indexed) |
+| `limit` | integer | No | `20` | Items per page (max 100) |
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "total": 5,
+  "undo_stack_count": 3,
+  "redo_stack_count": 2,
+  "results": [
+    {
+      "history_id": 42,
+      "operation": "update",
+      "is_undone": false,
+      "created_at": "2026-05-27T12:00:00Z",
+      "undone_at": null
+    },
+    {
+      "history_id": 41,
+      "operation": "update",
+      "is_undone": true,
+      "created_at": "2026-05-27T11:30:00Z",
+      "undone_at": "2026-05-27T13:00:00Z"
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `total` | integer | Total PATCH history records for this identity |
+| `undo_stack_count` | integer | Records available for undo (`is_undone=false`) |
+| `redo_stack_count` | integer | Records available for redo (`is_undone=true`) |
+| `results[].history_id` | integer | History record ID |
+| `results[].operation` | string | Operation type (`"update"` for PATCH) |
+| `results[].is_undone` | boolean | Whether the operation has been undone |
+| `results[].created_at` | string | When the PATCH was applied |
+| `results[].undone_at` | string | When the undo occurred (null if not undone) |
+
+##### Example
+
+```bash
+curl -s "$API/api/v1/identity/$IDENTITY_UUID/history?page=1&limit=10" \
+  -H "X-API-Key: $KEY"
+```
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+### 2. Bind/Unbind/Trace History & Undo/Redo
+
+All three operations (`bind`, `unbind`, `bind_trace`) share a single history table and undo/redo stack.
+
+#### Bind Operation Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | PostgreSQL `identity_history` table (same table as PATCH) |
+| Snapshot | `{"file_uuid", "face_id" (or "trace_id"), "identity_id_before/after"}` |
+| Max records | 256 per identity (shared limit across all operation types) |
+| Undo steps | Unlimited (`steps` param) |
+| Redo stack | Cleared on new bind/unbind/bind_trace (`operation IN ('bind','unbind','bind_trace')` + `is_undone=true` records deleted) |
+| Stack isolation | Bind redo stack is **independent** from PATCH redo stack — clearing one does not affect the other |
+
+##### Stack Model
+
+```
+bind face_1 (to id=9)              → unbind face_1          → bind trace 906 (to id=9)
+(undo stack, is_undone=false)         (undo stack)              (undo stack)
+                                                               ↓ undo (first undone: bind_trace)
+                                     bind trace 906 (is_undone=true)
+                                     (redo stack)
+                                                               ↓ redo
+bind face_1 → unbind face_1 → bind trace 906
+(undo stack)
+```
+
+A new bind/unbind/trace after undo clears only the bind redo stack (operations with `IN ('bind','unbind','bind_trace')`).
+
+##### Snapshot Format
+
+**Before (bind):**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_before": null
+}
+```
+
+**After (bind):**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_after": 9
+}
+```
+
+**Before (unbind) — binding existed before:**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_before": 9
+}
+```
+
+**After (unbind):**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_after": null
+}
+```
+
+For `bind_trace`, the snapshot uses `trace_id` instead of `face_id`, with `identity_id_before` capturing the first face's identity in that trace.
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/bind/undo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Undo the most recent bind/unbind/bind_trace operations. Restores `identity_id_before` from the snapshot and marks records as undone.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of undo steps to apply |
+
+##### Behavior
+
+- Queries `is_undone=false` records with `operation IN ('bind','unbind','bind_trace')`, ordered by `created_at DESC`
+- Restores `identity_id_before` — for bind this is `null` (face was unbound), for unbind this is the original identity (face goes back), for bind_trace this is the trace's previous identity
+- Marks the undone records as `is_undone=true` with `undone_at=NOW()`
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind/undo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "operation": "bind",
+  "undone_count": 1,
+  "affected_rows": 53
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `operation` | string | The actual operation undone (`bind`, `unbind`, or `bind_trace`) |
+| `undone_count` | integer | Number of history records undone |
+| `affected_rows` | integer | Number of `face_detections` rows updated |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No bind undo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/bind/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo previously undone bind/unbind/bind_trace operations. Restores `identity_id_after` from the snapshot.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of redo steps to apply |
+
+##### Behavior
+
+- Queries `is_undone=true` records with `operation IN ('bind','unbind','bind_trace')`, ordered by `created_at DESC`
+- Restores `identity_id_after` — for bind this is the identity the face was bound to, for unbind this is `null`
+- Marks records as `is_undone=false` with `undone_at=NULL`
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind/redo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "operation": "unbind",
+  "redone_count": 1,
+  "affected_rows": 1
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `operation` | string | The actual operation redone (`bind`, `unbind`, or `bind_trace`) |
+| `redone_count` | integer | Number of history records redone |
+| `affected_rows` | integer | Number of `face_detections` rows updated |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No bind redo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `GET /api/v1/identity/:identity_uuid/bind/history`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Query the bind/unbind/bind_trace operation history for an identity. Returns paginated records with undo/redo stack counts.
+
+##### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `page` | integer | No | `1` | Page number (1-indexed) |
+| `limit` | integer | No | `20` | Items per page (max 100) |
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "total": 3,
+  "undo_stack_count": 2,
+  "redo_stack_count": 1,
+  "results": [
+    {
+      "history_id": 52,
+      "operation": "bind_trace",
+      "is_undone": false,
+      "created_at": "2026-05-27T14:00:00Z",
+      "undone_at": null
+    },
+    {
+      "history_id": 51,
+      "operation": "unbind",
+      "is_undone": true,
+      "created_at": "2026-05-27T13:00:00Z",
+      "undone_at": "2026-05-27T14:30:00Z"
+    },
+    {
+      "history_id": 50,
+      "operation": "bind",
+      "is_undone": false,
+      "created_at": "2026-05-27T12:00:00Z",
+      "undone_at": null
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `total` | integer | Total bind history records for this identity |
+| `undo_stack_count` | integer | Records available for undo (`is_undone=false`) |
+| `redo_stack_count` | integer | Records available for redo (`is_undone=true`) |
+| `results[].history_id` | integer | History record ID |
+| `results[].operation` | string | Operation type (`bind`, `unbind`, or `bind_trace`) |
+| `results[].is_undone` | boolean | Whether the operation has been undone |
+| `results[].created_at` | string | When the operation was applied |
+| `results[].undone_at` | string | When the undo occurred (null if not undone) |
+
+##### Example
+
+```bash
+curl -s "$API/api/v1/identity/$IDENTITY_UUID/bind/history?page=1&limit=10" \
+  -H "X-API-Key: $KEY"
+```
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+### 3. Merge History & Undo/Redo
+
+Merge operations use MongoDB for richer record-keeping, with a 24-hour undo deadline.
+
+#### Merge Operation Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | MongoDB `identity_merge_history` collection |
+| Snapshot | Full source identity state + target identity state + aliases/metadata diffs |
+| Trigger | Every mergeinto with `keep_history=true` |
+| Undo deadline | 24 hours (renewed on redo) |
+| Redo support | Yes — restores undone merges with new 24hr deadline |
+| Max records | Unlimited |
+
+---
+
+#### `POST /api/v1/identity/merge/:merge_id/undo`
+
+Already documented in [`07_identity.md`](07_identity.md#post-apiv1identitymergemerge_idundo). See that document for full details.
+
+---
+
+#### `POST /api/v1/identity/merge/:merge_id/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo a previously undone merge operation within the renewed 24-hour deadline.
+
+##### Request
+
+No body required. The merge ID is taken from the URL path.
+
+##### Behavior
+
+1. Validates the merge record exists and `undone=true` (not already active)
+2. Checks the 24-hour undo deadline (if expired, the redo is rejected)
+3. Restores face bindings: moves all faces from `target_identity` back to `source_identity`
+4. Re-adds aliases that were removed by the undo (aliases with `source: "merge"` tag)
+5. Re-adds metadata fields that were removed by the undo
+6. If `keep_history=true`: sets `source_identity.status = 'merged'` again
+7. If `keep_history=false`: recreates source identity from the `undone_snapshot` stored at undo time
+8. Syncs both identity JSON files to disk
+9. Sets `undone=false`, clears `undone_snapshot`, renews `undo_deadline = NOW() + 24h`
+10. Records `redone_by` user for audit
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/merge/550e8400-e29b-41d4-a716-446655440000/redo" \
+  -H "X-API-Key: $KEY"
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "message": "Redo merge completed: merged 'stranger_13894' into 'Louis Viret' (52 faces transferred)",
+  "data": {
+    "merge_id": "550e8400-e29b-41d4-a716-446655440000",
+    "faces_transferred": 52,
+    "aliases_re_added": 1,
+    "metadata_fields_re_added": 2
+  }
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `merge_id` | string | The merge operation ID |
+| `faces_transferred` | integer | Number of faces transferred from source to target |
+| `aliases_re_added` | integer | Number of aliases restored to target |
+| `metadata_fields_re_added` | integer | Number of metadata fields restored to target |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | Merge not undone, deadline expired, or cannot redo |
+| `404` | Merge record not found |
+| `500` | Database error |
+
+---
+
+### 4. Delete History & Undo/Redo
+
+#### Delete Operation Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | PostgreSQL `identity_history` table |
+| Snapshot | `{"identity": {...full row...}, "unbound_faces": [{file_uuid, face_id, trace_id}, ...]}` |
+| Max records | 1 active delete record per identity (redo stack cleared on new delete) |
+| Undo support | Yes — recreates identity row, re-binds faces |
+| Redo support | Yes — re-deletes the identity |
+| Identity file | Deleted on delete, recreated on undo |
+
+#### Snapshot Format
+
+```json
+{
+  "identity": {
+    "id": 9,
+    "uuid": "a9a90105-6d6b-46ff-92da-0c3c1a57dff4",
+    "name": "Cary Grant",
+    "identity_type": "people",
+    "source": "tmdb",
+    "status": "confirmed",
+    "metadata": {},
+    "tmdb_id": 112,
+    "tmdb_profile": null
+  },
+  "unbound_faces": [
+    {
+      "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+      "face_id": "1_5",
+      "trace_id": null
+    },
+    {
+      "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+      "face_id": "1_6",
+      "trace_id": 906
+    }
+  ]
+}
+```
+
+#### Stack Model
+
+```
+DELETE identity                          (undo stack, is_undone=false)
+               ↓ undo
+Identity recreated, faces re-bound
+               → delete history marked is_undone=true
+               ↓ redo (re-delete)
+Identity deleted again, faces unbound
+               → delete history marked is_undone=false
+```
+
+A new delete after an undo clears the delete redo stack (no redo possible for the old delete).
+
+#### Undo Behavior (via existing `POST /api/v1/identity/:identity_uuid/undo`)
+
+1. Normal identity lookup fails (row was deleted)
+2. Checks `identity_history` for `operation='delete' AND is_undone=false` matching the UUID in the snapshot
+3. Recreates the identity row (new internal `id`, same UUID)
+4. Re-binds all faces listed in `unbound_faces` to the new identity
+5. Deletes the `identity_history` delete record as `is_undone=true` with `undone_at=NOW()`
+6. Syncs `identity.json` to disk
+7. Updates `_index.json`
+
+#### Redo Behavior (via existing `POST /api/v1/identity/:identity_uuid/redo`)
+
+1. Identity lookup succeeds (identity was restored by prior undo)
+2. Checks `identity_history` for `operation='delete' AND is_undone=true` matching the identity_id
+3. Deletes `identity.json` from disk
+4. Unbinds all faces (`identity_id = NULL`)
+5. Deletes the identity row
+6. Marks the delete history record as `is_undone=false`
+7. Returns success
+
+#### Error Responses (delete undo/redo)
+
+| HTTP | Scenario |
+|------|----------|
+| `400` | No delete history available (either no delete or already undone/redone) |
+| `404` | Identity not found (for redo — identity wasn't restored) |
+| `500` | Database error |
+
+---
+
+### Comparison: PATCH vs Bind vs Merge vs Delete Undo/Redo
+
+| Aspect | PATCH Undo/Redo | Bind Undo/Redo | Merge Undo/Redo | Delete Undo/Redo |
+|--------|----------------|----------------|-----------------|------------------|
+| Storage | PostgreSQL `identity_history` | PostgreSQL `identity_history` | MongoDB `identity_merge_history` | PostgreSQL `identity_history` |
+| Operation filter | `operation='update'` | `operation IN ('bind','unbind','bind_trace')` | — | `operation='delete'` |
+| Trigger | Every PATCH | Every bind/unbind/bind_trace | Every mergeinto with `keep_history=true` | Every DELETE |
+| Undo deadline | None (unlimited) | None (unlimited) | 24 hours (renewed on redo) | None (unlimited) |
+| Redo support | Yes | Yes | Yes | Yes |
+| Step undo | Yes (`steps` param) | Yes (`steps` param) | No (full undo/redo only) | No (single record) |
+| Max records | 256 per identity | 256 per identity (shared) | Unlimited | 256 per identity (shared) |
+| User tracking | `user_id` + `user_source` | `user_id` + `user_source` | `performed_by_user` + `undone_by` / `redone_by` | `user_id` + `user_source` |
+
+---
+
+*Updated: 2026-05-28*
diff --git a/docs_v1.0/API_WORKSPACE/narratives/marcom_intro.md b/docs_v1.0/API_WORKSPACE/narratives/marcom_intro.md
new file mode 100644
index 0000000..cf4fc12
--- /dev/null
+++ b/docs_v1.0/API_WORKSPACE/narratives/marcom_intro.md
@@ -0,0 +1,36 @@
+<!-- narrative: marcom_intro -->
+<!-- description: Intro section for Marcom training manual -->
+<!-- depends: -->
+
+## About This Manual
+
+This training manual is designed for the Marcom team to understand and use the Momentry Core API.
+
+### Demo Credentials
+
+**API Key**: `muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69`
+
+**SFTPGo** (for video upload):
+
+| Item | Value |
+|------|-------|
+| SFTP Host | `sftpgo.momentry.ddns.net` |
+| SFTP Port | `2022` |
+| Username | `demo` |
+| Password | `demopassword123` |
+| Web UI | `https://sftpgo.momentry.ddns.net` |
+
+### Quick Examples
+
+**List all videos:**
+```bash
+curl -s -H "X-API-Key: $KEY" "$API/api/v1/files/scan"
+```
+
+**Search:**
+```bash
+curl -s -X POST "$API/api/v1/search" \
+  -H "Content-Type: application/json" \
+  -H "X-API-Key: $KEY" \
+  -d '{"query": "example", "limit": 5}'
+```
diff --git a/docs_v1.0/DESIGN/ASRX_HYBRID_PIPELINE_V1.0.md b/docs_v1.0/DESIGN/ASRX_HYBRID_PIPELINE_V1.0.md
new file mode 100644
index 0000000..c3d2105
--- /dev/null
+++ b/docs_v1.0/DESIGN/ASRX_HYBRID_PIPELINE_V1.0.md
@@ -0,0 +1,588 @@
+# ASRX Hybrid Pipeline v1.0 — 聲紋分離混合架構
+
+| 項目 | 內容 |
+|------|------|
+| **範圍** | ASRX 處理器重構：whisperx → VAD-first hybrid pipeline |
+| **狀態** | Draft |
+| **適用版本** | Momentry Core V4.0+ |
+| **作者** | OpenCode / Warren |
+| **建立日期** | 2026-06-01 |
+
+---
+
+## 1. 問題
+
+### 1.1 現有問題
+
+| 問題 | 說明 | 影響 |
+|------|------|------|
+| **Whisper 合併短句** | `whisper small` 會將兩個人的對話錯認成一個連續段 (A+B → 一句) | ASR segment 內混兩人話語，speaker 無法分離 |
+| **ASRX v2 speaker_id = null** | `asrx_processor_v2.py` 使用 `whisperx.DiarizationPipeline()` 但該 API 未在 whisperx `__init__.py` 暴露 | 所有 segment speaker 均為 null |
+| **文字丟失** | `asrx_processor_custom.py` 的 `SelfASRXFixed.process_with_segments()` 只輸出 `text: ""` | Rule 1 合併時無文字可用 |
+| **錯誤的聲紋後端** | `asrx_processor_v2.py` 依賴 whisperx 內建 diarization，但該功能不穩定 | 準確度 ~85%，需 HF token |
+| **多版本混亂** | 7 個 root-level 變體、14 個 asrx_self 檔案，生產環境使用錯誤版本 | 維護困難，不知哪個是對的 |
+
+### 1.2 痛點場景
+
+**兩個說話人短句來回切換**（訪談、對話）：
+
+```
+Audio: A(2s) → B(1.5s) → A(3s)
+Whisper: ───────[0-7s, "A+B+A 全部混在一起"]───────
+```
+
+Whisper 在句間停頓處不切段，導致 ASR 時間邊界無法反映 speaker 切換。
+
+---
+
+## 2. 架構
+
+### 2.1 核心原則
+
+1. **VAD 先定邊界** — 用 VAD 在句間停頓處切段，取代 whisper 的邊界
+2. **ASR 後做** — 每段各自轉錄，保有獨立文字
+3. **聲紋聚類定 speaker** — ECAPA-TDNN + AgglomerativeClustering
+
+### 2.2 5 步 Pipeline
+
+```
+Audio
+  │
+  ① whisper (一次, 粗略定位)
+  │   找到說話段 + 初步文字 + 語種
+  │   [0-7s, "今天天氣很好我覺得也不錯對啊", zh]
+  │
+  ② VAD scan (在每段內細切)
+  │   利用句間停頓切開
+  │   段1 [0-2s]    段2 [2-3.5s]    段3 [3.5-7s]
+  │
+  ③ whisper per refined segment (各段轉錄)
+  │   段1 → "今天天氣很好"     (zh, 0.98)
+  │   段2 → "我覺得也不錯"     (zh, 0.97)
+  │   段3 → "對啊"             (zh, 0.96)
+  │
+  ④ ECAPA-TDNN per refined segment (聲紋提取)
+  │   段1 → emb[0] (192-dim)
+  │   段2 → emb[1] (192-dim)
+  │   段3 → emb[2] (192-dim)
+  │
+  ⑤ AgglomerativeClustering (聚類定 speaker)
+  │   emb[0]=SPEAKER_0, emb[1]=SPEAKER_1, emb[2]=SPEAKER_0
+  │
+  輸出:
+    start  end    text         language  speaker_id
+    0.0    2.0    今天天氣很好    zh        SPEAKER_0
+    2.0    3.5    我覺得也不錯    zh        SPEAKER_1
+    3.5    7.0    對啊            zh        SPEAKER_0
+```
+
+### 2.3 流程圖
+
+```
+┌─────────────────────────────────────────────────────────────────────┐
+│                    asrx_processor.py                                │
+│                      (wrapper)                                     │
+│                                                                    │
+│  ① ffprobe → select best track → ffmpeg → 16kHz WAV               │
+│                                                                    │
+│  ② SelfASRXFixed.process(audio_wav, file_uuid)                     │
+│     │                                                              │
+│     ├─ Step 1: whisper.transcribe() → rough segments               │
+│     ├─ Step 2: VAD scan each rough segment                         │
+│     ├─ Step 3: whisper per refined segment → text+language         │
+│     ├─ Step 4: ECAPA-TDNN per segment → 192-dim embedding         │
+│     ├─ Step 5: AgglomerativeClustering → speaker_labels            │
+│     │                                                              │
+│     ├─ Step 6: Store embeddings in Qdrant                          │
+│     │  └─ {file_uuid, speaker_id, text, language, start, end}      │
+│     │                                                              │
+│     └─ Step 7: Classify high-quality embeddings                    │
+│        ├─ quality > threshold → reference profile                  │
+│        ├─ 送入聲音分類模型推論性別/屬性                               │
+│        └─ 寫入 Qdrant (type: speaker_reference)                    │
+│                                                                    │
+│  ③ 輸出 JSON 格式 (不含 embedding)                                 │
+│                                                                    │
+│  Rust: rule1_ingest.rs                                            │
+│     └─ pre_chunks(processor_type='asrx') → chunks                  │
+└─────────────────────────────────────────────────────────────────────┘
+```
+
+---
+
+## 3. 檔案組織
+
+### 3.1 最終檔案結構
+
+```
+scripts/
+├── asrx_processor.py            ← production (cleaned custom.py)
+│
+└── asrx_self/                   ← 核心庫
+    ├── __init__.py              ← package marker
+    ├── vad.py                   ← Silero VAD (新增 scan_within_segment)
+    ├── whisper_local.py         ← 🆕 封裝 whisper 載入+轉錄
+    ├── speaker_encoder.py       ← ECAPA-TDNN 192-dim
+    ├── speaker_cluster_fixed.py ← AgglomerativeClustering
+    └── main_fixed.py            ← 🔧 重寫為 5 步 pipeline
+```
+
+### 3.2 刪除清單
+
+**Root-level 變體**（全部刪除）：
+
+| 檔案 | 原因 |
+|------|------|
+| `asrx_processor.py` | 原始 whisperx 版，diarization 壞的 |
+| `asrx_processor_v2.py` | 同上，Rust 目前錯誤呼叫此檔 |
+| `asrx_processor_v2_noalign.py` | 跳過對齊但 diarization 仍壞 |
+| `asrx_processor_v2_transcribe.py` | 只轉錄不做 speaker |
+| `asrx_processor_simplified.py` | 變體 |
+| `asrx_processor_contract_v1.py` | 18KB，pyannote，需 HF token |
+
+**asrx_self 內被取代的舊版**：
+
+| 檔案 | 原因 | 取代者 |
+|------|------|--------|
+| `main.py` | 用 SpectralClustering，有 NaN 問題 | `main_fixed.py` |
+| `speaker_cluster.py` | 用 SpectralClustering，不穩定 | `speaker_cluster_fixed.py` |
+
+### 3.3 搬離清單
+
+非生產工具搬至 `tools/asrx/`：
+
+```
+tools/asrx/
+├── integrate_face_asrx_speaker.py
+├── speaker_player_gui.py
+├── speaker_player_gui_face.py
+├── speaker_player_interactive.py
+├── speaker_audio_player.py
+├── test_long_movie.py
+├── test_gui_face_player.py
+└── docs/
+    ├── FINAL_TEST_REPORT.md
+    ├── GUI_FACE_PLAYER_USAGE.md
+    ├── LONG_MOVIE_TEST_SUMMARY.md
+    └── SPEAKER_PLAYER_GUIDE.md
+```
+
+---
+
+---
+
+## 4. Qdrant 聲紋向量儲存
+
+### 4.1 儲存流程
+
+```
+Step 4 輸出: 每個 refined segment 有 {embedding: [192-dim], text, language, start, end}
+Step 5 輸出: 每個 segment 被標上 speaker_id {SPEAKER_0, SPEAKER_1, ...}
+
+Step 6: Qdrant 儲存
+  ┌─ 每個 segment → Qdrant point
+  │   point_id = hash(file_uuid + segment_index)  ← 可重複查詢
+  │   vector   = embedding (192-dim)
+  │   payload  = {
+  │     "file_uuid":   str,     ← 聚類後填入
+  │     "speaker_id":  str,     ← 聚類後填入
+  │     "text":        str,     ← ASR 轉錄結果
+  │     "language":    str,     ← 語種 (zh/en/...)
+  │     "start_time":  f64,     ← 秒
+  │     "end_time":    f64,     ← 秒
+  │     "type":        "speaker_embedding"  ← 便於區分
+  │   }
+  └─
+```
+
+### 4.2 Qdrant Collection
+
+| 項目 | 內容 |
+|------|------|
+| Collection Name | `momentry_speaker` (或共用現有 collection) |
+| Vector Dimension | 192 (ECAPA-TDNN 輸出) |
+| Distance Metric | Cosine |
+| Point ID | `hash(file_uuid + "_" + segment_index)` |
+
+### 4.3 Rust `upsert_speaker_embedding`
+
+```rust
+impl QdrantDb {
+    pub async fn upsert_speaker_embedding(
+        &self,
+        point_id: u64,
+        vector: &[f32],
+        file_uuid: &str,
+        speaker_id: &str,
+        text: &str,
+        language: &str,
+        start_time: f64,
+        end_time: f64,
+    ) -> Result<()> {
+        // Qdrant PUT /collections/{collection}/points?wait=true
+        // payload: {file_uuid, speaker_id, text, language, start_time, end_time, type: "speaker_embedding"}
+    }
+}
+```
+
+### 4.4 與現有 Face Embedding 的關係
+
+| 類別 | Qdrant Collection | Dim | Payload |
+|------|-------------------|-----|---------|
+| Face | `momentry` (self.collection_name) | 512 (FaceNet) | `file_uuid, trace_id, frame_number` |
+| **Speaker** | `momentry` 或獨立 collection | **192** (ECAPA-TDNN) | `file_uuid, speaker_id, text, language, start, end` |
+
+---
+
+## 5. 模組詳細設計
+
+### 5.1 `vad.py` — 語音活動檢測
+
+| 項目 | 內容 |
+|------|------|
+| 模型 | Silero VAD (torch.hub, snakers4/silero-vad) |
+| 現有函數 | `load_vad_model()`, `extract_speech_segments()` |
+| **新增函數** | **`scan_within_segment(wav, start_sec, end_sec, model, utils, min_speech_duration_ms=500)`** |
+
+`scan_within_segment` 作用：
+- 在一個時間範圍 `[start_sec, end_sec]` 內執行 VAD 掃描
+- 只回傳該範圍內的語音子片段 `[(s1, e1), (s2, e2), ...]`
+- 利用句間停頓切分，解決 whisper 合併問題
+
+### 5.2 `whisper_local.py` 🆕 — Whisper 封裝
+
+| 項目 | 內容 |
+|------|------|
+| 模型 | `whisper.load_model("base")` (可設定) |
+| 函數 | `load_model()`, `transcribe_segment(audio, start, end)` |
+
+```python
+def transcribe_segment(wav, sample_rate, start_sec, end_sec, model) -> dict:
+    """轉錄單一段落，回傳 {text, language, lang_prob, segments}"""
+```
+
+每段獨立轉錄，保留語言與信心度。
+
+### 5.3 `speaker_encoder.py` — 聲紋編碼器
+
+| 項目 | 內容 |
+|------|------|
+| 模型 | SpeechBrain ECAPA-TDNN (`spkrec-ecapa-voxceleb`) |
+| 輸出維度 | 192-dim |
+| EER | 0.80% (VoxCeleb1) |
+| 授權 | MIT (不需要 HuggingFace token) |
+| 函數 | `load_speaker_encoder()`, `extract_speaker_embedding()`, `extract_speaker_embeddings_batch()` |
+
+### 5.4 `speaker_cluster_fixed.py` — 說話人聚類
+
+| 項目 | 內容 |
+|------|------|
+| 演算法 | AgglomerativeClustering (cosine + average linkage) |
+| 取代 | `speaker_cluster.py` (SpectralClustering, NaN 問題) |
+| 函數 | `robust_speaker_clustering(embeddings, n_speakers=None, max_speakers=10)` |
+
+### 5.5 `main_fixed.py` 🔧 — 核心調度器（7 步 Pipeline）
+
+```python
+class SelfASRXFixed:
+    def process(self, audio_path, output_path=None, file_uuid=None):
+        """
+        7 步 speaker diarization pipeline
+        
+        Steps:
+          1. whisper.transcribe(audio) → rough segments + text + language
+          2. VAD scan each rough segment → refined segments
+          3. whisper per refined segment → {text, language, lang_prob}
+          4. ECAPA-TDNN per refined segment → 192-dim embeddings
+          5. AgglomerativeClustering → speaker_labels
+          6. Store all embeddings in Qdrant (if file_uuid provided)
+             payload: {file_uuid, speaker_id, text, language, start_time, end_time, type: "speaker_embedding"}
+          7. High-quality embeddings (quality > threshold) → classify + store reference
+             payload: {type: "speaker_reference", file_uuid, speaker_id, n_segments, avg_quality, ...}
+        
+        Returns:
+            {
+                "segments": [
+                    {
+                        "start": float, "end": float,
+                        "text": str, "language": str,
+                        "lang_prob": float, "speaker": str,
+                        "speaker_id": str, "quality": float
+                    },
+                    ...
+                ],
+                "speaker_stats": {...},
+                "n_speakers": int,
+                "total_duration": float,
+                "references": [
+                    {
+                        "speaker_id": str,
+                        "n_segments": int,
+                        "avg_quality": float,
+                        "gender": str
+                    }
+                ]
+            }
+        """
+    
+    def _store_speaker_embeddings(self, segments, file_uuid):
+        """Step 6: 每個 segment 的 192-dim embedding 存入 Qdrant"""
+    
+    def _classify_high_quality_speakers(self, segments, embeddings, labels, file_uuid):
+        """Step 7: 高品質聲紋分級 + 分類 → Qdrant reference profile"""
+
+**移除**：
+
+| 舊方法 | 原因 |
+|--------|------|
+| `process_with_segments(audio, asr_segments)` | 外部 ASR 邊界來源不可靠，被 VAD 取代 |
+| `process()` VAD-only fallback | 無文字輸出，被完整 pipeline 取代 |
+
+### 5.6 `speaker_classifier.py` 🆕 — 高品質聲紋分級與分類
+
+#### 目的
+
+聚類後，對每個 cluster 的 embedding 進行品質評估，高於閾值的獨立建檔，並用外部模型做自動分類。
+
+#### 流程
+
+```
+Step ⑤ 聚類後，每個 segment 有 {embedding, speaker_id}
+  │
+  └─ Compute quality score per embedding
+      │
+      ├─ 低於閾值 → 寫入 Qdrant (一般 speaker_embedding)
+      │
+      └─ 高於閾值 (quality > 0.85)
+          ├─ 獨立建 reference profile
+          └─ 送入「支持聲音的模型」做分類
+              ├─ 語者性別 (male/female)
+              ├─ 語種口音 (zh-CN / zh-TW / en-US)
+              └─ 或跨影片 speaker 匹配用
+```
+
+#### Quality Score 計算
+
+```python
+def compute_embedding_quality(embeddings, labels, threshold=0.85):
+    """
+    每個 embedding 到所屬 cluster centroid 的餘弦相似度
+    
+    Args:
+        embeddings: [n_segments, 192]
+        labels: [n_segments] 聚類標籤
+        threshold: 高品質門檻
+    
+    Returns:
+        qualities: [n_segments] 每個 embedding 的品質分數
+        high_quality_mask: [n_segments] bool 陣列
+    """
+    from sklearn.metrics.pairwise import cosine_similarity
+    
+    unique_labels = set(labels)
+    centroids = {}
+    for label in unique_labels:
+        mask = labels == label
+        centroid = np.mean(embeddings[mask], axis=0)
+        centroid = centroid / np.linalg.norm(centroid)
+        centroids[label] = centroid
+    
+    qualities = []
+    for i, (emb, label) in enumerate(zip(embeddings, labels)):
+        sim = cosine_similarity([emb], [centroids[label]])[0][0]
+        qualities.append(sim)
+    
+    return np.array(qualities), np.array(qualities) >= threshold
+```
+
+#### Reference Profile 格式
+
+```json
+{
+    "point_id": "hash(speaker_reference_" + file_uuid + "_" + speaker_id + "_" + cluster_index)",
+    "vector": "[192-dim centroid embedding]",
+    "payload": {
+        "type": "speaker_reference",
+        "file_uuid": "來源影片",
+        "speaker_id": "SPEAKER_0",
+        "n_segments": 25,
+        "avg_quality": 0.92,
+        "total_duration": 45.3,
+        "language": "zh",
+        "gender": "male",
+        "text_samples": ["今天天氣很好", "我覺得也不錯", "..."]
+    }
+}
+```
+
+#### 支援的聲音分類模型（選項）
+
+| 模型 | 用途 | 優點 | 缺點 |
+|------|------|------|------|
+| **SpeechBrain gender classifier** | 性別分類 | 已整合 ECAPA-TDNN | 只分 male/female |
+| **CLAP** (LAION) | 零樣本音頻分類 | 可自訂 label text | 需額外安裝 |
+| **YAMNet** | 聲音事件分類 | Google 出品，521 classes | 不擅長語者屬性 |
+| **Wav2Vec2-BERT** (speechbrain) | 情感/屬性 | 多維度分類 | 模型較大 |
+| **自建 identity classifier** | 跨影片 speaker 匹配 | 與現有 identity 系統對接 | 需累積 reference data |
+
+> **待決定**: 選擇哪個分類模型，由後續 POC 決定。
+
+#### `main_fixed.py` 新增方法
+
+```python
+class SelfASRXFixed:
+    # ... 既有 6 個步驟 ...
+
+    def _classify_high_quality_speakers(self, segments, embeddings, labels, file_uuid):
+        """
+        步驟 7: 高品質聲紋分級與分類
+        
+        1. 計算 quality score
+        2. 高於閾值者建立 reference profile
+        3. 用分類模型推論性別/屬性
+        4. 寫入 Qdrant (type: speaker_reference)
+        """
+        qualities, mask = compute_embedding_quality(embeddings, labels)
+        
+        for i, (seg, emb, label, quality, is_high) in enumerate(
+            zip(segments, embeddings, labels, qualities, mask)
+        ):
+            seg["quality"] = float(quality)
+            if is_high:
+                profile = self._build_reference_profile(
+                    emb, seg, file_uuid
+                )
+                # 分類 (placeholder)
+                # gender = classify_gender(embedding)
+                self._store_speaker_reference(profile)
+```
+
+### 5.7 `asrx_processor.py` — 清理後的 wrapper
+
+清理項目：
+
+| 問題 | 位置 | 修法 |
+|------|------|------|
+| 硬編碼 UUID `dd61fda8...` | line 155 | 移除該 fallback path |
+| `os.chdir(script_dir)` | line 112 | 改區域性 Path 操作 |
+| ASR 文字丟棄 | line 258 | `text` 來自新 pipeline |
+| `_debug` dict | line 222 | 移除 |
+| `max_speakers=10` 寫死 | line 201 | 改 CLI 參數 `--max-speakers` |
+| 載入外部 ASR segments | line 148-174 | 移除（不再需要） |
+
+---
+
+## 6. 輸出格式
+
+### 6.1 ASRX JSON Output (由 `asrx_processor.py` 寫入)
+
+> **注意**: 192-dim embedding 不在此 JSON 中。embedding 在 Python 端直接送入 Qdrant，JSON 只保留中繼資料。
+
+```json
+{
+    "language": "zh",
+    "segments": [
+        {
+            "start_time": 0.0,
+            "end_time": 2.0,
+            "start_frame": 0,
+            "end_frame": 60,
+            "text": "今天天氣很好",
+            "speaker_id": "SPEAKER_0",
+            "language": "zh",
+            "lang_prob": 0.98
+        },
+        {
+            "start_time": 2.0,
+            "end_time": 3.5,
+            "start_frame": 60,
+            "end_frame": 105,
+            "text": "我覺得也不錯",
+            "speaker_id": "SPEAKER_1",
+            "language": "zh",
+            "lang_prob": 0.97
+        }
+    ],
+    "n_speakers": 2,
+    "speaker_stats": {
+        "SPEAKER_0": {"count": 1, "duration": 2.0},
+        "SPEAKER_1": {"count": 1, "duration": 1.5}
+    }
+}
+```
+
+### 6.2 Qdrant Point 格式 (由 Python `_store_speaker_embeddings` 寫入)
+
+> Embedding 不經過 Rust，直接在 Python 端完成 Qdrant HTTP PUT。
+
+| Qdrant 欄位 | 值 | 說明 |
+|-------------|-----|------|
+| `id` | `hash(file_uuid + "_" + segment_index)` | 可重複查詢的 point ID |
+| `vector` | `[f32; 192]` | ECAPA-TDNN 聲紋向量 |
+| `payload.file_uuid` | `str` | 影片識別碼 |
+| `payload.speaker_id` | `str` | 聚類後的 speaker 標籤 |
+| `payload.text` | `str` | 該段的轉錄文字 |
+| `payload.language` | `str` | 語種 (`zh`/`en`) |
+| `payload.start_time` | `f64` | 開始時間(秒) |
+| `payload.end_time` | `f64` | 結束時間(秒) |
+| `payload.type` | `"speaker_embedding"` | 便於與 face_embedding 區分 |
+
+### 6.3 Rust `AsrxResult` 對應
+
+```rust
+pub struct AsrxSegment {
+    pub start_time: f64,       // serde(alias = "start")
+    pub end_time: f64,         // serde(alias = "end")
+    pub start_frame: u64,      // default 0
+    pub end_frame: u64,        // default 0
+    pub text: String,
+    pub speaker_id: Option<String>,
+    pub language: Option<String>,    // 🆕 新增
+    pub lang_prob: Option<f64>,     // 🆕 新增
+}
+```
+
+---
+
+## 7. Rust 端變動
+
+| 檔案 | 變動 |
+|------|------|
+| `src/core/processor/asrx.rs` | `asrx_processor_v2.py` → `asrx_processor.py` |
+| `src/core/processor/asrx.rs` | `AsrxSegment` 新增 `language`, `lang_prob` 欄位 |
+| `src/core/processor/asrx.rs` | 傳遞 `--file-uuid` 給 Python 腳本，讓 Python 端可直接寫入 Qdrant |
+| `src/core/chunk/rule1_ingest.rs` | 若 `pre_chunks` data 含 `language` 則帶入 chunk metadata |
+| `src/core/db/qdrant_db.rs` | 🆕 新增 `upsert_speaker_embedding()` 方法 (可選，若 Python 端直接寫 Qdrant 則不需) |
+
+---
+
+## 8. 遷移計畫
+
+### 實作順序 (依賴關係排序)
+
+| 步驟 | 內容 | 檔案 | 風險 |
+|------|------|------|------|
+| **S1** | `vad.py`: 新增 `scan_within_segment()` | `asrx_self/vad.py` | 低 |
+| **S2** | 🆕 `whisper_local.py`: 封裝 whisper 載入 + 轉錄 | `asrx_self/whisper_local.py` | 低 |
+| **S3** | 🔧 `main_fixed.py`: 重寫為 7 步 pipeline | `asrx_self/main_fixed.py` | 中 |
+| **S4** | 🆕 `speaker_classifier.py`: 性別分類器 | `asrx_self/speaker_classifier.py` | 低 |
+| **S5** | 🔧 `custom.py` cleanup + rename → `asrx_processor.py` | `asrx_processor_custom.py` | 低 |
+| **S6** | 🔧 Rust `asrx.rs`: 改指向 + 傳 `--file-uuid` | `src/core/processor/asrx.rs` | 低 |
+| **S7** | ✅ 驗證：build + playground 測試 | — | 中 |
+| **S8** | 🧹 刪除變體 + 搬離工具 | — | 低 |
+
+### 驗證標準
+
+1. `cargo build` 通過
+2. Playground 3003: 註冊影片 → ASRX processor 完成
+3. 輸出 JSON 中 `speaker_id` 非 `null`
+4. Qdrant collection 有 `speaker_embedding` 點
+5. 性別正確標記 (male/female)
+
+---
+
+## 9. 版本歷史
+
+| 版本 | 日期 | 修改者 | 說明 |
+|------|------|--------|------|
+| V1.0 | 2026-06-01 | OpenCode | 初始版本：7 步 hybrid pipeline + Qdrant 聲紋儲存 + 高品質分類 |
diff --git a/docs_v1.0/DESIGN/Modular_Doc_System_V1.0.md b/docs_v1.0/DESIGN/Modular_Doc_System_V1.0.md
new file mode 100644
index 0000000..2fbe927
--- /dev/null
+++ b/docs_v1.0/DESIGN/Modular_Doc_System_V1.0.md
@@ -0,0 +1,385 @@
+---
+document_type: "design"
+service: "MOMENTRY_CORE"
+title: "模組生成式文件產出系統"
+date: "2026-05-17"
+version: "V1.0"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"
+tags:
+  - "documentation"
+  - "modular"
+  - "generated-docs"
+  - "workspace"
+ai_query_hints:
+  - "查詢模組生成式文件產出系統的設計理念"
+  - "如何使用 API_WORKSPACE"
+  - "如何新增 API endpoint 文檔"
+  - "make deploy 流程"
+  - "自定義交付文件"
+related_documents:
+  - "STANDARDS/USER_DOCS_STANDARD.md"
+  - "STANDARDS/DOCS_STANDARD.md"
+  - "API_WORKSPACE/README.md"
+  - "API_WORKSPACE/modules/_template.md"
+---
+
+# 模組生成式文件產出系統
+
+| 項目 | 內容 |
+|------|------|
+| 建立者 | OpenCode |
+| 建立時間 | 2026-05-17 |
+| 文件版本 | V1.0 |
+| 目標讀者 | developer, documentation maintainer |
+
+---
+
+## 版本歷史
+
+| 版本 | 日期 | 目的 | 操作人 |
+|------|------|------|--------|
+| V1.0 | 2026-05-17 | 建立設計文件 | OpenCode |
+
+---
+
+## 1. 設計理念
+
+### 1.1 痛點
+
+傳統 API 文件維護有常見問題：
+
+| 問題 | 具體表現 |
+|------|----------|
+| **內容重複** | 同一個 endpoint 在快速參考、完整手冊、教育訓練文件中寫三次 |
+| **更新遺漏** | 修改 curl 範例後，忘記同步到另一份文件 |
+| **交付僵化** | 無法按對象產出不同版本的 API 文件 |
+| **版本失靈** | YAML frontmatter 版本號與實際內容脫節 |
+
+### 1.2 核心原則
+
+```
+單一真理源（modules/）→ 組裝引擎（assemble_docs.sh）→ 多種交付產品（GUIDES/）
+
+        編輯       ──→      生成       ──→      部署
+    1 處修改模組      make all      make deploy
+```
+
+| 原則 | 說明 |
+|------|------|
+| **單一真理源** | 每個 endpoint 只在 `modules/` 中定義一次 |
+| **組裝而非撰寫** | 交付文件是 modules 的組合，不是手寫 |
+| **開發與交付分離** | `API_WORKSPACE/` 開發，`GUIDES/` 交付 |
+| **模組為最小可測試單位** | 每個 module 可獨立驗證正確性 |
+| **配置驅動** | `.toml` 配置定義哪些 module 以何種模式組裝成何種輸出 |
+
+### 1.3 檔案類型對照
+
+| 類型 | 角色 | 可編輯 | 位置 |
+|------|------|--------|------|
+| Module (模組) | 不可再拆的內容最小單位 | ✅ 是 | `API_WORKSPACE/modules/` |
+| Config (配方) | 定義組裝規則 | ✅ 是 | `API_WORKSPACE/configs/` |
+| Narrative (敘事) | 非結構化的前言/背景 | ✅ 是 | `API_WORKSPACE/narratives/` |
+| Assembled (產出) | 從模組組裝的交付文件 | ❌ 否（generated） | `API_WORKSPACE/_build/` → `GUIDES/` |
+
+---
+
+## 2. 目錄結構
+
+```
+docs_v1.0/
+├── API_WORKSPACE/                    ← 開發區
+│   ├── modules/                      ← 端點模組（單一真理源）
+│   │   ├── _template.md              ← 模組撰寫規範
+│   │   ├── 01_auth.md                ← 認證、Base URL
+│   │   ├── 02_health.md              ← 健康檢查
+│   │   ├── 03_register.md            ← 註冊、掃描
+│   │   ├── 04_lookup.md              ← 查詢、刪除
+│   │   ├── 05_process.md             ← 處理、進度、任務
+│   │   ├── 06_search.md              ← 搜尋（向量、n8n、視覺）
+│   │   ├── 07_identity.md            ← 身份 CRUD、bind/unbind
+│   │   ├── 08_identity_agent.md      ← Identity Agent
+│   │   ├── 09_tmdb.md                ← TMDb Enrichment
+│   │   ├── 10_pipeline.md            ← Stats、配置、未掛載端點
+│   │   └── 11_error_codes.md         ← 錯誤碼對照表
+│   │
+│   ├── configs/                      ← 組裝配方（每個輸出一份）
+│   │   ├── reference.toml            → API_REFERENCE.md
+│   │   ├── endpoints.toml            → API_ENDPOINTS.md
+│   │   ├── quickref.toml             → API_QUICK_REFERENCE.md
+│   │   ├── errors.toml               → API_ERROR_CODES.md
+│   │   ├── index.toml                → API_INDEX.md
+│   │   ├── marcom.toml               → API_TRAINING_MARCOM.md
+│   │   └── tmdb.toml                   → TMDb_User_Guide.md
+│   │
+│   ├── narratives/                   ← 非端點敘事前言
+│   │   └── marcom_intro.md
+│   │
+│   ├── _build/                       ← 生成暫存區（gitignored）
+│   ├── Makefile                      ← 組裝自動化入口
+│   ├── assemble_docs.sh              ← 組裝引擎
+│   └── README.md                     ← 開發者速查
+│
+├── GUIDES/                           ← 交付區
+│   ├── API_REFERENCE.md              (generated)
+│   ├── API_ENDPOINTS.md              (generated)
+│   ├── API_QUICK_REFERENCE.md        (generated)
+│   ├── API_ERROR_CODES.md            (generated)
+│   ├── API_INDEX.md                  (generated)
+│   ├── API_TRAINING_MARCOM.md        (generated)
+│   ├── TMDb_User_Guide.md            (generated)
+│   ├── Demo_EndToEnd.md              (手寫保留)
+│   ├── Pipeline_API_Demo.md          (手寫保留)
+│   └── ...                           (其他手寫文件)
+│
+├── DESIGN/
+├── REFERENCE/
+├── OPERATIONS/
+├── INTEGRATIONS/
+└── STANDARDS/
+```
+
+---
+
+## 3. 模組規範
+
+### 3.1 檔名規則
+
+- 格式：`NN_<name>.md`（NN = 兩位數排序 01-99）
+- 範例：`03_register.md`, `09_tmdb.md`
+- 依賴序號決定組裝時的 endpoint 順序
+
+### 3.2 Module Metadata 註解
+
+每個 module 開頭必須有 metadata 註解：
+
+```markdown
+<!-- module: auth -->
+<!-- description: Authentication, API Key, Base URL configuration -->
+<!-- depends: -->
+```
+
+| 欄位 | 必填 | 說明 |
+|------|------|------|
+| `module` | Yes | 唯一名稱，無空格無數字開頭 |
+| `description` | Yes | 一句話說明 |
+| `depends` | No | 依賴的其他 module 名稱（逗號分隔） |
+
+### 3.3 Endpoint 結構
+
+每個 endpoint 必須使用一致結構：
+
+```markdown
+### `METHOD /path/to/endpoint`
+
+**Auth**: Required / Optional / Public
+**Scope**: file-level / identity-level / system-level
+
+#### Request Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+
+#### Example
+
+```bash
+curl -s -X METHOD "$API/path" \
+  -H "X-API-Key: $KEY" \
+  -d '{"field": "value"}'
+```
+
+#### Response (200)
+
+```json
+{ ... }
+```
+
+#### Error Codes
+
+| Code | HTTP | When |
+|------|------|------|
+```
+```
+
+### 3.4 變數規則
+
+| 變數 | 用途 | 範例值 |
+|------|------|--------|
+| `$API` | Base URL | `http://localhost:3003` |
+| `$KEY` | API Key | `your-api-key-here` |
+| `$FILE_UUID` | File UUID | `3a6c1865...` |
+| `$IDENTITY_UUID` | Identity UUID | `a9a90105...` |
+
+---
+
+## 4. 組裝引擎
+
+### 4.1 `assemble_docs.sh`
+
+Shell 腳本，接收三個參數：
+
+| 參數 | 說明 | 範例 |
+|------|------|------|
+| `--config` | TOML 配方路徑 | `configs/reference.toml` |
+| `--modules` | Module 目錄 | `modules/` |
+| `--build` | 輸出目錄 | `_build/` |
+
+### 4.2 三種組裝模式
+
+| mode | 行為 | 適用 |
+|------|------|------|
+| `full` | 完整包含 module 全部內容（除 metadata） | API_REFERENCE, API_ENDPOINTS |
+| `summary` | 僅擷取 endpoint 表格 + curl 範例 | API_QUICK_REFERENCE |
+| `index` | 生成文件總覽（掃描 modules 目錄自動產生索引） | API_INDEX |
+
+### 4.3 組裝流程
+
+```
+1. 讀取 config.toml → 解析 title, modules, mode, narrative
+2. 生成 YAML frontmatter（含 document_type, date, version）
+3. 生成 title heading + info block
+4. （可選）摘自 TOC：從 modules ## headings 生成目錄
+5. （可選）插入 narrative intro
+6. 遍歷 modules：
+   - full mode: 複製整份內容（跳過 <!-- --> 註解）
+   - summary mode: 只提取 | table | + ```bash code block
+   - index mode: 自動掃描 modules 目錄生成清單
+7. 寫入 _build/ 輸出檔案
+```
+
+---
+
+## 5. 配方格式（config.toml）
+
+```toml
+title = "輸出文件標題"
+output = "_build/FILENAME.md"     # 輸出路徑（相對於 API_WORKSPACE）
+mode = "full"                      # full | summary | index
+modules = ["01_auth", "03_register"]  # 要包含的 module 名稱
+narrative = "narratives/xxx.md"   # （可選）包含的敘事前言
+toc = true                         # （可選）是否生成目錄
+
+[frontmatter]
+document_type = "api_reference"    # 用於 YAML frontmatter
+service = "MOMENTRY_CORE"
+version = "V1.0"
+owner = "M5"
+created_by = "OpenCode"
+```
+
+### 內建配方一覽
+
+| 檔案 | 輸出 | Modules | Mode |
+|------|------|---------|------|
+| `reference.toml` | API_REFERENCE.md | 01-11 | full |
+| `endpoints.toml` | API_ENDPOINTS.md | 01-10 | full |
+| `quickref.toml` | API_QUICK_REFERENCE.md | 01-06,09 | summary |
+| `errors.toml` | API_ERROR_CODES.md | 11 | full |
+| `index.toml` | API_INDEX.md | (auto) | index |
+| `marcom.toml` | API_TRAINING_MARCOM.md | 01,03,06 + narrative | full |
+| `tmdb.toml` | TMDb_User_Guide.md | 01,03,09 | full |
+
+---
+
+## 6. 工作流程
+
+### 6.1 日常修改
+
+```bash
+# 1. 編輯模組
+cd API_WORKSPACE
+vim modules/09_tmdb.md
+
+# 2. 重新生成單一文件
+make tmdb
+
+# 3. 預覽結果
+less _build/TMDb_User_Guide.md
+
+# 4. 部署
+make deploy
+```
+
+### 6.2 新增端點
+
+```bash
+# 1. 找到所屬模組
+ls modules/
+# 決定該 endpoint 屬於哪個模組（如 tmdb, identity, search）
+
+# 2. 在對應模組加入 endpoint 文檔
+vim modules/09_tmdb.md
+
+# 3. 重新生成所有文件
+make all
+
+# 4. 確認所有引用此端點的文件都有正確更新
+make check
+
+# 5. 部署
+make deploy
+```
+
+### 6.3 客製化交付
+
+```bash
+# 新增一個客製化配方
+cat > configs/integration_partner.toml << TOML
+title = "Integration Partner API Guide"
+output = "_build/PARTNER_GUIDE.md"
+mode = "full"
+modules = ["01_auth", "06_search", "09_tmdb", "11_error_codes"]
+toc = true
+[frontmatter]
+document_type = "user_manual"
+service = "MOMENTRY_CORE"
+version = "V1.0"
+owner = "M5"
+created_by = "OpenCode"
+TOML
+
+# 在 Makefile 中加入對應 target
+echo "partner:" >> Makefile
+echo '	@$$(SCRIPT) --config configs/integration_partner.toml --modules $$(MODULES) --build $$(BUILD)' >> Makefile
+
+# 生成
+make partner
+
+# 部署
+make deploy
+```
+
+---
+
+## 7. 交付客製化對照表
+
+| 對象 | 需要 modules | make target | 輸出 |
+|------|-------------|-------------|------|
+| API Developer | 01-11 (all) | `make reference` | API_REFERENCE.md |
+| Quick Start User | 01-06,09 | `make quickref` | API_QUICK_REFERENCE.md |
+| Marcom Team | 01,03,06 + narrative | `make marcom` | API_TRAINING_MARCOM.md |
+| TMDb User | 01,03,09 | `make tmdb` | TMDb_User_Guide.md |
+| Integration Partner | 01,06,09,11 | Custom config | PARTNER_GUIDE.md |
+
+---
+
+## 8. GUIDES/ 文件類型說明
+
+| 類型 | 來源 | 說明 |
+|------|------|------|
+| `API_*.md` (7 files) | Generated from API_WORKSPACE | API 功能文件，endpoint 列表 + curl 範例 |
+| `Demo_*.md`, `M5API_*.md` | 手寫 | 敘事性指引，含完整 step-by-step 流程 |
+| `PORTAL_*.md` | 手寫 | Portal 開發計畫與 Demo 指引 |
+| `USER_MANUAL.md` | 手寫 | 系統操作使用手冊 |
+
+> **提醒**：不要直接修改 GUIDES/ 中的 generated files。修改應在 API_WORKSPACE/modules/ 中進行，然後執行 `make deploy`。
+
+---
+
+## 相關文件
+
+- `API_WORKSPACE/README.md` — 開發者快速上手指南
+- `API_WORKSPACE/modules/_template.md` — 模組撰寫範本
+- `STANDARDS/DOCS_STANDARD.md` — 文件創建規範
+- `STANDARDS/USER_DOCS_STANDARD.md` — 使用者文件規範
diff --git a/docs_v1.0/DESIGN/REPRESENTATIVE_FRAME_API_V1.md b/docs_v1.0/DESIGN/REPRESENTATIVE_FRAME_API_V1.md
new file mode 100644
index 0000000..d96cfab
--- /dev/null
+++ b/docs_v1.0/DESIGN/REPRESENTATIVE_FRAME_API_V1.md
@@ -0,0 +1,128 @@
+# Representative Frame API V1.0
+
+Portal 影片代表畫面 API — 沒有指定 frame_number 時自動偵測男女主角找到最佳互動 frame。
+
+---
+
+## 1. Overview
+
+### Purpose
+
+Portal 需要為每個影片顯示一張代表畫面（thumbnail），內容應為該影片最具代表性的 scene — 通常包含男女主角同框且互看的時刻。
+
+### Principle
+
+**沒有指定 frame_number → auto-detect representative frame**
+
+既有端點不需改動，只需在 `frame` 參數為空時自動偵測。
+
+---
+
+## 2. Endpoint
+
+### `GET /api/v1/file/:file_uuid/thumbnail`
+
+**Query Parameters**:
+
+| Param | Type | Required | Description |
+|-------|------|----------|-------------|
+| `frame` | i64 | ❌ | 指定 frame；不傳則 auto-detect |
+| `x` | i32 | ❌ | bbox crop x |
+| `y` | i32 | ❌ | bbox crop y |
+| `w` | i32 | ❌ | bbox crop width |
+| `h` | i32 | ❌ | bbox crop height |
+
+**Response**: Pure JPEG bytes (Content-Type: image/jpeg)
+
+**Examples**:
+```
+GET /api/v1/file/:uuid/thumbnail                     → auto-detect
+GET /api/v1/file/:uuid/thumbnail?frame=38165         → 指定 frame
+GET /api/v1/file/:uuid/thumbnail?frame=38165&x=723&y=205&w=221&h=221  → 指定 crop
+```
+
+---
+
+## 3. Internal Algorithm
+
+### Auto-detect Fallback Chain
+
+```
+Step 1: Auto-detect 主角 (top 2 by face count)
+  └─ face_detections JOIN identities
+
+Step 2: TKG Bridge — mutual_gaze?
+  ├── 有 mutual_gaze edge → first_frame ✅
+  └── 無 → face_detections 第一次同框 frame ✅
+
+Step 3: 只有一個主角?
+  └─ 該主角 face_quality (w×h×confidence) 最高 frame
+
+Step 4: 完全無 identity?
+  └─ 任 identity 的 face_quality 最高 frame
+
+Step 5: 完全無 face?
+  └─ 404 "No faces in this file"
+```
+
+### TKG Bridge Query
+
+```sql
+-- 找兩主角各自的 main trace
+SELECT trace_id FROM face_detections
+WHERE file_uuid = $1 AND identity_id = $2 AND trace_id IS NOT NULL
+GROUP BY trace_id ORDER BY COUNT(*) DESC LIMIT 1;
+
+-- TKG mutual_gaze 查詢
+SELECT (e.properties->>'first_frame')::bigint
+FROM tkg_edges e
+JOIN tkg_nodes a ON a.id = e.source_node_id
+JOIN tkg_nodes b ON b.id = e.target_node_id
+WHERE e.file_uuid = $1
+  AND a.external_id = concat('trace_', $4)
+  AND b.external_id = concat('trace_', $5)
+  AND e.properties->>'mutual_gaze' = 'true'
+LIMIT 1;
+
+-- Fallback: 第一次同框
+SELECT MIN(fd_a.frame_number)::bigint
+FROM face_detections fd_a
+JOIN face_detections fd_b ON fd_a.frame_number = fd_b.frame_number
+WHERE fd_a.file_uuid = $1 AND fd_a.identity_id = $2 AND fd_b.identity_id = $3;
+```
+
+---
+
+## 4. Implementation
+
+### Files Changed
+
+| File | Change |
+|------|--------|
+| `src/api/media_api.rs` | `ThumbQuery.frame` → `Option<i64>`; add auto-detect fallback |
+| `src/core/processor/tkg.rs` | Add `query_auto_representative_frame()` + structs (已實作) |
+| `src/core/processor/mod.rs` | Export new function + structs (已實作) |
+
+### Existing Trace-level Endpoints (不變)
+
+```
+GET /api/v1/file/:uuid/trace/:tid/representative-face  → JSON (legacy)
+GET /api/v1/file/:uuid/trace/:tid/thumbnail             → JPEG (auto via select_rep_face)
+```
+
+### No Changes
+
+- ❌ No new DB tables / migrations
+- ❌ No changes to `select_rep_face` / blurdetect
+- ❌ No chunk / cut / pre_chunks dependency
+
+---
+
+## 5. Version History
+
+| Date | Version | Author | Change |
+|------|---------|--------|--------|
+| 2026-05-22 | 1.0 | OpenCode | Initial design |
+| 2026-05-22 | 1.1 | OpenCode | 簡化為單一 endpoint: frame 為 None 時 auto-detect |
+
+*Updated: 2026-05-22*
diff --git a/docs_v1.0/DESIGN/Redis_Progress_Reporting_V1.0.md b/docs_v1.0/DESIGN/Redis_Progress_Reporting_V1.0.md
new file mode 100644
index 0000000..0d35b62
--- /dev/null
+++ b/docs_v1.0/DESIGN/Redis_Progress_Reporting_V1.0.md
@@ -0,0 +1,270 @@
+---
+document_type: "design_doc"
+service: "MOMENTRY_CORE"
+title: "Redis Progress Reporting V1.0"
+version: "V1.0"
+date: "2026-05-17"
+author: "M5"
+status: "draft"
+---
+
+# Redis Progress Reporting V1.0
+
+| 項目 | 內容 |
+|------|------|
+| Service | `MOMENTRY_CORE` |
+| Version | V1.0 |
+| Date | 2026-05-17 |
+| Author | M5 (OpenCode) |
+| Status | Draft |
+
+## 1. Overview
+
+This document defines the standardized progress reporting architecture for Momentry Core processors. It replaces the inconsistent ad-hoc progress patterns found across `scripts/`, `src/worker/`, and `src/api/`.
+
+### 1.1 Problems Addressed
+
+| # | Problem | Detail |
+|---|---------|--------|
+| 1 | Worker Redis key does not match `OPERATIONS/MOMENTRY_CORE_REDIS_KEYS.md` V1.0 spec | Worker writes `worker:job:{uuid}:processor:{name}` instead of spec `job:{uuid}:processor:{name}` |
+| 2 | Progress API reads wrong key | `get_progress()` reads `worker:job:{uuid}:processor:{name}` — unresolved with Playground subscriber which writes `job:{uuid}:processor:{name}` |
+| 3 | Swift processors (Face/OCR/Pose) lack RedisPublisher | Progress lost — only stdout text |
+| 4 | ASRX/Story/Visual chunk have no incremental progress | Start + complete only, no `current/total` updates |
+| 5 | `frames_processed` / `chunks_produced` never updated in real-time | Worker only writes processor hash at start and exit |
+| 6 | No `output_count` / `output_type` fields | Impossible to know how many faces/objects/segments were produced |
+
+### 1.2 Key Design Decisions
+
+| Decision | Rationale |
+|----------|-----------|
+| Progress unit = frames for video processors | All media-level processors work frame by frame |
+| Output count separate from progress | Processors may produce N outputs per frame (multiple faces, objects) |
+| Pub/sub for real-time, Hash for final state | Pub/sub is transient; Hash persists for API queries |
+
+---
+
+## 2. Redis Key Architecture
+
+### 2.1 Key Patterns
+
+All keys use the configured `REDIS_KEY_PREFIX` (default: `momentry:` for production, `momentry_dev:` for playground).
+
+| Pattern | Type | TTL | Purpose | Owner |
+|---------|------|-----|---------|-------|
+| `{prefix}progress:{uuid}` | Pub/Sub | — | Real-time progress messages | Python scripts |
+| `{prefix}job:{uuid}` | Hash | 24h | Per-video job state | Worker |
+| `{prefix}job:{uuid}:processor:{name}` | Hash | 24h | Per-processor final state | Worker |
+| `{prefix}job:{uuid}:processor:{name}:output_count` | String | 24h | Output count by type | Worker |
+
+### 2.2 Processor Hash Fields
+
+```
+{prefix}job:{uuid}:processor:{name}
+├── status          String   running / completed / failed / pending
+├── current         u32      Units processed (frames for video processors)
+├── total           u32      Total units
+├── output_count    u32      Output items produced (faces, objects, segments)
+├── output_type     String   Type name of output: faces / objects / segments / cuts / etc.
+├── pid             i32      OS process ID (0 if not running)
+├── error           String   Error message if failed
+└── updated_at      String   ISO 8601 timestamp
+```
+
+### 2.3 Migrated Keys
+
+The following key patterns from the original implementation are REMOVED:
+
+| Old Key | Reason |
+|---------|--------|
+| `{prefix}worker:job:{uuid}:processor:{name}` | Non-standard prefix — not in `MOMENTRY_CORE_REDIS_KEYS.md` spec |
+| `{prefix}job:{uuid}:processor:{name}:status` (flat) | Redundant — status stored in Hash |
+| `{prefix}job:{uuid}:processor:{name}:progress` (flat) | Replaced by `current` + `total` for percent calculation |
+| `{prefix}job:{uuid}:processor:{name}:current` (flat) | Replaced by Hash fields |
+| `{prefix}job:{uuid}:processor:{name}:total` (flat) | Replaced by Hash fields |
+| `{prefix}job:{uuid}:processor:{name}:started_at` (flat) | Replaced by Hash `updated_at` |
+
+---
+
+## 3. Pub/Sub Message Format
+
+### 3.1 Channel
+
+```
+{prefix}progress:{uuid}
+```
+
+### 3.2 Message JSON
+
+```json
+{
+  "processor": "face",
+  "current": 150,
+  "total": 162696,
+  "output_count": 423,
+  "output_type": "faces",
+  "message": "Processing frame 150",
+  "timestamp": 1700000000
+}
+```
+
+### 3.3 Field Definitions
+
+| Field | Type | Required | Description |
+|-------|------|----------|-------------|
+| `processor` | String | ✅ | Processor name: asr / asrx / yolo / ocr / face / pose / cut / story / visual_chunk |
+| `current` | u32 | ✅ | Units processed (frames for video processors) |
+| `total` | u32 | ✅ | Total units |
+| `output_count` | u32 | ❌ | Output items produced so far |
+| `output_type` | String | ❌ | Type name: faces / objects / segments / cuts / text_regions / persons / speakers / stories / visual_chunks |
+| `message` | String | ❌ | Human-readable progress description |
+| `timestamp` | u64 | ✅ | Unix timestamp |
+
+---
+
+## 4. Per-Processor Metrics
+
+| Processor | current/total Unit | output_type | When to Publish |
+|-----------|-------------------|-------------|-----------------|
+| ASR | frames | `segments` | Every 100 segments processed |
+| ASRX | frames | `speakers` | Every processing stage |
+| YOLO | frames | `objects` | Every 500 frames |
+| OCR | frames | `text_regions` | Every 5% |
+| Face | frames | `faces` | Every batch (5% of frames) |
+| Pose | frames | `persons` | Every 10% |
+| CUT | frames | `cuts` | Every scene detected |
+| Story | chunks | `stories` | Every chunk processed |
+| Visual chunk | frames | `visual_chunks` | Every chunk processed |
+
+### 4.1 Output Type Enum
+
+```rust
+pub enum OutputType {
+    Segments,       // ASR
+    Speakers,       // ASRX
+    Objects,        // YOLO
+    TextRegions,    // OCR
+    Faces,          // Face
+    Persons,        // Pose
+    Cuts,           // CUT
+    Stories,        // Story
+    VisualChunks,   // Visual chunk
+}
+```
+
+---
+
+## 5. Data Flow
+
+```
+┌──────────────────┐     Pub/Sub                          ┌──────────────────────┐
+│  Python Processor │ ───────── progress:{uuid} ──────────→│  Worker (subscriber) │
+│  (ASR/YOLO/Face)  │     {current, total,                 │                      │
+│                   │      output_count, output_type}       │  ──→ HSET            │
+└──────────────────┘                                       │  job:{uuid}:         │
+                                                           │  processor:{name}    │
+┌──────────────────┐                                       │                      │
+│  Swift Processor  │ ──→ Python wrapper ──→ pub/sub        │  (status, current,   │
+│  (Face/OCR/Pose)  │     (add RedisPublisher)             │   total, output_count,│
+└──────────────────┘                                       │   output_type)       │
+                                                           └──────────┬───────────┘
+                                                                      │ HGETALL
+                                                           ┌──────────▼───────────┐
+                                                           │  Progress API        │
+                                                           │  GET /progress/:uuid │
+                                                           │                     │
+                                                           │  ─→ compute %       │
+                                                           │  ─→ return JSON     │
+                                                           └─────────────────────┘
+```
+
+---
+
+## 6. Implementation Plan
+
+### Phase 1: Python Processor RedisPublisher
+
+| Task | Files | Effort |
+|------|-------|--------|
+| Add `RedisPublisher` to `face_processor.py` | `scripts/face_processor.py` | Medium |
+| Add `RedisPublisher` to `ocr_processor.py` | `scripts/ocr_processor.py` | Medium |
+| Add `RedisPublisher` to `pose_processor.py` | `scripts/pose_processor.py` | Medium |
+| Add incremental `.progress()` to `asrx_processor_custom.py` | `scripts/asrx_processor_custom.py` | Low |
+| Standardize pub/sub message to include `output_count`, `output_type` | All processor scripts | Low |
+
+### Phase 2: Worker
+
+| Task | Files | Effort |
+|------|-------|--------|
+| Fix Redis key from `worker:job:` to `job:` | `src/worker/processor.rs`, `src/core/db/redis_client.rs` | Low |
+| Subscribe to `progress:{uuid}` channel in `run_processor()` | `src/worker/processor.rs` | Medium |
+| HSET Processor Hash on each progress message | `src/worker/processor.rs` | Medium |
+| Set `output_count` and `output_type` from pub/sub message | `src/worker/processor.rs` | Low |
+
+### Phase 3: Progress API
+
+| Task | Files | Effort |
+|------|-------|--------|
+| Read `output_count`, `output_type` from Redis Hash | `src/api/server.rs` | Low |
+| Compute percentage from `current` / `total` | `src/api/server.rs` | Low |
+| Return `output_count`, `output_type` in response JSON | `src/api/server.rs` | Low |
+| Remove `worker:` fallback path | `src/api/server.rs` | Low |
+
+### Phase 4: Cleanup
+
+| Task | Files | Effort |
+|------|-------|--------|
+| Remove old `worker:job:` keys from Redis | Deployment script | Low |
+| Remove `update_processor_progress()` DB path (stale `processing_status` JSONB) | `src/core/db/postgres_db.rs` | Medium |
+
+---
+
+## 7. API Response Changes
+
+### ProgressResponse (new fields)
+
+```json
+{
+  "processors": [
+    {
+      "name": "face",
+      "status": "running",
+      "current": 150,
+      "total": 162696,
+      "progress": 0,
+      "frames_processed": 150,
+      "output_count": 423,
+      "output_type": "faces"
+    }
+  ]
+}
+```
+
+---
+
+## 8. Dependencies
+
+| Component | Version | Role |
+|-----------|---------|------|
+| Redis | ≥ 6.0 | Pub/Sub + Hash storage |
+| `redis_publisher.py` | Existing | Python → Redis pub/sub client |
+| `redis_client.rs` | Existing | Rust Redis client for worker + API |
+
+---
+
+## 9. References
+
+| Doc | Relation |
+|-----|----------|
+| `OPERATIONS/MOMENTRY_CORE_REDIS_KEYS.md` | Parent spec — this doc supersedes sections 4, 7, 8 |
+| `DESIGN/VIDEO_PROCESSING_SPEC.md` §2.3 | Original progress design (ProcessProgress struct) |
+| `src/worker/processor.rs` | Worker progress write implementation |
+| `scripts/redis_publisher.py` | Python pub/sub client |
+| `src/api/server.rs` (get_progress) | Progress API handler |
+
+---
+
+## Version History
+
+| Version | Date | Author | Change |
+|---------|------|--------|--------|
+| V1.0 | 2026-05-17 | M5 (OpenCode) | Initial draft — replaces ad-hoc progress patterns |
diff --git a/docs_v1.0/M4_workspace/2026-05-27_charade_pipeline_checklist.md b/docs_v1.0/M4_workspace/2026-05-27_charade_pipeline_checklist.md
new file mode 100644
index 0000000..6e255bc
--- /dev/null
+++ b/docs_v1.0/M4_workspace/2026-05-27_charade_pipeline_checklist.md
@@ -0,0 +1,242 @@
+---
+title: Charade Full Movie Pipeline Checklist
+version: 1.0
+date: 2026-05-27
+author: M5Max48
+status: in_progress
+---
+
+# Charade Full Movie Pipeline Checklist
+
+**File UUID**: `c3c635e3641da80dde10cc555ffcdda5`
+**File Name**: Charade (1963) Cary Grant & Audrey Hepburn | Comedy Mystery Romance Thriller | Full Movie.mp4
+**Duration**: 6785 seconds (113 minutes)
+**Total Frames**: 169,625
+
+---
+
+## P0: Processor Outputs
+
+### Purpose
+原始處理器輸出檔案，存放在 `/Users/accusys/momentry/output_dev/`。這些是後續 ingestion 的資料來源。
+
+### Processor Details
+
+| Processor | Expected Output | Size Estimate | Purpose | Status |
+|-----------|-----------------|---------------|---------|--------|
+| CUT | `c3c635e3641da80dde10cc555ffcdda5.cut.json` | ~170KB | Scene boundary detection，切割點用於 Rule 3 chunking | ✅ Done |
+| YOLO | `c3c635e3641da80dde10cc555ffcdda5.yolo.json` | ~50-80MB | Object detection，每幀的物件類別與位置 | 🔄 Running |
+| Face | `c3c635e3641da80dde10cc555ffcdda5.face.json` | ~1.5GB | Face detection + 512-dim embedding (FaceNet CoreML) | 🔄 44% |
+| Face Traced | `c3c635e3641da80dde10cc555ffcdda5.face_traced.json` | ~1.2GB | Face tracking，同一人物的連續出現 → trace_id | ⏳ Pending (after Face) |
+| OCR | `c3c635e3641da80dde10cc555ffcdda5.ocr.json` | ~50KB | Text recognition from frames | ❌ Skipped |
+| Pose | `c3c635e3641da80dde10cc555ffcdda5.pose.json` | ~20MB | Body pose estimation | 🔄 Running |
+| ASRX | `c3c635e3641da80dde10cc555ffcdda5.asrx.json` | ~8MB | Speaker diarization，語者分段 | ✅ Done (reuse from public) |
+| Visual Chunk | `c3c635e3641da80dde10cc555ffcdda5.visual_chunk.json` | ~60KB | Visual scene chunk metadata | ✅ Done |
+| Scene | `c3c635e3641da80dde10cc555ffcdda5.scene.json` | ~300B | Scene list from CUT | ✅ Done |
+| Scene Meta | `c3c635e3641da80dde10cc555ffcdda5.scene_meta.json` | ~50KB | Heuristic scene metadata (人物 + 物件統計) | ⏳ Pending |
+| Story LLM | `c3c635e3641da80dde10cc555ffcdda5.story_llm.json` | ~800KB | LLM-generated story summaries per chunk | ✅ Done |
+| Story Story | `c3c635e3641da80dde10cc555ffcdda5.story_story.json` | ~800KB | Story parent-child relationships | ✅ Done |
+| TMDb | `c3c635e3641da80dde10cc555ffcdda5.tmdb.json` | ~5KB | TMDb cast list with face embeddings | ⏳ Pending |
+| 5W1H | `c3c635e3641da80dde10cc555ffcdda5.5w1h.json` | ~500KB | 5W1H agent output (who/when/where/what/why/how) | ✅ Done |
+
+### Key Dependencies
+- Face Traced 需要 Face 完成後才能執行 (face_traced.json = face.json + tracking)
+- Scene Meta 需要 Face + YOLO 完成
+- TMDb 需要 Face Traced 完成後執行 matching
+
+---
+
+## P1: Database Records
+
+### Purpose
+將 processor outputs 存入 PostgreSQL，供 API query 使用。
+
+### Table Details
+
+| Table | Expected Records | Purpose | Verification Query | Status |
+|-------|------------------|---------|-------------------|--------|
+| `dev.videos` | 1 row | Video metadata (duration, fps, status) | `SELECT file_uuid, status FROM dev.videos WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | ✅ Registered |
+| `dev.monitor_jobs` | 1 row | Processing job state machine | `SELECT uuid, status, completed_processors FROM dev.monitor_jobs WHERE uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | 🔄 Running |
+| `dev.pre_chunks` | ~7,000 rows | Raw processor outputs (ASR sentences, YOLO objects, etc.) | `SELECT COUNT(*) FROM dev.pre_chunks WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | ⏳ Pending |
+| `dev.face_detections` | ~70,000 rows | Face detection records (每幀每張臉) | `SELECT COUNT(*) FROM dev.face_detections WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | ⏳ Pending |
+| `dev.face_detections.embedding` | ~70,000 non-NULL | 512-dim FaceNet embedding (用於 identity matching) | `SELECT COUNT(embedding) FROM dev.face_detections WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | ⏳ Pending |
+| `dev.face_detections.trace_id` | ~70,000 non-NULL | Face tracking ID (同一人物跨幀連續出現) | `SELECT COUNT(trace_id) FROM dev.face_detections WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | ⏳ Pending |
+| `dev.face_detections.identity_id` | ~50,000 non-NULL | TMDb identity binding (Audrey, Cary, etc.) | `SELECT COUNT(identity_id) FROM dev.face_detections WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | ⏳ Pending |
+
+### Key Points
+- `embedding` 必須非 NULL 才能進行 TMDb matching (之前 store_traced_faces.py bug 修復)
+- `trace_id` 由 `store_traced_faces.py` 從 face_traced.json 計算
+- `identity_id` 由 `match_faces_to_tmdb.py` 計算 (cosine similarity > 0.5)
+
+---
+
+## P2: Chunk Ingestion
+
+### Purpose
+將 raw processor outputs 轉換為 searchable chunks，用於 RAG query。
+
+### Chunk Types
+
+| Chunk Type | Expected Count | Purpose | Source | Verification Query | Status |
+|------------|----------------|---------|--------|-------------------|--------|
+| sentence (Rule 1) | ~1,700 | Sentence-level chunks for text search | ASR output → sentence split | `SELECT COUNT(*) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND chunk_type = 'sentence'` | ⏳ Pending |
+| llm_parent | ~800 | LLM-generated summary parent chunks | Story LLM output | `SELECT COUNT(*) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND chunk_type = 'llm_parent'` | ⏳ Pending |
+| story_parent | ~800 | Story parent chunks (narrative segments) | Story processor | `SELECT COUNT(*) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND chunk_type = 'story_parent'` | ⏳ Pending |
+| story_child | ~1,700 | Story child chunks (linked to sentence) | Story processor | `SELECT COUNT(*) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND chunk_type = 'story_child'` | ⏳ Pending |
+| cut (Rule 3) | ~500 | Scene-level chunks for scene search | CUT output → scene boundaries | `SELECT COUNT(*) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND chunk_type = 'cut'` | ⏳ Pending |
+| trace | ~3,600 | Face trace chunks (identity-centric) | Face Traced output | `SELECT COUNT(*) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND chunk_type = 'trace'` | ⏳ Pending |
+
+### Ingestion Pipeline
+1. **Rule 1**: ASR → sentence split → chunk + embedding → Qdrant
+2. **Rule 3**: CUT + ASR → scene chunks → chunk + embedding → Qdrant
+3. **Trace**: Face Traced → trace chunks → TKG nodes → Qdrant
+
+### Key Points
+- `start_frame` / `end_frame` 必須正確計算 (之前 bug: frame=0)
+- Chunks 必須有 `embedding` 才能 search
+
+---
+
+## P3: Vector Embeddings
+
+### Purpose
+將 chunks 的 text 轉換為 768-dim embeddings，存入 PostgreSQL + Qdrant，用於 semantic search。
+
+### Embedding Targets
+
+| Target | Expected Count | Model | Purpose | Verification | Status |
+|--------|----------------|-------|---------|--------------|--------|
+| PostgreSQL `dev.chunk.embedding` | ~5,000 | Gemma-2-9B (768-dim) | Text semantic search | `SELECT COUNT(embedding) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | ⏳ Pending |
+| Qdrant `momentry_dev_rule1_v2` | ~5,000 points | Gemma-2-9B | Fast vector similarity search | `curl -H "api-key: Test3200Test3200Test3200" "http://localhost:6333/collections/momentry_dev_rule1_v2"` | ⏳ Pending |
+| Qdrant `_face` collection | ~70,000 points | FaceNet-512 (512-dim) | Face identity search | Face embeddings sync via `sync_face_embeddings()` | ⏳ Pending |
+
+### Embedding Pipeline
+1. **Text chunks**: `embeddinggemma_server.py` (port 11436) → 768-dim embedding
+2. **Face embeddings**: FaceNet CoreML (from face.json) → 512-dim embedding (已在 P0 產生)
+3. **Sync to Qdrant**: `sync_face_embeddings()` function in Rust
+
+### Key Points
+- Text embeddings 使用 Gemma-2-9B (local LLM server)
+- Face embeddings 使用 FaceNet-512 (CoreML ANE accelerated)
+- Qdrant 提供 fast similarity search (cosine similarity)
+
+---
+
+## P4: Identity Binding
+
+### Purpose
+將 detected faces 綁定到 TMDb identities (Audrey Hepburn, Cary Grant, etc.)，用於 identity_text search。
+
+### Identity Matching Pipeline
+
+| Step | Expected Result | Method | Verification | Status |
+|------|-----------------|--------|--------------|--------|
+| TMDb seeds loaded | 23 identities | `tmdb_embed_extractor.py` → TMDb profile face embeddings | `SELECT COUNT(*) FROM dev.identities WHERE source = 'tmdb' AND face_embedding IS NOT NULL` | ✅ Done |
+| Face matching | ~50,000 bindings | `match_faces_to_tmdb.py` → cosine similarity > 0.5 | `SELECT COUNT(identity_id) FROM dev.face_detections WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND identity_id IS NOT NULL` | ⏳ Pending |
+| Audrey Hepburn faces | ~16,000 | Highest similarity match | `SELECT COUNT(*) FROM dev.face_detections fd JOIN dev.identities i ON fd.identity_id = i.id WHERE fd.file_uuid = 'c3c635e3641da80dde10cc555ffcdda5' AND i.name = 'Audrey Hepburn'` | ⏳ Pending |
+| Cary Grant faces | ~5,000 | Second highest match | Same query for Cary Grant | ⏳ Pending |
+
+### Matching Algorithm
+```python
+# match_faces_to_tmdb.py
+for trace_id in traces:
+    for face_embedding in trace_faces:
+        for tmdb_identity in tmdb_identities:
+            similarity = cosine_similarity(face_embedding, tmdb_identity.face_embedding)
+            if similarity >= 0.5:
+                match trace_id → tmdb_identity
+```
+
+### Key Points
+- TMDb seeds 需要 `face_embedding` (之前已驗證: 23 identities with embeddings)
+- Face `embedding` 必須非 NULL (之前 store_traced_faces.py bug 修復)
+- Threshold: 0.5 (可調整)
+
+---
+
+## P5: API Endpoints
+
+### Purpose
+驗證 API endpoints 可以正確返回 identity_text search results。
+
+### API Tests
+
+| Endpoint | Purpose | Expected Response | Test Command | Status |
+|----------|---------|-------------------|--------------|--------|
+| `/api/v1/search/identity_text` | Search chunk text → identities | Results with `identity_name`, `trace_id`, `identity_source` | `curl "http://localhost:3003/api/v1/search/identity_text?file_uuid=c3c635e3641da80dde10cc555ffcdda5&q=Regina&limit=5"` | ⏳ Pending |
+| `/api/v1/identities` | List identities with TMDb | Identity list with `tmdb_id`, `face_embedding` | `curl "http://localhost:3003/api/v1/identities?name=Audrey"` | ⏳ Pending |
+| `/api/v1/progress/:file_uuid` | Check processing progress | JSON with `status`, `completed_processors` | `curl "http://localhost:3003/api/v1/progress/c3c635e3641da80dde10cc555ffcdda5"` | ⏳ Pending |
+
+### Expected API Response Example
+```json
+{
+  "success": true,
+  "total": 5,
+  "results": [
+    {
+      "chunk_id": "sentence_123",
+      "start_time": 355.0,
+      "text_content": "Oh, mine's Regina Lampert.",
+      "identity_id": 9,
+      "identity_name": "Audrey Hepburn",
+      "identity_source": "tmdb",
+      "trace_id": 169
+    }
+  ]
+}
+```
+
+### Key Points
+- `identity_text` API 需要 `chunk.start_frame` / `chunk.end_frame` 正確 (之前 bug: frame=0)
+- `identity_id` 必須非 NULL 才能返回 identity_name
+
+---
+
+## P6: Completion Criteria
+
+### Purpose
+驗證 pipeline 完整完成，所有 ingestion steps 成功。
+
+### Final Verification Checklist
+
+| Criteria | Purpose | Check Command | Expected Result | Status |
+|----------|---------|---------------|-----------------|--------|
+| All processor outputs exist | 確認所有 processor JSON 檔案產生 | `ls -la output_dev/c3c635e3641da80dde10cc555ffcdda5.*` | 14+ files with size > 0 | ⏳ Pending |
+| Job status = completed | 確認 worker 完成 job | `SELECT status FROM dev.monitor_jobs WHERE uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | `completed` | ⏳ Pending |
+| Video status = completed | 確認 video state 更新 | `SELECT status FROM dev.videos WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | `completed` | ⏳ Pending |
+| All chunks have embeddings | 確認 text embeddings 完成 | `SELECT COUNT(*) = COUNT(embedding) FROM dev.chunk WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | `true` (all chunks have embedding) | ⏳ Pending |
+| Face traces assigned | 確認 face tracking 完成 | `SELECT COUNT(*) = COUNT(trace_id) FROM dev.face_detections WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | `true` (all faces have trace_id) | ⏳ Pending |
+| TMDb matching done | 確認 identity binding 完成 | `SELECT COUNT(identity_id) > 40000 FROM dev.face_detections WHERE file_uuid = 'c3c635e3641da80dde10cc555ffcdda5'` | `true` (> 40K identity bindings) | ⏳ Pending |
+| Qdrant synced | 確認 vector search ready | Check Qdrant points count | Points increased by ~5,000 | ⏳ Pending |
+
+### Success Thresholds
+- **Face detections**: ~70,000 (169K frames / 3 sample interval)
+- **Identity bindings**: > 40,000 (60% match rate)
+- **Chunks with embeddings**: > 4,000 (all chunk types)
+- **Qdrant points**: > 90,000 (current) → > 95,000 (after Charade)
+
+---
+
+## Verification Script
+
+```bash
+# Run after completion
+./scripts/verify_charade_pipeline.sh c3c635e3641da80dde10cc555ffcdda5
+```
+
+---
+
+## Notes
+
+- OCR processor failed, skipped
+- Face detection using SwiftFace (ANE accelerated)
+- TMDb matching using `scripts/match_faces_to_tmdb.py`
+- Expected total processing time: ~2-3 hours
+
+---
+
+## Version History
+
+| Version | Date | Author | Changes |
+|---------|------|--------|---------|
+| 1.0 | 2026-05-27 | M5Max48 | Initial checklist |
\ No newline at end of file
diff --git a/docs_v1.0/M4_workspace/2026-05-29_identity_sync_and_wp_fixes.md b/docs_v1.0/M4_workspace/2026-05-29_identity_sync_and_wp_fixes.md
new file mode 100644
index 0000000..3d62daf
--- /dev/null
+++ b/docs_v1.0/M4_workspace/2026-05-29_identity_sync_and_wp_fixes.md
@@ -0,0 +1,49 @@
+# Session Summary: Identity Fixes + WP Proxy Fixes + Data Sync
+
+**Date**: 2026-05-29
+**Author**: OpenCode
+**Status**: Completed (marcom team testing)
+
+## What Was Done (Chronological)
+
+### 1. Production Identity Fixes (3002)
+- **James Coburn restored** (id=18738, confirmed)
+- **Chantal Goya restored** (id=18737, confirmed)
+- **Louis Viret name/status fixed**
+- **Sequences fixed**: `identities_id_seq` (48→18734), `face_detections_id_seq` (141383→932413), `identity_history_id_seq`, `identity_bindings_id_seq`, `pre_chunks_id_seq`, `file_identities_id_seq`
+- **COALESCE fix** for `reference_data` NULL crash (`postgres_db.rs:3198`, `storage.rs:196`)
+
+### 2. Bug Fixes
+- **DELETE identity**: Fixed binding order bug + removed `identity_confidence` column reference
+- **PATCH identity**: `jsonb_deep_merge` Nested JSON metadata
+- **mergeinto UNDO/REDO**: MongoDB deserialization fix (`Collection<Document>`)
+
+### 3. Library Page Infinite Load Fix
+- **Root cause**: WP scan proxy (snippet 48) didn't forward query params → infinite pagination loop
+- **Fix**: Added `$request->get_query_params()` forwarding in scan proxy
+- **Safety**: Added `maxPages = 10` limit in JS pagination
+
+### 4. Identity Data Sync (Dev → Production)
+- **Full replacement** of `public.identities`, `public.identity_bindings`, `public.identity_history` with dev data
+- James Coburn id: 18738 → 11
+- Bindings: 11,892 → 12,834 (+942)
+- **Verification**: 0 differences between schemas
+
+### 5. Snippet 55 Filter
+- Added `.filter(f => f.is_registered)` to show only registered files on library page
+- Changed `status:'unregistered'` → `status: f.status || 'unregistered'`
+
+## Key Decisions
+- Library page filter: default show registered files only
+- Identity sync: full DELETE + INSERT (not UPDATE) to ensure consistency
+- No user-defined metadata fields (starred/notes/role) preserved — matches dev exactly
+
+## Handoff to Marcom
+- `/people/` page should show correct identity state
+- `/library/` page should show only registered files (4 currently)
+- Login required for `/library/` — redirects to `/login/` if not authenticated
+
+## Files Modified
+- `snippet 48` (/scan WP proxy — query param forwarding)
+- `snippet 55` (library page JS — registered-only filter, maxPages safety)
+- `docs_v1.0/M4_workspace/2026-05-29_identity_sync_prod.md` (sync record)
diff --git a/docs_v1.0/M4_workspace/2026-05-29_identity_sync_prod.md b/docs_v1.0/M4_workspace/2026-05-29_identity_sync_prod.md
new file mode 100644
index 0000000..fc7bdc8
--- /dev/null
+++ b/docs_v1.0/M4_workspace/2026-05-29_identity_sync_prod.md
@@ -0,0 +1,45 @@
+# Identity Data Sync: Dev (3003) → Production (3002)
+
+**Date**: 2026-05-29
+**Author**: OpenCode
+**Status**: Completed
+
+## Summary
+
+Fully synced all identity-related tables from dev schema to public schema on PostgreSQL `momentry` database.
+
+## What Was Done
+
+1. **Identities table** (`public.identities`): Replaced with `dev.identities` (69 records, original ids preserved)
+2. **Identity_bindings** (`public.identity_bindings`): Replaced with `dev.identity_bindings` (12,834 records)
+3. **Identity_history** (`public.identity_history`): Replaced with `dev.identity_history` (10 records)
+4. **Sequences**: Updated `identities_id_seq`, `identity_bindings_id_seq`, `identity_history_id_seq` to match
+
+### Key Changes
+- **James Coburn**: Changed from id=18738 → id=11 (dev's original id)
+- **Chantal Goya**: Changed from id=18737 → id=18736 (dev's id)
+- **Metadata**: Now matches dev schema — TMDB fields only, no user-defined fields (starred, notes, role, aliases, user_confirmed are removed as expected)
+- **Bindings**: Increased from 11,892 → 12,834 (+942 bindings)
+
+### Not Changed
+- `face_detections` — identical in both schemas (135,521 records)
+- `pre_chunks` — large difference (public: 1.3M vs dev: 3.3M) but NOT related to identity
+- All other non-identity tables unchanged
+
+## Verification
+
+```sql
+-- Counts match
+identities:        69 = 69 ✅
+identity_bindings: 12,834 = 12,834 ✅
+identity_history:  10 = 10 ✅
+
+-- No differences
+id/uuid mismatch:         0
+metadata/status/name diffs: 0
+```
+
+## Files Referenced
+
+- `AGENTS.md` — Development isolation rules
+- `/Users/accusys/momentry_core/docs_v1.0/M4_workspace/2026-05-29_wp_api_url_update.md` — Previous session handoff
diff --git a/docs_v1.0/M4_workspace/2026-05-29_mergeinto_null_faceid_fix.md b/docs_v1.0/M4_workspace/2026-05-29_mergeinto_null_faceid_fix.md
new file mode 100644
index 0000000..c606677
--- /dev/null
+++ b/docs_v1.0/M4_workspace/2026-05-29_mergeinto_null_faceid_fix.md
@@ -0,0 +1,27 @@
+# 2026-05-29: Mergeinto NULL face_id Fix
+
+## Problem
+Production server (3002) returned `"error":"error occurred while decoding column 0: unexpected null; try decoding as an 'Option'"` when using mergeinto after clicking undo on a merge.
+
+## Root Cause
+`src/api/identity_binding.rs:428` decodes `face_id` from `face_detections` as `String` (non-Option), but **135,521 records** in the production `face_detections` table have NULL `face_id`. When merging an identity whose face_detections include NULL face_ids, the SQLx decode panics.
+
+## Fix
+- Changed `(String, Option<i32>)` → `(Option<String>, Option<i32>)` at line 428
+- Changed `face_id_list` to use `filter_map` instead of `map` to skip NULL face_ids
+- Changed `faces_count` to use `face_id_list.len()` instead of `face_ids.len()` (matching the actual transferred count)
+
+## Files Changed
+- `momentry_core/src/api/identity_binding.rs` — 3 lines changed
+
+## Verification
+- 234 library tests pass
+- `cargo fmt` passes
+- Production binary rebuilt (`target/release/momentry`)
+- Production server restarted on port 3002 (PID 92043)
+
+## Identities with NULL face_id (20 identities, ~135k records)
+Audrey Hepburn (36k), Cary Grant (15k), Bernard Musson, Walter Matthau, Jacques Marin, George Kennedy, Michel Thomass, Antonio Passalia, etc. — all `type=people, status=confirmed`. These identities were likely imported from bulk face detection data without face_id generation.
+
+## Data Note
+The NULL face_ids are a pre-existing data quality issue. The fix prevents crashes but doesn't clean up the NULL data. Faces with NULL face_id won't be tracked in undo history (they stay with the target after undo), but the bulk transfer (`WHERE identity_id = $1`) still works correctly.
diff --git a/docs_v1.0/OPERATIONS/TMDb_Pipeline_Test_2026-05-17.md b/docs_v1.0/OPERATIONS/TMDb_Pipeline_Test_2026-05-17.md
new file mode 100644
index 0000000..2162b21
--- /dev/null
+++ b/docs_v1.0/OPERATIONS/TMDb_Pipeline_Test_2026-05-17.md
@@ -0,0 +1,68 @@
+# TMDb Pipeline Test 2026-05-17
+
+## Purpose
+Verify full TMDb enrichment pipeline: register → process → TMDb prefetch → probe → identity files → downloads.
+
+## Environment
+- **Server**: playground (port 3003)
+- **Schema**: `dev`
+- **TMDB_API_KEY**: `e9cde52197f6f8df4d9db99da93db1fb`
+- **Build**: `momentry_playground` (debug, 0 errors)
+
+## Pre-cleanup
+Unregistered old files + deleted output files:
+```bash
+POST /api/v1/unregister {"file_uuid": "3abeee81..."}
+POST /api/v1.unregister {"file_uuid": "23b1c872..."}
+```
+
+## Step 1: Register
+
+| File | UUID | Result |
+|------|------|--------|
+| Charade main | `bd80fec92b0b6963d177a2c55bf713e2` | ✅ Registered (already_exists due to content_hash match) |
+| Charade YouTube | `a6fb22eebefaef17e62af874997c5944` | ✅ Fresh registration |
+
+Register phase completed: probe → CUT → scene classification.
+
+## Step 2: Trigger Processing
+
+```bash
+POST /api/v1/file/:uuid/process {}
+```
+
+Jobs created:
+- Main: job_id=167, status=PENDING
+- YouTube: job_id=168, status=PENDING
+
+Worker blocked by schema issue: `processor_results` missing `retry_count` column + `jsonb_set(text, text, jsonb)` signature mismatch. Fixed `retry_count` via ALTER TABLE.
+
+## Step 3: TMDb Prefetch (requires pipeline completion first)
+
+```bash
+POST /api/v1/agents/tmdb/prefetch
+```
+
+## Step 4: TMDb Probe
+
+```bash
+POST /api/v1/file/:uuid/tmdb-probe
+```
+
+## Known Issues
+1. `jsonb_set(jsonb, text, jsonb)` → should be `jsonb_set(jsonb, text[], jsonb)` — pre-existing worker bug
+2. `processor_results.retry_count` column missing — fixed via ALTER TABLE
+3. Worker requires running as separate process: `./target/debug/momentry_playground worker`
+
+## Endpoint Changes in This Test
+| Endpoint | Status |
+|----------|--------|
+| `GET /api/v1/stats/ingest` | ❌ Removed (stats moved to files/scan + identities) |
+| `GET /api/v1/files/scan` | ➕ Added `total_chunks`, `searchable_chunks`, `pending_videos` |
+| `GET /api/v1/identities` | ➕ Added `total_identities`, `tmdb_identities`, `auto_identities` |
+| `POST /api/v1/agents/tmdb/prefetch` | ✅ Writes identity files directly |
+| `POST /api/v1/file/:uuid/tmdb-probe` | ✅ Upserts from disk identity files |
+| `GET /api/v1/identity/:uuid/json` | ✅ Download identity JSON |
+| `GET /api/v1/file/:uuid/json/:processor` | ✅ Download processor JSON |
+| `POST /api/v1/agents/identity/match-from-photo` | 🆕 New |
+| `POST /api/v1/agents/identity/match-from-trace` | 🆕 New |
diff --git a/docs_v1.0/REFERENCE/FACE_BINDING_STATES.md b/docs_v1.0/REFERENCE/FACE_BINDING_STATES.md
new file mode 100644
index 0000000..f8bee1e
--- /dev/null
+++ b/docs_v1.0/REFERENCE/FACE_BINDING_STATES.md
@@ -0,0 +1,375 @@
+# Face Binding States — Data Model Reference
+
+**Version**: 1.0.0
+**Date**: 2026-05-25
+**Related**: `GET /api/v1/file/:file_uuid/faces`, `identities`, `strangers`, `face_detections`
+
+---
+
+## Glossary
+
+| Term | Definition |
+|------|------------|
+| **face detection** | A single face bounding box detected in one video frame. Stored in `face_detections` table. |
+| **trace** | A sequence of face detections belonging to the same person across consecutive frames. Assigned by the face tracker. `trace_id` groups multiple face detections. |
+| **identity** | A known person with a name. Sources: TMDb (movie stars), user-defined (manual entry). Stored in `identities` table with `source='tmdb'` or `source='user_defined'`. |
+| **stranger** | An unknown person detected but not matched to any known identity. Created automatically for unmatched traces. Stored in `strangers` table. |
+| **binding** | The association between a face detection and either an identity or a stranger. Represented by `identity_id` or `stranger_id` FK in `face_detections`. |
+| **TMDb** | The Movie Database. Source of celebrity identity seeds with `face_embedding` for matching. |
+| **auto identity** | Legacy term for identities created from `face_clustered.json` analysis. Now migrated to `strangers` table as reference records. |
+| **dangling** | A face detection whose `identity_id` points to a deleted identity (e.g., auto identities removed during migration). |
+| **unbound** | A face detection with no binding at all — `identity_id IS NULL AND stranger_id IS NULL`. |
+| **PK** | Primary Key. A unique identifier for each row in a table. Example: `identities.id`, `strangers.id`, `face_detections.id`. |
+| **FK** | Foreign Key. A column that references the PK of another table, creating a relationship. Example: `face_detections.identity_id` → `identities.id`, `face_detections.stranger_id` → `strangers.id`. FK ensures referential integrity — a face cannot point to a non-existent identity. |
+
+---
+
+## Three Core Tables
+
+### ER Diagram
+
+```
+┌─────────────────────┐       ┌─────────────────────┐
+│     identities      │       │      strangers      │
+│─────────────────────│       │─────────────────────│
+│ id (PK)             │       │ id (PK)             │
+│ uuid                │       │ file_uuid           │
+│ name                │       │ trace_id            │
+│ source              │       │ metadata            │
+│ tmdb_id             │       │ created_at          │
+│ face_embedding      │       │                     │
+│ metadata            │       │ UNIQUE(file_uuid,   │
+│ status              │       │        trace_id)    │
+│ ...                 │       │                     │
+└─────────┬───────────┘       └─────────┬───────────┘
+          │                             │
+          │ FK                          │ FK
+          │ (ON DELETE SET NULL)        │ (ON DELETE SET NULL)
+          │                             │
+          ▼                             ▼
+┌─────────────────────────────────────────────────────┐
+│                  face_detections                    │
+│─────────────────────────────────────────────────────│
+│ id (PK)                                             │
+│ file_uuid           — Video file identifier        │
+│ frame_number        — Frame where face was detected│
+│ timestamp_secs      — Frame number / fps           │
+│ trace_id            — Face tracking ID             │
+│ face_id             — Format: `{frame}_{idx}`      │
+│ identity_id (FK)    — → identities.id             │
+│ stranger_id (FK)    — → strangers.id               │
+│ x, y, width, height — Bounding box                 │
+│ confidence          — Detection confidence (0–1)   │
+│ embedding           — Face embedding vector        │
+│ metadata            — JSON metadata                │
+└─────────────────────────────────────────────────────┘
+```
+
+### Table Summary
+
+| Table | Role | Record Count (public) | Primary Key |
+|-------|------|----------------------|-------------|
+| `identities` | Known persons (TMDb, user-defined) | 70 | `id`, `uuid` |
+| `strangers` | Unknown persons (unmatched traces) | 0–N per file | `id`, `(file_uuid, trace_id)` |
+| `face_detections` | Individual face detections | 70691 per file | `id` |
+
+### Key Columns in `face_detections`
+
+| Column | Type | Purpose |
+|--------|------|---------|
+| `identity_id` | INTEGER FK | Points to `identities.id` if matched to known person |
+| `stranger_id` | INTEGER FK | Points to `strangers.id` if unmatched trace |
+| `trace_id` | INTEGER | Groups faces belonging to same person across frames |
+
+**Design Rule**: `identity_id` and `stranger_id` are mutually exclusive in normal operation. A face should have only one binding.
+
+---
+
+## Four Binding States
+
+### State Definitions
+
+| # | State | `binding` JSON | SQL Condition | Meaning |
+|---|-------|----------------|---------------|---------|
+| 1 | **identity** | `{"identity_id": 9, "identity_uuid": "...", "identity_name": "Audrey Hepburn"}` | `identity_id IN (SELECT id FROM identities)` | Face matched to a known TMDb or user-defined identity |
+| 2 | **stranger** | `{"stranger_id": 845, "metadata": {}}` | `stranger_id IS NOT NULL` | Face belongs to an unmatched trace (unknown person) |
+| 3 | **dangling** | `{"old_identity_id": 18052}` | `identity_id IS NOT NULL AND NOT EXISTS (SELECT 1 FROM identities WHERE id = face_detections.identity_id)` | Face was bound to an identity that has been deleted (orphaned reference) |
+| 4 | **unbound** | `null` | `identity_id IS NULL AND stranger_id IS NULL` | Face has no binding at all |
+
+### State Detection Logic (Rust)
+
+```rust
+let binding = if let (Some(iid), Some(iuuid), Some(iname)) =
+    (identity_id, identity_uuid, identity_name)
+{
+    FaceBinding::Identity { identity_id: iid, identity_uuid: iuuid, identity_name: iname }
+} else if let Some(sid) = stranger_id {
+    FaceBinding::Stranger { stranger_id: sid, metadata: stranger_metadata }
+} else if let Some(iid) = identity_id {
+    FaceBinding::Dangling { old_identity_id: iid }
+} else {
+    FaceBinding::Unbound
+};
+```
+
+---
+
+## Lifecycle Flow
+
+### Processing Pipeline
+
+```
+            Video Registration
+                   │
+                   ▼
+            Face Detection
+         (face_detections created)
+                   │
+                   ▼
+            Face Tracking
+         (trace_id assigned)
+                   │
+                   ▼
+         ┌────────────────┐
+         │ Identity Agent │
+         │  Face Matching │
+         └────────────────┘
+                   │
+         ┌─────────┴─────────┐
+         │                   │
+         ▼                   ▼
+   ┌──────────┐        ┌──────────┐
+   │ MATCHED  │        │ UNMATCHED│
+   │ to TMDb  │        │  trace   │
+   └─────┬────┘        └────┬─────┘
+         │                   │
+         │                   │
+         ▼                   ▼
+   identity_id=X        stranger_id=S
+         │                   │
+         │                   │
+         ▼                   ▼
+    ┌─────────┐         ┌─────────┐
+    │ IDENTITY│         │ STRANGER│
+    │  state  │         │  state  │
+    └─────────┘         └─────────┘
+```
+
+### User Operations
+
+```
+┌─────────┐     bind      ┌─────────┐
+│ STRANGER│──────────────▶│ IDENTITY│
+└────┬────┘               └────┬────┘
+     │                         │
+     │  unbind                 │
+     │  (if stranger_id        │
+     │   preserved)            │
+     │                         │
+     ▼                         ▼
+┌─────────┐              ┌─────────┐
+│ STRANGER│◀─────────────│ UNBOUND │
+│ (rollback)             │ (if no  │
+└─────────┘              │ stranger)│
+                         └─────────┘
+```
+
+### Migration Effect
+
+```
+┌─────────────────────┐
+│ auto identities     │
+│ (source='auto')     │
+│ 943 records         │
+└─────────┬───────────┘
+          │
+          │ DELETE
+          │
+          ▼
+┌─────────────────────┐
+│ face_detections     │
+│ identity_id=18052   │
+│ (points to deleted) │
+└─────────┬───────────┘
+          │
+          │ Cleanup SQL
+          │ SET identity_id=NULL
+          │
+          ▼
+┌─────────────────────┐
+│ DANGLING → UNBOUND  │
+│ 18641 faces cleaned │
+└─────────────────────┘
+```
+
+---
+
+## SQL Query Examples
+
+### Count by State
+
+```sql
+SELECT 
+    COUNT(*) FILTER (WHERE identity_id IN (SELECT id FROM identities)) AS identity,
+    COUNT(*) FILTER (WHERE stranger_id IS NOT NULL) AS stranger,
+    COUNT(*) FILTER (WHERE identity_id IS NOT NULL 
+                     AND NOT EXISTS (SELECT 1 FROM identities WHERE id = face_detections.identity_id)) AS dangling,
+    COUNT(*) FILTER (WHERE identity_id IS NULL AND stranger_id IS NULL) AS unbound
+FROM face_detections 
+WHERE file_uuid = 'aeed71342a899fe4b4c57b7d41bcb692';
+```
+
+### Filter by State
+
+```sql
+-- Identity
+SELECT * FROM face_detections fd
+WHERE fd.identity_id IN (SELECT id FROM identities);
+
+-- Stranger
+SELECT * FROM face_detections WHERE stranger_id IS NOT NULL;
+
+-- Dangling
+SELECT * FROM face_detections fd
+WHERE fd.identity_id IS NOT NULL 
+  AND NOT EXISTS (SELECT 1 FROM identities WHERE id = fd.identity_id);
+
+-- Unbound
+SELECT * FROM face_detections 
+WHERE identity_id IS NULL AND stranger_id IS NULL;
+```
+
+---
+
+## bind/unbind Behavior
+
+### Current Implementation (stranger_id cleared on bind)
+
+| Operation | SQL Effect | Result |
+|-----------|------------|--------|
+| `bind_face_to_identity` | `SET identity_id=X, stranger_id=NULL` | Stranger info lost |
+| `bind_trace_to_identity` | `SET identity_id=X, stranger_id=NULL` | Stranger info lost |
+| `merge_identity` | `SET identity_id=X, stranger_id=NULL` | Stranger info lost |
+| `unbind_face` | `SET identity_id=NULL` | Becomes unbound (cannot rollback) |
+
+**Problem**: After bind → unbind, face becomes unbound instead of returning to stranger.
+
+### Proposed Fix (preserve stranger_id on bind)
+
+| Operation | SQL Effect | Result |
+|-----------|------------|--------|
+| `bind_face_to_identity` | `SET identity_id=X` (keep stranger_id) | Stranger info preserved |
+| `bind_trace_to_identity` | `SET identity_id=X` (keep stranger_id) | Stranger info preserved |
+| `merge_identity` | `SET identity_id=X` (keep stranger_id) | Stranger info preserved |
+| `unbind_face` | `SET identity_id=NULL` | Returns to stranger (if stranger_id exists) |
+
+**Change Required**: Remove `, stranger_id = NULL` from three UPDATE queries in `identity_binding.rs`.
+
+---
+
+## Why Dangling Happens
+
+Dangling occurs when `face_detections.identity_id` points to a deleted row in `identities` table.
+
+### Root Cause
+
+At the time of migration, `face_detections.identity_id` **had no FK constraint** to `identities.id`. This allowed:
+
+1. `DELETE FROM identities WHERE source='auto'` succeeded without error
+2. `face_detections.identity_id` values remained unchanged (pointing to deleted IDs)
+3. No `ON DELETE SET NULL` triggered because no FK existed
+
+### Prevention
+
+With FK constraint in place:
+```sql
+ALTER TABLE face_detections
+ADD CONSTRAINT fk_face_detections_identity
+FOREIGN KEY (identity_id) REFERENCES identities(id) ON DELETE SET NULL;
+```
+
+Deleting an identity would automatically set `face_detections.identity_id = NULL` (no dangling).
+
+### Current Status
+
+After migration cleanup:
+- Public schema: FK `fk_face_detections_stranger` exists (on `stranger_id`)
+- Public schema: FK `fk_face_detections_identity` **does not exist** (historical reason)
+- Dev schema: Same state as public
+
+---
+
+## API Endpoint
+
+### `GET /api/v1/file/:file_uuid/faces`
+
+**Purpose**: List all face detections in a file with binding state.
+
+**Query Parameters**:
+
+| Param | Type | Default | Description |
+|-------|------|---------|-------------|
+| `page` | int | 1 | Page number |
+| `page_size` | int | 50 | Items per page |
+| `binding` | string | — | Filter: `identity`, `stranger`, `dangling`, `unbound` |
+| `trace_id` | int | — | Filter by trace ID |
+| `min_confidence` | float | — | Minimum confidence (0.0–1.0) |
+| `start_frame` | int | — | Start frame (inclusive) |
+| `end_frame` | int | — | End frame (inclusive) |
+
+**Response Example**:
+
+```json
+{
+  "success": true,
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "total": 52244,
+  "page": 1,
+  "page_size": 2,
+  "data": [
+    {
+      "id": 661508,
+      "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+      "frame_number": 21297,
+      "timestamp_secs": 851.88,
+      "face_id": "21297_0",
+      "trace_id": 485,
+      "bbox": { "x": 1072, "y": 390, "width": 56, "height": 56 },
+      "confidence": 0.6114,
+      "binding": {
+        "identity_id": 9,
+        "identity_uuid": "c3545906-c82d-4b66-aa1d-150bc02decce",
+        "identity_name": "Audrey Hepburn"
+      }
+    }
+  ]
+}
+```
+
+---
+
+## Migration Reference
+
+### `migrate_strangers_table.sql` (Summary)
+
+1. `CREATE TABLE strangers`
+2. Insert unmatched traces → strangers
+3. Preserve auto identity metadata → strangers (NULL file_uuid/trace_id)
+4. Update `face_detections.stranger_id` → FK
+5. Add FK constraint
+6. Delete legacy `identity_bindings` for auto identities
+7. Delete `identities` where `source='auto'`
+8. Cleanup dangling `identity_id` (set to NULL)
+
+### Cleanup SQL (Dangling)
+
+```sql
+UPDATE face_detections fd
+SET identity_id = NULL
+WHERE NOT EXISTS (SELECT 1 FROM identities i WHERE i.id = fd.identity_id)
+  AND fd.identity_id IS NOT NULL;
+```
+
+---
+
+*Updated: 2026-05-25*
\ No newline at end of file
diff --git a/docs_v1.0/doc-wasm b/docs_v1.0/doc-wasm
new file mode 120000
index 0000000..f633f2c
--- /dev/null
+++ b/docs_v1.0/doc-wasm
@@ -0,0 +1 @@
+doc_wasm
\ No newline at end of file
diff --git a/docs_v1.0/doc/06_search.html b/docs_v1.0/doc/06_search.html
index fbd9cf7..86f5f8b 100644
--- a/docs_v1.0/doc/06_search.html
+++ b/docs_v1.0/doc/06_search.html
@@ -38,7 +38,7 @@ a { color: #0066cc; }
 <h2>Search APIs</h2>
 <h3><code>POST /api/v1/search/smart</code></h3>
 <p><strong>Auth</strong>: Required
-<strong>Scope</strong>: file-level</p>
+<strong>Scope</strong>: global / file-level</p>
 <p>Semantic vector search using EmbeddingGemma-300m. Generates a query embedding via EmbeddingGemma (port 11436), then searches pgvector <code>story_parent</code> and <code>llm_parent</code> chunks by cosine similarity.</p>
 <h4>Request Parameters</h4>
 <table class="table">
@@ -53,13 +53,6 @@ a { color: #0066cc; }
 </thead>
 <tbody>
 <tr>
-<td><code>file_uuid</code></td>
-<td>string</td>
-<td>Yes</td>
-<td>—</td>
-<td>File UUID to search within</td>
-</tr>
-<tr>
 <td><code>query</code></td>
 <td>string</td>
 <td>Yes</td>
@@ -67,6 +60,13 @@ a { color: #0066cc; }
 <td>Search text</td>
 </tr>
 <tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>File UUID to search within. If omitted, searches all files (global search)</td>
+</tr>
+<tr>
 <td><code>limit</code></td>
 <td>integer</td>
 <td>No</td>
@@ -89,7 +89,14 @@ a { color: #0066cc; }
 </tr>
 </tbody>
 </table>
-<h4>Example</h4>
+<h4>Example (Global Search)</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/smart&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;Audrey Hepburn&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Example (File-specific Search)</h4>
 <div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/smart&quot;</span><span class="w"> </span><span class="se">\</span>
 <span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
 <span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
@@ -101,6 +108,7 @@ a { color: #0066cc; }
 <span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span><span class="p">,</span>
 <span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
 <span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a6fb22eebefaef17e62af874997c5944&quot;</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;parent_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1087822</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;scene_order&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1087822</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;start_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">104438</span><span class="p">,</span>
@@ -118,10 +126,26 @@ a { color: #0066cc; }
 <span class="p">}</span>
 </code></pre></div>
 
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID where result was found</td>
+</tr>
+</tbody>
+</table>
 <hr />
 <h3><code>POST /api/v1/search/universal</code></h3>
 <p><strong>Auth</strong>: Required
-<strong>Scope</strong>: file-level</p>
+<strong>Scope</strong>: global / file-level</p>
 <p>Multi-type BM25 full-text search across chunks, frames, and persons. Uses PostgreSQL <code>tsvector</code>.</p>
 <h4>Request Parameters</h4>
 <table class="table">
@@ -147,7 +171,7 @@ a { color: #0066cc; }
 <td>string</td>
 <td>No</td>
 <td>—</td>
-<td>Restrict to specific file</td>
+<td>Restrict to specific file. If omitted, searches all files (global search)</td>
 </tr>
 <tr>
 <td><code>types</code></td>
@@ -179,7 +203,14 @@ a { color: #0066cc; }
 </tr>
 </tbody>
 </table>
-<h4>Example</h4>
+<h4>Example (Global Search)</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/universal&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;Cary Grant&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Example (File-specific Search)</h4>
 <div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/universal&quot;</span><span class="w"> </span><span class="se">\</span>
 <span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
 <span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
@@ -191,6 +222,7 @@ a { color: #0066cc; }
 <span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
 <span class="w">    </span><span class="p">{</span>
 <span class="w">      </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;chunk&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a6fb22eebefaef17e62af874997c5944&quot;</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;bd80fec92b0b6963d177a2c55bf713e2_2&quot;</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;story_child&quot;</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;start_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5103</span><span class="p">,</span>
@@ -199,6 +231,25 @@ a { color: #0066cc; }
 <span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">213.64</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;[213s-214s] Cary Grant: \&quot;Olá!\&quot;&quot;</span><span class="p">,</span>
 <span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.9</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;frame&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a6fb22eebefaef17e62af874997c5944&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;frame_number&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5105</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;timestamp&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">212.72</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.7</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;objects&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;ocr_texts&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;faces&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;person&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a6fb22eebefaef17e62af874997c5944&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">12</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;appearance_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">542</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.95</span>
 <span class="w">    </span><span class="p">}</span>
 <span class="w">  </span><span class="p">],</span>
 <span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
@@ -206,16 +257,140 @@ a { color: #0066cc; }
 <span class="p">}</span>
 </code></pre></div>
 
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].type</code></td>
+<td>string</td>
+<td>Result type: <code>chunk</code>, <code>frame</code>, or <code>person</code></td>
+</tr>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID where result was found (all types)</td>
+</tr>
+</tbody>
+</table>
 <hr />
 <h3><code>POST /api/v1/search/frames</code></h3>
 <p><strong>Auth</strong>: Required
-<strong>Scope</strong>: file-level</p>
+<strong>Scope</strong>: global / file-level</p>
 <p>Search face detection frames by identity name or trace ID.</p>
 <hr />
-<h3><code>POST /api/v1/search/identity_text</code></h3>
+<h3><code>GET /api/v1/search/identity_text</code></h3>
 <p><strong>Auth</strong>: Required
-<strong>Scope</strong>: file-level</p>
-<p>Search text chunks spoken by a specific identity.</p>
+<strong>Scope</strong>: global / file-level</p>
+<p>Search text chunks → find associated identities. Returns chunks where face detections overlap with text content.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text (ILIKE match)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict to specific file. If omitted, searches all files (global search)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>50</td>
+<td>Max results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>50</td>
+<td>Items per page</td>
+</tr>
+</tbody>
+</table>
+<h4>Example (Global Search)</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/identity_text?q=love&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Example (File-specific Search)</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/identity_text?file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&amp;q=love&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a6fb22eebefaef17e62af874997c5944&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;llm_parent_..._256_270&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">256.256</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">270.228</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text_content&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...lack of affection...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">9</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;identity_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;identity_source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">94</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID where chunk was found</td>
+</tr>
+<tr>
+<td><code>results[].identity_id</code></td>
+<td>integer</td>
+<td>Identity ID if face was detected</td>
+</tr>
+<tr>
+<td><code>results[].trace_id</code></td>
+<td>integer</td>
+<td>Face trace ID</td>
+</tr>
+</tbody>
+</table>
 <hr />
 <h3>Visual Search</h3>
 <table class="table">
@@ -282,7 +457,7 @@ a { color: #0066cc; }
 </tbody>
 </table>
 <hr />
-<p><em>Updated: 2026-05-19 12:49:24</em></p>
+<p><em>Updated: 2026-05-27 — Added global search support for smart, universal, identity_text APIs</em></p>
 </div>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs_v1.0/doc/07_identity.html b/docs_v1.0/doc/07_identity.html
index 2bedf0f..2180a55 100644
--- a/docs_v1.0/doc/07_identity.html
+++ b/docs_v1.0/doc/07_identity.html
@@ -218,6 +218,13 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 </tr>
 </tbody>
 </table>
+<h4>History &amp; Undo/Redo</h4>
+<p>Every PATCH records a before/after snapshot in the operation history. Up to 256 records per identity are kept (oldest auto-deleted). See <a href="14_identity_history.md"><code>14_identity_history.md</code></a> for:</p>
+<ul>
+<li><code>POST /api/v1/identity/:identity_uuid/undo</code> — Revert PATCH changes</li>
+<li><code>POST /api/v1/identity/:identity_uuid/redo</code> — Reapply undone changes</li>
+<li><code>GET /api/v1/identity/:identity_uuid/history</code> — Query operation log</li>
+</ul>
 <hr />
 <h3><code>GET /api/v1/identity/:identity_uuid/files</code></h3>
 <p><strong>Auth</strong>: Required
@@ -227,13 +234,28 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 <div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/files&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
 </code></pre></div>
 
-<hr />
-<h3><code>GET /api/v1/identity/:identity_uuid/faces</code></h3>
-<p><strong>Auth</strong>: Required
-<strong>Scope</strong>: identity-level</p>
-<p>Get all face detection records associated with this identity.</p>
-<h4>Example</h4>
-<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/faces&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aeed71342a899fe4b4c57b7d41bcb692&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/charade.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;done&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">16335</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;speaker_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;first_appearance&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">206.76</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;last_appearance&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">6756.68</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.8088</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
 </code></pre></div>
 
 <table class="table">
@@ -246,28 +268,268 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 </thead>
 <tbody>
 <tr>
-<td><code>file_uuid</code></td>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>data[].file_uuid</code></td>
+<td>string</td>
+<td>File identifier</td>
+</tr>
+<tr>
+<td><code>data[].file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>data[].face_count</code></td>
+<td>integer</td>
+<td>Number of face detections in this file</td>
+</tr>
+<tr>
+<td><code>data[].first_appearance</code></td>
+<td>float</td>
+<td>First appearance time in seconds</td>
+</tr>
+<tr>
+<td><code>data[].last_appearance</code></td>
+<td>float</td>
+<td>Last appearance time in seconds</td>
+</tr>
+<tr>
+<td><code>data[].confidence</code></td>
+<td>float</td>
+<td>Average confidence (0.0–1.0)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/faces</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all face detection records associated with this identity.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/faces&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">963</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">50</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3902</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aeed71342a899fe4b4c57b7d41bcb692&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;frame_number&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">37974</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;timestamp_secs&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">1518.96</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;37974_1&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.8197</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;bbox&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;x&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1097</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;y&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">310</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">177</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">177</span><span class="w"> </span><span class="p">}</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>data[].file_uuid</code></td>
 <td>string</td>
 <td>File where face was detected</td>
 </tr>
 <tr>
-<td><code>frame_number</code></td>
+<td><code>data[].frame_number</code></td>
 <td>integer</td>
 <td>Frame number of detection</td>
 </tr>
 <tr>
-<td><code>face_id</code></td>
+<td><code>data[].face_id</code></td>
 <td>string</td>
-<td>Face ID (format: <code>face_{frame_number}</code>)</td>
+<td>Face ID (format: <code>{frame}_{idx}</code>)</td>
 </tr>
 <tr>
-<td><code>confidence</code></td>
+<td><code>data[].confidence</code></td>
 <td>float</td>
 <td>Detection confidence</td>
 </tr>
 </tbody>
 </table>
 <hr />
+<h3><code>GET /api/v1/file/:file_uuid/faces</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>List all face detections in a file with binding status. Each face is in one of four binding states:</p>
+<table class="table">
+<thead>
+<tr>
+<th>State</th>
+<th><code>binding</code> response</th>
+<th>Meaning</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>identity</strong></td>
+<td><code>{"identity_id": 9, "identity_uuid": "...", "identity_name": "Audrey Hepburn"}</code></td>
+<td>Face matched to a known TMDb or user-defined identity</td>
+</tr>
+<tr>
+<td><strong>stranger</strong></td>
+<td><code>{"stranger_id": 845, "metadata": {}}</code></td>
+<td>Face matched to an unknown person (trace not matched to any known identity)</td>
+</tr>
+<tr>
+<td><strong>dangling</strong></td>
+<td><code>{"old_identity_id": 18052}</code></td>
+<td>Face was previously bound to an auto-generated identity that has been deleted (orphaned reference)</td>
+</tr>
+<tr>
+<td><strong>unbound</strong></td>
+<td><code>null</code></td>
+<td>Face has no binding at all (identity_id and stranger_id are both NULL)</td>
+</tr>
+</tbody>
+</table>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Param</th>
+<th>Type</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>int</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>int</td>
+<td>50</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>binding</code></td>
+<td>string</td>
+<td>—</td>
+<td>Filter by state: <code>identity</code>, <code>stranger</code>, <code>dangling</code>, or <code>unbound</code></td>
+</tr>
+<tr>
+<td><code>trace_id</code></td>
+<td>int</td>
+<td>—</td>
+<td>Filter by trace ID</td>
+</tr>
+<tr>
+<td><code>min_confidence</code></td>
+<td>float</td>
+<td>—</td>
+<td>Minimum detection confidence (0.0–1.0)</td>
+</tr>
+<tr>
+<td><code>start_frame</code></td>
+<td>int</td>
+<td>—</td>
+<td>Starting frame number (inclusive)</td>
+</tr>
+<tr>
+<td><code>end_frame</code></td>
+<td>int</td>
+<td>—</td>
+<td>Ending frame number (inclusive)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/aeed71342a899fe4b4c57b7d41bcb692/faces?page=1&amp;page_size=2&amp;binding=identity&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aeed71342a899fe4b4c57b7d41bcb692&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">52244</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">661508</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aeed71342a899fe4b4c57b7d41bcb692&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;frame_number&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">21297</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;timestamp_secs&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">851.88</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;21297_0&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">485</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;bbox&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;x&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1072</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;y&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">390</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">56</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">56</span><span class="w"> </span><span class="p">},</span>
+<span class="w">      </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.6114</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;binding&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">        </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">9</span><span class="p">,</span>
+<span class="w">        </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;c3545906-c82d-4b66-aa1d-150bc02decce&quot;</span><span class="p">,</span>
+<span class="w">        </span><span class="nt">&quot;identity_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span>
+<span class="w">      </span><span class="p">}</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>total</code></td>
+<td>int</td>
+<td>Number of faces matching the filter (not total in file)</td>
+</tr>
+<tr>
+<td><code>data[].trace_id</code></td>
+<td>int</td>
+<td>Face tracking trace ID</td>
+</tr>
+<tr>
+<td><code>data[].timestamp_secs</code></td>
+<td>float</td>
+<td>Timestamp in seconds (<code>frame_number / fps</code>)</td>
+</tr>
+<tr>
+<td><code>data[].bbox</code></td>
+<td>object</td>
+<td>Bounding box <code>{x, y, width, height}</code></td>
+</tr>
+<tr>
+<td><code>data[].binding</code></td>
+<td>object/null</td>
+<td>One of four binding states (see table above)</td>
+</tr>
+</tbody>
+</table>
+<hr />
 <h3><code>GET /api/v1/identity/:identity_uuid/chunks</code></h3>
 <p><strong>Auth</strong>: Required
 <strong>Scope</strong>: identity-level</p>
@@ -280,6 +542,10 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 <div class="codehilite"><pre><span></span><code><span class="p">{</span>
 <span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
 <span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
 <span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
 <span class="w">    </span><span class="p">{</span>
 <span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
@@ -307,42 +573,47 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 </thead>
 <tbody>
 <tr>
-<td><code>file_uuid</code></td>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>data[].file_uuid</code></td>
 <td>string</td>
 <td>File identifier</td>
 </tr>
 <tr>
-<td><code>chunk_id</code></td>
+<td><code>data[].chunk_id</code></td>
 <td>string</td>
 <td>Sentence chunk identifier</td>
 </tr>
 <tr>
-<td><code>start_frame</code></td>
+<td><code>data[].start_frame</code></td>
 <td>integer</td>
 <td>Frame-accurate start position</td>
 </tr>
 <tr>
-<td><code>end_frame</code></td>
+<td><code>data[].end_frame</code></td>
 <td>integer</td>
 <td>Frame-accurate end position</td>
 </tr>
 <tr>
-<td><code>fps</code></td>
+<td><code>data[].fps</code></td>
 <td>float</td>
 <td>Frames per second</td>
 </tr>
 <tr>
-<td><code>start_time</code></td>
+<td><code>data[].start_time</code></td>
 <td>float</td>
 <td>Start time in seconds</td>
 </tr>
 <tr>
-<td><code>end_time</code></td>
+<td><code>data[].end_time</code></td>
 <td>float</td>
 <td>End time in seconds</td>
 </tr>
 <tr>
-<td><code>text_content</code></td>
+<td><code>data[].text_content</code></td>
 <td>string</td>
 <td>Spoken text content</td>
 </tr>
@@ -378,6 +649,11 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 </tr>
 </tbody>
 </table>
+<h4>Side Effects</h4>
+<ul>
+<li>清除該 face detection row 的 <code>stranger_id</code>（設為 NULL）</li>
+<li>不影響 <code>identities</code> 表中原有的 stranger auto-identity 記錄</li>
+</ul>
 <h4>Example</h4>
 <div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/bind&quot;</span><span class="w"> </span><span class="se">\</span>
 <span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
@@ -386,17 +662,134 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 </code></pre></div>
 
 <hr />
-<h3><code>POST /api/v1/identity/:identity_uuid/unbind</code></h3>
+<h3><code>POST /api/v1/identity/:identity_uuid/bind/trace</code></h3>
 <p><strong>Auth</strong>: Required
 <strong>Scope</strong>: identity-level</p>
-<p>Unbind a face detection from an identity. Removes the identity association from the face record.</p>
-<hr />
-<h3><code>GET /api/v1/identities/search</code></h3>
-<p><strong>Auth</strong>: Required
-<strong>Scope</strong>: identity-level</p>
-<p>Search identities by name (ILIKE search). Returns matching identity records.</p>
+<p>Bind all face detections of a trace to an identity. Updates all rows in <code>face_detections</code> with the matching <code>file_uuid</code> and <code>trace_id</code>.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File where trace exists</td>
+</tr>
+<tr>
+<td><code>trace_id</code></td>
+<td>integer</td>
+<td>Yes</td>
+<td>Trace ID (from <code>face_detections.trace_id</code>)</td>
+</tr>
+</tbody>
+</table>
+<h4>Side Effects</h4>
+<ul>
+<li>清除該 trace 所有 face detection rows 的 <code>stranger_id</code>（設為 NULL）</li>
+<li>不影響 <code>identities</code> 表中原有的 stranger auto-identity 記錄</li>
+</ul>
 <h4>Example</h4>
-<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search?q=Cary&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/bind/trace&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;trace_id&quot;: 919}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Bound trace 919 of aeed71342... to Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;rows_affected&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">53</span><span class="w"> </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/traces</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get paginated face traces (continuous tracking segments) associated with this identity across all files.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>1</code></td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>20</code></td>
+<td>Items per page</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/traces?page=1&amp;page_size=3&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, total_faces, traces}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">18</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_faces&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">542</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;traces&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aeed71342a899fe4b4c57b7d41bcb692&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">906</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;frame_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">52</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;first_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">37974</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;last_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">38127</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;first_sec&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">1519.0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;last_sec&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">1525.1</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;avg_confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.8254</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
 </code></pre></div>
 
 <table class="table">
@@ -409,24 +802,578 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 </thead>
 <tbody>
 <tr>
+<td><code>success</code></td>
+<td>bool</td>
+<td>Always <code>true</code></td>
+</tr>
+<tr>
+<td><code>identity_uuid</code></td>
+<td>string</td>
+<td>Identity UUID</td>
+</tr>
+<tr>
 <td><code>name</code></td>
 <td>string</td>
-<td>Identity name</td>
+<td>Identity display name</td>
 </tr>
 <tr>
-<td><code>source</code></td>
-<td>string</td>
-<td>Identity source</td>
-</tr>
-<tr>
-<td><code>tmdb_id</code></td>
+<td><code>total</code></td>
 <td>integer</td>
-<td>TMDb ID (if source = tmdb)</td>
+<td>Total number of traces (across all pages)</td>
+</tr>
+<tr>
+<td><code>total_faces</code></td>
+<td>integer</td>
+<td>Sum of all face detections in returned traces</td>
+</tr>
+<tr>
+<td><code>traces[].file_uuid</code></td>
+<td>string</td>
+<td>File where trace exists</td>
+</tr>
+<tr>
+<td><code>traces[].trace_id</code></td>
+<td>integer</td>
+<td>Trace tracking ID</td>
+</tr>
+<tr>
+<td><code>traces[].frame_count</code></td>
+<td>integer</td>
+<td>Number of frames in this trace</td>
+</tr>
+<tr>
+<td><code>traces[].first_frame</code></td>
+<td>integer</td>
+<td>Start frame number</td>
+</tr>
+<tr>
+<td><code>traces[].last_frame</code></td>
+<td>integer</td>
+<td>End frame number</td>
+</tr>
+<tr>
+<td><code>traces[].first_sec</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>traces[].last_sec</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>traces[].avg_confidence</code></td>
+<td>float</td>
+<td>Average detection confidence (0.0–1.0)</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/unbind</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Unbind a face detection from an identity. Removes the identity association from the face record.</p>
+<h4>Side Effects</h4>
+<ul>
+<li>只清除 <code>identity_id</code>（設為 NULL），<strong>不會恢復 <code>stranger_id</code></strong></li>
+<li>被 unbind 的 face 不會自動成為 stranger</li>
+<li>要重新標記為 stranger 需重新跑 Agent API（<code>identity/analyze</code>）</li>
+</ul>
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/mergeinto</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Transfer all face bindings from this identity to another identity, then optionally delete or mark the source as merged.</p>
+<h4>Two Merge Cases</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Case</th>
+<th>Description</th>
+<th>Undo Support</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>stranger → identity</strong></td>
+<td>Merge an auto-generated stranger identity into a known identity (TMDb or user-defined)</td>
+<td>✅ 24hr undo</td>
+</tr>
+<tr>
+<td><strong>identity A → identity B</strong></td>
+<td>Merge two known identities (e.g., duplicate entries)</td>
+<td>✅ 24hr undo</td>
+</tr>
+</tbody>
+</table>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>into_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Target identity UUID to merge into</td>
+</tr>
+<tr>
+<td><code>keep_history</code></td>
+<td>bool</td>
+<td>No</td>
+<td><code>true</code></td>
+<td>Keep source identity record with <code>status='merged'</code> (<code>true</code>) or delete it (<code>false</code>)</td>
+</tr>
+</tbody>
+</table>
+<h4>Side Effects</h4>
+<ul>
+<li>轉移所有 <code>face_detections.identity_id</code> 到目標 identity</li>
+<li>同時清除所有被轉移 rows 的 <code>stranger_id</code></li>
+<li>將 source name 加入 target aliases (with <code>source: "merge"</code> tag)</li>
+<li>將 source aliases 加入 target aliases (if not already present)</li>
+<li>將 source metadata fields 加入 target metadata (if not already present)</li>
+<li><code>keep_history: true</code>（預設）：source identity 設為 <code>status='merged'</code>，保留記錄</li>
+<li><code>keep_history: false</code>：<strong>刪除</strong> source identity 及其 identity JSON 檔案</li>
+<li><strong>記錄 merge history 到 MongoDB</strong>（支援 undo）</li>
+</ul>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$SOURCE_UUID</span><span class="s2">/mergeinto&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;into_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$TARGET_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;keep_history&quot;: true}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Merged &#39;stranger_13894&#39; into &#39;Louis Viret&#39; (52 faces transferred, history kept)&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;merge_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;550e8400-e29b-41d4-a716-446655440000&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;faces_transferred&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">52</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;aliases_added&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;metadata_fields_added&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>merge_id</code></td>
+<td>string</td>
+<td>Unique merge operation ID (for undo)</td>
+</tr>
+<tr>
+<td><code>faces_transferred</code></td>
+<td>integer</td>
+<td>Number of face detections transferred</td>
+</tr>
+<tr>
+<td><code>aliases_added</code></td>
+<td>integer</td>
+<td>Number of aliases added to target</td>
+</tr>
+<tr>
+<td><code>metadata_fields_added</code></td>
+<td>integer</td>
+<td>Number of metadata fields added to target</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>Source or target identity not found</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/identity/merge/:merge_id/undo</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Undo a merge operation within 24 hours. Restores the source identity and reverts face bindings.</p>
+<h4>Undo Behavior</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Action</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Restore source identity</td>
+<td>If <code>keep_history=true</code>: restore status to <code>confirmed</code><br>If <code>keep_history=false</code>: recreate identity from MongoDB snapshot</td>
+</tr>
+<tr>
+<td>Restore faces</td>
+<td>Transfer faces back to source identity</td>
+</tr>
+<tr>
+<td>Remove aliases from target</td>
+<td>Remove aliases with <code>source: "merge"</code> tag</td>
+</tr>
+<tr>
+<td>Remove metadata fields from target</td>
+<td>Remove fields that were added from source</td>
+</tr>
+<tr>
+<td><strong>Preserve manual changes</strong></td>
+<td>Keep aliases/metadata manually added after merge</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/merge/550e8400-e29b-41d4-a716-446655440000/undo&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Undo merge completed: &#39;stranger_13894&#39; restored, 52 faces reverted&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;source_identity_restored&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a90105...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;stranger_13894&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;confirmed&quot;</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;faces_reverted&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">52</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;aliases_removed_from_target&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;metadata_fields_removed_from_target&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Undo deadline expired (&gt;24hr) or already undone</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>Merge record not found</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/merge/history</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Query merge history records from MongoDB.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>source_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Filter by source identity UUID</td>
+</tr>
+<tr>
+<td><code>target_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Filter by target identity UUID</td>
+</tr>
+<tr>
+<td><code>merge_id</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Filter by specific merge ID</td>
+</tr>
+<tr>
+<td><code>undone</code></td>
+<td>bool</td>
+<td>No</td>
+<td>—</td>
+<td>Filter by undone status</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>int</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>int</td>
+<td>No</td>
+<td>20</td>
+<td>Items per page</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/merge/history?page=1&amp;page_size=10&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">10</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;merge_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;550e8400-e29b-41d4-a716-446655440000&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;source_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;stranger_13894&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;target_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Louis Viret&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;faces_transferred&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">52</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;merged_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-27T10:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;undo_deadline&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-28T10:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;undone&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;undo_expired&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>merge_id</code></td>
+<td>string</td>
+<td>Unique merge operation ID</td>
+</tr>
+<tr>
+<td><code>source_name</code></td>
+<td>string</td>
+<td>Source identity name</td>
+</tr>
+<tr>
+<td><code>target_name</code></td>
+<td>string</td>
+<td>Target identity name</td>
+</tr>
+<tr>
+<td><code>faces_transferred</code></td>
+<td>integer</td>
+<td>Number of faces transferred</td>
+</tr>
+<tr>
+<td><code>merged_at</code></td>
+<td>datetime</td>
+<td>When merge occurred</td>
+</tr>
+<tr>
+<td><code>undo_deadline</code></td>
+<td>datetime</td>
+<td>24hr deadline for undo</td>
+</tr>
+<tr>
+<td><code>undone</code></td>
+<td>bool</td>
+<td>Whether merge was undone</td>
+</tr>
+<tr>
+<td><code>undo_expired</code></td>
+<td>bool</td>
+<td>Whether undo deadline passed</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identities/search</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: global / file-level</p>
+<p>Search identity name → find associated chunks. Searches identity name and aliases, returns identities with their associated text chunks.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text (ILIKE match on name and aliases)</td>
 </tr>
 <tr>
 <td><code>file_uuid</code></td>
 <td>string</td>
-<td>Associated file</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict to specific file. If omitted, searches all files (global search)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>50</td>
+<td>Max results</td>
+</tr>
+</tbody>
+</table>
+<h4>Example (Global Search)</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search?q=Audrey&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Example (File-specific Search)</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search?q=Audrey&amp;file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">9</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;tmdb_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1932</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a6fb22eebefaef17e62af874997c5944&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">41</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;llm_parent_..._204_207&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">204.162</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text_content&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...confrontation...&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].identity_id</code></td>
+<td>integer</td>
+<td>Identity ID</td>
+</tr>
+<tr>
+<td><code>results[].name</code></td>
+<td>string</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>results[].source</code></td>
+<td>string</td>
+<td>Identity source (<code>tmdb</code>, <code>user_defined</code>, etc.)</td>
+</tr>
+<tr>
+<td><code>results[].tmdb_id</code></td>
+<td>integer</td>
+<td>TMDb person ID (if source = tmdb)</td>
+</tr>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File where identity appears</td>
+</tr>
+<tr>
+<td><code>results[].trace_id</code></td>
+<td>integer</td>
+<td>Face trace ID</td>
+</tr>
+<tr>
+<td><code>results[].chunk_id</code></td>
+<td>string</td>
+<td>Associated chunk ID</td>
+</tr>
+<tr>
+<td><code>results[].start_time</code></td>
+<td>float</td>
+<td>Chunk start time</td>
+</tr>
+<tr>
+<td><code>results[].text_content</code></td>
+<td>string</td>
+<td>Chunk text content</td>
 </tr>
 </tbody>
 </table>
@@ -699,7 +1646,7 @@ curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>
 
 <p>This <strong>replaces</strong> the entire <code>aliases</code> array. To add to existing aliases, include all existing entries in the request.</p>
 <hr />
-<p>*Updated: 2026-05-22</p>
+<p>*Updated: 2026-05-25 — Added <code>GET /api/v1/file/:file_uuid/faces</code> with 4 binding states, filters, strangers table split</p>
 </div>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs_v1.0/doc/08_media.html b/docs_v1.0/doc/08_media.html
index fe451e0..99543ef 100644
--- a/docs_v1.0/doc/08_media.html
+++ b/docs_v1.0/doc/08_media.html
@@ -294,6 +294,7 @@ curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</s
 <hr />
 <h3><code>GET /api/v1/file/:file_uuid/thumbnail</code></h3>
 <p>Extract a single frame from a video as JPEG image. Uses FFmpeg <code>select</code> filter.</p>
+<p>When <code>frame</code> is omitted, the system automatically selects the best representative frame using the TKG bridge (see algorithm below).</p>
 <p><strong>Auth</strong>: Required
 <strong>Scope</strong>: file-level</p>
 <h4>Query Parameters</h4>
@@ -311,9 +312,9 @@ curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</s
 <tr>
 <td><code>frame</code></td>
 <td>integer</td>
-<td>Yes</td>
-<td>—</td>
-<td>Zero-based frame number to extract</td>
+<td>No</td>
+<td>auto-detect</td>
+<td>Zero-based frame number to extract. Omit for auto-detect.</td>
 </tr>
 <tr>
 <td><code>x</code></td>
@@ -346,8 +347,23 @@ curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</s
 </tbody>
 </table>
 <p>All four crop params (<code>x</code>, <code>y</code>, <code>w</code>, <code>h</code>) must be provided together or omitted.</p>
-<h4>Example</h4>
-<div class="codehilite"><pre><span></span><code><span class="c1"># Extract frame 1000 (full frame)</span>
+<h4>Auto-detect Algorithm</h4>
+<p>When <code>frame</code> is not provided, the endpoint finds the best frame using this fallback chain:</p>
+<ol>
+<li><strong>Main characters</strong>: find the two identities with the most face detections (TMDb source)</li>
+<li><strong>Mutual gaze</strong>: if their face traces have a TKG <code>CO_OCCURS_WITH</code> edge with <code>mutual_gaze=true</code>, take <code>first_frame</code></li>
+<li><strong>Co-occurrence</strong>: fallback to the first frame where both identities appear together</li>
+<li><strong>Single identity</strong>: if only one main identity exists, take its highest-quality face frame</li>
+<li><strong>Any identity</strong>: fallback to the best-quality face frame across all identities</li>
+<li><strong>Error</strong>: if no face exists, returns <code>404</code></li>
+</ol>
+<p>The selected frame is constrained to the <strong>first half of the video</strong> (<code>total_frames / 2</code>).</p>
+<h4>Examples</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Auto-detect best representative frame</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/thumbnail&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>representative.jpg
+
+<span class="c1"># Extract frame 1000 (full frame)</span>
 curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/bd80fec92b0b6963d177a2c55bf713e2/thumbnail?frame=1000&quot;</span><span class="w"> </span><span class="se">\</span>
 <span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>frame_1000.jpg
 
@@ -359,10 +375,185 @@ curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</s
 <h4>Response</h4>
 <ul>
 <li><strong>200</strong>: <code>image/jpeg</code> binary data</li>
-<li><strong>404</strong>: File not found</li>
+<li><strong>404</strong>: File not found / No faces in file (auto-detect)</li>
 <li><strong>500</strong>: FFmpeg error (e.g., frame number exceeds video duration)</li>
 </ul>
-<h3><code>GET /api/v1/file/:file_uuid/clip</code></h3>
+<h4>Technical Details</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Detail</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Backend</strong></td>
+<td>FFmpeg (<code>ffmpeg-full</code>)</td>
+</tr>
+<tr>
+<td><strong>Filter</strong></td>
+<td><code>select=eq(n\,FRAME)</code> to select frame, optional <code>crop=W:H:X:Y</code></td>
+</tr>
+<tr>
+<td><strong>Output</strong></td>
+<td>Single JPEG via pipe (<code>image2pipe</code>, <code>mjpeg</code> codec)</td>
+</tr>
+<tr>
+<td><strong>Cache</strong></td>
+<td><code>Cache-Control: public, max-age=86400</code> (24h)</td>
+</tr>
+<tr>
+<td><strong>Frame number</strong></td>
+<td>Zero-based (<code>frame=0</code> = first frame of video)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/representative-frame</code></h3>
+<p>Return JSON metadata about the best representative frame for the video. Uses the same auto-detect algorithm as <code>GET /thumbnail</code> (without crop support).</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/representative-frame&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aeed71342a899fe4b4c57b7d41bcb692&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;frame_number&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">38165</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;timestamp_secs&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">1526.6</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;face_quality&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">37292.97</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;main_identities&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;c3545906-c82d-4b66-aa1d-150bc02decce&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">16456</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2b0ddefe-e2a9-4533-9308-b375594604d5&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">10643</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;traces&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">919</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2b0ddefe-e2a9-4533-9308-b375594604d5&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;x&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">764</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;y&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">237</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">199</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">199</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.8426</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">920</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;c3545906-c82d-4b66-aa1d-150bc02decce&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;x&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1143</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;y&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">312</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">215</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">215</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.8068</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Response Fields</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>frame_number</code></td>
+<td>integer</td>
+<td>Selected representative frame number (primary coordinate)</td>
+</tr>
+<tr>
+<td><code>timestamp_secs</code></td>
+<td>float</td>
+<td>Time in seconds (derived from <code>frame_number / fps</code>)</td>
+</tr>
+<tr>
+<td><code>face_quality</code></td>
+<td>float</td>
+<td>Quality score <code>area × confidence</code> of the best face at this frame</td>
+</tr>
+<tr>
+<td><code>main_identities</code></td>
+<td>array</td>
+<td>Top 2 most frequent TMDb identities in the file</td>
+</tr>
+<tr>
+<td><code>main_identities[].name</code></td>
+<td>string</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>main_identities[].face_count</code></td>
+<td>integer</td>
+<td>Total face detections count</td>
+</tr>
+<tr>
+<td><code>traces</code></td>
+<td>array</td>
+<td>All face traces present at the selected frame</td>
+</tr>
+<tr>
+<td><code>traces[].trace_id</code></td>
+<td>integer</td>
+<td>Face trace ID</td>
+</tr>
+<tr>
+<td><code>traces[].identity_uuid</code></td>
+<td>string or null</td>
+<td>Matched identity UUID</td>
+</tr>
+<tr>
+<td><code>traces[].name</code></td>
+<td>string or null</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>traces[].x, y, width, height</code></td>
+<td>integer</td>
+<td>Bounding box coordinates</td>
+</tr>
+<tr>
+<td><code>traces[].confidence</code></td>
+<td>float</td>
+<td>Detection confidence (0.0–1.0)</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>File not found / No faces in file</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
 <p>Extract a video clip (time range) as MPEG-TS stream. Uses FFmpeg <code>-ss</code> fast seek.</p>
 <p><strong>Auth</strong>: Required
 <strong>Scope</strong>: file-level</p>
diff --git a/docs_v1.0/doc/12_agent.html b/docs_v1.0/doc/12_agent.html
index 6532a47..166ef43 100644
--- a/docs_v1.0/doc/12_agent.html
+++ b/docs_v1.0/doc/12_agent.html
@@ -209,7 +209,191 @@ a { color: #0066cc; }
 </tbody>
 </table>
 <hr />
-<p><em>Updated: 2026-05-19 12:49:24</em></p>
+<h2>POST /api/v1/agents/search</h2>
+<p>Conversational search assistant. Uses Gemma4 function calling to automatically decide which tools to call based on the user's natural language query. Supports multi-turn conversation.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn 和 Cary Grant 第一次同框在哪個 frame？&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;conversation_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>✅</td>
+<td>自然語言查詢</td>
+</tr>
+<tr>
+<td><code>conversation_id</code></td>
+<td>string</td>
+<td>❌</td>
+<td>延續對話時傳入；新對話不傳</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>❌</td>
+<td>Portal 有選中檔案時可指定</td>
+</tr>
+</tbody>
+</table>
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;conversation_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;conv_abc123&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;answer&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;在 Charade (1963) 中，Audrey Hepburn 與 Cary Grant 第一次同框在第 38619 幀（約 1544.76 秒）。&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;need_input&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;sources&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;tool&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tkg_query&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;result&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;{\&quot;first_cooccurrence\&quot;:{\&quot;frame\&quot;:38619,\&quot;timestamp_secs\&quot;:1544.76}}&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>conversation_id</code></td>
+<td>string</td>
+<td>後續對話需要傳入此 ID</td>
+</tr>
+<tr>
+<td><code>answer</code></td>
+<td>string</td>
+<td>Agent 的自然語言回答（或反問）</td>
+</tr>
+<tr>
+<td><code>need_input</code></td>
+<td>boolean</td>
+<td><code>true</code> 表示 agent 需要更多資訊才能回答</td>
+</tr>
+<tr>
+<td><code>suggestions</code></td>
+<td>string[]</td>
+<td>建議用戶提供的線索（當 <code>need_input=true</code>）</td>
+</tr>
+<tr>
+<td><code>sources</code></td>
+<td>array</td>
+<td>引用的工具執行結果</td>
+</tr>
+</tbody>
+</table>
+<h3>Conversation Flow</h3>
+<div class="codehilite"><pre><span></span><code>Round 1: POST /agents/search { query: &quot;我想看男女主角同框&quot; }
+         → need_input: true, suggestions: [&quot;片名&quot;, &quot;演員&quot;, &quot;年代&quot;]
+         → answer: &quot;請問是哪部電影？請提供更多線索&quot;
+
+Round 2: POST /agents/search { query: &quot;奧黛麗赫本&quot;, conversation_id: &quot;...&quot; }
+         → need_input: false
+         → answer: &quot;找到 Charade (1963)，Audrey Hepburn 和 Cary Grant...&quot;
+</code></pre></div>
+
+<h3>Available Tools</h3>
+<p>Agent 內部使用 Gemma4 function calling 自動調用以下工具：</p>
+<table class="table">
+<thead>
+<tr>
+<th>Tool</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>find_file</code></td>
+<td>透過片名/演員/年份關鍵字搜尋影片，回傳 file_uuid + has_data 狀態</td>
+</tr>
+<tr>
+<td><code>list_files</code></td>
+<td>列出近期註冊的影片</td>
+</tr>
+<tr>
+<td><code>tkg_query</code></td>
+<td>查詢人物互動資料（7 種子類型：top_identities、first_cooccurrence、identity_details、mutual_gaze、interaction_network、identity_traces、file_info）</td>
+</tr>
+<tr>
+<td><code>smart_search</code></td>
+<td>文字內容 ILIKE 搜尋 chunk（可指定 file_uuid 限制範圍）</td>
+</tr>
+<tr>
+<td><code>get_identity_detail</code></td>
+<td>查詢單一身份的詳細資料（角色、TMDb 資訊）</td>
+</tr>
+<tr>
+<td><code>get_file_info</code></td>
+<td>查詢影片基本資訊（片長、解析度）</td>
+</tr>
+<tr>
+<td><code>get_representative_frame</code></td>
+<td>查詢影片最具代表性的 frame 資訊</td>
+</tr>
+</tbody>
+</table>
+<h3>Design Principles</h3>
+<ul>
+<li><strong>用戶不需要知道 file_uuid</strong> — Agent 會自動用 <code>find_file</code> 搜尋或反問</li>
+<li><strong>不推薦無資料的影片</strong> — <code>has_data=false</code> 的影片不會被推薦給用戶</li>
+<li><strong>多輪對話</strong> — 透過 <code>conversation_id</code> 延續上下文，agent 會記得之前的交流</li>
+<li><strong>並行工具呼叫</strong> — Gemma4 可以一次呼叫多個工具再綜合回答</li>
+</ul>
+<h3>Model</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Detail</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>LLM</strong></td>
+<td>Gemma4 26B (Q5_K_M)</td>
+</tr>
+<tr>
+<td><strong>Engine</strong></td>
+<td>llama.cpp at <code>localhost:8082</code></td>
+</tr>
+<tr>
+<td><strong>Endpoint</strong></td>
+<td><code>/v1/chat/completions</code> (OpenAI-compatible)</td>
+</tr>
+<tr>
+<td><strong>Temperature</strong></td>
+<td>0.1</td>
+</tr>
+<tr>
+<td><strong>Max rounds</strong></td>
+<td>5 (tool call iterations)</td>
+</tr>
+<tr>
+<td><strong>Conversation TTL</strong></td>
+<td>30 minutes</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<p><em>Updated: 2026-05-22</em></p>
 </div>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_developer/14_identity_history.html b/docs_v1.0/doc_developer/14_identity_history.html
new file mode 100644
index 0000000..568e9a9
--- /dev/null
+++ b/docs_v1.0/doc_developer/14_identity_history.html
@@ -0,0 +1,470 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>14 Identity History - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+.topbar { display: flex; justify-content: space-between; align-items: center; margin-bottom: 20px; }
+.logout-btn { font-size: 13px; color: #999; text-decoration: none; }
+.logout-btn:hover { color: #cc0000; }
+</style>
+</head>
+<body>
+<div class="container">
+<div class="topbar">
+<a class="back" href="index.html">&larr; Back to index</a>
+<a class="logout-btn" href="#" onclick="fetch('/api/v1/auth/logout',{method:'POST'}).then(()=>window.location.reload());return false">Logout</a>
+</div>
+<!-- module: identity_history -->
+<!-- description: Identity PATCH operation history, undo, and redo -->
+<!-- depends: 01_auth, 07_identity -->
+
+<h2>Identity Operation History</h2>
+<p>Every <code>PATCH /api/v1/identity/:identity_uuid</code> automatically records a before/after snapshot in the <code>identity_history</code> table. Use undo/redo to revert or reapply changes, and history to inspect the operation log.</p>
+<h3>History System Overview</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Property</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Storage</td>
+<td>PostgreSQL <code>identity_history</code> table</td>
+</tr>
+<tr>
+<td>Snapshot</td>
+<td>Full identity record (all fields) before and after each PATCH</td>
+</tr>
+<tr>
+<td>Max records</td>
+<td>256 per identity (oldest auto-deleted when limit exceeded)</td>
+</tr>
+<tr>
+<td>Undo steps</td>
+<td>Unlimited (no expiry, no step limit)</td>
+</tr>
+<tr>
+<td>Redo stack</td>
+<td>Cleared on new PATCH (<code>is_undone=true</code> records are deleted)</td>
+</tr>
+</tbody>
+</table>
+<h4>Stack Model</h4>
+<div class="codehilite"><pre><span></span><code>PATCH 1 → PATCH 2 → PATCH 3         (undo stack, is_undone=false)
+                           ↓ undo
+PATCH 1 → PATCH 2                   (undo stack)
+           PATCH 3                   (redo stack, is_undone=true)
+                           ↓ redo
+PATCH 1 → PATCH 2 → PATCH 3         (undo stack)
+</code></pre></div>
+
+<p>A new PATCH after undo clears the redo stack (PATCH 3 is lost).</p>
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/undo</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Undo the most recent PATCH operations. Restores the identity's <code>before_snapshot</code> and marks the history records as undone.</p>
+<h4>Request (JSON)</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>steps</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>1</code></td>
+<td>Number of undo steps to apply (max records undone in one call)</td>
+</tr>
+</tbody>
+</table>
+<h4>Behavior</h4>
+<ul>
+<li>Queries <code>is_undone=false</code> records, ordered by <code>created_at DESC</code></li>
+<li>Restores <code>name</code>, <code>identity_type</code>, <code>source</code>, <code>status</code>, <code>metadata</code>, <code>tmdb_id</code>, <code>tmdb_profile</code> from the last record's <code>before_snapshot</code></li>
+<li>Marks the undone records as <code>is_undone=true</code> with <code>undone_at=NOW()</code></li>
+<li>Syncs <code>identity.json</code> to disk</li>
+<li>Updates <code>_index.json</code> if name changed</li>
+</ul>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/undo&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;steps&quot;: 1}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;undone_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;current_state&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">9</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;identity_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;people&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;confirmed&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;metadata&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{},</span>
+<span class="w">    </span><span class="nt">&quot;tmdb_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">112</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;tmdb_profile&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>undone_count</code></td>
+<td>integer</td>
+<td>Number of history records undone</td>
+</tr>
+<tr>
+<td><code>current_state</code></td>
+<td>object</td>
+<td>Full identity state after undo</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>No undo operations available</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/redo</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Redo previously undone PATCH operations. Restores the identity's <code>after_snapshot</code> and marks the history records as no longer undone.</p>
+<h4>Request (JSON)</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>steps</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>1</code></td>
+<td>Number of redo steps to apply</td>
+</tr>
+</tbody>
+</table>
+<h4>Behavior</h4>
+<ul>
+<li>Queries <code>is_undone=true</code> records, ordered by <code>created_at DESC</code></li>
+<li>Restores all identity fields from the last record's <code>after_snapshot</code></li>
+<li>Marks records as <code>is_undone=false</code> with <code>undone_at=NULL</code></li>
+<li>Syncs <code>identity.json</code> to disk</li>
+<li>Updates <code>_index.json</code> if name changed</li>
+</ul>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/redo&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;steps&quot;: 1}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;redone_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;current_state&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">9</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;John Smith&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;identity_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;people&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;confirmed&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;metadata&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="w"> </span><span class="nt">&quot;aliases&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="err">...</span><span class="p">]</span><span class="w"> </span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;tmdb_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">112</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;tmdb_profile&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>redone_count</code></td>
+<td>integer</td>
+<td>Number of history records redone</td>
+</tr>
+<tr>
+<td><code>current_state</code></td>
+<td>object</td>
+<td>Full identity state after redo</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>No redo operations available</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/history</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Query the operation history for an identity. Returns paginated records with undo/redo stack counts.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>1</code></td>
+<td>Page number (1-indexed)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>20</code></td>
+<td>Items per page (max 100)</td>
+</tr>
+</tbody>
+</table>
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;undo_stack_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;redo_stack_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;history_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;operation&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;update&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;is_undone&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-27T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;undone_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;history_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">41</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;operation&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;update&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;is_undone&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-27T11:30:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;undone_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-27T13:00:00Z&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total history records for this identity</td>
+</tr>
+<tr>
+<td><code>undo_stack_count</code></td>
+<td>integer</td>
+<td>Records available for undo (<code>is_undone=false</code>)</td>
+</tr>
+<tr>
+<td><code>redo_stack_count</code></td>
+<td>integer</td>
+<td>Records available for redo (<code>is_undone=true</code>)</td>
+</tr>
+<tr>
+<td><code>results[].history_id</code></td>
+<td>integer</td>
+<td>History record ID</td>
+</tr>
+<tr>
+<td><code>results[].operation</code></td>
+<td>string</td>
+<td>Operation type (<code>"update"</code> for PATCH)</td>
+</tr>
+<tr>
+<td><code>results[].is_undone</code></td>
+<td>boolean</td>
+<td>Whether the operation has been undone</td>
+</tr>
+<tr>
+<td><code>results[].created_at</code></td>
+<td>string</td>
+<td>When the PATCH was applied</td>
+</tr>
+<tr>
+<td><code>results[].undone_at</code></td>
+<td>string</td>
+<td>When the undo occurred (null if not undone)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/history?page=1&amp;limit=10&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Database error</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Comparison: PATCH Undo vs Merge Undo</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Aspect</th>
+<th>PATCH Undo/Redo</th>
+<th>Merge Undo</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Storage</td>
+<td>PostgreSQL <code>identity_history</code></td>
+<td>MongoDB <code>identity_merge_history</code></td>
+</tr>
+<tr>
+<td>Trigger</td>
+<td>Every PATCH</td>
+<td>Every mergeinto with <code>keep_history=true</code></td>
+</tr>
+<tr>
+<td>Undo deadline</td>
+<td>None (unlimited)</td>
+<td>24 hours</td>
+</tr>
+<tr>
+<td>Redo support</td>
+<td>Yes</td>
+<td>No</td>
+</tr>
+<tr>
+<td>Step undo</td>
+<td>Yes (<code>steps</code> param)</td>
+<td>No (full undo only)</td>
+</tr>
+<tr>
+<td>Max records</td>
+<td>256 per identity</td>
+<td>Unlimited</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<p><em>Updated: 2026-05-28</em></p>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_developer/index.html b/docs_v1.0/doc_developer/index.html
index 033e6da..d87cd1a 100644
--- a/docs_v1.0/doc_developer/index.html
+++ b/docs_v1.0/doc_developer/index.html
@@ -29,7 +29,7 @@ a:hover td { background: #f8f8f8; border-radius: 4px; }
 <a class="logout-btn" href="#" onclick="fetch('/api/v1/auth/logout',{method:'POST'}).then(()=>window.location.reload());return false">Logout</a>
 </div>
 <p class="subtitle">API 參考手冊 — 登入後可瀏覽各模組文件</p>
-<table><tr onclick="window.location='11_error_codes.html'" style="cursor:pointer"><td class="cn">錯誤碼</td><td class="en">Error Codes</td></tr></table>
+<table><tr onclick="window.location='11_error_codes.html'" style="cursor:pointer"><td class="cn">錯誤碼</td><td class="en">Error Codes</td></tr><tr onclick="window.location='14_identity_history.html'" style="cursor:pointer"><td class="cn">14 Identity History</td><td class="en"></td></tr></table>
 </div>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/API_ACCESS.html b/docs_v1.0/doc_user/API_ACCESS.html
new file mode 100644
index 0000000..257ca11
--- /dev/null
+++ b/docs_v1.0/doc_user/API_ACCESS.html
@@ -0,0 +1,358 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Api Access - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<h1>Momentry Core API 存取指南</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>版本</td>
+<td>V1.3</td>
+</tr>
+<tr>
+<td>日期</td>
+<td>2026-03-25</td>
+</tr>
+<tr>
+<td>用途</td>
+<td>API 存取方式、端點與整合指南</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>版本歷史</h2>
+<table class="table">
+<thead>
+<tr>
+<th>版本</th>
+<th>日期</th>
+<th>目的</th>
+<th>操作人</th>
+<th>工具/模型</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>V1.3</td>
+<td>2026-03-25</td>
+<td>更新: n8n 搜尋回傳 <code>file_path</code> 取代 <code>media_url</code>，新增 API Key 驗證說明</td>
+<td>OpenCode</td>
+<td>deepseek-reasoner</td>
+</tr>
+<tr>
+<td>V1.2</td>
+<td>2026-03-24</td>
+<td>更新網址與服務列表</td>
+<td>Warren</td>
+<td>OpenCode / MiniMax M2.5</td>
+</tr>
+<tr>
+<td>V1.1</td>
+<td>2026-03-23</td>
+<td>初始版本</td>
+<td>Warren</td>
+<td>OpenCode / MiniMax M2.5</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>基本網址</h2>
+<table class="table">
+<thead>
+<tr>
+<th>環境</th>
+<th>URL</th>
+<th>說明</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>本地開發</strong></td>
+<td><code>http://localhost:3002</code></td>
+<td>直接訪問 API，繞過反向代理</td>
+</tr>
+<tr>
+<td><strong>外部訪問</strong></td>
+<td><code>https://m5api.momentry.ddns.net</code></td>
+<td>通過 Caddy 反向代理訪問，需網路可達</td>
+</tr>
+</tbody>
+</table>
+<h3>何時使用哪個 URL</h3>
+<p><strong>使用 <code>localhost:3002</code>：</strong>
+- 開發/測試環境
+- 直接在伺服器上操作
+- 當反向代理有問題時</p>
+<p><strong>使用 <code>m5api.momentry.ddns.net</code>：</strong>
+- n8n workflow 中呼叫 API
+- 外部系統整合
+- 生產環境</p>
+<h2>認證</h2>
+<p>所有 <code>/api/v1/*</code> 端點（除了健康檢查 <code>/health</code> 與 <code>/health/detailed</code>）都需要 API Key 認證。</p>
+<p>請在請求標頭中加入：</p>
+<div class="codehilite"><pre><span></span><code>X-API-Key: YOUR_API_KEY
+</code></pre></div>
+
+<p><strong>目前示範使用的 API Key</strong>: <code>demo_api_key_12345</code></p>
+<blockquote>
+<p><strong>注意</strong>: 正式環境請使用安全的 API Key 管理機制，避免在客戶端暴露 API Key。</p>
+</blockquote>
+<hr />
+<h2>影片搜尋 API</h2>
+<h3>語意搜尋</h3>
+<p><strong>端點：</strong> <code>POST /api/v1/search</code></p>
+<p><strong>請求：</strong></p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;limit&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a1b10138a6bbb0cd&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>欄位</th>
+<th>類型</th>
+<th>必填</th>
+<th>說明</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>字串</td>
+<td>是</td>
+<td>搜尋文字</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>整數</td>
+<td>否</td>
+<td>最大回傳結果數（預設 10）</td>
+</tr>
+<tr>
+<td><code>uuid</code></td>
+<td>字串</td>
+<td>否</td>
+<td>依影片 UUID 過濾</td>
+</tr>
+</tbody>
+</table>
+<p><strong>回應：</strong></p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a1b10138a6bbb0cd&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0006&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.44</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;fun plot twists, Woody Dialog and charming performances...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.526</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3>n8n 整合搜尋</h3>
+<p><strong>端點：</strong> <code>POST /api/v1/n8n/search</code></p>
+<p><strong>請求：</strong></p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;limit&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p><strong>回應：</strong></p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;hits&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0006&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;vid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a1b10138a6bbb0cd&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.44</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;title&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Chunk sentence_0006&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;fun plot twists...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.526</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/Users/accusys/momentry/var/sftpgo/data/demo/Old_Time_Movie_Show_-_Charade_1963.HD.mov&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<blockquote>
+<p><strong>注意</strong>: API 現在返回 <code>file_path</code>（檔案系統路徑）而非 <code>media_url</code>（網頁 URL）。如需在網頁中播放影片，請將檔案路徑轉換為可訪問的 URL（例如透過 SFTPGo 分享連結）。</p>
+</blockquote>
+<hr />
+<h2>影片管理 API</h2>
+<h3>列出所有影片</h3>
+<p><strong>端點：</strong> <code>GET /api/v1/videos</code></p>
+<h3>查詢影片資訊</h3>
+<p><strong>端點：</strong> <code>GET /api/v1/lookup?uuid={uuid}</code> 或 <code>GET /api/v1/lookup?path={path}</code></p>
+<h3>取得處理進度</h3>
+<p><strong>端點：</strong> <code>GET /api/v1/progress/{uuid}</code></p>
+<hr />
+<h2>區塊資料結構</h2>
+<p>每個搜尋結果包含影片播放的時間資訊：</p>
+<table class="table">
+<thead>
+<tr>
+<th>欄位</th>
+<th>說明</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>uuid</code></td>
+<td>影片識別碼</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>區塊唯一識別碼</td>
+</tr>
+<tr>
+<td><code>chunk_type</code></td>
+<td>類型：<code>sentence</code>、<code>cut</code>、<code>time_based</code></td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>開始時間（秒）</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>結束時間（秒）</td>
+</tr>
+<tr>
+<td><code>text</code></td>
+<td>語音轉文字內容</td>
+</tr>
+<tr>
+<td><code>score</code></td>
+<td>相關性分數（0-1）</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>整合範例</h2>
+<h3>JavaScript/fetch</h3>
+<div class="codehilite"><pre><span></span><code><span class="kd">const</span><span class="w"> </span><span class="nx">response</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="k">await</span><span class="w"> </span><span class="nx">fetch</span><span class="p">(</span><span class="s1">&#39;http://localhost:3002/api/v1/search&#39;</span><span class="p">,</span><span class="w"> </span><span class="p">{</span>
+<span class="w">  </span><span class="nx">method</span><span class="o">:</span><span class="w"> </span><span class="s1">&#39;POST&#39;</span><span class="p">,</span>
+<span class="w">  </span><span class="nx">headers</span><span class="o">:</span><span class="w"> </span><span class="p">{</span><span class="w"> </span>
+<span class="w">    </span><span class="s1">&#39;Content-Type&#39;</span><span class="o">:</span><span class="w"> </span><span class="s1">&#39;application/json&#39;</span><span class="p">,</span>
+<span class="w">    </span><span class="s1">&#39;X-API-Key&#39;</span><span class="o">:</span><span class="w"> </span><span class="s1">&#39;YOUR_API_KEY&#39;</span><span class="w">  </span><span class="c1">// 替換為實際的 API Key</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nx">body</span><span class="o">:</span><span class="w"> </span><span class="nb">JSON</span><span class="p">.</span><span class="nx">stringify</span><span class="p">({</span><span class="w"> </span><span class="nx">query</span><span class="o">:</span><span class="w"> </span><span class="s1">&#39;charade&#39;</span><span class="p">,</span><span class="w"> </span><span class="nx">limit</span><span class="o">:</span><span class="w"> </span><span class="mf">5</span><span class="w"> </span><span class="p">})</span>
+<span class="p">});</span>
+<span class="kd">const</span><span class="w"> </span><span class="nx">data</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="k">await</span><span class="w"> </span><span class="nx">response</span><span class="p">.</span><span class="nx">json</span><span class="p">();</span>
+<span class="nx">console</span><span class="p">.</span><span class="nx">log</span><span class="p">(</span><span class="nx">data</span><span class="p">.</span><span class="nx">results</span><span class="p">);</span>
+</code></pre></div>
+
+<h3>PHP/cURL</h3>
+<div class="codehilite"><pre><span></span><code><span class="x">$ch = curl_init(&#39;http://localhost:3002/api/v1/search&#39;);</span>
+<span class="x">curl_setopt($ch, CURLOPT_POST, true);</span>
+<span class="x">curl_setopt($ch, CURLOPT_POSTFIELDS, json_encode([</span>
+<span class="x">  &#39;query&#39; =&gt; &#39;charade&#39;,</span>
+<span class="x">  &#39;limit&#39; =&gt; 5</span>
+<span class="x">]));</span>
+<span class="x">curl_setopt($ch, CURLOPT_HTTPHEADER, [</span>
+<span class="x">  &#39;Content-Type: application/json&#39;,</span>
+<span class="x">  &#39;X-API-Key: YOUR_API_KEY&#39;  // 替換為實際的 API Key</span>
+<span class="x">]);</span>
+<span class="x">$response = curl_exec($ch);</span>
+<span class="x">$data = json_decode($response, true);</span>
+</code></pre></div>
+
+<hr />
+<h2>影片嵌入網址</h2>
+<blockquote>
+<p><strong>重要</strong>: API 現在返回 <code>file_path</code>（檔案系統路徑），而非直接可訪問的網址。您需要將檔案路徑轉換為 SFTPGo 分享連結才能嵌入影片。</p>
+</blockquote>
+<p><strong>檔案路徑轉換為網址：</strong>
+- API 返回的 <code>file_path</code> 範例：<code>/Users/accusys/momentry/var/sftpgo/data/demo/video.mp4</code>
+- 對應的 SFTPGo 分享連結：<code>https://wp.momentry.ddns.net/demo/video.mp4</code>
+- 轉換方式：移除 <code>/Users/accusys/momentry/var/sftpgo/data/</code> 前綴，將剩餘路徑附加到 <code>https://wp.momentry.ddns.net/</code></p>
+<p><strong>手動建立分享連結：</strong>
+1. 開啟 SFTPGo Web UI：<code>http://localhost:8080</code>
+2. 使用帳號 <code>demo</code> / 密碼 <code>demopassword123</code> 登入
+3. 導航至 <code>Files</code> → 選擇影片檔案
+4. 點擊 <code>Share</code> → <code>Create Link</code>
+5. 複製產生的分享連結</p>
+<p>使用搜尋結果中的 <code>start_time</code> 和 <code>end_time</code> 來嵌入影片片段。</p>
+<hr />
+<h2>服務列表</h2>
+<table class="table">
+<thead>
+<tr>
+<th>服務</th>
+<th>網址</th>
+<th>用途</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Momentry API</td>
+<td><code>http://localhost:3002</code></td>
+<td>核心 API</td>
+</tr>
+<tr>
+<td>SFTPGo</td>
+<td><code>http://localhost:8080</code></td>
+<td>檔案儲存</td>
+</tr>
+<tr>
+<td>Qdrant</td>
+<td><code>http://localhost:6333</code></td>
+<td>向量搜尋</td>
+</tr>
+<tr>
+<td>PostgreSQL</td>
+<td><code>localhost:5432</code></td>
+<td>資料庫</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>示範影片</h2>
+<ul>
+<li><strong>檔案：</strong> <code>Old_Time_Movie_Show_-_Charade_1963.HD.mov</code></li>
+<li><strong>UUID：</strong> <code>a1b10138a6bbb0cd</code></li>
+<li><strong>長度：</strong> 約 6879 秒（約 1.9 小時）</li>
+<li><strong>區塊數：</strong> 3886 個（句子 + 場景 + 時間）</li>
+</ul>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/API_ENDPOINTS.html b/docs_v1.0/doc_user/API_ENDPOINTS.html
new file mode 100644
index 0000000..5d9c247
--- /dev/null
+++ b/docs_v1.0/doc_user/API_ENDPOINTS.html
@@ -0,0 +1,3537 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Api Endpoints - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "api_reference"
+service: "MOMENTRY_CORE"
+title: "Momentry Core API 端點總覽"
+date: "2026-05-17"
+version: "V1.4"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"</p>
+<hr />
+<h1>Momentry Core API 端點總覽</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Base URL</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Environment</th>
+<th>URL</th>
+<th>Purpose</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Playground (Dev)</td>
+<td><code>http://localhost:3003</code></td>
+<td>Development and testing</td>
+</tr>
+<tr>
+<td>Production</td>
+<td><code>http://localhost:3002</code></td>
+<td>Production deployment</td>
+</tr>
+<tr>
+<td>External (M5)</td>
+<td><code>https://m5api.momentry.ddns.net</code></td>
+<td>Remote access</td>
+</tr>
+</tbody>
+</table>
+<h2>Variables</h2>
+<p>All examples in this documentation use these environment variables:</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://localhost:3003&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;your-api-key-here&quot;</span>
+</code></pre></div>
+
+<h2>Authentication</h2>
+<p>All endpoints under <code>/api/v1/*</code> require authentication.
+The following endpoints are public (no auth needed):</p>
+<ul>
+<li><code>GET /health</code></li>
+<li><code>POST /api/v1/auth/login</code></li>
+<li><code>POST /api/v1/auth/logout</code></li>
+</ul>
+<h3>Three Authentication Modes</h3>
+<p>The system supports three authentication methods, checked in <strong>priority order</strong> by the middleware:</p>
+<div class="codehilite"><pre><span></span><code>Middleware priority:
+  1. Session Cookie (Portal/browser)
+  2. JWT Bearer (API clients: n8n, CLI)
+  3. API Key Header (legacy compatibility)
+  4. API Key Query Param (?api_key=)
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Mode</th>
+<th>Transport</th>
+<th>Expiry</th>
+<th>Scope</th>
+<th>Best for</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td><code>Cookie: session_id=&lt;uuid&gt;</code></td>
+<td>24h</td>
+<td>per-browser session</td>
+<td>Portal (browser)</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td><code>Authorization: Bearer &lt;token&gt;</code></td>
+<td>1h</td>
+<td>per-login token</td>
+<td>API clients (n8n, CLI, scripts)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td><code>X-API-Key: &lt;key&gt;</code></td>
+<td>90d</td>
+<td>fixed key for automation</td>
+<td>Legacy scripts, WordPress</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Login</h3>
+<p><strong>Default accounts &amp; API keys:</strong></p>
+<table class="table">
+<thead>
+<tr>
+<th>Username</th>
+<th>Password</th>
+<th>API Key</th>
+<th>Role</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>admin</code></td>
+<td><code>admin</code></td>
+<td>—</td>
+<td>admin</td>
+</tr>
+<tr>
+<td><code>demo</code></td>
+<td><code>demo</code></td>
+<td><code>muser_demo_key_32chars_abcdef1234567890</code></td>
+<td>user</td>
+</tr>
+</tbody>
+</table>
+<p>The demo API key is set via <code>MOMENTRY_DEMO_API_KEY</code> env var and can be used in place of JWT for marcom integrations:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Using API key instead of JWT</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_demo_key_32chars_abcdef1234567890&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login as admin</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;admin&quot;, &quot;password&quot;: &quot;admin&quot;}&#39;</span>
+
+<span class="c1"># Login as demo user</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;demo&quot;, &quot;password&quot;: &quot;demo&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Success Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;jwt&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;eyJhbGciOiJIUzI1NiIs...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_key&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;muser_...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;user&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;username&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;role&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;expires_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-18T13:00:00Z&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jwt</code></td>
+<td>string</td>
+<td>JWT access token. Use as <code>Authorization: Bearer &lt;jwt&gt;</code>. Expires in 1 hour.</td>
+</tr>
+<tr>
+<td><code>api_key</code></td>
+<td>string</td>
+<td>Legacy API key. Use as <code>X-API-Key: &lt;key&gt;</code>. Good for 90 days.</td>
+</tr>
+<tr>
+<td><code>user.username</code></td>
+<td>string</td>
+<td>Username</td>
+</tr>
+<tr>
+<td><code>user.role</code></td>
+<td>string</td>
+<td>Role: <code>admin</code>, <code>user</code>, or <code>readonly</code></td>
+</tr>
+<tr>
+<td><code>expires_at</code></td>
+<td>string</td>
+<td>ISO8601 timestamp of JWT expiration</td>
+</tr>
+</tbody>
+</table>
+<p>The login endpoint also sets a <code>Set-Cookie</code> header for browser-based clients:</p>
+<div class="codehilite"><pre><span></span><code><span class="nt">Set-Cookie</span><span class="o">:</span><span class="w"> </span><span class="nt">session_id</span><span class="o">=&lt;</span><span class="nt">uuid</span><span class="o">&gt;;</span><span class="w"> </span><span class="nt">Path</span><span class="o">=/</span><span class="nt">api</span><span class="o">;</span><span class="w"> </span><span class="nt">HttpOnly</span><span class="o">;</span><span class="w"> </span><span class="nt">SameSite</span><span class="o">=</span><span class="nt">Strict</span><span class="o">;</span><span class="w"> </span><span class="nt">Max-Age</span><span class="o">=</span><span class="nt">86400</span>
+</code></pre></div>
+
+<h4>Error Response (401)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Invalid username or password&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3>Using JWT</h3>
+<p>JWT is preferred for API clients (n8n, CLI scripts, WordPress). It is validated by the middleware without a database lookup (stateless).</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login and capture JWT</span>
+<span class="nv">JWT</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;print(json.load(sys.stdin)[&#39;jwt&#39;])&quot;</span><span class="k">)</span>
+
+<span class="c1"># Use JWT for all subsequent requests</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span>
+</code></pre></div>
+
+<p>JWT is short-lived (1 hour). When it expires, request a new one via login.</p>
+<hr />
+<h3>Using Session Cookie (Browser)</h3>
+<p>Browser-based clients (Portal) get a session cookie automatically after login. The browser sends the cookie with every request—no manual header needed.</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login captures the session cookie from Set-Cookie header</span>
+curl<span class="w"> </span>-v<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span>
+
+<span class="c1"># Browser automatically sends: Cookie: session_id=&lt;uuid&gt;</span>
+<span class="c1"># No manual header needed for subsequent requests</span>
+</code></pre></div>
+
+<p>The session cookie is HttpOnly (not accessible from JavaScript) and SameSite=Strict (protected against CSRF).</p>
+<hr />
+<h3>Using Legacy API Key</h3>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+
+<span class="c1"># Also accepted via Bearer header (non-JWT format) or query parameter:</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?api_key=</span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>API keys are validated via SHA256 hash lookup in the database. They are long-lived (90 days) and intended for automation.</p>
+<h3>Obtaining an API Key (CLI)</h3>
+<div class="codehilite"><pre><span></span><code>momentry<span class="w"> </span>api-key<span class="w"> </span>create<span class="w"> </span><span class="s2">&quot;My API Key&quot;</span><span class="w"> </span>--key-type<span class="w"> </span>user
+</code></pre></div>
+
+<hr />
+<h3>Logout</h3>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Logout using the session cookie (browser)</span>
+curl<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=&lt;uuid&gt;&quot;</span>
+</code></pre></div>
+
+<h4>What logout does</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Auth mode</th>
+<th>Effect</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td>Session deleted from database. Same cookie returns 401 on subsequent requests.</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td>JWT remains valid until expiry. (JWT is stateless — logout adds JWT to a blacklist only if API key mode is used.)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td>API key remains valid. (Legacy keys are shared across sessions — revoking would break other clients.)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example: full session lifecycle</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># 1. Login</span>
+<span class="nv">SESSION_ID</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-D<span class="w"> </span>-<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sed<span class="w"> </span><span class="s1">&#39;s/.*session_id=\([^;]*\).*/\1/&#39;</span><span class="k">)</span>
+
+<span class="c1"># 2. Use session (works)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 200</span>
+
+<span class="c1"># 3. Logout</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → {&quot;success&quot;: true}</span>
+
+<span class="c1"># 4. Use session again (rejected)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 401</span>
+</code></pre></div>
+
+<hr />
+<h3>Authentication Flow Summary</h3>
+<div class="codehilite"><pre><span></span><code>Login Request
+     │
+     ▼
+┌──────────────────┐
+│  1. Check users  │ ← users table (argon2 password verify)
+│     table        │
+└──────┬───────────┘
+       │
+   ┌───┴───┐
+   │ match │
+   └───┬───┘
+       │
+       ▼
+┌──────────────────┐
+│  2. Create JWT   │ ← 1h expiry, signed with JWT_SECRET
+├──────────────────┤
+│  3. Create       │ ← 24h expiry, stored in sessions table
+│     session      │
+├──────────────────┤
+│  4. Set-Cookie   │ ← HttpOnly, SameSite=Strict, Path=/api
+├──────────────────┤
+│  5. Return       │ ← JWT + api_key + user info to client
+└──────────────────┘
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>Protected Request
+     │
+     ▼
+┌──────────────────────┐
+│  Middleware checks:  │
+│                      │
+│  1. Cookie session?  │ → DB lookup session → get api_key → verify
+│                      │
+│  2. JWT Bearer?      │ → verify JWT signature → decode claims
+│                      │
+│  3. X-API-Key?       │ → SHA256 hash → DB lookup → verify
+│                      │
+│  4. ?api_key=?       │ → same as #3
+│                      │
+│  5. None → 401       │
+└──────────────────────┘
+</code></pre></div>
+
+<hr />
+<h3>Error Responses</h3>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid authentication</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Session expired or logged out</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>JWT expired</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>API key revoked or inactive</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Related</h3>
+<ul>
+<li><code>POST /api/v1/resource/tmdb/check</code> — test authentication + TMDb API connectivity</li>
+<li><code>GET /health/detailed</code> — view auth status (integrations section)</li>
+</ul>
+<hr />
+<h2>Health Check</h2>
+<h3><code>GET /health</code></h3>
+<p><strong>Auth</strong>: Public
+<strong>Scope</strong>: system-level</p>
+<p>Returns basic server health status — used by load balancers and monitoring.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, version}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_git_hash&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_timestamp&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T13:38:15Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;uptime_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3015</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>version</code></td>
+<td>string</td>
+<td>Semver version</td>
+</tr>
+<tr>
+<td><code>build_git_hash</code></td>
+<td>string</td>
+<td>Git commit hash</td>
+</tr>
+<tr>
+<td><code>build_timestamp</code></td>
+<td>string</td>
+<td>Binary build time</td>
+</tr>
+<tr>
+<td><code>uptime_ms</code></td>
+<td>integer</td>
+<td>Milliseconds since server start</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /health/detailed</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Returns full system health including each service status, resource utilization, pipeline readiness, schema migration status, identity file sync status, and external integrations.</p>
+<blockquote>
+<p>Requires authentication (JWT, session cookie, or API key). The basic <code>/health</code> endpoint remains public for load balancer checks.</p>
+</blockquote>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health/detailed&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, services, resources: {cpu: .resources.cpu_used_percent, memory: .resources.memory_used_percent}}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;services&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;postgres&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;redis&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;qdrant&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">}</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;resources&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;cpu_used_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">12.5</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;memory_available_mb&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">32768</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;memory_used_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">31.7</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;pipeline&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;scripts_ready&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;scripts_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;asr&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;yolo&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;pose&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;ocr&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;cut&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;scene&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;asrx&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;visual_chunk&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;models_ready&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;models_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;scripts_integrity&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">332</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;ffmpeg&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;schema&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;table_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;applied&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[{</span><span class="nt">&quot;filename&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;migrate_add_users_table.sql&quot;</span><span class="p">}],</span>
+<span class="w">    </span><span class="nt">&quot;required&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[],</span>
+<span class="w">    </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;identities&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;directory_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;files_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3481</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;index_ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;db_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3481</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;synced&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;integrations&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;tmdb&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;api_key_configured&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;enabled&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;api_reachable&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Response Fields</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> if all essential services healthy</td>
+</tr>
+<tr>
+<td><code>services</code></td>
+<td>object</td>
+<td>Per-service status (postgres, redis, qdrant)</td>
+</tr>
+<tr>
+<td><code>services.*.status</code></td>
+<td>string</td>
+<td><code>ok</code>, <code>error</code>, or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>services.*.latency_ms</code></td>
+<td>int</td>
+<td>Response time in milliseconds</td>
+</tr>
+<tr>
+<td><code>resources</code></td>
+<td>object</td>
+<td>CPU, memory usage</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_ready</code></td>
+<td>boolean</td>
+<td>Scripts directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_count</code></td>
+<td>int</td>
+<td>Number of Python processor scripts</td>
+</tr>
+<tr>
+<td><code>pipeline.processors</code></td>
+<td>object</td>
+<td>Per-processor availability</td>
+</tr>
+<tr>
+<td><code>pipeline.models_ready</code></td>
+<td>boolean</td>
+<td>Models directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_integrity</code></td>
+<td>object</td>
+<td>SHA256 checksum verification results</td>
+</tr>
+<tr>
+<td><code>schema.ok</code></td>
+<td>boolean</td>
+<td>All required migrations applied</td>
+</tr>
+<tr>
+<td><code>identities.synced</code></td>
+<td>boolean</td>
+<td>Identity file count matches DB count</td>
+</tr>
+<tr>
+<td><code>integrations.tmdb</code></td>
+<td>object</td>
+<td>TMDB API key config and reachability</td>
+</tr>
+</tbody>
+</table>
+<h4>Health status rules</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Condition</th>
+<th>status</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>All services ok</td>
+<td><code>ok</code></td>
+</tr>
+<tr>
+<td>Any service error</td>
+<td><code>degraded</code></td>
+</tr>
+<tr>
+<td>Postgres or Redis error</td>
+<td><code>degraded</code> (server still responds)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Stats Endpoints</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Auth</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/ingest</code></td>
+<td>No</td>
+<td>Ingest pipeline statistics</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/sftpgo</code></td>
+<td>No</td>
+<td>SFTPGo service status</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/inference</code></td>
+<td>No</td>
+<td>Inference service (LLM) health</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/stats/ingest&quot;</span>
+</code></pre></div>
+
+<hr />
+<h2>File Registration</h2>
+<h3><code>POST /api/v1/files/register</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Register a video file for processing. Returns the file's metadata and UUID.</p>
+<p><strong>New in v0.1.2</strong>: Registration now <strong>automatically triggers the processing pipeline</strong> — no need to call <code>POST /api/v1/file/:uuid/process</code> separately. The system will:
+1. Register the file and run ffprobe
+2. Auto-run offline TMDb probe (reads local identity files, no API calls)
+3. Create a monitor job for the worker
+4. Worker starts all 10 processors (Cut → ASR → ASRX → YOLO → OCR → Face → Pose → VisualChunk → Story → 5W1H)</p>
+<p>If the file already exists (same content hash), returns the existing record with <code>already_exists: true</code>.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Path to video file on disk</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex pattern for batch register (requires <code>file_path</code> to be a directory)</td>
+</tr>
+<tr>
+<td><code>user_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>User ID to associate with registration</td>
+</tr>
+<tr>
+<td><code>content_hash</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Pre-computed SHA-256 hash (skips computation)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Register a single file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39;</span>
+
+<span class="c1"># Batch register files matching a pattern in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;already_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;File registered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the registered file</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name (auto-renamed if name conflict)</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Canonical path on disk</td>
+</tr>
+<tr>
+<td><code>file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>"unknown"</code></td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Total frame count</td>
+</tr>
+<tr>
+<td><code>already_exists</code></td>
+<td>boolean</td>
+<td>True if same content was already registered</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+<tr>
+<td><code>400</code></td>
+<td>Invalid request body</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File path does not exist</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/files/scan</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Scan the filesystem directory and list all media files, showing which are registered, processing, or unregistered.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Items per page (alias: <code>limit</code>)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Max items (alias for <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex filter on file name (e.g., <code>.*\\.mp4$</code>)</td>
+</tr>
+<tr>
+<td><code>sort_by</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>name</code></td>
+<td>Sort field: <code>name</code>, <code>size</code>, <code>modified</code>, <code>status</code></td>
+</tr>
+<tr>
+<td><code>sort_order</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>asc</code></td>
+<td>Sort direction: <code>asc</code> or <code>desc</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Full scan</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, registered_count, unregistered_count}&#39;</span>
+
+<span class="c1"># Paginated (page 1, 5 per page)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?page=1&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{page, total_pages, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Regex filter: only mp4 files</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?pattern=.*\\.mp4</span>$<span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{filtered_total, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Sort by file size (largest first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=size&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, file_size}]&#39;</span>
+
+<span class="c1"># Sort by modified time (most recent first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=modified&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, modified_time}]&#39;</span>
+
+<span class="c1"># Sort by status</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=status&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, status}]&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;files&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">12345678</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;is_registered&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;registration_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">107</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;filtered_total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">80</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_pages&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;registered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">26</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;unregistered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">81</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>files</code></td>
+<td>array</td>
+<td>Array of file info objects (paginated)</td>
+</tr>
+<tr>
+<td><code>files[].file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>files[].relative_path</code></td>
+<td>string</td>
+<td>Path relative to scan root</td>
+</tr>
+<tr>
+<td><code>files[].file_path</code></td>
+<td>string</td>
+<td>Absolute path on disk</td>
+</tr>
+<tr>
+<td><code>files[].file_size</code></td>
+<td>integer</td>
+<td>File size in bytes</td>
+</tr>
+<tr>
+<td><code>files[].modified_time</code></td>
+<td>string</td>
+<td>Last modified timestamp (ISO8601)</td>
+</tr>
+<tr>
+<td><code>files[].is_registered</code></td>
+<td>boolean</td>
+<td>Whether file is registered in DB</td>
+</tr>
+<tr>
+<td><code>files[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].status</code></td>
+<td>string</td>
+<td><code>"completed"</code>, <code>"processing"</code>, <code>"registered"</code>, <code>"unregistered"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>files[].registration_time</code></td>
+<td>string</td>
+<td>DB registration timestamp (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].job_id</code></td>
+<td>integer</td>
+<td>Processing job ID (only if a job exists)</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total files found on disk (unfiltered)</td>
+</tr>
+<tr>
+<td><code>filtered_total</code></td>
+<td>integer</td>
+<td>Files matching regex filter</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>total_pages</code></td>
+<td>integer</td>
+<td>Total pages</td>
+</tr>
+<tr>
+<td><code>registered_count</code></td>
+<td>integer</td>
+<td>Files registered in DB</td>
+</tr>
+<tr>
+<td><code>unregistered_count</code></td>
+<td>integer</td>
+<td>Files not yet registered</td>
+</tr>
+</tbody>
+</table>
+<h4>Notes</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Feature</th>
+<th>Behavior</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Regex</strong></td>
+<td>Case-insensitive (<code>(?i)</code> prefix auto-applied). Applied to <code>file_name</code>.</td>
+</tr>
+<tr>
+<td><strong>Sort order</strong></td>
+<td>Default (<code>sort_by=name</code>): registered files first, then alphabetically. <code>sort_by=status</code>: alphabetical by status string.</td>
+</tr>
+<tr>
+<td><strong>Pagination</strong></td>
+<td><code>page_size</code> and <code>limit</code> are aliases. Default: show all results.</td>
+</tr>
+<tr>
+<td><strong>Processing order</strong></td>
+<td><code>pattern</code> regex filter → <code>sort_by</code>/<code>sort_order</code> → <code>page</code>/<code>page_size</code> slice.</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>File Lookup</h2>
+<h3><code>GET /api/v1/files/lookup</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Search registered files by file name. Performs a case-insensitive LIKE search on the file name column. Returns basic info about matching files.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File name to search for (partial matches supported)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Look up a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=video.mp4&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+
+<span class="c1"># Partial name search</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=charade&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.matches[].file_name&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;matches&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a03485a40b2df2d3&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;next_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video (2).mp4&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Searched name</td>
+</tr>
+<tr>
+<td><code>exists</code></td>
+<td>boolean</td>
+<td>Exact name match exists</td>
+</tr>
+<tr>
+<td><code>matches</code></td>
+<td>array</td>
+<td>Array of matching registered files</td>
+</tr>
+<tr>
+<td><code>matches[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>matches[].file_name</code></td>
+<td>string</td>
+<td>Registered file name</td>
+</tr>
+<tr>
+<td><code>matches[].file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>matches[].status</code></td>
+<td>string</td>
+<td>Registration/processing status</td>
+</tr>
+<tr>
+<td><code>next_name</code></td>
+<td>string</td>
+<td>Suggested name for avoiding conflicts</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Unregister</h2>
+<h3><code>POST /api/v1/unregister</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Delete a registered file from the system. Supports single file by UUID, or batch by directory + regex pattern.</p>
+<h4>What gets deleted</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Removed (default)</th>
+<th>Not removed</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Database records (videos, chunks, embeddings, processor_results, pre_chunks)</td>
+<td>The original source video file on disk</td>
+</tr>
+<tr>
+<td>Processor output JSON files (<code>{uuid}.*.json</code>) — unless <code>delete_output_files: false</code></td>
+<td>Temp/working directories</td>
+</tr>
+<tr>
+<td>In-memory cache entries</td>
+<td></td>
+</tr>
+<tr>
+<td>MongoDB cached lists</td>
+<td></td>
+</tr>
+</tbody>
+</table>
+<blockquote>
+<p>⚠️ Database deletion is <strong>irreversible</strong>. To keep output files, set <code>"delete_output_files": false</code>.</p>
+</blockquote>
+<h4>Request Parameters</h4>
+<p>At least one mode must be specified: either <code>file_uuid</code> alone, or <code>file_path</code> + <code>pattern</code> together.</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Single file UUID to delete</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Directory path (for batch delete)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Regex pattern (requires <code>file_path</code>)</td>
+</tr>
+<tr>
+<td><code>delete_output_files</code></td>
+<td>boolean</td>
+<td>No</td>
+<td><code>true</code></td>
+<td>If <code>true</code>, also delete processor output JSON files (<code>{uuid}.*.json</code>). Set to <code>false</code> to keep them.</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Delete a single file by UUID (default: also deletes output JSON files)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Keep output JSON files, only delete DB records</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;delete_output_files&quot;: false}&#39;</span>
+
+<span class="c1"># Batch delete all mp4 files in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a03485a40b2df2d3&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Video unregistered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>True if deletion succeeded</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>UUID of the deleted file (single mode)</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Neither <code>file_uuid</code> nor <code>file_path</code>+<code>pattern</code> provided</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Processing Pipeline</h2>
+<h3><code>POST /api/v1/file/:file_uuid/process</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Trigger the processing pipeline for a registered file. Creates a monitor job that the worker picks up and processes sequentially. Returns immediately with the job info—processing runs asynchronously in the background.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>processors</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Specific processors to run: <code>["asr","cut","yolo","ocr","face","pose","asrx","visual_chunk"]</code></td>
+</tr>
+<tr>
+<td><code>rules</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Rule names to apply (currently unused)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Run all processors</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-d<span class="w"> </span><span class="s1">&#39;{}&#39;</span>
+
+<span class="c1"># Run specific processors only</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;processors&quot;: [&quot;asr&quot;, &quot;face&quot;, &quot;yolo&quot;]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;processing&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;pids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="mi">12345</span><span class="p">,</span><span class="w"> </span><span class="mi">12346</span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Processing triggered for video.mp4&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>job_id</code></td>
+<td>integer</td>
+<td>Monitor job ID (for job tracking)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the file</td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>"processing"</code></td>
+</tr>
+<tr>
+<td><code>pids</code></td>
+<td>integer[]</td>
+<td>Process IDs of started processors</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/probe</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Get ffprobe metadata for a registered file. Returns video/audio stream info, codec details, duration, resolution, and frame rate.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/probe&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">794863677</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;cached&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;format&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;filename&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;format_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;mov,mp4,m4a,3gp&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;120.5&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;size&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;12345678&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;bit_rate&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;819200&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;streams&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;index&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;codec_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;h264&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;codec_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;r_frame_rate&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;24/1&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;120.5&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>file_size</code></td>
+<td>integer</td>
+<td>File size in bytes (from filesystem)</td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Estimated total frames</td>
+</tr>
+<tr>
+<td><code>cached</code></td>
+<td>boolean</td>
+<td>True if result was from cached probe JSON</td>
+</tr>
+<tr>
+<td><code>format</code></td>
+<td>object</td>
+<td>Container format info (ffprobe format section)</td>
+</tr>
+<tr>
+<td><code>streams</code></td>
+<td>array</td>
+<td>Array of stream info objects</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/progress/:file_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Get real-time processing progress for a file. Queries Redis for per-processor status and the database for file metadata. Also includes system resource stats.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/progress/</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{overall_progress, processors: [.processors[] | {processor_type, status}]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;overall_progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">71</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;cpu_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">45.2</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;gpu_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">30.1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;memory_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">62.4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;asr&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;complete&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">100</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;running&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">65</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;face&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>overall_progress</code></td>
+<td>integer</td>
+<td>Overall progress percentage (0–100)</td>
+</tr>
+<tr>
+<td><code>processors</code></td>
+<td>array</td>
+<td>Per-processor status list</td>
+</tr>
+<tr>
+<td><code>processors[].processor_type</code></td>
+<td>string</td>
+<td>Processor name (<code>asr</code>, <code>cut</code>, <code>yolo</code>, etc.)</td>
+</tr>
+<tr>
+<td><code>processors[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"complete"</code>, or <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>processors[].progress</code></td>
+<td>integer</td>
+<td>Per-processor progress (0–100)</td>
+</tr>
+<tr>
+<td><code>cpu_percent</code></td>
+<td>float</td>
+<td>Current CPU usage</td>
+</tr>
+<tr>
+<td><code>gpu_percent</code></td>
+<td>float</td>
+<td>Current GPU utilization</td>
+</tr>
+<tr>
+<td><code>memory_percent</code></td>
+<td>float</td>
+<td>Current memory usage</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/jobs</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>List all processing jobs (monitor jobs) in the system. Shows job status, which file each job is processing, and current processor info.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/jobs&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{count, jobs: [.jobs[] | {uuid, status}]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;jobs&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;running&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;current_processor&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;started_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:01:00Z&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jobs</code></td>
+<td>array</td>
+<td>Array of job info objects</td>
+</tr>
+<tr>
+<td><code>jobs[].id</code></td>
+<td>integer</td>
+<td>Job ID</td>
+</tr>
+<tr>
+<td><code>jobs[].uuid</code></td>
+<td>string</td>
+<td>File UUID being processed</td>
+</tr>
+<tr>
+<td><code>jobs[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"completed"</code>, <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>jobs[].current_processor</code></td>
+<td>string</td>
+<td>Currently active processor, or null</td>
+</tr>
+<tr>
+<td><code>count</code></td>
+<td>integer</td>
+<td>Total job count</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Jobs per page</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Search APIs</h2>
+<h3>Standard Search</h3>
+<h3><code>POST /api/v1/search</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Semantic/vector search across indexed video chunks. Returns matching chunks with scores.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict search to a specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>10</td>
+<td>Max results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+<td>Items per page (alias: <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>mode</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>smart</code></td>
+<td>Search mode: <code>"vector"</code> or <code>"smart"</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Search across all files</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+
+<span class="c1"># Search within a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Paginated search</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;page&quot;: 1, &quot;page_size&quot;: 3}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.92</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span>
+<span class="p">}</span>
+
+<span class="err">&gt;</span><span class="w"> </span><span class="err">Resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">are</span><span class="w"> </span><span class="err">deduplica</span><span class="kc">te</span><span class="err">d</span><span class="w"> </span><span class="err">by</span><span class="w"> </span><span class="err">`chu</span><span class="kc">n</span><span class="err">k_id`</span><span class="w"> </span><span class="err">(highes</span><span class="kc">t</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">wi</span><span class="kc">ns</span><span class="err">)</span><span class="w"> </span><span class="err">be</span><span class="kc">f</span><span class="err">ore</span><span class="w"> </span><span class="err">pagi</span><span class="kc">nat</span><span class="err">io</span><span class="kc">n</span><span class="err">.</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">Field</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Type</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Descrip</span><span class="kc">t</span><span class="err">io</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">-------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">-------------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">array</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Array</span><span class="w"> </span><span class="err">o</span><span class="kc">f</span><span class="w"> </span><span class="err">ma</span><span class="kc">t</span><span class="err">ched</span><span class="w"> </span><span class="err">chu</span><span class="kc">n</span><span class="err">ks</span><span class="w"> </span><span class="err">(deduplica</span><span class="kc">te</span><span class="err">d)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.uuid`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">File</span><span class="w"> </span><span class="err">UUID</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.chu</span><span class="kc">n</span><span class="err">k_id`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Chu</span><span class="kc">n</span><span class="err">k</span><span class="w"> </span><span class="err">ide</span><span class="kc">nt</span><span class="err">i</span><span class="kc">f</span><span class="err">ier</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.chu</span><span class="kc">n</span><span class="err">k_</span><span class="kc">t</span><span class="err">ype`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;sentence&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;cut&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;trace&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;visual&quot;</span><span class="err">`</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.s</span><span class="kc">tart</span><span class="err">_</span><span class="kc">t</span><span class="err">ime`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">S</span><span class="kc">tart</span><span class="w"> </span><span class="kc">t</span><span class="err">ime</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="w"> </span><span class="err">seco</span><span class="kc">n</span><span class="err">ds</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.e</span><span class="kc">n</span><span class="err">d_</span><span class="kc">t</span><span class="err">ime`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">E</span><span class="kc">n</span><span class="err">d</span><span class="w"> </span><span class="kc">t</span><span class="err">ime</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="w"> </span><span class="err">seco</span><span class="kc">n</span><span class="err">ds</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.</span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Chu</span><span class="kc">n</span><span class="err">k</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">co</span><span class="kc">ntent</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.score`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Similari</span><span class="kc">t</span><span class="err">y</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`query`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Origi</span><span class="kc">nal</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="err">query</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="kc">t</span><span class="err">o</span><span class="kc">tal</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">To</span><span class="kc">tal</span><span class="w"> </span><span class="err">ma</span><span class="kc">t</span><span class="err">chi</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Curre</span><span class="kc">nt</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="kc">nu</span><span class="err">mber</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page_size`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">I</span><span class="kc">te</span><span class="err">ms</span><span class="w"> </span><span class="err">per</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="err">|</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Error</span><span class="w"> </span><span class="err">Respo</span><span class="kc">nses</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">HTTP</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Whe</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="mi">401</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Missi</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">or</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="err">valid</span><span class="w"> </span><span class="err">API</span><span class="w"> </span><span class="err">key</span><span class="w"> </span><span class="err">|</span>
+
+<span class="mi">---</span>
+
+<span class="err">###</span><span class="w"> </span><span class="err">`POST</span><span class="w"> </span><span class="err">/api/v</span><span class="mi">1</span><span class="err">/search/hybrid`</span>
+
+<span class="err">**Au</span><span class="kc">t</span><span class="err">h**</span><span class="p">:</span><span class="w"> </span><span class="err">Required</span>
+<span class="err">**Scope**</span><span class="p">:</span><span class="w"> </span><span class="kc">f</span><span class="err">ile</span><span class="mi">-</span><span class="err">level</span>
+
+<span class="err">Hybrid</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="err">combi</span><span class="kc">n</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">vec</span><span class="kc">t</span><span class="err">or</span><span class="w"> </span><span class="err">similari</span><span class="kc">t</span><span class="err">y</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">a</span><span class="kc">n</span><span class="err">d</span><span class="w"> </span><span class="err">BM</span><span class="mi">25</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">i</span><span class="kc">nt</span><span class="err">o</span><span class="w"> </span><span class="err">a</span><span class="w"> </span><span class="err">combi</span><span class="kc">ne</span><span class="err">d</span><span class="w"> </span><span class="err">score.</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Reques</span><span class="kc">t</span><span class="w"> </span><span class="err">Parame</span><span class="kc">ters</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">Field</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Type</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Required</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">De</span><span class="kc">fault</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Descrip</span><span class="kc">t</span><span class="err">io</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">-------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">----------</span><span class="err">|</span><span class="mi">---------</span><span class="err">|</span><span class="mi">-------------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`query`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Yes</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Search</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="kc">f</span><span class="err">ile_uuid`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Res</span><span class="kc">tr</span><span class="err">ic</span><span class="kc">t</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="kc">t</span><span class="err">o</span><span class="w"> </span><span class="err">a</span><span class="w"> </span><span class="err">speci</span><span class="kc">f</span><span class="err">ic</span><span class="w"> </span><span class="kc">f</span><span class="err">ile</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`limi</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mi">10</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Max</span><span class="w"> </span><span class="err">resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mi">1</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Page</span><span class="w"> </span><span class="kc">nu</span><span class="err">mber</span><span class="w"> </span><span class="err">(</span><span class="mi">1-</span><span class="err">based)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page_size`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">`limi</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">I</span><span class="kc">te</span><span class="err">ms</span><span class="w"> </span><span class="err">per</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`vec</span><span class="kc">t</span><span class="err">or_weigh</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mf">0.5</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Weigh</span><span class="kc">t</span><span class="w"> </span><span class="kc">f</span><span class="err">or</span><span class="w"> </span><span class="err">vec</span><span class="kc">t</span><span class="err">or</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`bm</span><span class="mi">25</span><span class="err">_weigh</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mf">0.5</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Weigh</span><span class="kc">t</span><span class="w"> </span><span class="kc">f</span><span class="err">or</span><span class="w"> </span><span class="err">BM</span><span class="mi">25</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Respo</span><span class="kc">nse</span>
+
+<span class="err">```jso</span><span class="kc">n</span>
+<span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;vector_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.85</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;bm25_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.72</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;combined_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.79</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].vector_score</code></td>
+<td>float</td>
+<td>Vector similarity score</td>
+</tr>
+<tr>
+<td><code>results[].bm25_score</code></td>
+<td>float</td>
+<td>BM25 text score</td>
+</tr>
+<tr>
+<td><code>results[].combined_score</code></td>
+<td>float</td>
+<td>Weighted combination of both scores</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/search/bm25</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>BM25 full-text keyword search. Good for exact term matching. Returns results with BM25 score only.</p>
+<h4>Request Parameters</h4>
+<p>Same as standard search: <code>query</code>, <code>file_uuid</code>, <code>limit</code>.</p>
+<h4>Response</h4>
+<p>Returns the same structure as standard search, with <code>score</code> representing the BM25 relevance score.</p>
+<hr />
+<h3>N8N Search</h3>
+<p>N8N-format search endpoints. Response format is optimized for n8n workflow consumption.</p>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search</code></td>
+<td>N8N-format vector search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/bm25</code></td>
+<td>N8N-format BM25 search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/hybrid</code></td>
+<td>N8N-format hybrid search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/smart</code></td>
+<td>N8N-format smart search</td>
+</tr>
+</tbody>
+</table>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>types</code></td>
+<td>string[]</td>
+<td>No</td>
+<td><code>["chunk"]</code></td>
+<td>Search types: <code>chunk</code>, <code>frame</code>, <code>person</code></td>
+</tr>
+<tr>
+<td><code>filters</code></td>
+<td>object</td>
+<td>No</td>
+<td>—</td>
+<td>Filter criteria (confidence, object class, speaker, etc.)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>20</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>time_range</code></td>
+<td>float[2]</td>
+<td>No</td>
+<td>—</td>
+<td>Time range <code>[start, end]</code> in seconds</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/n8n/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;chunk&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.92</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;took_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results</code></td>
+<td>array</td>
+<td>Array of search results</td>
+</tr>
+<tr>
+<td><code>results[].type</code></td>
+<td>string</td>
+<td>Result type: <code>"chunk"</code>, <code>"frame"</code>, or <code>"person"</code></td>
+</tr>
+<tr>
+<td><code>results[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>results[].chunk_type</code></td>
+<td>string</td>
+<td>Chunk type</td>
+</tr>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>results[].start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].text</code></td>
+<td>string</td>
+<td>Content text</td>
+</tr>
+<tr>
+<td><code>results[].score</code></td>
+<td>float</td>
+<td>Relevance score</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>took_ms</code></td>
+<td>integer</td>
+<td>Query execution time in milliseconds</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Identity Text Search</h3>
+<p>Two paths for searching identities by text.</p>
+<h4>Path A: <code>GET /api/v1/search/identity_text</code></h4>
+<p>Search chunk text content and return associated identities (if any).</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to search within</td>
+</tr>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Text search query</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/identity_text?file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&amp;q=charade&amp;page=1&amp;page_size=5&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h5>Response</h5>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;limit&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">50</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p>Each result (IdentityTextHit):</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;text_content&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">10</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>text_content</code></td>
+<td>string</td>
+<td>Chunk text content</td>
+</tr>
+<tr>
+<td><code>identity_id</code></td>
+<td>integer</td>
+<td>Identity ID (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_name</code></td>
+<td>string</td>
+<td>Identity name (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_source</code></td>
+<td>string</td>
+<td>Identity origin. <code>.json</code> = established from identity.json files on disk (unified format for all sources). <code>tmdb</code> = from <code>.json</code> via TMDb enrichment probe, then matched against faces. <code>auto</code> = pipeline face matching result; only stranger identities are auto-created. <code>user_defined</code> = manual. <code>merged</code> = merged identities.</td>
+</tr>
+<tr>
+<td><code>trace_id</code></td>
+<td>integer</td>
+<td>Face trace ID (null if no trace matched)</td>
+</tr>
+</tbody>
+</table>
+<h4>Path B: <code>POST /api/v1/identities/search</code></h4>
+<p>Search identity names and return associated face detection text.</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity name search</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;q&quot;: &quot;Cary Grant&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3>Visual Chunk Search</h3>
+<p>Search video frames by visual content (object detection results).</p>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual</code></td>
+<td>Search visual chunks by criteria (object classes, density)</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/class</code></td>
+<td>Search by specific object class</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/density</code></td>
+<td>Search by spatial density range</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/stats</code></td>
+<td>Get visual detection statistics</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/combination</code></td>
+<td>Search by object class combination</td>
+</tr>
+</tbody>
+</table>
+<h4>Request Parameters (Visual Search)</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>criteria.required_classes</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>Required object classes (e.g., <code>["person", "car"]</code>)</td>
+</tr>
+<tr>
+<td><code>criteria.min_confidence</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum confidence threshold</td>
+</tr>
+<tr>
+<td><code>criteria.min_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum spatial density</td>
+</tr>
+<tr>
+<td><code>criteria.max_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Maximum spatial density</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/visual&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;criteria&quot;: {&quot;required_classes&quot;: [&quot;person&quot;, &quot;car&quot;]}}&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;chunks&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;visual_001&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;visual&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;detections&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">        </span><span class="p">{</span><span class="nt">&quot;class&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;person&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.95</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;bbox&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="mi">100</span><span class="p">,</span><span class="w"> </span><span class="mi">200</span><span class="p">,</span><span class="w"> </span><span class="mi">150</span><span class="p">,</span><span class="w"> </span><span class="mi">350</span><span class="p">]}</span>
+<span class="w">      </span><span class="p">],</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">125.3</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>chunks</code></td>
+<td>array</td>
+<td>Array of matching visual chunks</td>
+</tr>
+<tr>
+<td><code>chunks[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunks[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>chunks[].detections</code></td>
+<td>array</td>
+<td>Object detections in this chunk</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching chunks</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Global Identities</h2>
+<h3><code>GET /api/v1/identities</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>List all registered identities with pagination.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities?page=1&amp;page_size=20&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{count, identities: [.identities[] | {name}]}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get detailed information for a specific identity, including metadata and TMDb references.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;people&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;confirmed&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;tmdb_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">112</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;tmdb_profile&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;https://image.tmdb.org/t/p/w185/abc.jpg&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;metadata&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{},</span>
+<span class="w">  </span><span class="nt">&quot;reference_data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{},</span>
+<span class="w">  </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;updated_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>uuid</code></td>
+<td>string</td>
+<td>32-char hex identity UUID</td>
+</tr>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>identity_type</code></td>
+<td>string</td>
+<td><code>"people"</code> or null</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td><code>.json</code>, <code>auto</code>, <code>tmdb</code>, <code>user_defined</code>, or <code>merged</code></td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>"confirmed"</code>, <code>"pending"</code>, or <code>"inactive"</code></td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>TMDb person ID (only if source = tmdb)</td>
+</tr>
+<tr>
+<td><code>tmdb_profile</code></td>
+<td>string</td>
+<td>TMDb profile image URL</td>
+</tr>
+<tr>
+<td><code>metadata</code></td>
+<td>object</td>
+<td>Metadata JSON (tmdb_character, cast_order, etc.)</td>
+</tr>
+<tr>
+<td><code>created_at</code></td>
+<td>string</td>
+<td>Creation timestamp</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>DELETE /api/v1/identity/:identity_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Delete an identity permanently.</p>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/files</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all files where this identity appears. Returns per-file summary including face count, confidence, and appearance time range.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/files&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/faces</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all face detection records associated with this identity.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/faces&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID where face was detected</td>
+</tr>
+<tr>
+<td><code>frame_number</code></td>
+<td>integer</td>
+<td>Frame number of detection</td>
+</tr>
+<tr>
+<td><code>face_id</code></td>
+<td>string</td>
+<td>Face ID (format: <code>face_{frame_number}</code>)</td>
+</tr>
+<tr>
+<td><code>confidence</code></td>
+<td>float</td>
+<td>Detection confidence</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/chunks</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all text chunks (sentences) spoken while this identity's face was on screen. Useful for finding what a person said.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/chunks&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>string</td>
+<td>Sentence chunk identifier</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>text</code></td>
+<td>string</td>
+<td>Spoken text content</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/bind</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Bind a face detection to an identity. Associates the face trace with the identity for future search and recognition.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID where face is detected</td>
+</tr>
+<tr>
+<td><code>face_id</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Face ID (format: <code>{frame}_{idx}</code>)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/bind&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;face_id&quot;: &quot;1_5&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/unbind</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Unbind a face detection from an identity. Removes the identity association from the face record.</p>
+<hr />
+<h3><code>GET /api/v1/identities/search</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Search identities by name (ILIKE search). Returns matching identity records.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search?q=Cary&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td>Identity source</td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>TMDb ID (if source = tmdb)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Associated file UUID</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<hr />
+<h3><code>POST /api/v1/identity/upload</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Upload an identity.json file to create or update an identity. Accepts the same format as the identity.json files stored on disk.</p>
+<p>If an identity with the same <code>name</code> already exists, it will be updated with the new values.</p>
+<h4>Request</h4>
+<p>The request body is an <code>IdentityFile</code> object:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>identity_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>32-char hex UUID (hyphens allowed, will be stripped)</td>
+</tr>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>identity_type</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>"people"</code> or null</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>.json</code>, <code>auto</code>, <code>tmdb</code>, <code>user_defined</code>, or <code>merged</code></td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>"confirmed"</code>, <code>"pending"</code>, or <code>"inactive"</code></td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>TMDb person ID</td>
+</tr>
+<tr>
+<td><code>tmdb_profile</code></td>
+<td>string</td>
+<td>No</td>
+<td>TMDb profile image URL</td>
+</tr>
+<tr>
+<td><code>metadata</code></td>
+<td>object</td>
+<td>No</td>
+<td>Arbitrary metadata JSON</td>
+</tr>
+<tr>
+<td><code>file_bindings</code></td>
+<td>array</td>
+<td>No</td>
+<td>Array of <code>{ file_uuid, trace_ids, face_count }</code> (informational)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/upload&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{</span>
+<span class="s1">    &quot;version&quot;: 1,</span>
+<span class="s1">    &quot;identity_uuid&quot;: &quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;,</span>
+<span class="s1">    &quot;name&quot;: &quot;Cary Grant&quot;,</span>
+<span class="s1">    &quot;identity_type&quot;: &quot;people&quot;,</span>
+<span class="s1">    &quot;source&quot;: &quot;.json&quot;,</span>
+<span class="s1">    &quot;status&quot;: &quot;confirmed&quot;,</span>
+<span class="s1">    &quot;metadata&quot;: {},</span>
+<span class="s1">    &quot;file_bindings&quot;: []</span>
+<span class="s1">  }&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Identity uploaded successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/profile-image</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Upload a profile image (JPEG or PNG) for an identity. The image is saved to <code>{output}/identities/{uuid}/profile.{ext}</code>.</p>
+<p>Uses <code>multipart/form-data</code> with field name <code>image</code>.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/profile-image&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-F<span class="w"> </span><span class="s2">&quot;image=@/path/to/photo.jpg&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/output/identities/.../profile.jpg&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Profile image saved: profile.jpg&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Missing image field or unsupported format</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>415</code></td>
+<td>Unsupported image type (use JPEG or PNG)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/profile-image</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Retrieve the profile image for an identity. Returns the raw image data with appropriate Content-Type header.</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/profile-image&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>profile.jpg
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Response Header</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>content-type</code></td>
+<td><code>image/jpeg</code> or <code>image/png</code></td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/signals/unbound</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>List unbound face signals — face detections that have not yet been assigned to any identity.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/signals/unbound&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h2>Identity Agent</h2>
+<h3><code>POST /api/v1/agents/identity/analyze</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Run identity matching on a processed file: matches face detection traces against known identities (TMDb, .json, auto) and creates bindings. Optionally uses LLM for enhanced analysis.</p>
+<blockquote>
+<p>Requires the file's face processor to have completed. Will return an error if face traces are not available.</p>
+</blockquote>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>File UUID to analyze</td>
+</tr>
+<tr>
+<td><code>use_llm</code></td>
+<td>boolean</td>
+<td>No</td>
+<td><code>false</code></td>
+<td>Enable LLM-assisted identity analysis</td>
+</tr>
+<tr>
+<td><code>model</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>LLM model name (e.g., <code>"gemma4"</code>)</td>
+</tr>
+<tr>
+<td><code>auto_merge_threshold</code></td>
+<td>float</td>
+<td>No</td>
+<td>—</td>
+<td>Confidence threshold (0.0–1.0) for auto-merging</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Basic analysis</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/analyze&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># With LLM enhancement</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/analyze&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;use_llm&quot;: true, &quot;model&quot;: &quot;gemma4&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identities&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;person_ids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;trace_10&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;trace_23&quot;</span><span class="p">],</span>
+<span class="w">      </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.87</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;stranger&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;processing_status&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;phase&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;COMPLETED&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">100</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Analyzed file UUID</td>
+</tr>
+<tr>
+<td><code>identities</code></td>
+<td>array</td>
+<td>Array of matched identity results</td>
+</tr>
+<tr>
+<td><code>identities[].identity_id</code></td>
+<td>string</td>
+<td>32-char identity UUID</td>
+</tr>
+<tr>
+<td><code>identities[].person_ids</code></td>
+<td>string[]</td>
+<td>Matched trace/person IDs</td>
+</tr>
+<tr>
+<td><code>identities[].confidence</code></td>
+<td>float</td>
+<td>Matching confidence (0.0–1.0)</td>
+</tr>
+<tr>
+<td><code>identities[].matched</code></td>
+<td>boolean</td>
+<td>Whether this identity was matched to a known entity</td>
+</tr>
+<tr>
+<td><code>identities[].name</code></td>
+<td>string</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>identities[].source</code></td>
+<td>string</td>
+<td>Identity source (<code>.json</code>, <code>auto</code>, <code>tmdb</code>, etc.)</td>
+</tr>
+<tr>
+<td><code>identities[].stranger</code></td>
+<td>boolean</td>
+<td>Whether this is an unmatched stranger trace</td>
+</tr>
+<tr>
+<td><code>processing_status</code></td>
+<td>object</td>
+<td>Identity agent processing progress</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>File UUID not provided or invalid</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File not found or face processor not completed</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Analysis failed (LLM error, DB error)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/agents/identity/suggest</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Suggest identity merges based on face embedding similarity analysis. Returns pairs of identities that are similar enough to potentially be the same person.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>File UUID to analyze for merge suggestions</td>
+</tr>
+<tr>
+<td><code>auto_merge_threshold</code></td>
+<td>float</td>
+<td>No</td>
+<td>—</td>
+<td>Confidence threshold for auto-suggest</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/suggest&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/agents/identity/status</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Get the identity agent processing status for a file. Shows current phase and progress.</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/status?file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/agents/suggest/merge</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Execute a suggested identity merge. Combines two identities into one, consolidating their face bindings.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>source_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity UUID to merge FROM (will be removed)</td>
+</tr>
+<tr>
+<td><code>target_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity UUID to merge INTO (will be kept)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/suggest/merge&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;source_uuid&quot;: &quot;uuid_to_discard&quot;, &quot;target_uuid&quot;: &quot;uuid_to_keep&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/agents/suggest/clustering</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Suggest face clustering results. Analyzes all face embeddings in a file and groups similar faces into candidate identity clusters.</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/suggest/clustering&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h2>TMDb Enrichment</h2>
+<blockquote>
+<p>⚠️ <strong>External resource</strong>: TMDb requires internet access, violating Momentry's local-only principle.
+All core processing (ASR, YOLO, Face, OCR, Pose, embeddings) runs fully offline.
+TMDb enrichment is <strong>optional</strong> and gated behind <code>TMDB_API_KEY</code> + <code>MOMENTRY_TMDB_PROBE_ENABLED</code>.</p>
+</blockquote>
+<h3>Overview</h3>
+<p>TMDb enrichment is an optional identity enrichment step that can be run after Pipeline face detection completes. The workflow is:</p>
+<ol>
+<li><strong>Prefetch</strong> (requires internet): Download movie cast data from TMDb API → cache to <code>{file_uuid}.tmdb.json</code></li>
+<li><strong>Probe</strong>: Read local cache → create identities for <strong>all</strong> cast members (<code>source='tmdb'</code>) + save <code>identity.json</code> + download profile image to <code>{OUTPUT}/identities/{uuid}/profile.jpg</code></li>
+<li><strong>Match</strong>: The worker automatically matches video faces against TMDb identities when <code>MOMENTRY_TMDB_PROBE_ENABLED=true</code></li>
+</ol>
+<h3><code>POST /api/v1/agents/tmdb/prefetch</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Fetch TMDb cast data for a registered file and cache it locally. This is the only step requiring internet access.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to enrich</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/tmdb/prefetch&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;cache_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/output/...tmdb.json&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/file/:file_uuid/tmdb-probe</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Read local TMDb cache and create/update identities. Requires prefetch to have been run first.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/tmdb-probe&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_created, movie_title}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200 — identities created)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;identities_created&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;movie_title&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h4>Response (200 — no cache)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;No TMDb cache found. Run tmdb-prefetch first.&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>GET /api/v1/resource/tmdb</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>View TMDb resource status including configuration, identity counts, and cache file count.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_seeded, cache_files}&#39;</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/resource/tmdb/check</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Ping the TMDb API to verify connectivity and measure latency.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb/check&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.status&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;api_key_configured&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;enabled&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_reachable&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">120</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Stats &amp; Pipeline</h2>
+<h3>Stats Endpoints</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Auth</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/ingest</code></td>
+<td>No</td>
+<td>Ingest statistics</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/sftpgo</code></td>
+<td>No</td>
+<td>SFTPGo service status</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/inference</code></td>
+<td>No</td>
+<td>Inference service health</td>
+</tr>
+</tbody>
+</table>
+<h3>Configuration</h3>
+<h3><code>POST /api/v1/config/cache</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Toggle the Redis cache on or off.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>enabled</code></td>
+<td>boolean</td>
+<td>Yes</td>
+<td><code>true</code> to enable, <code>false</code> to disable</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/config/cache&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;enabled&quot;: false}&#39;</span>
+</code></pre></div>
+
+<h3>Unmounted Routes</h3>
+<p>The following routes are defined in source code but are <strong>NOT</strong> currently mounted in the router:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Endpoint</th>
+<th>Source file</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>/api/v1/search/universal</code></td>
+<td><code>universal_search.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/search/frames</code></td>
+<td><code>universal_search.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/search/persons</code></td>
+<td><code>universal_search.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/who</code></td>
+<td><code>who.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/who/candidates</code></td>
+<td><code>who.rs</code></td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h1>Agent Endpoints</h1>
+<p>Agent endpoints provide AI-powered capabilities including translation, identity analysis, and 5W1H extraction.</p>
+<h2>POST /api/v1/agents/translate</h2>
+<p>Translate text between languages using Gemma4 (llama.cpp, port 8082).</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Hello, welcome to Momentry Core.&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;target_language&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Traditional Chinese&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source_language&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;English&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>text</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Text to translate</td>
+</tr>
+<tr>
+<td><code>target_language</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Target language name (e.g. "Traditional Chinese", "Japanese")</td>
+</tr>
+<tr>
+<td><code>source_language</code></td>
+<td>string</td>
+<td>❌</td>
+<td>Source language (default: "auto")</td>
+</tr>
+</tbody>
+</table>
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;translated_text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;您好，歡迎使用 Momentry Core。&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source_language_detected&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;English&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;model_used&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;google_gemma-4-26B-A4B-it-Q5_K_M.gguf&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h3>Supported Language Pairs (tested)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Source</th>
+<th>Target</th>
+<th>Quality</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>English</td>
+<td>Traditional Chinese</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>English</td>
+<td>Japanese</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>Chinese</td>
+<td>English</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>English</td>
+<td>French</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>Chinese</td>
+<td>Japanese</td>
+<td>✅</td>
+</tr>
+</tbody>
+</table>
+<h3>Model</h3>
+<ul>
+<li><strong>Model</strong>: Gemma4 26B (Q5_K_M)</li>
+<li><strong>Engine</strong>: llama.cpp at <code>localhost:8082</code></li>
+<li><strong>Endpoint</strong>: <code>/v1/chat/completions</code> (OpenAI-compatible)</li>
+<li><strong>Temperature</strong>: 0.1</li>
+<li><strong>Max tokens</strong>: 1024</li>
+</ul>
+<h3>Errors</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Status</th>
+<th>Condition</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>500</td>
+<td>LLM unreachable or response parse failure</td>
+</tr>
+<tr>
+<td>401</td>
+<td>Missing/invalid auth</td>
+</tr>
+</tbody>
+</table>
+<h2>GET /api/v1/agents/identity/status</h2>
+<p>Get status of the identity agent pipeline.</p>
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;idle&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;last_analysis&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-17T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identities_processed&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">27</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/suggest/clustering</h2>
+<p>Run face clustering to suggest new identity groupings.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/suggest/merge</h2>
+<p>Merge two identities into one.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;from_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;into_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/5w1h/analyze</h2>
+<p>Extract 5W1H (Who, What, When, Where, Why, How) from video chunk text.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;chunk_42&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;5w1h&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;who&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;what&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;discussing plans&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;when&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;1963&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;where&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;Paris&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;why&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;vacation&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;how&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;in person&quot;</span><span class="p">]</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/5w1h/batch</h2>
+<p>Batch analyze multiple chunks for 5W1h extraction.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;chunk_ids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;chunk_1&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;chunk_2&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;chunk_3&quot;</span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>GET /api/v1/agents/5w1h/status</h2>
+<p>Get status of the 5W1H agent pipeline.</p>
+<hr />
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/API_ERROR_CODES.html b/docs_v1.0/doc_user/API_ERROR_CODES.html
new file mode 100644
index 0000000..04ccbb3
--- /dev/null
+++ b/docs_v1.0/doc_user/API_ERROR_CODES.html
@@ -0,0 +1,207 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Api Error Codes - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "api_reference"
+service: "MOMENTRY_CORE"
+title: "API Error Codes (API 標準錯誤碼)"
+date: "2026-05-17"
+version: "V1.1"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"</p>
+<hr />
+<h1>API Error Codes (API 標準錯誤碼)</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Error Response Format</h2>
+<p>All API errors follow this JSON structure:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;error&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;code&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;E001_NOT_FOUND&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Resource not found&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;details&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;resource&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;file_uuid&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;value&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;abc&quot;</span><span class="p">}</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>Error Code List</h2>
+<h3>Generic Errors (E0xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E001_NOT_FOUND</code></td>
+<td>404</td>
+<td>Resource not found (file, identity, chunk)</td>
+</tr>
+<tr>
+<td><code>E002_DUPLICATE</code></td>
+<td>409</td>
+<td>Resource already exists</td>
+</tr>
+<tr>
+<td><code>E003_VALIDATION</code></td>
+<td>400</td>
+<td>Request parameter validation failed</td>
+</tr>
+<tr>
+<td><code>E004_UNAUTHORIZED</code></td>
+<td>401</td>
+<td>Invalid API key or token</td>
+</tr>
+<tr>
+<td><code>E005_INTERNAL</code></td>
+<td>500</td>
+<td>Internal server error</td>
+</tr>
+</tbody>
+</table>
+<h3>Processor Errors (E1xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E101_PROCESSOR_FAIL</code></td>
+<td>500</td>
+<td>Python script execution failed</td>
+</tr>
+<tr>
+<td><code>E102_TIMEOUT</code></td>
+<td>504</td>
+<td>Processing timeout</td>
+</tr>
+<tr>
+<td><code>E103_RESUME_FAIL</code></td>
+<td>500</td>
+<td>Resume failed (checkpoint not found)</td>
+</tr>
+<tr>
+<td><code>E104_NO_VIDEO</code></td>
+<td>400</td>
+<td>Video file path not found</td>
+</tr>
+</tbody>
+</table>
+<h3>Identity Errors (E2xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E201_FACE_NOT_FOUND</code></td>
+<td>404</td>
+<td>Face detection not found</td>
+</tr>
+<tr>
+<td><code>E202_MERGE_CONFLICT</code></td>
+<td>409</td>
+<td>Identity merge conflict</td>
+</tr>
+<tr>
+<td><code>E203_CANDIDATE_EMPTY</code></td>
+<td>404</td>
+<td>No candidates available for confirmation</td>
+</tr>
+</tbody>
+</table>
+<h3>TMDb Errors (E3xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E301_TMDB_NO_KEY</code></td>
+<td>400</td>
+<td><code>TMDB_API_KEY</code> environment variable not set</td>
+</tr>
+<tr>
+<td><code>E302_TMDB_UNREACHABLE</code></td>
+<td>502</td>
+<td>TMDb API unreachable or timed out</td>
+</tr>
+<tr>
+<td><code>E303_TMDB_CACHE_NOT_FOUND</code></td>
+<td>200</td>
+<td>No local TMDb cache; run prefetch first</td>
+</tr>
+<tr>
+<td><code>E304_TMDB_PROBE_FAILED</code></td>
+<td>500</td>
+<td>TMDb probe execution failed</td>
+</tr>
+<tr>
+<td><code>E305_TMDB_MOVIE_NOT_FOUND</code></td>
+<td>404</td>
+<td>No matching TMDb movie found from filename</td>
+</tr>
+</tbody>
+</table>
+<hr />
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/API_INDEX.html b/docs_v1.0/doc_user/API_INDEX.html
new file mode 100644
index 0000000..a345701
--- /dev/null
+++ b/docs_v1.0/doc_user/API_INDEX.html
@@ -0,0 +1,125 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Api Index - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "api_reference"
+service: "MOMENTRY_CORE"
+title: "Momentry Core API 文件總覽"
+date: "2026-05-17"
+version: "V1.0"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"</p>
+<hr />
+<h1>Momentry Core API 文件總覽</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>📁 文件結構</h2>
+<div class="codehilite"><pre><span></span><code><span class="n">API_WORKSPACE</span><span class="o">/</span>
+<span class="err">└──</span><span class="w"> </span><span class="n">modules</span><span class="o">/</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="n">_template</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">One</span><span class="o">-</span><span class="n">line</span><span class="w"> </span><span class="n">description</span><span class="w"> </span><span class="n">of</span><span class="w"> </span><span class="n">what</span><span class="w"> </span><span class="n">this</span><span class="w"> </span><span class="k">module</span><span class="w"> </span><span class="n">covers</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">01</span><span class="n">_auth</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Authentication</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="n">login</span><span class="p">,</span><span class="w"> </span><span class="n">logout</span><span class="p">,</span><span class="w"> </span><span class="n">JWT</span><span class="p">,</span><span class="w"> </span><span class="n">session</span><span class="w"> </span><span class="n">cookie</span><span class="p">,</span><span class="w"> </span><span class="n">API</span><span class="w"> </span><span class="n">key</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">02</span><span class="n">_health</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Health</span><span class="w"> </span><span class="n">check</span><span class="w"> </span><span class="n">endpoints</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">03</span><span class="n">_register</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">File</span><span class="w"> </span><span class="n">registration</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="n">register</span><span class="p">,</span><span class="w"> </span><span class="n">scan</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">04</span><span class="n">_lookup</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">File</span><span class="w"> </span><span class="n">lookup</span><span class="w"> </span><span class="n">by</span><span class="w"> </span><span class="n">name</span><span class="w"> </span><span class="k">and</span><span class="w"> </span><span class="n">unregistration</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">05</span><span class="n">_process</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Processing</span><span class="w"> </span><span class="n">pipeline</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="n">trigger</span><span class="p">,</span><span class="w"> </span><span class="n">probe</span><span class="p">,</span><span class="w"> </span><span class="n">progress</span><span class="p">,</span><span class="w"> </span><span class="n">jobs</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">06</span><span class="n">_search</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Vector</span><span class="w"> </span><span class="n">search</span><span class="p">,</span><span class="w"> </span><span class="n">hybrid</span><span class="w"> </span><span class="n">search</span><span class="p">,</span><span class="w"> </span><span class="n">BM25</span><span class="p">,</span><span class="w"> </span><span class="n">n8n</span><span class="p">,</span><span class="w"> </span><span class="n">visual</span><span class="p">,</span><span class="w"> </span><span class="n">identity</span><span class="w"> </span><span class="n">text</span><span class="w"> </span><span class="n">search</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">07</span><span class="n">_identity</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Global</span><span class="w"> </span><span class="n">identities</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="n">CRUD</span><span class="p">,</span><span class="w"> </span><span class="n">detail</span><span class="p">,</span><span class="w"> </span><span class="n">files</span><span class="p">,</span><span class="w"> </span><span class="n">faces</span><span class="p">,</span><span class="w"> </span><span class="n">bind</span><span class="p">,</span><span class="w"> </span><span class="n">unbind</span><span class="p">,</span><span class="w"> </span><span class="n">search</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">08</span><span class="n">_identity_agent</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Identity</span><span class="w"> </span><span class="n">agent</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="n">analyze</span><span class="p">,</span><span class="w"> </span><span class="n">suggest</span><span class="p">,</span><span class="w"> </span><span class="n">merge</span><span class="p">,</span><span class="w"> </span><span class="n">clustering</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">08</span><span class="n">_media</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Video</span><span class="w"> </span><span class="n">streaming</span><span class="w"> </span><span class="o">&amp;</span><span class="w"> </span><span class="n">frame</span><span class="w"> </span><span class="n">extraction</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">09</span><span class="n">_tmdb</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">TMDb</span><span class="w"> </span><span class="n">enrichment</span><span class="w"> </span><span class="n">endpoints</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="n">prefetch</span><span class="p">,</span><span class="w"> </span><span class="n">probe</span><span class="p">,</span><span class="w"> </span><span class="n">resource</span><span class="p">,</span><span class="w"> </span><span class="n">check</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">10</span><span class="n">_pipeline</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Stats</span><span class="w"> </span><span class="n">endpoints</span><span class="p">,</span><span class="w"> </span><span class="n">inference</span><span class="w"> </span><span class="n">health</span><span class="p">,</span><span class="w"> </span><span class="n">stfpgo</span><span class="w"> </span><span class="n">status</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">11</span><span class="n">_error_codes</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span><span class="n">Standard</span><span class="w"> </span><span class="n">API</span><span class="w"> </span><span class="n">error</span><span class="w"> </span><span class="n">codes</span>
+<span class="err">│</span><span class="w">   </span><span class="err">├──</span><span class="w"> </span><span class="mh">12</span><span class="n">_agent</span><span class="p">.</span><span class="n">md</span><span class="w">  </span><span class="err">←</span><span class="w"> </span>
+<span class="err">└──</span><span class="w"> </span><span class="p">(</span><span class="n">generated</span><span class="w"> </span><span class="n">files</span><span class="w"> </span><span class="err">→</span><span class="w"> </span><span class="n">GUIDES</span><span class="o">/</span><span class="p">)</span>
+</code></pre></div>
+
+<h2>快速選擇指南</h2>
+<table class="table">
+<thead>
+<tr>
+<th>需求</th>
+<th>閱讀文件</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>查看所有 API 端點（curl 範例版）</td>
+<td><code>GUIDES/API_ENDPOINTS.md</code></td>
+</tr>
+<tr>
+<td>查看快速端點摘要</td>
+<td><code>GUIDES/API_QUICK_REFERENCE.md</code></td>
+</tr>
+<tr>
+<td>執行 TMDb Enrichment</td>
+<td><code>GUIDES/TMDb_User_Guide.md</code></td>
+</tr>
+<tr>
+<td>查看錯誤碼</td>
+<td><code>GUIDES/API_ERROR_CODES.md</code></td>
+</tr>
+</tbody>
+</table>
+<h2>文件模組清單</h2>
+<ul>
+<li><code>_template</code> — One-line description of what this module covers</li>
+<li><code>01_auth</code> — Authentication — login, logout, JWT, session cookie, API key</li>
+<li><code>02_health</code> — Health check endpoints</li>
+<li><code>03_register</code> — File registration — register, scan</li>
+<li><code>04_lookup</code> — File lookup by name and unregistration</li>
+<li><code>05_process</code> — Processing pipeline — trigger, probe, progress, jobs</li>
+<li><code>06_search</code> — Vector search, hybrid search, BM25, n8n, visual, identity text search</li>
+<li><code>07_identity</code> — Global identities — CRUD, detail, files, faces, bind, unbind, search</li>
+<li><code>08_identity_agent</code> — Identity agent — analyze, suggest, merge, clustering</li>
+<li><code>08_media</code> — Video streaming &amp; frame extraction</li>
+<li><code>09_tmdb</code> — TMDb enrichment endpoints — prefetch, probe, resource, check</li>
+<li><code>10_pipeline</code> — Stats endpoints, inference health, stfpgo status</li>
+<li><code>11_error_codes</code> — Standard API error codes</li>
+<li><code>12_agent</code> — </li>
+</ul>
+<hr />
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/API_QUICK_REFERENCE.html b/docs_v1.0/doc_user/API_QUICK_REFERENCE.html
new file mode 100644
index 0000000..70bd218
--- /dev/null
+++ b/docs_v1.0/doc_user/API_QUICK_REFERENCE.html
@@ -0,0 +1,2105 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Api Quick Reference - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "api_reference"
+service: "MOMENTRY_CORE"
+title: "Momentry Core API 快速查詢表"
+date: "2026-05-17"
+version: "V1.1"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"</p>
+<hr />
+<h1>Momentry Core API 快速查詢表</h1>
+<h2>Base URL</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Environment</th>
+<th>URL</th>
+<th>Purpose</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Playground (Dev)</td>
+<td><code>http://localhost:3003</code></td>
+<td>Development and testing</td>
+</tr>
+<tr>
+<td>Production</td>
+<td><code>http://localhost:3002</code></td>
+<td>Production deployment</td>
+</tr>
+<tr>
+<td>External (M5)</td>
+<td><code>https://m5api.momentry.ddns.net</code></td>
+<td>Remote access</td>
+</tr>
+</tbody>
+</table>
+<h2>Variables</h2>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://localhost:3003&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;your-api-key-here&quot;</span>
+</code></pre></div>
+
+<h2>Authentication</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Mode</th>
+<th>Transport</th>
+<th>Expiry</th>
+<th>Scope</th>
+<th>Best for</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td><code>Cookie: session_id=&lt;uuid&gt;</code></td>
+<td>24h</td>
+<td>per-browser session</td>
+<td>Portal (browser)</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td><code>Authorization: Bearer &lt;token&gt;</code></td>
+<td>1h</td>
+<td>per-login token</td>
+<td>API clients (n8n, CLI, scripts)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td><code>X-API-Key: &lt;key&gt;</code></td>
+<td>90d</td>
+<td>fixed key for automation</td>
+<td>Legacy scripts, WordPress</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Username</th>
+<th>Password</th>
+<th>API Key</th>
+<th>Role</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>admin</code></td>
+<td><code>admin</code></td>
+<td>—</td>
+<td>admin</td>
+</tr>
+<tr>
+<td><code>demo</code></td>
+<td><code>demo</code></td>
+<td><code>muser_demo_key_32chars_abcdef1234567890</code></td>
+<td>user</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Using API key instead of JWT</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_demo_key_32chars_abcdef1234567890&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login as admin</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;admin&quot;, &quot;password&quot;: &quot;admin&quot;}&#39;</span>
+
+<span class="c1"># Login as demo user</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;demo&quot;, &quot;password&quot;: &quot;demo&quot;}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jwt</code></td>
+<td>string</td>
+<td>JWT access token. Use as <code>Authorization: Bearer &lt;jwt&gt;</code>. Expires in 1 hour.</td>
+</tr>
+<tr>
+<td><code>api_key</code></td>
+<td>string</td>
+<td>Legacy API key. Use as <code>X-API-Key: &lt;key&gt;</code>. Good for 90 days.</td>
+</tr>
+<tr>
+<td><code>user.username</code></td>
+<td>string</td>
+<td>Username</td>
+</tr>
+<tr>
+<td><code>user.role</code></td>
+<td>string</td>
+<td>Role: <code>admin</code>, <code>user</code>, or <code>readonly</code></td>
+</tr>
+<tr>
+<td><code>expires_at</code></td>
+<td>string</td>
+<td>ISO8601 timestamp of JWT expiration</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login and capture JWT</span>
+<span class="nv">JWT</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;print(json.load(sys.stdin)[&#39;jwt&#39;])&quot;</span><span class="k">)</span>
+
+<span class="c1"># Use JWT for all subsequent requests</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login captures the session cookie from Set-Cookie header</span>
+curl<span class="w"> </span>-v<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span>
+
+<span class="c1"># Browser automatically sends: Cookie: session_id=&lt;uuid&gt;</span>
+<span class="c1"># No manual header needed for subsequent requests</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+
+<span class="c1"># Also accepted via Bearer header (non-JWT format) or query parameter:</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?api_key=</span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>momentry<span class="w"> </span>api-key<span class="w"> </span>create<span class="w"> </span><span class="s2">&quot;My API Key&quot;</span><span class="w"> </span>--key-type<span class="w"> </span>user
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Logout using the session cookie (browser)</span>
+curl<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=&lt;uuid&gt;&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Auth mode</th>
+<th>Effect</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td>Session deleted from database. Same cookie returns 401 on subsequent requests.</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td>JWT remains valid until expiry. (JWT is stateless — logout adds JWT to a blacklist only if API key mode is used.)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td>API key remains valid. (Legacy keys are shared across sessions — revoking would break other clients.)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># 1. Login</span>
+<span class="nv">SESSION_ID</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-D<span class="w"> </span>-<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sed<span class="w"> </span><span class="s1">&#39;s/.*session_id=\([^;]*\).*/\1/&#39;</span><span class="k">)</span>
+
+<span class="c1"># 2. Use session (works)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 200</span>
+
+<span class="c1"># 3. Logout</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → {&quot;success&quot;: true}</span>
+
+<span class="c1"># 4. Use session again (rejected)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 401</span>
+</code></pre></div>
+
+<h3>Error Responses</h3>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid authentication</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Session expired or logged out</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>JWT expired</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>API key revoked or inactive</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<ul>
+<li><code>POST /api/v1/resource/tmdb/check</code> — test authentication + TMDb API connectivity</li>
+<li><code>GET /health/detailed</code> — view auth status (integrations section)</li>
+</ul>
+<hr />
+<h2>Health Check</h2>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, version}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>version</code></td>
+<td>string</td>
+<td>Semver version</td>
+</tr>
+<tr>
+<td><code>build_git_hash</code></td>
+<td>string</td>
+<td>Git commit hash</td>
+</tr>
+<tr>
+<td><code>build_timestamp</code></td>
+<td>string</td>
+<td>Binary build time</td>
+</tr>
+<tr>
+<td><code>uptime_ms</code></td>
+<td>integer</td>
+<td>Milliseconds since server start</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health/detailed&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, services, resources: {cpu: .resources.cpu_used_percent, memory: .resources.memory_used_percent}}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> if all essential services healthy</td>
+</tr>
+<tr>
+<td><code>services</code></td>
+<td>object</td>
+<td>Per-service status (postgres, redis, qdrant)</td>
+</tr>
+<tr>
+<td><code>services.*.status</code></td>
+<td>string</td>
+<td><code>ok</code>, <code>error</code>, or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>services.*.latency_ms</code></td>
+<td>int</td>
+<td>Response time in milliseconds</td>
+</tr>
+<tr>
+<td><code>resources</code></td>
+<td>object</td>
+<td>CPU, memory usage</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_ready</code></td>
+<td>boolean</td>
+<td>Scripts directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_count</code></td>
+<td>int</td>
+<td>Number of Python processor scripts</td>
+</tr>
+<tr>
+<td><code>pipeline.processors</code></td>
+<td>object</td>
+<td>Per-processor availability</td>
+</tr>
+<tr>
+<td><code>pipeline.models_ready</code></td>
+<td>boolean</td>
+<td>Models directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_integrity</code></td>
+<td>object</td>
+<td>SHA256 checksum verification results</td>
+</tr>
+<tr>
+<td><code>schema.ok</code></td>
+<td>boolean</td>
+<td>All required migrations applied</td>
+</tr>
+<tr>
+<td><code>identities.synced</code></td>
+<td>boolean</td>
+<td>Identity file count matches DB count</td>
+</tr>
+<tr>
+<td><code>integrations.tmdb</code></td>
+<td>object</td>
+<td>TMDB API key config and reachability</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Condition</th>
+<th>status</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>All services ok</td>
+<td><code>ok</code></td>
+</tr>
+<tr>
+<td>Any service error</td>
+<td><code>degraded</code></td>
+</tr>
+<tr>
+<td>Postgres or Redis error</td>
+<td><code>degraded</code> (server still responds)</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Auth</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/ingest</code></td>
+<td>No</td>
+<td>Ingest pipeline statistics</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/sftpgo</code></td>
+<td>No</td>
+<td>SFTPGo service status</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/inference</code></td>
+<td>No</td>
+<td>Inference service (LLM) health</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/stats/ingest&quot;</span>
+</code></pre></div>
+
+<hr />
+<h2>File Registration</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Path to video file on disk</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex pattern for batch register (requires <code>file_path</code> to be a directory)</td>
+</tr>
+<tr>
+<td><code>user_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>User ID to associate with registration</td>
+</tr>
+<tr>
+<td><code>content_hash</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Pre-computed SHA-256 hash (skips computation)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Register a single file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39;</span>
+
+<span class="c1"># Batch register files matching a pattern in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the registered file</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name (auto-renamed if name conflict)</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Canonical path on disk</td>
+</tr>
+<tr>
+<td><code>file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>"unknown"</code></td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Total frame count</td>
+</tr>
+<tr>
+<td><code>already_exists</code></td>
+<td>boolean</td>
+<td>True if same content was already registered</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+<tr>
+<td><code>400</code></td>
+<td>Invalid request body</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File path does not exist</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Items per page (alias: <code>limit</code>)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Max items (alias for <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex filter on file name (e.g., <code>.*\\.mp4$</code>)</td>
+</tr>
+<tr>
+<td><code>sort_by</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>name</code></td>
+<td>Sort field: <code>name</code>, <code>size</code>, <code>modified</code>, <code>status</code></td>
+</tr>
+<tr>
+<td><code>sort_order</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>asc</code></td>
+<td>Sort direction: <code>asc</code> or <code>desc</code></td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Full scan</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, registered_count, unregistered_count}&#39;</span>
+
+<span class="c1"># Paginated (page 1, 5 per page)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?page=1&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{page, total_pages, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Regex filter: only mp4 files</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?pattern=.*\\.mp4</span>$<span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{filtered_total, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Sort by file size (largest first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=size&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, file_size}]&#39;</span>
+
+<span class="c1"># Sort by modified time (most recent first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=modified&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, modified_time}]&#39;</span>
+
+<span class="c1"># Sort by status</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=status&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, status}]&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>files</code></td>
+<td>array</td>
+<td>Array of file info objects (paginated)</td>
+</tr>
+<tr>
+<td><code>files[].file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>files[].relative_path</code></td>
+<td>string</td>
+<td>Path relative to scan root</td>
+</tr>
+<tr>
+<td><code>files[].file_path</code></td>
+<td>string</td>
+<td>Absolute path on disk</td>
+</tr>
+<tr>
+<td><code>files[].file_size</code></td>
+<td>integer</td>
+<td>File size in bytes</td>
+</tr>
+<tr>
+<td><code>files[].modified_time</code></td>
+<td>string</td>
+<td>Last modified timestamp (ISO8601)</td>
+</tr>
+<tr>
+<td><code>files[].is_registered</code></td>
+<td>boolean</td>
+<td>Whether file is registered in DB</td>
+</tr>
+<tr>
+<td><code>files[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].status</code></td>
+<td>string</td>
+<td><code>"completed"</code>, <code>"processing"</code>, <code>"registered"</code>, <code>"unregistered"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>files[].registration_time</code></td>
+<td>string</td>
+<td>DB registration timestamp (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].job_id</code></td>
+<td>integer</td>
+<td>Processing job ID (only if a job exists)</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total files found on disk (unfiltered)</td>
+</tr>
+<tr>
+<td><code>filtered_total</code></td>
+<td>integer</td>
+<td>Files matching regex filter</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>total_pages</code></td>
+<td>integer</td>
+<td>Total pages</td>
+</tr>
+<tr>
+<td><code>registered_count</code></td>
+<td>integer</td>
+<td>Files registered in DB</td>
+</tr>
+<tr>
+<td><code>unregistered_count</code></td>
+<td>integer</td>
+<td>Files not yet registered</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Feature</th>
+<th>Behavior</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Regex</strong></td>
+<td>Case-insensitive (<code>(?i)</code> prefix auto-applied). Applied to <code>file_name</code>.</td>
+</tr>
+<tr>
+<td><strong>Sort order</strong></td>
+<td>Default (<code>sort_by=name</code>): registered files first, then alphabetically. <code>sort_by=status</code>: alphabetical by status string.</td>
+</tr>
+<tr>
+<td><strong>Pagination</strong></td>
+<td><code>page_size</code> and <code>limit</code> are aliases. Default: show all results.</td>
+</tr>
+<tr>
+<td><strong>Processing order</strong></td>
+<td><code>pattern</code> regex filter → <code>sort_by</code>/<code>sort_order</code> → <code>page</code>/<code>page_size</code> slice.</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>File Lookup</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File name to search for (partial matches supported)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Look up a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=video.mp4&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+
+<span class="c1"># Partial name search</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=charade&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.matches[].file_name&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Searched name</td>
+</tr>
+<tr>
+<td><code>exists</code></td>
+<td>boolean</td>
+<td>Exact name match exists</td>
+</tr>
+<tr>
+<td><code>matches</code></td>
+<td>array</td>
+<td>Array of matching registered files</td>
+</tr>
+<tr>
+<td><code>matches[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>matches[].file_name</code></td>
+<td>string</td>
+<td>Registered file name</td>
+</tr>
+<tr>
+<td><code>matches[].file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>matches[].status</code></td>
+<td>string</td>
+<td>Registration/processing status</td>
+</tr>
+<tr>
+<td><code>next_name</code></td>
+<td>string</td>
+<td>Suggested name for avoiding conflicts</td>
+</tr>
+</tbody>
+</table>
+<h2>Unregister</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Removed (default)</th>
+<th>Not removed</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Database records (videos, chunks, embeddings, processor_results, pre_chunks)</td>
+<td>The original source video file on disk</td>
+</tr>
+<tr>
+<td>Processor output JSON files (<code>{uuid}.*.json</code>) — unless <code>delete_output_files: false</code></td>
+<td>Temp/working directories</td>
+</tr>
+<tr>
+<td>In-memory cache entries</td>
+<td></td>
+</tr>
+<tr>
+<td>MongoDB cached lists</td>
+<td></td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Single file UUID to delete</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Directory path (for batch delete)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Regex pattern (requires <code>file_path</code>)</td>
+</tr>
+<tr>
+<td><code>delete_output_files</code></td>
+<td>boolean</td>
+<td>No</td>
+<td><code>true</code></td>
+<td>If <code>true</code>, also delete processor output JSON files (<code>{uuid}.*.json</code>). Set to <code>false</code> to keep them.</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Delete a single file by UUID (default: also deletes output JSON files)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Keep output JSON files, only delete DB records</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;delete_output_files&quot;: false}&#39;</span>
+
+<span class="c1"># Batch delete all mp4 files in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>True if deletion succeeded</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>UUID of the deleted file (single mode)</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Neither <code>file_uuid</code> nor <code>file_path</code>+<code>pattern</code> provided</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Processing Pipeline</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>processors</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Specific processors to run: <code>["asr","cut","yolo","ocr","face","pose","asrx","visual_chunk"]</code></td>
+</tr>
+<tr>
+<td><code>rules</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Rule names to apply (currently unused)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Run all processors</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-d<span class="w"> </span><span class="s1">&#39;{}&#39;</span>
+
+<span class="c1"># Run specific processors only</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;processors&quot;: [&quot;asr&quot;, &quot;face&quot;, &quot;yolo&quot;]}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>job_id</code></td>
+<td>integer</td>
+<td>Monitor job ID (for job tracking)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the file</td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>"processing"</code></td>
+</tr>
+<tr>
+<td><code>pids</code></td>
+<td>integer[]</td>
+<td>Process IDs of started processors</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/probe&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>file_size</code></td>
+<td>integer</td>
+<td>File size in bytes (from filesystem)</td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Estimated total frames</td>
+</tr>
+<tr>
+<td><code>cached</code></td>
+<td>boolean</td>
+<td>True if result was from cached probe JSON</td>
+</tr>
+<tr>
+<td><code>format</code></td>
+<td>object</td>
+<td>Container format info (ffprobe format section)</td>
+</tr>
+<tr>
+<td><code>streams</code></td>
+<td>array</td>
+<td>Array of stream info objects</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/progress/</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{overall_progress, processors: [.processors[] | {processor_type, status}]}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>overall_progress</code></td>
+<td>integer</td>
+<td>Overall progress percentage (0–100)</td>
+</tr>
+<tr>
+<td><code>processors</code></td>
+<td>array</td>
+<td>Per-processor status list</td>
+</tr>
+<tr>
+<td><code>processors[].processor_type</code></td>
+<td>string</td>
+<td>Processor name (<code>asr</code>, <code>cut</code>, <code>yolo</code>, etc.)</td>
+</tr>
+<tr>
+<td><code>processors[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"complete"</code>, or <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>processors[].progress</code></td>
+<td>integer</td>
+<td>Per-processor progress (0–100)</td>
+</tr>
+<tr>
+<td><code>cpu_percent</code></td>
+<td>float</td>
+<td>Current CPU usage</td>
+</tr>
+<tr>
+<td><code>gpu_percent</code></td>
+<td>float</td>
+<td>Current GPU utilization</td>
+</tr>
+<tr>
+<td><code>memory_percent</code></td>
+<td>float</td>
+<td>Current memory usage</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/jobs&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{count, jobs: [.jobs[] | {uuid, status}]}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jobs</code></td>
+<td>array</td>
+<td>Array of job info objects</td>
+</tr>
+<tr>
+<td><code>jobs[].id</code></td>
+<td>integer</td>
+<td>Job ID</td>
+</tr>
+<tr>
+<td><code>jobs[].uuid</code></td>
+<td>string</td>
+<td>File UUID being processed</td>
+</tr>
+<tr>
+<td><code>jobs[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"completed"</code>, <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>jobs[].current_processor</code></td>
+<td>string</td>
+<td>Currently active processor, or null</td>
+</tr>
+<tr>
+<td><code>count</code></td>
+<td>integer</td>
+<td>Total job count</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Jobs per page</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Search APIs</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict search to a specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>10</td>
+<td>Max results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+<td>Items per page (alias: <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>mode</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>smart</code></td>
+<td>Search mode: <code>"vector"</code> or <code>"smart"</code></td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Search across all files</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+
+<span class="c1"># Search within a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Paginated search</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;page&quot;: 1, &quot;page_size&quot;: 3}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results</code></td>
+<td>array</td>
+<td>Array of matched chunks (deduplicated)</td>
+</tr>
+<tr>
+<td><code>results[].uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>results[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>results[].chunk_type</code></td>
+<td>string</td>
+<td><code>"sentence"</code>, <code>"cut"</code>, <code>"trace"</code>, <code>"visual"</code></td>
+</tr>
+<tr>
+<td><code>results[].start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].text</code></td>
+<td>string</td>
+<td>Chunk text content</td>
+</tr>
+<tr>
+<td><code>results[].score</code></td>
+<td>float</td>
+<td>Similarity score (0.0–1.0)</td>
+</tr>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Original search query</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict search to a specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>10</td>
+<td>Max results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>vector_weight</code></td>
+<td>float</td>
+<td>No</td>
+<td>0.5</td>
+<td>Weight for vector score (0.0–1.0)</td>
+</tr>
+<tr>
+<td><code>bm25_weight</code></td>
+<td>float</td>
+<td>No</td>
+<td>0.5</td>
+<td>Weight for BM25 score (0.0–1.0)</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].vector_score</code></td>
+<td>float</td>
+<td>Vector similarity score</td>
+</tr>
+<tr>
+<td><code>results[].bm25_score</code></td>
+<td>float</td>
+<td>BM25 text score</td>
+</tr>
+<tr>
+<td><code>results[].combined_score</code></td>
+<td>float</td>
+<td>Weighted combination of both scores</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search</code></td>
+<td>N8N-format vector search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/bm25</code></td>
+<td>N8N-format BM25 search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/hybrid</code></td>
+<td>N8N-format hybrid search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/smart</code></td>
+<td>N8N-format smart search</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>types</code></td>
+<td>string[]</td>
+<td>No</td>
+<td><code>["chunk"]</code></td>
+<td>Search types: <code>chunk</code>, <code>frame</code>, <code>person</code></td>
+</tr>
+<tr>
+<td><code>filters</code></td>
+<td>object</td>
+<td>No</td>
+<td>—</td>
+<td>Filter criteria (confidence, object class, speaker, etc.)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>20</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>time_range</code></td>
+<td>float[2]</td>
+<td>No</td>
+<td>—</td>
+<td>Time range <code>[start, end]</code> in seconds</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/n8n/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results</code></td>
+<td>array</td>
+<td>Array of search results</td>
+</tr>
+<tr>
+<td><code>results[].type</code></td>
+<td>string</td>
+<td>Result type: <code>"chunk"</code>, <code>"frame"</code>, or <code>"person"</code></td>
+</tr>
+<tr>
+<td><code>results[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>results[].chunk_type</code></td>
+<td>string</td>
+<td>Chunk type</td>
+</tr>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>results[].start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].text</code></td>
+<td>string</td>
+<td>Content text</td>
+</tr>
+<tr>
+<td><code>results[].score</code></td>
+<td>float</td>
+<td>Relevance score</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>took_ms</code></td>
+<td>integer</td>
+<td>Query execution time in milliseconds</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to search within</td>
+</tr>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Text search query</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/identity_text?file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&amp;q=charade&amp;page=1&amp;page_size=5&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>text_content</code></td>
+<td>string</td>
+<td>Chunk text content</td>
+</tr>
+<tr>
+<td><code>identity_id</code></td>
+<td>integer</td>
+<td>Identity ID (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_name</code></td>
+<td>string</td>
+<td>Identity name (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_source</code></td>
+<td>string</td>
+<td>Identity origin. <code>.json</code> = established from identity.json files on disk (unified format for all sources). <code>tmdb</code> = from <code>.json</code> via TMDb enrichment probe, then matched against faces. <code>auto</code> = pipeline face matching result; only stranger identities are auto-created. <code>user_defined</code> = manual. <code>merged</code> = merged identities.</td>
+</tr>
+<tr>
+<td><code>trace_id</code></td>
+<td>integer</td>
+<td>Face trace ID (null if no trace matched)</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity name search</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;q&quot;: &quot;Cary Grant&quot;}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual</code></td>
+<td>Search visual chunks by criteria (object classes, density)</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/class</code></td>
+<td>Search by specific object class</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/density</code></td>
+<td>Search by spatial density range</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/stats</code></td>
+<td>Get visual detection statistics</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/combination</code></td>
+<td>Search by object class combination</td>
+</tr>
+</tbody>
+</table>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>criteria.required_classes</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>Required object classes (e.g., <code>["person", "car"]</code>)</td>
+</tr>
+<tr>
+<td><code>criteria.min_confidence</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum confidence threshold</td>
+</tr>
+<tr>
+<td><code>criteria.min_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum spatial density</td>
+</tr>
+<tr>
+<td><code>criteria.max_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Maximum spatial density</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/visual&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;criteria&quot;: {&quot;required_classes&quot;: [&quot;person&quot;, &quot;car&quot;]}}&#39;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>chunks</code></td>
+<td>array</td>
+<td>Array of matching visual chunks</td>
+</tr>
+<tr>
+<td><code>chunks[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunks[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>chunks[].detections</code></td>
+<td>array</td>
+<td>Object detections in this chunk</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching chunks</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>TMDb Enrichment</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to enrich</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/tmdb/prefetch&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/tmdb-probe&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_created, movie_title}&#39;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_seeded, cache_files}&#39;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb/check&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.status&#39;</span>
+</code></pre></div>
+
+<hr />
+<h2>POST /api/v1/agents/translate</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>text</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Text to translate</td>
+</tr>
+<tr>
+<td><code>target_language</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Target language name (e.g. "Traditional Chinese", "Japanese")</td>
+</tr>
+<tr>
+<td><code>source_language</code></td>
+<td>string</td>
+<td>❌</td>
+<td>Source language (default: "auto")</td>
+</tr>
+</tbody>
+</table>
+<h3>Response</h3>
+<p>```json
+| Source | Target | Quality |
+|--------|--------|---------|
+| English | Traditional Chinese | ✅ |
+| English | Japanese | ✅ |
+| Chinese | English | ✅ |
+| English | French | ✅ |
+| Chinese | Japanese | ✅ |</p>
+<h3>Errors</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Status</th>
+<th>Condition</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>500</td>
+<td>LLM unreachable or response parse failure</td>
+</tr>
+<tr>
+<td>401</td>
+<td>Missing/invalid auth</td>
+</tr>
+</tbody>
+</table>
+<h2>GET /api/v1/agents/identity/status</h2>
+<p>Get status of the identity agent pipeline.</p>
+<h3>Response</h3>
+<p>```json</p>
+<h2>POST /api/v1/agents/suggest/clustering</h2>
+<h2>POST /api/v1/agents/suggest/merge</h2>
+<h2>POST /api/v1/agents/5w1h/analyze</h2>
+<h3>Response</h3>
+<p>```json</p>
+<h2>POST /api/v1/agents/5w1h/batch</h2>
+<h2>GET /api/v1/agents/5w1h/status</h2>
+<hr />
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/API_REFERENCE.html b/docs_v1.0/doc_user/API_REFERENCE.html
new file mode 100644
index 0000000..50d2d1d
--- /dev/null
+++ b/docs_v1.0/doc_user/API_REFERENCE.html
@@ -0,0 +1,3684 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Api Reference - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "api_reference"
+service: "MOMENTRY_CORE"
+title: "Momentry Core API Reference"
+date: "2026-05-17"
+version: "V1.1"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"</p>
+<hr />
+<h1>Momentry Core API Reference</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Base URL</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Environment</th>
+<th>URL</th>
+<th>Purpose</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Playground (Dev)</td>
+<td><code>http://localhost:3003</code></td>
+<td>Development and testing</td>
+</tr>
+<tr>
+<td>Production</td>
+<td><code>http://localhost:3002</code></td>
+<td>Production deployment</td>
+</tr>
+<tr>
+<td>External (M5)</td>
+<td><code>https://m5api.momentry.ddns.net</code></td>
+<td>Remote access</td>
+</tr>
+</tbody>
+</table>
+<h2>Variables</h2>
+<p>All examples in this documentation use these environment variables:</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://localhost:3003&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;your-api-key-here&quot;</span>
+</code></pre></div>
+
+<h2>Authentication</h2>
+<p>All endpoints under <code>/api/v1/*</code> require authentication.
+The following endpoints are public (no auth needed):</p>
+<ul>
+<li><code>GET /health</code></li>
+<li><code>POST /api/v1/auth/login</code></li>
+<li><code>POST /api/v1/auth/logout</code></li>
+</ul>
+<h3>Three Authentication Modes</h3>
+<p>The system supports three authentication methods, checked in <strong>priority order</strong> by the middleware:</p>
+<div class="codehilite"><pre><span></span><code>Middleware priority:
+  1. Session Cookie (Portal/browser)
+  2. JWT Bearer (API clients: n8n, CLI)
+  3. API Key Header (legacy compatibility)
+  4. API Key Query Param (?api_key=)
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Mode</th>
+<th>Transport</th>
+<th>Expiry</th>
+<th>Scope</th>
+<th>Best for</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td><code>Cookie: session_id=&lt;uuid&gt;</code></td>
+<td>24h</td>
+<td>per-browser session</td>
+<td>Portal (browser)</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td><code>Authorization: Bearer &lt;token&gt;</code></td>
+<td>1h</td>
+<td>per-login token</td>
+<td>API clients (n8n, CLI, scripts)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td><code>X-API-Key: &lt;key&gt;</code></td>
+<td>90d</td>
+<td>fixed key for automation</td>
+<td>Legacy scripts, WordPress</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Login</h3>
+<p><strong>Default accounts &amp; API keys:</strong></p>
+<table class="table">
+<thead>
+<tr>
+<th>Username</th>
+<th>Password</th>
+<th>API Key</th>
+<th>Role</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>admin</code></td>
+<td><code>admin</code></td>
+<td>—</td>
+<td>admin</td>
+</tr>
+<tr>
+<td><code>demo</code></td>
+<td><code>demo</code></td>
+<td><code>muser_demo_key_32chars_abcdef1234567890</code></td>
+<td>user</td>
+</tr>
+</tbody>
+</table>
+<p>The demo API key is set via <code>MOMENTRY_DEMO_API_KEY</code> env var and can be used in place of JWT for marcom integrations:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Using API key instead of JWT</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_demo_key_32chars_abcdef1234567890&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login as admin</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;admin&quot;, &quot;password&quot;: &quot;admin&quot;}&#39;</span>
+
+<span class="c1"># Login as demo user</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;demo&quot;, &quot;password&quot;: &quot;demo&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Success Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;jwt&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;eyJhbGciOiJIUzI1NiIs...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_key&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;muser_...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;user&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;username&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;role&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;expires_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-18T13:00:00Z&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jwt</code></td>
+<td>string</td>
+<td>JWT access token. Use as <code>Authorization: Bearer &lt;jwt&gt;</code>. Expires in 1 hour.</td>
+</tr>
+<tr>
+<td><code>api_key</code></td>
+<td>string</td>
+<td>Legacy API key. Use as <code>X-API-Key: &lt;key&gt;</code>. Good for 90 days.</td>
+</tr>
+<tr>
+<td><code>user.username</code></td>
+<td>string</td>
+<td>Username</td>
+</tr>
+<tr>
+<td><code>user.role</code></td>
+<td>string</td>
+<td>Role: <code>admin</code>, <code>user</code>, or <code>readonly</code></td>
+</tr>
+<tr>
+<td><code>expires_at</code></td>
+<td>string</td>
+<td>ISO8601 timestamp of JWT expiration</td>
+</tr>
+</tbody>
+</table>
+<p>The login endpoint also sets a <code>Set-Cookie</code> header for browser-based clients:</p>
+<div class="codehilite"><pre><span></span><code><span class="nt">Set-Cookie</span><span class="o">:</span><span class="w"> </span><span class="nt">session_id</span><span class="o">=&lt;</span><span class="nt">uuid</span><span class="o">&gt;;</span><span class="w"> </span><span class="nt">Path</span><span class="o">=/</span><span class="nt">api</span><span class="o">;</span><span class="w"> </span><span class="nt">HttpOnly</span><span class="o">;</span><span class="w"> </span><span class="nt">SameSite</span><span class="o">=</span><span class="nt">Strict</span><span class="o">;</span><span class="w"> </span><span class="nt">Max-Age</span><span class="o">=</span><span class="nt">86400</span>
+</code></pre></div>
+
+<h4>Error Response (401)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Invalid username or password&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3>Using JWT</h3>
+<p>JWT is preferred for API clients (n8n, CLI scripts, WordPress). It is validated by the middleware without a database lookup (stateless).</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login and capture JWT</span>
+<span class="nv">JWT</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;print(json.load(sys.stdin)[&#39;jwt&#39;])&quot;</span><span class="k">)</span>
+
+<span class="c1"># Use JWT for all subsequent requests</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span>
+</code></pre></div>
+
+<p>JWT is short-lived (1 hour). When it expires, request a new one via login.</p>
+<hr />
+<h3>Using Session Cookie (Browser)</h3>
+<p>Browser-based clients (Portal) get a session cookie automatically after login. The browser sends the cookie with every request—no manual header needed.</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login captures the session cookie from Set-Cookie header</span>
+curl<span class="w"> </span>-v<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span>
+
+<span class="c1"># Browser automatically sends: Cookie: session_id=&lt;uuid&gt;</span>
+<span class="c1"># No manual header needed for subsequent requests</span>
+</code></pre></div>
+
+<p>The session cookie is HttpOnly (not accessible from JavaScript) and SameSite=Strict (protected against CSRF).</p>
+<hr />
+<h3>Using Legacy API Key</h3>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+
+<span class="c1"># Also accepted via Bearer header (non-JWT format) or query parameter:</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?api_key=</span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>API keys are validated via SHA256 hash lookup in the database. They are long-lived (90 days) and intended for automation.</p>
+<h3>Obtaining an API Key (CLI)</h3>
+<div class="codehilite"><pre><span></span><code>momentry<span class="w"> </span>api-key<span class="w"> </span>create<span class="w"> </span><span class="s2">&quot;My API Key&quot;</span><span class="w"> </span>--key-type<span class="w"> </span>user
+</code></pre></div>
+
+<hr />
+<h3>Logout</h3>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Logout using the session cookie (browser)</span>
+curl<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=&lt;uuid&gt;&quot;</span>
+</code></pre></div>
+
+<h4>What logout does</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Auth mode</th>
+<th>Effect</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td>Session deleted from database. Same cookie returns 401 on subsequent requests.</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td>JWT remains valid until expiry. (JWT is stateless — logout adds JWT to a blacklist only if API key mode is used.)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td>API key remains valid. (Legacy keys are shared across sessions — revoking would break other clients.)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example: full session lifecycle</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># 1. Login</span>
+<span class="nv">SESSION_ID</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-D<span class="w"> </span>-<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sed<span class="w"> </span><span class="s1">&#39;s/.*session_id=\([^;]*\).*/\1/&#39;</span><span class="k">)</span>
+
+<span class="c1"># 2. Use session (works)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 200</span>
+
+<span class="c1"># 3. Logout</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → {&quot;success&quot;: true}</span>
+
+<span class="c1"># 4. Use session again (rejected)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 401</span>
+</code></pre></div>
+
+<hr />
+<h3>Authentication Flow Summary</h3>
+<div class="codehilite"><pre><span></span><code>Login Request
+     │
+     ▼
+┌──────────────────┐
+│  1. Check users  │ ← users table (argon2 password verify)
+│     table        │
+└──────┬───────────┘
+       │
+   ┌───┴───┐
+   │ match │
+   └───┬───┘
+       │
+       ▼
+┌──────────────────┐
+│  2. Create JWT   │ ← 1h expiry, signed with JWT_SECRET
+├──────────────────┤
+│  3. Create       │ ← 24h expiry, stored in sessions table
+│     session      │
+├──────────────────┤
+│  4. Set-Cookie   │ ← HttpOnly, SameSite=Strict, Path=/api
+├──────────────────┤
+│  5. Return       │ ← JWT + api_key + user info to client
+└──────────────────┘
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>Protected Request
+     │
+     ▼
+┌──────────────────────┐
+│  Middleware checks:  │
+│                      │
+│  1. Cookie session?  │ → DB lookup session → get api_key → verify
+│                      │
+│  2. JWT Bearer?      │ → verify JWT signature → decode claims
+│                      │
+│  3. X-API-Key?       │ → SHA256 hash → DB lookup → verify
+│                      │
+│  4. ?api_key=?       │ → same as #3
+│                      │
+│  5. None → 401       │
+└──────────────────────┘
+</code></pre></div>
+
+<hr />
+<h3>Error Responses</h3>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid authentication</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Session expired or logged out</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>JWT expired</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>API key revoked or inactive</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Related</h3>
+<ul>
+<li><code>POST /api/v1/resource/tmdb/check</code> — test authentication + TMDb API connectivity</li>
+<li><code>GET /health/detailed</code> — view auth status (integrations section)</li>
+</ul>
+<hr />
+<h2>Health Check</h2>
+<h3><code>GET /health</code></h3>
+<p><strong>Auth</strong>: Public
+<strong>Scope</strong>: system-level</p>
+<p>Returns basic server health status — used by load balancers and monitoring.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, version}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_git_hash&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_timestamp&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T13:38:15Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;uptime_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3015</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>version</code></td>
+<td>string</td>
+<td>Semver version</td>
+</tr>
+<tr>
+<td><code>build_git_hash</code></td>
+<td>string</td>
+<td>Git commit hash</td>
+</tr>
+<tr>
+<td><code>build_timestamp</code></td>
+<td>string</td>
+<td>Binary build time</td>
+</tr>
+<tr>
+<td><code>uptime_ms</code></td>
+<td>integer</td>
+<td>Milliseconds since server start</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /health/detailed</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Returns full system health including each service status, resource utilization, pipeline readiness, schema migration status, identity file sync status, and external integrations.</p>
+<blockquote>
+<p>Requires authentication (JWT, session cookie, or API key). The basic <code>/health</code> endpoint remains public for load balancer checks.</p>
+</blockquote>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health/detailed&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, services, resources: {cpu: .resources.cpu_used_percent, memory: .resources.memory_used_percent}}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;services&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;postgres&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;redis&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;qdrant&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">}</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;resources&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;cpu_used_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">12.5</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;memory_available_mb&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">32768</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;memory_used_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">31.7</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;pipeline&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;scripts_ready&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;scripts_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;asr&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;yolo&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;face&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;pose&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;ocr&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;cut&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;scene&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;asrx&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;visual_chunk&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;models_ready&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;models_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;scripts_integrity&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">332</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;ffmpeg&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;schema&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;table_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;applied&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[{</span><span class="nt">&quot;filename&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;migrate_add_users_table.sql&quot;</span><span class="p">}],</span>
+<span class="w">    </span><span class="nt">&quot;required&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[],</span>
+<span class="w">    </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;identities&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;directory_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;files_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3481</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;index_ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;db_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3481</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;synced&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;integrations&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;tmdb&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;api_key_configured&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;enabled&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;api_reachable&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Response Fields</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>ok</code> if all essential services healthy</td>
+</tr>
+<tr>
+<td><code>services</code></td>
+<td>object</td>
+<td>Per-service status (postgres, redis, qdrant)</td>
+</tr>
+<tr>
+<td><code>services.*.status</code></td>
+<td>string</td>
+<td><code>ok</code>, <code>error</code>, or <code>degraded</code></td>
+</tr>
+<tr>
+<td><code>services.*.latency_ms</code></td>
+<td>int</td>
+<td>Response time in milliseconds</td>
+</tr>
+<tr>
+<td><code>resources</code></td>
+<td>object</td>
+<td>CPU, memory usage</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_ready</code></td>
+<td>boolean</td>
+<td>Scripts directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_count</code></td>
+<td>int</td>
+<td>Number of Python processor scripts</td>
+</tr>
+<tr>
+<td><code>pipeline.processors</code></td>
+<td>object</td>
+<td>Per-processor availability</td>
+</tr>
+<tr>
+<td><code>pipeline.models_ready</code></td>
+<td>boolean</td>
+<td>Models directory accessible</td>
+</tr>
+<tr>
+<td><code>pipeline.scripts_integrity</code></td>
+<td>object</td>
+<td>SHA256 checksum verification results</td>
+</tr>
+<tr>
+<td><code>schema.ok</code></td>
+<td>boolean</td>
+<td>All required migrations applied</td>
+</tr>
+<tr>
+<td><code>identities.synced</code></td>
+<td>boolean</td>
+<td>Identity file count matches DB count</td>
+</tr>
+<tr>
+<td><code>integrations.tmdb</code></td>
+<td>object</td>
+<td>TMDB API key config and reachability</td>
+</tr>
+</tbody>
+</table>
+<h4>Health status rules</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Condition</th>
+<th>status</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>All services ok</td>
+<td><code>ok</code></td>
+</tr>
+<tr>
+<td>Any service error</td>
+<td><code>degraded</code></td>
+</tr>
+<tr>
+<td>Postgres or Redis error</td>
+<td><code>degraded</code> (server still responds)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Stats Endpoints</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Auth</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/ingest</code></td>
+<td>No</td>
+<td>Ingest pipeline statistics</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/sftpgo</code></td>
+<td>No</td>
+<td>SFTPGo service status</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/inference</code></td>
+<td>No</td>
+<td>Inference service (LLM) health</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/stats/ingest&quot;</span>
+</code></pre></div>
+
+<hr />
+<h2>File Registration</h2>
+<h3><code>POST /api/v1/files/register</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Register a video file for processing. Returns the file's metadata and UUID.</p>
+<p><strong>New in v0.1.2</strong>: Registration now <strong>automatically triggers the processing pipeline</strong> — no need to call <code>POST /api/v1/file/:uuid/process</code> separately. The system will:
+1. Register the file and run ffprobe
+2. Auto-run offline TMDb probe (reads local identity files, no API calls)
+3. Create a monitor job for the worker
+4. Worker starts all 10 processors (Cut → ASR → ASRX → YOLO → OCR → Face → Pose → VisualChunk → Story → 5W1H)</p>
+<p>If the file already exists (same content hash), returns the existing record with <code>already_exists: true</code>.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Path to video file on disk</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex pattern for batch register (requires <code>file_path</code> to be a directory)</td>
+</tr>
+<tr>
+<td><code>user_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>User ID to associate with registration</td>
+</tr>
+<tr>
+<td><code>content_hash</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Pre-computed SHA-256 hash (skips computation)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Register a single file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39;</span>
+
+<span class="c1"># Batch register files matching a pattern in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;already_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;File registered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the registered file</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name (auto-renamed if name conflict)</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Canonical path on disk</td>
+</tr>
+<tr>
+<td><code>file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>"unknown"</code></td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Total frame count</td>
+</tr>
+<tr>
+<td><code>already_exists</code></td>
+<td>boolean</td>
+<td>True if same content was already registered</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+<tr>
+<td><code>400</code></td>
+<td>Invalid request body</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File path does not exist</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/files/scan</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Scan the filesystem directory and list all media files, showing which are registered, processing, or unregistered.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Items per page (alias: <code>limit</code>)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Max items (alias for <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex filter on file name (e.g., <code>.*\\.mp4$</code>)</td>
+</tr>
+<tr>
+<td><code>sort_by</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>name</code></td>
+<td>Sort field: <code>name</code>, <code>size</code>, <code>modified</code>, <code>status</code></td>
+</tr>
+<tr>
+<td><code>sort_order</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>asc</code></td>
+<td>Sort direction: <code>asc</code> or <code>desc</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Full scan</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, registered_count, unregistered_count}&#39;</span>
+
+<span class="c1"># Paginated (page 1, 5 per page)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?page=1&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{page, total_pages, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Regex filter: only mp4 files</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?pattern=.*\\.mp4</span>$<span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{filtered_total, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Sort by file size (largest first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=size&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, file_size}]&#39;</span>
+
+<span class="c1"># Sort by modified time (most recent first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=modified&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, modified_time}]&#39;</span>
+
+<span class="c1"># Sort by status</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=status&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, status}]&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;files&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">12345678</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;is_registered&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;registration_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">107</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;filtered_total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">80</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_pages&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;registered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">26</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;unregistered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">81</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>files</code></td>
+<td>array</td>
+<td>Array of file info objects (paginated)</td>
+</tr>
+<tr>
+<td><code>files[].file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>files[].relative_path</code></td>
+<td>string</td>
+<td>Path relative to scan root</td>
+</tr>
+<tr>
+<td><code>files[].file_path</code></td>
+<td>string</td>
+<td>Absolute path on disk</td>
+</tr>
+<tr>
+<td><code>files[].file_size</code></td>
+<td>integer</td>
+<td>File size in bytes</td>
+</tr>
+<tr>
+<td><code>files[].modified_time</code></td>
+<td>string</td>
+<td>Last modified timestamp (ISO8601)</td>
+</tr>
+<tr>
+<td><code>files[].is_registered</code></td>
+<td>boolean</td>
+<td>Whether file is registered in DB</td>
+</tr>
+<tr>
+<td><code>files[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].status</code></td>
+<td>string</td>
+<td><code>"completed"</code>, <code>"processing"</code>, <code>"registered"</code>, <code>"unregistered"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>files[].registration_time</code></td>
+<td>string</td>
+<td>DB registration timestamp (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].job_id</code></td>
+<td>integer</td>
+<td>Processing job ID (only if a job exists)</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total files found on disk (unfiltered)</td>
+</tr>
+<tr>
+<td><code>filtered_total</code></td>
+<td>integer</td>
+<td>Files matching regex filter</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>total_pages</code></td>
+<td>integer</td>
+<td>Total pages</td>
+</tr>
+<tr>
+<td><code>registered_count</code></td>
+<td>integer</td>
+<td>Files registered in DB</td>
+</tr>
+<tr>
+<td><code>unregistered_count</code></td>
+<td>integer</td>
+<td>Files not yet registered</td>
+</tr>
+</tbody>
+</table>
+<h4>Notes</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Feature</th>
+<th>Behavior</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Regex</strong></td>
+<td>Case-insensitive (<code>(?i)</code> prefix auto-applied). Applied to <code>file_name</code>.</td>
+</tr>
+<tr>
+<td><strong>Sort order</strong></td>
+<td>Default (<code>sort_by=name</code>): registered files first, then alphabetically. <code>sort_by=status</code>: alphabetical by status string.</td>
+</tr>
+<tr>
+<td><strong>Pagination</strong></td>
+<td><code>page_size</code> and <code>limit</code> are aliases. Default: show all results.</td>
+</tr>
+<tr>
+<td><strong>Processing order</strong></td>
+<td><code>pattern</code> regex filter → <code>sort_by</code>/<code>sort_order</code> → <code>page</code>/<code>page_size</code> slice.</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>File Lookup</h2>
+<h3><code>GET /api/v1/files/lookup</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Search registered files by file name. Performs a case-insensitive LIKE search on the file name column. Returns basic info about matching files.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File name to search for (partial matches supported)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Look up a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=video.mp4&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+
+<span class="c1"># Partial name search</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/lookup?file_name=charade&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.matches[].file_name&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;matches&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a03485a40b2df2d3&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;next_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video (2).mp4&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>Searched name</td>
+</tr>
+<tr>
+<td><code>exists</code></td>
+<td>boolean</td>
+<td>Exact name match exists</td>
+</tr>
+<tr>
+<td><code>matches</code></td>
+<td>array</td>
+<td>Array of matching registered files</td>
+</tr>
+<tr>
+<td><code>matches[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>matches[].file_name</code></td>
+<td>string</td>
+<td>Registered file name</td>
+</tr>
+<tr>
+<td><code>matches[].file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>matches[].status</code></td>
+<td>string</td>
+<td>Registration/processing status</td>
+</tr>
+<tr>
+<td><code>next_name</code></td>
+<td>string</td>
+<td>Suggested name for avoiding conflicts</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Unregister</h2>
+<h3><code>POST /api/v1/unregister</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Delete a registered file from the system. Supports single file by UUID, or batch by directory + regex pattern.</p>
+<h4>What gets deleted</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Removed (default)</th>
+<th>Not removed</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Database records (videos, chunks, embeddings, processor_results, pre_chunks)</td>
+<td>The original source video file on disk</td>
+</tr>
+<tr>
+<td>Processor output JSON files (<code>{uuid}.*.json</code>) — unless <code>delete_output_files: false</code></td>
+<td>Temp/working directories</td>
+</tr>
+<tr>
+<td>In-memory cache entries</td>
+<td></td>
+</tr>
+<tr>
+<td>MongoDB cached lists</td>
+<td></td>
+</tr>
+</tbody>
+</table>
+<blockquote>
+<p>⚠️ Database deletion is <strong>irreversible</strong>. To keep output files, set <code>"delete_output_files": false</code>.</p>
+</blockquote>
+<h4>Request Parameters</h4>
+<p>At least one mode must be specified: either <code>file_uuid</code> alone, or <code>file_path</code> + <code>pattern</code> together.</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Single file UUID to delete</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Directory path (for batch delete)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>*</td>
+<td>—</td>
+<td>Regex pattern (requires <code>file_path</code>)</td>
+</tr>
+<tr>
+<td><code>delete_output_files</code></td>
+<td>boolean</td>
+<td>No</td>
+<td><code>true</code></td>
+<td>If <code>true</code>, also delete processor output JSON files (<code>{uuid}.*.json</code>). Set to <code>false</code> to keep them.</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Delete a single file by UUID (default: also deletes output JSON files)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Keep output JSON files, only delete DB records</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;delete_output_files&quot;: false}&#39;</span>
+
+<span class="c1"># Batch delete all mp4 files in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/unregister&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a03485a40b2df2d3&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Video unregistered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>True if deletion succeeded</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>UUID of the deleted file (single mode)</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Neither <code>file_uuid</code> nor <code>file_path</code>+<code>pattern</code> provided</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Processing Pipeline</h2>
+<h3><code>POST /api/v1/file/:file_uuid/process</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Trigger the processing pipeline for a registered file. Creates a monitor job that the worker picks up and processes sequentially. Returns immediately with the job info—processing runs asynchronously in the background.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>processors</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Specific processors to run: <code>["asr","cut","yolo","ocr","face","pose","asrx","visual_chunk"]</code></td>
+</tr>
+<tr>
+<td><code>rules</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>all</td>
+<td>Rule names to apply (currently unused)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Run all processors</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-d<span class="w"> </span><span class="s1">&#39;{}&#39;</span>
+
+<span class="c1"># Run specific processors only</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;processors&quot;: [&quot;asr&quot;, &quot;face&quot;, &quot;yolo&quot;]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;processing&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;pids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="mi">12345</span><span class="p">,</span><span class="w"> </span><span class="mi">12346</span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Processing triggered for video.mp4&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>job_id</code></td>
+<td>integer</td>
+<td>Monitor job ID (for job tracking)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the file</td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>"processing"</code></td>
+</tr>
+<tr>
+<td><code>pids</code></td>
+<td>integer[]</td>
+<td>Process IDs of started processors</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>404</code></td>
+<td>File UUID not found</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/file/:file_uuid/probe</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Get ffprobe metadata for a registered file. Returns video/audio stream info, codec details, duration, resolution, and frame rate.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/probe&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">794863677</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;cached&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;format&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;filename&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;format_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;mov,mp4,m4a,3gp&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;120.5&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;size&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;12345678&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;bit_rate&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;819200&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;streams&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;index&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;codec_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;h264&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;codec_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;r_frame_rate&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;24/1&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;120.5&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>file_size</code></td>
+<td>integer</td>
+<td>File size in bytes (from filesystem)</td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Estimated total frames</td>
+</tr>
+<tr>
+<td><code>cached</code></td>
+<td>boolean</td>
+<td>True if result was from cached probe JSON</td>
+</tr>
+<tr>
+<td><code>format</code></td>
+<td>object</td>
+<td>Container format info (ffprobe format section)</td>
+</tr>
+<tr>
+<td><code>streams</code></td>
+<td>array</td>
+<td>Array of stream info objects</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/progress/:file_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Get real-time processing progress for a file. Queries Redis for per-processor status and the database for file metadata. Also includes system resource stats.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/progress/</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{overall_progress, processors: [.processors[] | {processor_type, status}]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;overall_progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">71</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;cpu_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">45.2</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;gpu_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">30.1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;memory_percent&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">62.4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;asr&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;complete&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">100</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;running&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">65</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;processor_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;face&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID</td>
+</tr>
+<tr>
+<td><code>overall_progress</code></td>
+<td>integer</td>
+<td>Overall progress percentage (0–100)</td>
+</tr>
+<tr>
+<td><code>processors</code></td>
+<td>array</td>
+<td>Per-processor status list</td>
+</tr>
+<tr>
+<td><code>processors[].processor_type</code></td>
+<td>string</td>
+<td>Processor name (<code>asr</code>, <code>cut</code>, <code>yolo</code>, etc.)</td>
+</tr>
+<tr>
+<td><code>processors[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"complete"</code>, or <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>processors[].progress</code></td>
+<td>integer</td>
+<td>Per-processor progress (0–100)</td>
+</tr>
+<tr>
+<td><code>cpu_percent</code></td>
+<td>float</td>
+<td>Current CPU usage</td>
+</tr>
+<tr>
+<td><code>gpu_percent</code></td>
+<td>float</td>
+<td>Current GPU utilization</td>
+</tr>
+<tr>
+<td><code>memory_percent</code></td>
+<td>float</td>
+<td>Current memory usage</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/jobs</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>List all processing jobs (monitor jobs) in the system. Shows job status, which file each job is processing, and current processor info.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/jobs&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{count, jobs: [.jobs[] | {uuid, status}]}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;jobs&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;running&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;current_processor&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;started_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:01:00Z&quot;</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jobs</code></td>
+<td>array</td>
+<td>Array of job info objects</td>
+</tr>
+<tr>
+<td><code>jobs[].id</code></td>
+<td>integer</td>
+<td>Job ID</td>
+</tr>
+<tr>
+<td><code>jobs[].uuid</code></td>
+<td>string</td>
+<td>File UUID being processed</td>
+</tr>
+<tr>
+<td><code>jobs[].status</code></td>
+<td>string</td>
+<td><code>"pending"</code>, <code>"running"</code>, <code>"completed"</code>, <code>"failed"</code></td>
+</tr>
+<tr>
+<td><code>jobs[].current_processor</code></td>
+<td>string</td>
+<td>Currently active processor, or null</td>
+</tr>
+<tr>
+<td><code>count</code></td>
+<td>integer</td>
+<td>Total job count</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Jobs per page</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Search APIs</h2>
+<h3>Standard Search</h3>
+<h3><code>POST /api/v1/search</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Semantic/vector search across indexed video chunks. Returns matching chunks with scores.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict search to a specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>10</td>
+<td>Max results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+<td>Items per page (alias: <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>mode</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>smart</code></td>
+<td>Search mode: <code>"vector"</code> or <code>"smart"</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Search across all files</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+
+<span class="c1"># Search within a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Paginated search</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;page&quot;: 1, &quot;page_size&quot;: 3}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.92</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span>
+<span class="p">}</span>
+
+<span class="err">&gt;</span><span class="w"> </span><span class="err">Resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">are</span><span class="w"> </span><span class="err">deduplica</span><span class="kc">te</span><span class="err">d</span><span class="w"> </span><span class="err">by</span><span class="w"> </span><span class="err">`chu</span><span class="kc">n</span><span class="err">k_id`</span><span class="w"> </span><span class="err">(highes</span><span class="kc">t</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">wi</span><span class="kc">ns</span><span class="err">)</span><span class="w"> </span><span class="err">be</span><span class="kc">f</span><span class="err">ore</span><span class="w"> </span><span class="err">pagi</span><span class="kc">nat</span><span class="err">io</span><span class="kc">n</span><span class="err">.</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">Field</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Type</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Descrip</span><span class="kc">t</span><span class="err">io</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">-------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">-------------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">array</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Array</span><span class="w"> </span><span class="err">o</span><span class="kc">f</span><span class="w"> </span><span class="err">ma</span><span class="kc">t</span><span class="err">ched</span><span class="w"> </span><span class="err">chu</span><span class="kc">n</span><span class="err">ks</span><span class="w"> </span><span class="err">(deduplica</span><span class="kc">te</span><span class="err">d)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.uuid`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">File</span><span class="w"> </span><span class="err">UUID</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.chu</span><span class="kc">n</span><span class="err">k_id`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Chu</span><span class="kc">n</span><span class="err">k</span><span class="w"> </span><span class="err">ide</span><span class="kc">nt</span><span class="err">i</span><span class="kc">f</span><span class="err">ier</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.chu</span><span class="kc">n</span><span class="err">k_</span><span class="kc">t</span><span class="err">ype`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;sentence&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;cut&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;trace&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;visual&quot;</span><span class="err">`</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.s</span><span class="kc">tart</span><span class="err">_</span><span class="kc">t</span><span class="err">ime`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">S</span><span class="kc">tart</span><span class="w"> </span><span class="kc">t</span><span class="err">ime</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="w"> </span><span class="err">seco</span><span class="kc">n</span><span class="err">ds</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.e</span><span class="kc">n</span><span class="err">d_</span><span class="kc">t</span><span class="err">ime`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">E</span><span class="kc">n</span><span class="err">d</span><span class="w"> </span><span class="kc">t</span><span class="err">ime</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="w"> </span><span class="err">seco</span><span class="kc">n</span><span class="err">ds</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.</span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Chu</span><span class="kc">n</span><span class="err">k</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">co</span><span class="kc">ntent</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.score`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Similari</span><span class="kc">t</span><span class="err">y</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`query`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Origi</span><span class="kc">nal</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="err">query</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="kc">t</span><span class="err">o</span><span class="kc">tal</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">To</span><span class="kc">tal</span><span class="w"> </span><span class="err">ma</span><span class="kc">t</span><span class="err">chi</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Curre</span><span class="kc">nt</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="kc">nu</span><span class="err">mber</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page_size`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">I</span><span class="kc">te</span><span class="err">ms</span><span class="w"> </span><span class="err">per</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="err">|</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Error</span><span class="w"> </span><span class="err">Respo</span><span class="kc">nses</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">HTTP</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Whe</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="mi">401</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Missi</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">or</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="err">valid</span><span class="w"> </span><span class="err">API</span><span class="w"> </span><span class="err">key</span><span class="w"> </span><span class="err">|</span>
+
+<span class="mi">---</span>
+
+<span class="err">###</span><span class="w"> </span><span class="err">`POST</span><span class="w"> </span><span class="err">/api/v</span><span class="mi">1</span><span class="err">/search/hybrid`</span>
+
+<span class="err">**Au</span><span class="kc">t</span><span class="err">h**</span><span class="p">:</span><span class="w"> </span><span class="err">Required</span>
+<span class="err">**Scope**</span><span class="p">:</span><span class="w"> </span><span class="kc">f</span><span class="err">ile</span><span class="mi">-</span><span class="err">level</span>
+
+<span class="err">Hybrid</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="err">combi</span><span class="kc">n</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">vec</span><span class="kc">t</span><span class="err">or</span><span class="w"> </span><span class="err">similari</span><span class="kc">t</span><span class="err">y</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">a</span><span class="kc">n</span><span class="err">d</span><span class="w"> </span><span class="err">BM</span><span class="mi">25</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">i</span><span class="kc">nt</span><span class="err">o</span><span class="w"> </span><span class="err">a</span><span class="w"> </span><span class="err">combi</span><span class="kc">ne</span><span class="err">d</span><span class="w"> </span><span class="err">score.</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Reques</span><span class="kc">t</span><span class="w"> </span><span class="err">Parame</span><span class="kc">ters</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">Field</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Type</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Required</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">De</span><span class="kc">fault</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Descrip</span><span class="kc">t</span><span class="err">io</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">-------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">----------</span><span class="err">|</span><span class="mi">---------</span><span class="err">|</span><span class="mi">-------------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`query`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Yes</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Search</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="kc">f</span><span class="err">ile_uuid`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Res</span><span class="kc">tr</span><span class="err">ic</span><span class="kc">t</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="kc">t</span><span class="err">o</span><span class="w"> </span><span class="err">a</span><span class="w"> </span><span class="err">speci</span><span class="kc">f</span><span class="err">ic</span><span class="w"> </span><span class="kc">f</span><span class="err">ile</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`limi</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mi">10</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Max</span><span class="w"> </span><span class="err">resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mi">1</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Page</span><span class="w"> </span><span class="kc">nu</span><span class="err">mber</span><span class="w"> </span><span class="err">(</span><span class="mi">1-</span><span class="err">based)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page_size`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">`limi</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">I</span><span class="kc">te</span><span class="err">ms</span><span class="w"> </span><span class="err">per</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`vec</span><span class="kc">t</span><span class="err">or_weigh</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mf">0.5</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Weigh</span><span class="kc">t</span><span class="w"> </span><span class="kc">f</span><span class="err">or</span><span class="w"> </span><span class="err">vec</span><span class="kc">t</span><span class="err">or</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`bm</span><span class="mi">25</span><span class="err">_weigh</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mf">0.5</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Weigh</span><span class="kc">t</span><span class="w"> </span><span class="kc">f</span><span class="err">or</span><span class="w"> </span><span class="err">BM</span><span class="mi">25</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Respo</span><span class="kc">nse</span>
+
+<span class="err">```jso</span><span class="kc">n</span>
+<span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;vector_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.85</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;bm25_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.72</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;combined_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.79</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].vector_score</code></td>
+<td>float</td>
+<td>Vector similarity score</td>
+</tr>
+<tr>
+<td><code>results[].bm25_score</code></td>
+<td>float</td>
+<td>BM25 text score</td>
+</tr>
+<tr>
+<td><code>results[].combined_score</code></td>
+<td>float</td>
+<td>Weighted combination of both scores</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/search/bm25</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>BM25 full-text keyword search. Good for exact term matching. Returns results with BM25 score only.</p>
+<h4>Request Parameters</h4>
+<p>Same as standard search: <code>query</code>, <code>file_uuid</code>, <code>limit</code>.</p>
+<h4>Response</h4>
+<p>Returns the same structure as standard search, with <code>score</code> representing the BM25 relevance score.</p>
+<hr />
+<h3>N8N Search</h3>
+<p>N8N-format search endpoints. Response format is optimized for n8n workflow consumption.</p>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search</code></td>
+<td>N8N-format vector search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/bm25</code></td>
+<td>N8N-format BM25 search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/hybrid</code></td>
+<td>N8N-format hybrid search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/smart</code></td>
+<td>N8N-format smart search</td>
+</tr>
+</tbody>
+</table>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>types</code></td>
+<td>string[]</td>
+<td>No</td>
+<td><code>["chunk"]</code></td>
+<td>Search types: <code>chunk</code>, <code>frame</code>, <code>person</code></td>
+</tr>
+<tr>
+<td><code>filters</code></td>
+<td>object</td>
+<td>No</td>
+<td>—</td>
+<td>Filter criteria (confidence, object class, speaker, etc.)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>20</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>time_range</code></td>
+<td>float[2]</td>
+<td>No</td>
+<td>—</td>
+<td>Time range <code>[start, end]</code> in seconds</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/n8n/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;chunk&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.92</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;took_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results</code></td>
+<td>array</td>
+<td>Array of search results</td>
+</tr>
+<tr>
+<td><code>results[].type</code></td>
+<td>string</td>
+<td>Result type: <code>"chunk"</code>, <code>"frame"</code>, or <code>"person"</code></td>
+</tr>
+<tr>
+<td><code>results[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>results[].chunk_type</code></td>
+<td>string</td>
+<td>Chunk type</td>
+</tr>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>results[].start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].text</code></td>
+<td>string</td>
+<td>Content text</td>
+</tr>
+<tr>
+<td><code>results[].score</code></td>
+<td>float</td>
+<td>Relevance score</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>took_ms</code></td>
+<td>integer</td>
+<td>Query execution time in milliseconds</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Identity Text Search</h3>
+<p>Two paths for searching identities by text.</p>
+<h4>Path A: <code>GET /api/v1/search/identity_text</code></h4>
+<p>Search chunk text content and return associated identities (if any).</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to search within</td>
+</tr>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Text search query</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/identity_text?file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&amp;q=charade&amp;page=1&amp;page_size=5&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h5>Response</h5>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;limit&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">50</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p>Each result (IdentityTextHit):</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;text_content&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">10</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>text_content</code></td>
+<td>string</td>
+<td>Chunk text content</td>
+</tr>
+<tr>
+<td><code>identity_id</code></td>
+<td>integer</td>
+<td>Identity ID (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_name</code></td>
+<td>string</td>
+<td>Identity name (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_source</code></td>
+<td>string</td>
+<td>Identity origin. <code>.json</code> = established from identity.json files on disk (unified format for all sources). <code>tmdb</code> = from <code>.json</code> via TMDb enrichment probe, then matched against faces. <code>auto</code> = pipeline face matching result; only stranger identities are auto-created. <code>user_defined</code> = manual. <code>merged</code> = merged identities.</td>
+</tr>
+<tr>
+<td><code>trace_id</code></td>
+<td>integer</td>
+<td>Face trace ID (null if no trace matched)</td>
+</tr>
+</tbody>
+</table>
+<h4>Path B: <code>POST /api/v1/identities/search</code></h4>
+<p>Search identity names and return associated face detection text.</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity name search</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;q&quot;: &quot;Cary Grant&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3>Visual Chunk Search</h3>
+<p>Search video frames by visual content (object detection results).</p>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual</code></td>
+<td>Search visual chunks by criteria (object classes, density)</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/class</code></td>
+<td>Search by specific object class</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/density</code></td>
+<td>Search by spatial density range</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/stats</code></td>
+<td>Get visual detection statistics</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/combination</code></td>
+<td>Search by object class combination</td>
+</tr>
+</tbody>
+</table>
+<h4>Request Parameters (Visual Search)</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>criteria.required_classes</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>Required object classes (e.g., <code>["person", "car"]</code>)</td>
+</tr>
+<tr>
+<td><code>criteria.min_confidence</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum confidence threshold</td>
+</tr>
+<tr>
+<td><code>criteria.min_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum spatial density</td>
+</tr>
+<tr>
+<td><code>criteria.max_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Maximum spatial density</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/visual&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;criteria&quot;: {&quot;required_classes&quot;: [&quot;person&quot;, &quot;car&quot;]}}&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;chunks&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;visual_001&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;visual&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;detections&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">        </span><span class="p">{</span><span class="nt">&quot;class&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;person&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.95</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;bbox&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="mi">100</span><span class="p">,</span><span class="w"> </span><span class="mi">200</span><span class="p">,</span><span class="w"> </span><span class="mi">150</span><span class="p">,</span><span class="w"> </span><span class="mi">350</span><span class="p">]}</span>
+<span class="w">      </span><span class="p">],</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">125.3</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>chunks</code></td>
+<td>array</td>
+<td>Array of matching visual chunks</td>
+</tr>
+<tr>
+<td><code>chunks[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunks[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>chunks[].detections</code></td>
+<td>array</td>
+<td>Object detections in this chunk</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching chunks</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Global Identities</h2>
+<h3><code>GET /api/v1/identities</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>List all registered identities with pagination.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities?page=1&amp;page_size=20&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{count, identities: [.identities[] | {name}]}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get detailed information for a specific identity, including metadata and TMDb references.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;people&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;confirmed&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;tmdb_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">112</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;tmdb_profile&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;https://image.tmdb.org/t/p/w185/abc.jpg&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;metadata&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{},</span>
+<span class="w">  </span><span class="nt">&quot;reference_data&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{},</span>
+<span class="w">  </span><span class="nt">&quot;created_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;updated_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">null</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>uuid</code></td>
+<td>string</td>
+<td>32-char hex identity UUID</td>
+</tr>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>identity_type</code></td>
+<td>string</td>
+<td><code>"people"</code> or null</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td><code>.json</code>, <code>auto</code>, <code>tmdb</code>, <code>user_defined</code>, or <code>merged</code></td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td><code>"confirmed"</code>, <code>"pending"</code>, or <code>"inactive"</code></td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>TMDb person ID (only if source = tmdb)</td>
+</tr>
+<tr>
+<td><code>tmdb_profile</code></td>
+<td>string</td>
+<td>TMDb profile image URL</td>
+</tr>
+<tr>
+<td><code>metadata</code></td>
+<td>object</td>
+<td>Metadata JSON (tmdb_character, cast_order, etc.)</td>
+</tr>
+<tr>
+<td><code>created_at</code></td>
+<td>string</td>
+<td>Creation timestamp</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>DELETE /api/v1/identity/:identity_uuid</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Delete an identity permanently.</p>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/files</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all files where this identity appears. Returns per-file summary including face count, confidence, and appearance time range.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/files&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/faces</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all face detection records associated with this identity.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/faces&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID where face was detected</td>
+</tr>
+<tr>
+<td><code>frame_number</code></td>
+<td>integer</td>
+<td>Frame number of detection</td>
+</tr>
+<tr>
+<td><code>face_id</code></td>
+<td>string</td>
+<td>Face ID (format: <code>face_{frame_number}</code>)</td>
+</tr>
+<tr>
+<td><code>confidence</code></td>
+<td>float</td>
+<td>Detection confidence</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/chunks</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Get all text chunks (sentences) spoken while this identity's face was on screen. Useful for finding what a person said.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/chunks&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>string</td>
+<td>Sentence chunk identifier</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>text</code></td>
+<td>string</td>
+<td>Spoken text content</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/bind</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Bind a face detection to an identity. Associates the face trace with the identity for future search and recognition.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID where face is detected</td>
+</tr>
+<tr>
+<td><code>face_id</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Face ID (format: <code>{frame}_{idx}</code>)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/bind&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;face_id&quot;: &quot;1_5&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/unbind</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Unbind a face detection from an identity. Removes the identity association from the face record.</p>
+<hr />
+<h3><code>GET /api/v1/identities/search</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Search identities by name (ILIKE search). Returns matching identity records.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search?q=Cary&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Identity name</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td>Identity source</td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>TMDb ID (if source = tmdb)</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Associated file UUID</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<hr />
+<h3><code>POST /api/v1/identity/upload</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Upload an identity.json file to create or update an identity. Accepts the same format as the identity.json files stored on disk.</p>
+<p>If an identity with the same <code>name</code> already exists, it will be updated with the new values.</p>
+<h4>Request</h4>
+<p>The request body is an <code>IdentityFile</code> object:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>identity_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>32-char hex UUID (hyphens allowed, will be stripped)</td>
+</tr>
+<tr>
+<td><code>name</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>identity_type</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>"people"</code> or null</td>
+</tr>
+<tr>
+<td><code>source</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>.json</code>, <code>auto</code>, <code>tmdb</code>, <code>user_defined</code>, or <code>merged</code></td>
+</tr>
+<tr>
+<td><code>status</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>"confirmed"</code>, <code>"pending"</code>, or <code>"inactive"</code></td>
+</tr>
+<tr>
+<td><code>tmdb_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>TMDb person ID</td>
+</tr>
+<tr>
+<td><code>tmdb_profile</code></td>
+<td>string</td>
+<td>No</td>
+<td>TMDb profile image URL</td>
+</tr>
+<tr>
+<td><code>metadata</code></td>
+<td>object</td>
+<td>No</td>
+<td>Arbitrary metadata JSON</td>
+</tr>
+<tr>
+<td><code>file_bindings</code></td>
+<td>array</td>
+<td>No</td>
+<td>Array of <code>{ file_uuid, trace_ids, face_count }</code> (informational)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/upload&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{</span>
+<span class="s1">    &quot;version&quot;: 1,</span>
+<span class="s1">    &quot;identity_uuid&quot;: &quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;,</span>
+<span class="s1">    &quot;name&quot;: &quot;Cary Grant&quot;,</span>
+<span class="s1">    &quot;identity_type&quot;: &quot;people&quot;,</span>
+<span class="s1">    &quot;source&quot;: &quot;.json&quot;,</span>
+<span class="s1">    &quot;status&quot;: &quot;confirmed&quot;,</span>
+<span class="s1">    &quot;metadata&quot;: {},</span>
+<span class="s1">    &quot;file_bindings&quot;: []</span>
+<span class="s1">  }&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Identity uploaded successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<hr />
+<h3><code>POST /api/v1/identity/:identity_uuid/profile-image</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Upload a profile image (JPEG or PNG) for an identity. The image is saved to <code>{output}/identities/{uuid}/profile.{ext}</code>.</p>
+<p>Uses <code>multipart/form-data</code> with field name <code>image</code>.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/profile-image&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-F<span class="w"> </span><span class="s2">&quot;image=@/path/to/photo.jpg&quot;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/output/identities/.../profile.jpg&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Profile image saved: profile.jpg&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>Missing image field or unsupported format</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>Identity not found</td>
+</tr>
+<tr>
+<td><code>415</code></td>
+<td>Unsupported image type (use JPEG or PNG)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/identity/:identity_uuid/profile-image</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Retrieve the profile image for an identity. Returns the raw image data with appropriate Content-Type header.</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="nv">$IDENTITY_UUID</span><span class="s2">/profile-image&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-o<span class="w"> </span>profile.jpg
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Response Header</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>content-type</code></td>
+<td><code>image/jpeg</code> or <code>image/png</code></td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/signals/unbound</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>List unbound face signals — face detections that have not yet been assigned to any identity.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/signals/unbound&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h2>Identity Agent</h2>
+<h3><code>POST /api/v1/agents/identity/analyze</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Run identity matching on a processed file: matches face detection traces against known identities (TMDb, .json, auto) and creates bindings. Optionally uses LLM for enhanced analysis.</p>
+<blockquote>
+<p>Requires the file's face processor to have completed. Will return an error if face traces are not available.</p>
+</blockquote>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>File UUID to analyze</td>
+</tr>
+<tr>
+<td><code>use_llm</code></td>
+<td>boolean</td>
+<td>No</td>
+<td><code>false</code></td>
+<td>Enable LLM-assisted identity analysis</td>
+</tr>
+<tr>
+<td><code>model</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>LLM model name (e.g., <code>"gemma4"</code>)</td>
+</tr>
+<tr>
+<td><code>auto_merge_threshold</code></td>
+<td>float</td>
+<td>No</td>
+<td>—</td>
+<td>Confidence threshold (0.0–1.0) for auto-merging</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Basic analysis</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/analyze&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># With LLM enhancement</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/analyze&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;use_llm&quot;: true, &quot;model&quot;: &quot;gemma4&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identities&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;a9a901056d6b46ff92da0c3c1a57dff4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;person_ids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;trace_10&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;trace_23&quot;</span><span class="p">],</span>
+<span class="w">      </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.87</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;stranger&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;processing_status&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;phase&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;COMPLETED&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;progress&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">100</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Analyzed file UUID</td>
+</tr>
+<tr>
+<td><code>identities</code></td>
+<td>array</td>
+<td>Array of matched identity results</td>
+</tr>
+<tr>
+<td><code>identities[].identity_id</code></td>
+<td>string</td>
+<td>32-char identity UUID</td>
+</tr>
+<tr>
+<td><code>identities[].person_ids</code></td>
+<td>string[]</td>
+<td>Matched trace/person IDs</td>
+</tr>
+<tr>
+<td><code>identities[].confidence</code></td>
+<td>float</td>
+<td>Matching confidence (0.0–1.0)</td>
+</tr>
+<tr>
+<td><code>identities[].matched</code></td>
+<td>boolean</td>
+<td>Whether this identity was matched to a known entity</td>
+</tr>
+<tr>
+<td><code>identities[].name</code></td>
+<td>string</td>
+<td>Identity display name</td>
+</tr>
+<tr>
+<td><code>identities[].source</code></td>
+<td>string</td>
+<td>Identity source (<code>.json</code>, <code>auto</code>, <code>tmdb</code>, etc.)</td>
+</tr>
+<tr>
+<td><code>identities[].stranger</code></td>
+<td>boolean</td>
+<td>Whether this is an unmatched stranger trace</td>
+</tr>
+<tr>
+<td><code>processing_status</code></td>
+<td>object</td>
+<td>Identity agent processing progress</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>400</code></td>
+<td>File UUID not provided or invalid</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File not found or face processor not completed</td>
+</tr>
+<tr>
+<td><code>500</code></td>
+<td>Analysis failed (LLM error, DB error)</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/agents/identity/suggest</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Suggest identity merges based on face embedding similarity analysis. Returns pairs of identities that are similar enough to potentially be the same person.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>File UUID to analyze for merge suggestions</td>
+</tr>
+<tr>
+<td><code>auto_merge_threshold</code></td>
+<td>float</td>
+<td>No</td>
+<td>—</td>
+<td>Confidence threshold for auto-suggest</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/suggest&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>GET /api/v1/agents/identity/status</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Get the identity agent processing status for a file. Shows current phase and progress.</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/identity/status?file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/agents/suggest/merge</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Execute a suggested identity merge. Combines two identities into one, consolidating their face bindings.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>source_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity UUID to merge FROM (will be removed)</td>
+</tr>
+<tr>
+<td><code>target_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity UUID to merge INTO (will be kept)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/suggest/merge&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;source_uuid&quot;: &quot;uuid_to_discard&quot;, &quot;target_uuid&quot;: &quot;uuid_to_keep&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3><code>POST /api/v1/agents/suggest/clustering</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<p>Suggest face clustering results. Analyzes all face embeddings in a file and groups similar faces into candidate identity clusters.</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/suggest/clustering&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h2>TMDb Enrichment</h2>
+<blockquote>
+<p>⚠️ <strong>External resource</strong>: TMDb requires internet access, violating Momentry's local-only principle.
+All core processing (ASR, YOLO, Face, OCR, Pose, embeddings) runs fully offline.
+TMDb enrichment is <strong>optional</strong> and gated behind <code>TMDB_API_KEY</code> + <code>MOMENTRY_TMDB_PROBE_ENABLED</code>.</p>
+</blockquote>
+<h3>Overview</h3>
+<p>TMDb enrichment is an optional identity enrichment step that can be run after Pipeline face detection completes. The workflow is:</p>
+<ol>
+<li><strong>Prefetch</strong> (requires internet): Download movie cast data from TMDb API → cache to <code>{file_uuid}.tmdb.json</code></li>
+<li><strong>Probe</strong>: Read local cache → create identities for <strong>all</strong> cast members (<code>source='tmdb'</code>) + save <code>identity.json</code> + download profile image to <code>{OUTPUT}/identities/{uuid}/profile.jpg</code></li>
+<li><strong>Match</strong>: The worker automatically matches video faces against TMDb identities when <code>MOMENTRY_TMDB_PROBE_ENABLED=true</code></li>
+</ol>
+<h3><code>POST /api/v1/agents/tmdb/prefetch</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Fetch TMDb cast data for a registered file and cache it locally. This is the only step requiring internet access.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to enrich</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/tmdb/prefetch&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;cache_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/output/...tmdb.json&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/file/:file_uuid/tmdb-probe</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Read local TMDb cache and create/update identities. Requires prefetch to have been run first.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/tmdb-probe&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_created, movie_title}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200 — identities created)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;identities_created&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;movie_title&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h4>Response (200 — no cache)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;No TMDb cache found. Run tmdb-prefetch first.&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>GET /api/v1/resource/tmdb</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>View TMDb resource status including configuration, identity counts, and cache file count.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_seeded, cache_files}&#39;</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/resource/tmdb/check</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Ping the TMDb API to verify connectivity and measure latency.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb/check&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.status&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;api_key_configured&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;enabled&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_reachable&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">120</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Stats &amp; Pipeline</h2>
+<h3>Stats Endpoints</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Auth</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/ingest</code></td>
+<td>No</td>
+<td>Ingest statistics</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/sftpgo</code></td>
+<td>No</td>
+<td>SFTPGo service status</td>
+</tr>
+<tr>
+<td>GET</td>
+<td><code>/api/v1/stats/inference</code></td>
+<td>No</td>
+<td>Inference service health</td>
+</tr>
+</tbody>
+</table>
+<h3>Configuration</h3>
+<h3><code>POST /api/v1/config/cache</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Toggle the Redis cache on or off.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>enabled</code></td>
+<td>boolean</td>
+<td>Yes</td>
+<td><code>true</code> to enable, <code>false</code> to disable</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/config/cache&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;enabled&quot;: false}&#39;</span>
+</code></pre></div>
+
+<h3>Unmounted Routes</h3>
+<p>The following routes are defined in source code but are <strong>NOT</strong> currently mounted in the router:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Endpoint</th>
+<th>Source file</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>/api/v1/search/universal</code></td>
+<td><code>universal_search.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/search/frames</code></td>
+<td><code>universal_search.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/search/persons</code></td>
+<td><code>universal_search.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/who</code></td>
+<td><code>who.rs</code></td>
+</tr>
+<tr>
+<td><code>/api/v1/who/candidates</code></td>
+<td><code>who.rs</code></td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Error Response Format</h2>
+<p>All API errors follow this JSON structure:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;error&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;code&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;E001_NOT_FOUND&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Resource not found&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;details&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;resource&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;file_uuid&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;value&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;abc&quot;</span><span class="p">}</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>Error Code List</h2>
+<h3>Generic Errors (E0xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E001_NOT_FOUND</code></td>
+<td>404</td>
+<td>Resource not found (file, identity, chunk)</td>
+</tr>
+<tr>
+<td><code>E002_DUPLICATE</code></td>
+<td>409</td>
+<td>Resource already exists</td>
+</tr>
+<tr>
+<td><code>E003_VALIDATION</code></td>
+<td>400</td>
+<td>Request parameter validation failed</td>
+</tr>
+<tr>
+<td><code>E004_UNAUTHORIZED</code></td>
+<td>401</td>
+<td>Invalid API key or token</td>
+</tr>
+<tr>
+<td><code>E005_INTERNAL</code></td>
+<td>500</td>
+<td>Internal server error</td>
+</tr>
+</tbody>
+</table>
+<h3>Processor Errors (E1xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E101_PROCESSOR_FAIL</code></td>
+<td>500</td>
+<td>Python script execution failed</td>
+</tr>
+<tr>
+<td><code>E102_TIMEOUT</code></td>
+<td>504</td>
+<td>Processing timeout</td>
+</tr>
+<tr>
+<td><code>E103_RESUME_FAIL</code></td>
+<td>500</td>
+<td>Resume failed (checkpoint not found)</td>
+</tr>
+<tr>
+<td><code>E104_NO_VIDEO</code></td>
+<td>400</td>
+<td>Video file path not found</td>
+</tr>
+</tbody>
+</table>
+<h3>Identity Errors (E2xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E201_FACE_NOT_FOUND</code></td>
+<td>404</td>
+<td>Face detection not found</td>
+</tr>
+<tr>
+<td><code>E202_MERGE_CONFLICT</code></td>
+<td>409</td>
+<td>Identity merge conflict</td>
+</tr>
+<tr>
+<td><code>E203_CANDIDATE_EMPTY</code></td>
+<td>404</td>
+<td>No candidates available for confirmation</td>
+</tr>
+</tbody>
+</table>
+<h3>TMDb Errors (E3xx)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Code</th>
+<th>HTTP</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>E301_TMDB_NO_KEY</code></td>
+<td>400</td>
+<td><code>TMDB_API_KEY</code> environment variable not set</td>
+</tr>
+<tr>
+<td><code>E302_TMDB_UNREACHABLE</code></td>
+<td>502</td>
+<td>TMDb API unreachable or timed out</td>
+</tr>
+<tr>
+<td><code>E303_TMDB_CACHE_NOT_FOUND</code></td>
+<td>200</td>
+<td>No local TMDb cache; run prefetch first</td>
+</tr>
+<tr>
+<td><code>E304_TMDB_PROBE_FAILED</code></td>
+<td>500</td>
+<td>TMDb probe execution failed</td>
+</tr>
+<tr>
+<td><code>E305_TMDB_MOVIE_NOT_FOUND</code></td>
+<td>404</td>
+<td>No matching TMDb movie found from filename</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h1>Agent Endpoints</h1>
+<p>Agent endpoints provide AI-powered capabilities including translation, identity analysis, and 5W1H extraction.</p>
+<h2>POST /api/v1/agents/translate</h2>
+<p>Translate text between languages using Gemma4 (llama.cpp, port 8082).</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Hello, welcome to Momentry Core.&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;target_language&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Traditional Chinese&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source_language&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;English&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>text</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Text to translate</td>
+</tr>
+<tr>
+<td><code>target_language</code></td>
+<td>string</td>
+<td>✅</td>
+<td>Target language name (e.g. "Traditional Chinese", "Japanese")</td>
+</tr>
+<tr>
+<td><code>source_language</code></td>
+<td>string</td>
+<td>❌</td>
+<td>Source language (default: "auto")</td>
+</tr>
+</tbody>
+</table>
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;translated_text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;您好，歡迎使用 Momentry Core。&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;source_language_detected&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;English&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;model_used&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;google_gemma-4-26B-A4B-it-Q5_K_M.gguf&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h3>Supported Language Pairs (tested)</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Source</th>
+<th>Target</th>
+<th>Quality</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>English</td>
+<td>Traditional Chinese</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>English</td>
+<td>Japanese</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>Chinese</td>
+<td>English</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>English</td>
+<td>French</td>
+<td>✅</td>
+</tr>
+<tr>
+<td>Chinese</td>
+<td>Japanese</td>
+<td>✅</td>
+</tr>
+</tbody>
+</table>
+<h3>Model</h3>
+<ul>
+<li><strong>Model</strong>: Gemma4 26B (Q5_K_M)</li>
+<li><strong>Engine</strong>: llama.cpp at <code>localhost:8082</code></li>
+<li><strong>Endpoint</strong>: <code>/v1/chat/completions</code> (OpenAI-compatible)</li>
+<li><strong>Temperature</strong>: 0.1</li>
+<li><strong>Max tokens</strong>: 1024</li>
+</ul>
+<h3>Errors</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Status</th>
+<th>Condition</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>500</td>
+<td>LLM unreachable or response parse failure</td>
+</tr>
+<tr>
+<td>401</td>
+<td>Missing/invalid auth</td>
+</tr>
+</tbody>
+</table>
+<h2>GET /api/v1/agents/identity/status</h2>
+<p>Get status of the identity agent pipeline.</p>
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;idle&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;last_analysis&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-17T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identities_processed&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">27</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/suggest/clustering</h2>
+<p>Run face clustering to suggest new identity groupings.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/suggest/merge</h2>
+<p>Merge two identities into one.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;from_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;into_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/5w1h/analyze</h2>
+<p>Extract 5W1H (Who, What, When, Where, Why, How) from video chunk text.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;chunk_42&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h3>Response</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;5w1h&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;who&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;what&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;discussing plans&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;when&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;1963&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;where&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;Paris&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;why&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;vacation&quot;</span><span class="p">],</span>
+<span class="w">    </span><span class="nt">&quot;how&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;in person&quot;</span><span class="p">]</span>
+<span class="w">  </span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>POST /api/v1/agents/5w1h/batch</h2>
+<p>Batch analyze multiple chunks for 5W1h extraction.</p>
+<h3>Request</h3>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;chunk_ids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;chunk_1&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;chunk_2&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;chunk_3&quot;</span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<h2>GET /api/v1/agents/5w1h/status</h2>
+<p>Get status of the 5W1H agent pipeline.</p>
+<hr />
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/API_TRAINING_MARCOM.html b/docs_v1.0/doc_user/API_TRAINING_MARCOM.html
new file mode 100644
index 0000000..e0f78d0
--- /dev/null
+++ b/docs_v1.0/doc_user/API_TRAINING_MARCOM.html
@@ -0,0 +1,1603 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Api Training Marcom - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "user_manual"
+service: "MOMENTRY_CORE"
+title: "Momentry Core API 教育訓練手冊"
+date: "2026-05-17"
+version: "V1.5"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"</p>
+<hr />
+<h1>Momentry Core API 教育訓練手冊</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<!-- narrative: marcom_intro -->
+<!-- description: Intro section for Marcom training manual -->
+<!-- depends: -->
+
+<h2>About This Manual</h2>
+<p>This training manual is designed for the Marcom team to understand and use the Momentry Core API.</p>
+<h3>Demo Credentials</h3>
+<p><strong>API Key</strong>: <code>muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69</code></p>
+<p><strong>SFTPGo</strong> (for video upload):</p>
+<table class="table">
+<thead>
+<tr>
+<th>Item</th>
+<th>Value</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>SFTP Host</td>
+<td><code>sftpgo.momentry.ddns.net</code></td>
+</tr>
+<tr>
+<td>SFTP Port</td>
+<td><code>2022</code></td>
+</tr>
+<tr>
+<td>Username</td>
+<td><code>demo</code></td>
+</tr>
+<tr>
+<td>Password</td>
+<td><code>demopassword123</code></td>
+</tr>
+<tr>
+<td>Web UI</td>
+<td><code>https://sftpgo.momentry.ddns.net</code></td>
+</tr>
+</tbody>
+</table>
+<h3>Quick Examples</h3>
+<p><strong>List all videos:</strong></p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+</code></pre></div>
+
+<p><strong>Search:</strong></p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;example&quot;, &quot;limit&quot;: 5}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h2>Base URL</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Environment</th>
+<th>URL</th>
+<th>Purpose</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Playground (Dev)</td>
+<td><code>http://localhost:3003</code></td>
+<td>Development and testing</td>
+</tr>
+<tr>
+<td>Production</td>
+<td><code>http://localhost:3002</code></td>
+<td>Production deployment</td>
+</tr>
+<tr>
+<td>External (M5)</td>
+<td><code>https://m5api.momentry.ddns.net</code></td>
+<td>Remote access</td>
+</tr>
+</tbody>
+</table>
+<h2>Variables</h2>
+<p>All examples in this documentation use these environment variables:</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://localhost:3003&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;your-api-key-here&quot;</span>
+</code></pre></div>
+
+<h2>Authentication</h2>
+<p>All endpoints under <code>/api/v1/*</code> require authentication.
+The following endpoints are public (no auth needed):</p>
+<ul>
+<li><code>GET /health</code></li>
+<li><code>POST /api/v1/auth/login</code></li>
+<li><code>POST /api/v1/auth/logout</code></li>
+</ul>
+<h3>Three Authentication Modes</h3>
+<p>The system supports three authentication methods, checked in <strong>priority order</strong> by the middleware:</p>
+<div class="codehilite"><pre><span></span><code>Middleware priority:
+  1. Session Cookie (Portal/browser)
+  2. JWT Bearer (API clients: n8n, CLI)
+  3. API Key Header (legacy compatibility)
+  4. API Key Query Param (?api_key=)
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Mode</th>
+<th>Transport</th>
+<th>Expiry</th>
+<th>Scope</th>
+<th>Best for</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td><code>Cookie: session_id=&lt;uuid&gt;</code></td>
+<td>24h</td>
+<td>per-browser session</td>
+<td>Portal (browser)</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td><code>Authorization: Bearer &lt;token&gt;</code></td>
+<td>1h</td>
+<td>per-login token</td>
+<td>API clients (n8n, CLI, scripts)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td><code>X-API-Key: &lt;key&gt;</code></td>
+<td>90d</td>
+<td>fixed key for automation</td>
+<td>Legacy scripts, WordPress</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Login</h3>
+<p><strong>Default accounts &amp; API keys:</strong></p>
+<table class="table">
+<thead>
+<tr>
+<th>Username</th>
+<th>Password</th>
+<th>API Key</th>
+<th>Role</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>admin</code></td>
+<td><code>admin</code></td>
+<td>—</td>
+<td>admin</td>
+</tr>
+<tr>
+<td><code>demo</code></td>
+<td><code>demo</code></td>
+<td><code>muser_demo_key_32chars_abcdef1234567890</code></td>
+<td>user</td>
+</tr>
+</tbody>
+</table>
+<p>The demo API key is set via <code>MOMENTRY_DEMO_API_KEY</code> env var and can be used in place of JWT for marcom integrations:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Using API key instead of JWT</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_demo_key_32chars_abcdef1234567890&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login as admin</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;admin&quot;, &quot;password&quot;: &quot;admin&quot;}&#39;</span>
+
+<span class="c1"># Login as demo user</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;demo&quot;, &quot;password&quot;: &quot;demo&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Success Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;jwt&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;eyJhbGciOiJIUzI1NiIs...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_key&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;muser_...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;user&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;username&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;role&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;expires_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-18T13:00:00Z&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jwt</code></td>
+<td>string</td>
+<td>JWT access token. Use as <code>Authorization: Bearer &lt;jwt&gt;</code>. Expires in 1 hour.</td>
+</tr>
+<tr>
+<td><code>api_key</code></td>
+<td>string</td>
+<td>Legacy API key. Use as <code>X-API-Key: &lt;key&gt;</code>. Good for 90 days.</td>
+</tr>
+<tr>
+<td><code>user.username</code></td>
+<td>string</td>
+<td>Username</td>
+</tr>
+<tr>
+<td><code>user.role</code></td>
+<td>string</td>
+<td>Role: <code>admin</code>, <code>user</code>, or <code>readonly</code></td>
+</tr>
+<tr>
+<td><code>expires_at</code></td>
+<td>string</td>
+<td>ISO8601 timestamp of JWT expiration</td>
+</tr>
+</tbody>
+</table>
+<p>The login endpoint also sets a <code>Set-Cookie</code> header for browser-based clients:</p>
+<div class="codehilite"><pre><span></span><code><span class="nt">Set-Cookie</span><span class="o">:</span><span class="w"> </span><span class="nt">session_id</span><span class="o">=&lt;</span><span class="nt">uuid</span><span class="o">&gt;;</span><span class="w"> </span><span class="nt">Path</span><span class="o">=/</span><span class="nt">api</span><span class="o">;</span><span class="w"> </span><span class="nt">HttpOnly</span><span class="o">;</span><span class="w"> </span><span class="nt">SameSite</span><span class="o">=</span><span class="nt">Strict</span><span class="o">;</span><span class="w"> </span><span class="nt">Max-Age</span><span class="o">=</span><span class="nt">86400</span>
+</code></pre></div>
+
+<h4>Error Response (401)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Invalid username or password&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3>Using JWT</h3>
+<p>JWT is preferred for API clients (n8n, CLI scripts, WordPress). It is validated by the middleware without a database lookup (stateless).</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login and capture JWT</span>
+<span class="nv">JWT</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;print(json.load(sys.stdin)[&#39;jwt&#39;])&quot;</span><span class="k">)</span>
+
+<span class="c1"># Use JWT for all subsequent requests</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span>
+</code></pre></div>
+
+<p>JWT is short-lived (1 hour). When it expires, request a new one via login.</p>
+<hr />
+<h3>Using Session Cookie (Browser)</h3>
+<p>Browser-based clients (Portal) get a session cookie automatically after login. The browser sends the cookie with every request—no manual header needed.</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login captures the session cookie from Set-Cookie header</span>
+curl<span class="w"> </span>-v<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span>
+
+<span class="c1"># Browser automatically sends: Cookie: session_id=&lt;uuid&gt;</span>
+<span class="c1"># No manual header needed for subsequent requests</span>
+</code></pre></div>
+
+<p>The session cookie is HttpOnly (not accessible from JavaScript) and SameSite=Strict (protected against CSRF).</p>
+<hr />
+<h3>Using Legacy API Key</h3>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+
+<span class="c1"># Also accepted via Bearer header (non-JWT format) or query parameter:</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?api_key=</span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>API keys are validated via SHA256 hash lookup in the database. They are long-lived (90 days) and intended for automation.</p>
+<h3>Obtaining an API Key (CLI)</h3>
+<div class="codehilite"><pre><span></span><code>momentry<span class="w"> </span>api-key<span class="w"> </span>create<span class="w"> </span><span class="s2">&quot;My API Key&quot;</span><span class="w"> </span>--key-type<span class="w"> </span>user
+</code></pre></div>
+
+<hr />
+<h3>Logout</h3>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Logout using the session cookie (browser)</span>
+curl<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=&lt;uuid&gt;&quot;</span>
+</code></pre></div>
+
+<h4>What logout does</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Auth mode</th>
+<th>Effect</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td>Session deleted from database. Same cookie returns 401 on subsequent requests.</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td>JWT remains valid until expiry. (JWT is stateless — logout adds JWT to a blacklist only if API key mode is used.)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td>API key remains valid. (Legacy keys are shared across sessions — revoking would break other clients.)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example: full session lifecycle</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># 1. Login</span>
+<span class="nv">SESSION_ID</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-D<span class="w"> </span>-<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sed<span class="w"> </span><span class="s1">&#39;s/.*session_id=\([^;]*\).*/\1/&#39;</span><span class="k">)</span>
+
+<span class="c1"># 2. Use session (works)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 200</span>
+
+<span class="c1"># 3. Logout</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → {&quot;success&quot;: true}</span>
+
+<span class="c1"># 4. Use session again (rejected)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 401</span>
+</code></pre></div>
+
+<hr />
+<h3>Authentication Flow Summary</h3>
+<div class="codehilite"><pre><span></span><code>Login Request
+     │
+     ▼
+┌──────────────────┐
+│  1. Check users  │ ← users table (argon2 password verify)
+│     table        │
+└──────┬───────────┘
+       │
+   ┌───┴───┐
+   │ match │
+   └───┬───┘
+       │
+       ▼
+┌──────────────────┐
+│  2. Create JWT   │ ← 1h expiry, signed with JWT_SECRET
+├──────────────────┤
+│  3. Create       │ ← 24h expiry, stored in sessions table
+│     session      │
+├──────────────────┤
+│  4. Set-Cookie   │ ← HttpOnly, SameSite=Strict, Path=/api
+├──────────────────┤
+│  5. Return       │ ← JWT + api_key + user info to client
+└──────────────────┘
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>Protected Request
+     │
+     ▼
+┌──────────────────────┐
+│  Middleware checks:  │
+│                      │
+│  1. Cookie session?  │ → DB lookup session → get api_key → verify
+│                      │
+│  2. JWT Bearer?      │ → verify JWT signature → decode claims
+│                      │
+│  3. X-API-Key?       │ → SHA256 hash → DB lookup → verify
+│                      │
+│  4. ?api_key=?       │ → same as #3
+│                      │
+│  5. None → 401       │
+└──────────────────────┘
+</code></pre></div>
+
+<hr />
+<h3>Error Responses</h3>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid authentication</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Session expired or logged out</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>JWT expired</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>API key revoked or inactive</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Related</h3>
+<ul>
+<li><code>POST /api/v1/resource/tmdb/check</code> — test authentication + TMDb API connectivity</li>
+<li><code>GET /health/detailed</code> — view auth status (integrations section)</li>
+</ul>
+<hr />
+<h2>File Registration</h2>
+<h3><code>POST /api/v1/files/register</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Register a video file for processing. Returns the file's metadata and UUID.</p>
+<p><strong>New in v0.1.2</strong>: Registration now <strong>automatically triggers the processing pipeline</strong> — no need to call <code>POST /api/v1/file/:uuid/process</code> separately. The system will:
+1. Register the file and run ffprobe
+2. Auto-run offline TMDb probe (reads local identity files, no API calls)
+3. Create a monitor job for the worker
+4. Worker starts all 10 processors (Cut → ASR → ASRX → YOLO → OCR → Face → Pose → VisualChunk → Story → 5W1H)</p>
+<p>If the file already exists (same content hash), returns the existing record with <code>already_exists: true</code>.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Path to video file on disk</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex pattern for batch register (requires <code>file_path</code> to be a directory)</td>
+</tr>
+<tr>
+<td><code>user_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>User ID to associate with registration</td>
+</tr>
+<tr>
+<td><code>content_hash</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Pre-computed SHA-256 hash (skips computation)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Register a single file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39;</span>
+
+<span class="c1"># Batch register files matching a pattern in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;already_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;File registered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the registered file</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name (auto-renamed if name conflict)</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Canonical path on disk</td>
+</tr>
+<tr>
+<td><code>file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>"unknown"</code></td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Total frame count</td>
+</tr>
+<tr>
+<td><code>already_exists</code></td>
+<td>boolean</td>
+<td>True if same content was already registered</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+<tr>
+<td><code>400</code></td>
+<td>Invalid request body</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File path does not exist</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/files/scan</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Scan the filesystem directory and list all media files, showing which are registered, processing, or unregistered.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Items per page (alias: <code>limit</code>)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Max items (alias for <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex filter on file name (e.g., <code>.*\\.mp4$</code>)</td>
+</tr>
+<tr>
+<td><code>sort_by</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>name</code></td>
+<td>Sort field: <code>name</code>, <code>size</code>, <code>modified</code>, <code>status</code></td>
+</tr>
+<tr>
+<td><code>sort_order</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>asc</code></td>
+<td>Sort direction: <code>asc</code> or <code>desc</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Full scan</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, registered_count, unregistered_count}&#39;</span>
+
+<span class="c1"># Paginated (page 1, 5 per page)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?page=1&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{page, total_pages, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Regex filter: only mp4 files</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?pattern=.*\\.mp4</span>$<span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{filtered_total, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Sort by file size (largest first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=size&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, file_size}]&#39;</span>
+
+<span class="c1"># Sort by modified time (most recent first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=modified&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, modified_time}]&#39;</span>
+
+<span class="c1"># Sort by status</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=status&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, status}]&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;files&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">12345678</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;is_registered&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;registration_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">107</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;filtered_total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">80</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_pages&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;registered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">26</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;unregistered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">81</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>files</code></td>
+<td>array</td>
+<td>Array of file info objects (paginated)</td>
+</tr>
+<tr>
+<td><code>files[].file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>files[].relative_path</code></td>
+<td>string</td>
+<td>Path relative to scan root</td>
+</tr>
+<tr>
+<td><code>files[].file_path</code></td>
+<td>string</td>
+<td>Absolute path on disk</td>
+</tr>
+<tr>
+<td><code>files[].file_size</code></td>
+<td>integer</td>
+<td>File size in bytes</td>
+</tr>
+<tr>
+<td><code>files[].modified_time</code></td>
+<td>string</td>
+<td>Last modified timestamp (ISO8601)</td>
+</tr>
+<tr>
+<td><code>files[].is_registered</code></td>
+<td>boolean</td>
+<td>Whether file is registered in DB</td>
+</tr>
+<tr>
+<td><code>files[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].status</code></td>
+<td>string</td>
+<td><code>"completed"</code>, <code>"processing"</code>, <code>"registered"</code>, <code>"unregistered"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>files[].registration_time</code></td>
+<td>string</td>
+<td>DB registration timestamp (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].job_id</code></td>
+<td>integer</td>
+<td>Processing job ID (only if a job exists)</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total files found on disk (unfiltered)</td>
+</tr>
+<tr>
+<td><code>filtered_total</code></td>
+<td>integer</td>
+<td>Files matching regex filter</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>total_pages</code></td>
+<td>integer</td>
+<td>Total pages</td>
+</tr>
+<tr>
+<td><code>registered_count</code></td>
+<td>integer</td>
+<td>Files registered in DB</td>
+</tr>
+<tr>
+<td><code>unregistered_count</code></td>
+<td>integer</td>
+<td>Files not yet registered</td>
+</tr>
+</tbody>
+</table>
+<h4>Notes</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Feature</th>
+<th>Behavior</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Regex</strong></td>
+<td>Case-insensitive (<code>(?i)</code> prefix auto-applied). Applied to <code>file_name</code>.</td>
+</tr>
+<tr>
+<td><strong>Sort order</strong></td>
+<td>Default (<code>sort_by=name</code>): registered files first, then alphabetically. <code>sort_by=status</code>: alphabetical by status string.</td>
+</tr>
+<tr>
+<td><strong>Pagination</strong></td>
+<td><code>page_size</code> and <code>limit</code> are aliases. Default: show all results.</td>
+</tr>
+<tr>
+<td><strong>Processing order</strong></td>
+<td><code>pattern</code> regex filter → <code>sort_by</code>/<code>sort_order</code> → <code>page</code>/<code>page_size</code> slice.</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Search APIs</h2>
+<h3>Standard Search</h3>
+<h3><code>POST /api/v1/search</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Semantic/vector search across indexed video chunks. Returns matching chunks with scores.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict search to a specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>10</td>
+<td>Max results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+<td>Items per page (alias: <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>mode</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>smart</code></td>
+<td>Search mode: <code>"vector"</code> or <code>"smart"</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Search across all files</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+
+<span class="c1"># Search within a specific file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+
+<span class="c1"># Paginated search</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;page&quot;: 1, &quot;page_size&quot;: 3}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.92</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3</span>
+<span class="p">}</span>
+
+<span class="err">&gt;</span><span class="w"> </span><span class="err">Resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">are</span><span class="w"> </span><span class="err">deduplica</span><span class="kc">te</span><span class="err">d</span><span class="w"> </span><span class="err">by</span><span class="w"> </span><span class="err">`chu</span><span class="kc">n</span><span class="err">k_id`</span><span class="w"> </span><span class="err">(highes</span><span class="kc">t</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">wi</span><span class="kc">ns</span><span class="err">)</span><span class="w"> </span><span class="err">be</span><span class="kc">f</span><span class="err">ore</span><span class="w"> </span><span class="err">pagi</span><span class="kc">nat</span><span class="err">io</span><span class="kc">n</span><span class="err">.</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">Field</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Type</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Descrip</span><span class="kc">t</span><span class="err">io</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">-------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">-------------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">array</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Array</span><span class="w"> </span><span class="err">o</span><span class="kc">f</span><span class="w"> </span><span class="err">ma</span><span class="kc">t</span><span class="err">ched</span><span class="w"> </span><span class="err">chu</span><span class="kc">n</span><span class="err">ks</span><span class="w"> </span><span class="err">(deduplica</span><span class="kc">te</span><span class="err">d)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.uuid`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">File</span><span class="w"> </span><span class="err">UUID</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.chu</span><span class="kc">n</span><span class="err">k_id`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Chu</span><span class="kc">n</span><span class="err">k</span><span class="w"> </span><span class="err">ide</span><span class="kc">nt</span><span class="err">i</span><span class="kc">f</span><span class="err">ier</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.chu</span><span class="kc">n</span><span class="err">k_</span><span class="kc">t</span><span class="err">ype`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;sentence&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;cut&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;trace&quot;</span><span class="err">`</span><span class="p">,</span><span class="w"> </span><span class="err">`</span><span class="s2">&quot;visual&quot;</span><span class="err">`</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.s</span><span class="kc">tart</span><span class="err">_</span><span class="kc">t</span><span class="err">ime`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">S</span><span class="kc">tart</span><span class="w"> </span><span class="kc">t</span><span class="err">ime</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="w"> </span><span class="err">seco</span><span class="kc">n</span><span class="err">ds</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.e</span><span class="kc">n</span><span class="err">d_</span><span class="kc">t</span><span class="err">ime`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">E</span><span class="kc">n</span><span class="err">d</span><span class="w"> </span><span class="kc">t</span><span class="err">ime</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="w"> </span><span class="err">seco</span><span class="kc">n</span><span class="err">ds</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.</span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Chu</span><span class="kc">n</span><span class="err">k</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">co</span><span class="kc">ntent</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`resul</span><span class="kc">ts</span><span class="p">[]</span><span class="err">.score`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Similari</span><span class="kc">t</span><span class="err">y</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`query`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Origi</span><span class="kc">nal</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="err">query</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="kc">t</span><span class="err">o</span><span class="kc">tal</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">To</span><span class="kc">tal</span><span class="w"> </span><span class="err">ma</span><span class="kc">t</span><span class="err">chi</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Curre</span><span class="kc">nt</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="kc">nu</span><span class="err">mber</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page_size`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">I</span><span class="kc">te</span><span class="err">ms</span><span class="w"> </span><span class="err">per</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="err">|</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Error</span><span class="w"> </span><span class="err">Respo</span><span class="kc">nses</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">HTTP</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Whe</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="mi">401</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Missi</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">or</span><span class="w"> </span><span class="err">i</span><span class="kc">n</span><span class="err">valid</span><span class="w"> </span><span class="err">API</span><span class="w"> </span><span class="err">key</span><span class="w"> </span><span class="err">|</span>
+
+<span class="mi">---</span>
+
+<span class="err">###</span><span class="w"> </span><span class="err">`POST</span><span class="w"> </span><span class="err">/api/v</span><span class="mi">1</span><span class="err">/search/hybrid`</span>
+
+<span class="err">**Au</span><span class="kc">t</span><span class="err">h**</span><span class="p">:</span><span class="w"> </span><span class="err">Required</span>
+<span class="err">**Scope**</span><span class="p">:</span><span class="w"> </span><span class="kc">f</span><span class="err">ile</span><span class="mi">-</span><span class="err">level</span>
+
+<span class="err">Hybrid</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="err">combi</span><span class="kc">n</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">vec</span><span class="kc">t</span><span class="err">or</span><span class="w"> </span><span class="err">similari</span><span class="kc">t</span><span class="err">y</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">a</span><span class="kc">n</span><span class="err">d</span><span class="w"> </span><span class="err">BM</span><span class="mi">25</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">i</span><span class="kc">nt</span><span class="err">o</span><span class="w"> </span><span class="err">a</span><span class="w"> </span><span class="err">combi</span><span class="kc">ne</span><span class="err">d</span><span class="w"> </span><span class="err">score.</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Reques</span><span class="kc">t</span><span class="w"> </span><span class="err">Parame</span><span class="kc">ters</span>
+
+<span class="err">|</span><span class="w"> </span><span class="err">Field</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Type</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Required</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">De</span><span class="kc">fault</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Descrip</span><span class="kc">t</span><span class="err">io</span><span class="kc">n</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="mi">-------</span><span class="err">|</span><span class="mi">------</span><span class="err">|</span><span class="mi">----------</span><span class="err">|</span><span class="mi">---------</span><span class="err">|</span><span class="mi">-------------</span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`query`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Yes</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Search</span><span class="w"> </span><span class="kc">te</span><span class="err">x</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`</span><span class="kc">f</span><span class="err">ile_uuid`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">s</span><span class="kc">tr</span><span class="err">i</span><span class="kc">n</span><span class="err">g</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">—</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Res</span><span class="kc">tr</span><span class="err">ic</span><span class="kc">t</span><span class="w"> </span><span class="err">search</span><span class="w"> </span><span class="kc">t</span><span class="err">o</span><span class="w"> </span><span class="err">a</span><span class="w"> </span><span class="err">speci</span><span class="kc">f</span><span class="err">ic</span><span class="w"> </span><span class="kc">f</span><span class="err">ile</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`limi</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mi">10</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Max</span><span class="w"> </span><span class="err">resul</span><span class="kc">ts</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mi">1</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Page</span><span class="w"> </span><span class="kc">nu</span><span class="err">mber</span><span class="w"> </span><span class="err">(</span><span class="mi">1-</span><span class="err">based)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`page_size`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">i</span><span class="kc">nte</span><span class="err">ger</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">`limi</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">I</span><span class="kc">te</span><span class="err">ms</span><span class="w"> </span><span class="err">per</span><span class="w"> </span><span class="err">page</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`vec</span><span class="kc">t</span><span class="err">or_weigh</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mf">0.5</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Weigh</span><span class="kc">t</span><span class="w"> </span><span class="kc">f</span><span class="err">or</span><span class="w"> </span><span class="err">vec</span><span class="kc">t</span><span class="err">or</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+<span class="err">|</span><span class="w"> </span><span class="err">`bm</span><span class="mi">25</span><span class="err">_weigh</span><span class="kc">t</span><span class="err">`</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="kc">fl</span><span class="err">oa</span><span class="kc">t</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">No</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="mf">0.5</span><span class="w"> </span><span class="err">|</span><span class="w"> </span><span class="err">Weigh</span><span class="kc">t</span><span class="w"> </span><span class="kc">f</span><span class="err">or</span><span class="w"> </span><span class="err">BM</span><span class="mi">25</span><span class="w"> </span><span class="err">score</span><span class="w"> </span><span class="err">(</span><span class="mf">0.0</span><span class="err">–</span><span class="mf">1.0</span><span class="err">)</span><span class="w"> </span><span class="err">|</span>
+
+<span class="err">####</span><span class="w"> </span><span class="err">Respo</span><span class="kc">nse</span>
+
+<span class="err">```jso</span><span class="kc">n</span>
+<span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;vector_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.85</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;bm25_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.72</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;combined_score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.79</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results[].vector_score</code></td>
+<td>float</td>
+<td>Vector similarity score</td>
+</tr>
+<tr>
+<td><code>results[].bm25_score</code></td>
+<td>float</td>
+<td>BM25 text score</td>
+</tr>
+<tr>
+<td><code>results[].combined_score</code></td>
+<td>float</td>
+<td>Weighted combination of both scores</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>POST /api/v1/search/bm25</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>BM25 full-text keyword search. Good for exact term matching. Returns results with BM25 score only.</p>
+<h4>Request Parameters</h4>
+<p>Same as standard search: <code>query</code>, <code>file_uuid</code>, <code>limit</code>.</p>
+<h4>Response</h4>
+<p>Returns the same structure as standard search, with <code>score</code> representing the BM25 relevance score.</p>
+<hr />
+<h3>N8N Search</h3>
+<p>N8N-format search endpoints. Response format is optimized for n8n workflow consumption.</p>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search</code></td>
+<td>N8N-format vector search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/bm25</code></td>
+<td>N8N-format BM25 search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/hybrid</code></td>
+<td>N8N-format hybrid search</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/n8n/search/smart</code></td>
+<td>N8N-format smart search</td>
+</tr>
+</tbody>
+</table>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>query</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Search text</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>types</code></td>
+<td>string[]</td>
+<td>No</td>
+<td><code>["chunk"]</code></td>
+<td>Search types: <code>chunk</code>, <code>frame</code>, <code>person</code></td>
+</tr>
+<tr>
+<td><code>filters</code></td>
+<td>object</td>
+<td>No</td>
+<td>—</td>
+<td>Filter criteria (confidence, object class, speaker, etc.)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>20</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>time_range</code></td>
+<td>float[2]</td>
+<td>No</td>
+<td>—</td>
+<td>Time range <code>[start, end]</code> in seconds</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/n8n/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;query&quot;: &quot;charade&quot;, &quot;limit&quot;: 5}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;query&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;chunk&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.92</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;took_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>results</code></td>
+<td>array</td>
+<td>Array of search results</td>
+</tr>
+<tr>
+<td><code>results[].type</code></td>
+<td>string</td>
+<td>Result type: <code>"chunk"</code>, <code>"frame"</code>, or <code>"person"</code></td>
+</tr>
+<tr>
+<td><code>results[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>results[].chunk_type</code></td>
+<td>string</td>
+<td>Chunk type</td>
+</tr>
+<tr>
+<td><code>results[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>results[].start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>results[].text</code></td>
+<td>string</td>
+<td>Content text</td>
+</tr>
+<tr>
+<td><code>results[].score</code></td>
+<td>float</td>
+<td>Relevance score</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching results</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>took_ms</code></td>
+<td>integer</td>
+<td>Query execution time in milliseconds</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Identity Text Search</h3>
+<p>Two paths for searching identities by text.</p>
+<h4>Path A: <code>GET /api/v1/search/identity_text</code></h4>
+<p>Search chunk text content and return associated identities (if any).</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to search within</td>
+</tr>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Text search query</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td><code>limit</code></td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/identity_text?file_uuid=</span><span class="nv">$FILE_UUID</span><span class="s2">&amp;q=charade&amp;page=1&amp;page_size=5&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<h5>Response</h5>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;limit&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">50</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;results&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p>Each result (IdentityTextHit):</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence_0012&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">48.8</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">55.4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;text_content&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;charade is a classic film...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identity_source&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;tmdb&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;trace_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">10</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>start_time</code></td>
+<td>float</td>
+<td>Start time in seconds</td>
+</tr>
+<tr>
+<td><code>end_time</code></td>
+<td>float</td>
+<td>End time in seconds</td>
+</tr>
+<tr>
+<td><code>text_content</code></td>
+<td>string</td>
+<td>Chunk text content</td>
+</tr>
+<tr>
+<td><code>identity_id</code></td>
+<td>integer</td>
+<td>Identity ID (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_name</code></td>
+<td>string</td>
+<td>Identity name (null if no identity matched)</td>
+</tr>
+<tr>
+<td><code>identity_source</code></td>
+<td>string</td>
+<td>Identity origin. <code>.json</code> = established from identity.json files on disk (unified format for all sources). <code>tmdb</code> = from <code>.json</code> via TMDb enrichment probe, then matched against faces. <code>auto</code> = pipeline face matching result; only stranger identities are auto-created. <code>user_defined</code> = manual. <code>merged</code> = merged identities.</td>
+</tr>
+<tr>
+<td><code>trace_id</code></td>
+<td>integer</td>
+<td>Face trace ID (null if no trace matched)</td>
+</tr>
+</tbody>
+</table>
+<h4>Path B: <code>POST /api/v1/identities/search</code></h4>
+<p>Search identity names and return associated face detection text.</p>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: identity-level</p>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>q</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>Identity name search</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>No</td>
+<td>Restrict to specific file</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>Max results (default 50)</td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities/search&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;q&quot;: &quot;Cary Grant&quot;}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h3>Visual Chunk Search</h3>
+<p>Search video frames by visual content (object detection results).</p>
+<table class="table">
+<thead>
+<tr>
+<th>Method</th>
+<th>Endpoint</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual</code></td>
+<td>Search visual chunks by criteria (object classes, density)</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/class</code></td>
+<td>Search by specific object class</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/density</code></td>
+<td>Search by spatial density range</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/stats</code></td>
+<td>Get visual detection statistics</td>
+</tr>
+<tr>
+<td>POST</td>
+<td><code>/api/v1/search/visual/combination</code></td>
+<td>Search by object class combination</td>
+</tr>
+</tbody>
+</table>
+<h4>Request Parameters (Visual Search)</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>criteria.required_classes</code></td>
+<td>string[]</td>
+<td>No</td>
+<td>Required object classes (e.g., <code>["person", "car"]</code>)</td>
+</tr>
+<tr>
+<td><code>criteria.min_confidence</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum confidence threshold</td>
+</tr>
+<tr>
+<td><code>criteria.min_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Minimum spatial density</td>
+</tr>
+<tr>
+<td><code>criteria.max_spatial_density</code></td>
+<td>float</td>
+<td>No</td>
+<td>Maximum spatial density</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/visual&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;, &quot;criteria&quot;: {&quot;required_classes&quot;: [&quot;person&quot;, &quot;car&quot;]}}&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;chunks&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;visual_001&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;visual&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;detections&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">        </span><span class="p">{</span><span class="nt">&quot;class&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;person&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.95</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;bbox&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="mi">100</span><span class="p">,</span><span class="w"> </span><span class="mi">200</span><span class="p">,</span><span class="w"> </span><span class="mi">150</span><span class="p">,</span><span class="w"> </span><span class="mi">350</span><span class="p">]}</span>
+<span class="w">      </span><span class="p">],</span>
+<span class="w">      </span><span class="nt">&quot;start_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;end_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">125.3</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>chunks</code></td>
+<td>array</td>
+<td>Array of matching visual chunks</td>
+</tr>
+<tr>
+<td><code>chunks[].file_uuid</code></td>
+<td>string</td>
+<td>File UUID</td>
+</tr>
+<tr>
+<td><code>chunks[].chunk_id</code></td>
+<td>string</td>
+<td>Chunk identifier</td>
+</tr>
+<tr>
+<td><code>chunks[].detections</code></td>
+<td>array</td>
+<td>Object detections in this chunk</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total matching chunks</td>
+</tr>
+</tbody>
+</table>
+<hr />
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/Demo_EndToEnd.html b/docs_v1.0/doc_user/Demo_EndToEnd.html
new file mode 100644
index 0000000..527ce46
--- /dev/null
+++ b/docs_v1.0/doc_user/Demo_EndToEnd.html
@@ -0,0 +1,1084 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Demo Endtoend - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "demo_guide"
+service: "MOMENTRY_CORE"
+title: "Pipeline Demo End-to-End"
+date: "2026-05-15"
+version: "V1.0"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"
+tags:
+  - "demo"
+  - "pipeline"
+  - "end-to-end"
+  - "api"
+ai_query_hints:
+  - "如何執行端到端 Pipeline demo"
+  - "Pipeline 處理流程"
+  - "註冊影片並觸發處理的完整流程"
+related_documents:
+  - "GUIDES/API_ENDPOINTS.md"
+  - "GUIDES/Pipeline_API_Demo.md"</p>
+<hr />
+<h1>Momentry Core — Pipeline Demo End-to-End</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>建立者</td>
+<td>OpenCode</td>
+</tr>
+<tr>
+<td>建立時間</td>
+<td>2026-05-15</td>
+</tr>
+<tr>
+<td>文件版本</td>
+<td>V1.0</td>
+</tr>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key、Pipeline 基本概念</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Table of Contents</h2>
+<h3>Pipeline Phases</h3>
+<table class="table">
+<thead>
+<tr>
+<th>Phase</th>
+<th>Step</th>
+<th>What happens</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Pre</strong></td>
+<td>1–4</td>
+<td>System check, scan, register, probe</td>
+</tr>
+<tr>
+<td><strong>處理中</strong></td>
+<td>5–6</td>
+<td>Submit job → Worker picks up → Each processor runs (pending→running→completed)</td>
+</tr>
+<tr>
+<td><strong>處理後</strong></td>
+<td>7–9</td>
+<td>All results → Search → Identities → Schema verification</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>1. 檢查系統狀況</h2>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://m5api.momentry.ddns.net&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span>
+
+<span class="c1"># Basic health</span>
+curl<span class="w"> </span>-sf<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, version, build_git_hash, uptime_ms}&#39;</span>
+
+<span class="c1"># Detailed health</span>
+curl<span class="w"> </span>-sf<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health/detailed&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{</span>
+<span class="s1">  services, </span>
+<span class="s1">  schema: .schema.ok, </span>
+<span class="s1">  scripts: .pipeline.scripts_count, </span>
+<span class="s1">  integrity: .pipeline.scripts_integrity,</span>
+<span class="s1">  procs: [.pipeline.processors | to_entries[] | select(.value == true and .key != &quot;total_py_files&quot;) | .key]</span>
+<span class="s1">}&#39;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_git_hash&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;c41f7e0c&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;uptime_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2756192</span>
+<span class="p">}</span>
+<span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;services&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;postgres&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;redis&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;qdrant&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;schema&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;scripts&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">291</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;integrity&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">332</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;procs&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;asr&quot;</span><span class="p">,</span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span><span class="s2">&quot;face&quot;</span><span class="p">,</span><span class="s2">&quot;pose&quot;</span><span class="p">,</span><span class="s2">&quot;ocr&quot;</span><span class="p">,</span><span class="s2">&quot;cut&quot;</span><span class="p">,</span><span class="s2">&quot;caption&quot;</span><span class="p">,</span><span class="s2">&quot;scene&quot;</span><span class="p">,</span><span class="s2">&quot;story&quot;</span><span class="p">,</span><span class="s2">&quot;asrx&quot;</span><span class="p">,</span><span class="s2">&quot;probe&quot;</span><span class="p">,</span><span class="s2">&quot;visual_chunk&quot;</span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>2. 掃描檔案</h2>
+<p>掃描伺服器上所有與 <code>exasan</code> 相關的檔案（支援規則表達式）：</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?pattern=exasan&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {uuid: .file_uuid, name: .file_name, size: .file_size}]&#39;</span>
+</code></pre></div>
+
+<p>輸出（節錄）：</p>
+<div class="codehilite"><pre><span></span><code><span class="p">[</span>
+<span class="w">  </span><span class="p">{</span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;dd61fda85fee441f...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ExaSAN PCIe series - Director Ou Yu-Zhi Shares His Experience.mp4&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">6827600</span><span class="p">},</span>
+<span class="w">  </span><span class="p">{</span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;8e2e98c49355935f...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ExaSAN Webinar by Blake Jones, Vision2see.mp4&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">38635889</span><span class="p">},</span>
+<span class="w">  </span><span class="p">{</span><span class="nt">&quot;uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;477d8fa7bc0e1a7...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Thunderbolt ExaSAN at CCBN.mp4&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">13126748</span><span class="p">}</span>
+<span class="p">]</span>
+</code></pre></div>
+
+<p><strong>Note</strong>: <code>files/scan</code> 也可以掃所有檔案，或用於批次註冊。若不指定 pattern，回傳伺服器 <code>sftpgo/data/demo/</code> 目錄下所有檔案。</p>
+<hr />
+<h2>3. 註冊或確認</h2>
+<p>若檔案尚未註冊，使用 register API。若已存在（如本次示範），直接確認狀態：</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">UUID</span><span class="o">=</span><span class="s2">&quot;dd61fda85fee441fdd00ab5528213ff7&quot;</span>
+
+<span class="c1"># 確認檔案狀態</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{uuid: .file_uuid[0:16], name: .file_name, status, duration, fps}&#39;</span>
+
+<span class="c1"># 若檔案不存在，使用註冊 API：</span>
+<span class="c1"># curl -sf -X POST -H &quot;X-API-Key: $KEY&quot; -H &quot;Content-Type: application/json&quot; \</span>
+<span class="c1">#   -d &#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39; \</span>
+<span class="c1">#   &quot;$API/api/v1/files/register&quot; | jq &#39;.&#39;</span>
+</code></pre></div>
+
+<p><strong>註冊流程</strong>：</p>
+<div class="codehilite"><pre><span></span><code><span class="n">POST</span><span class="w"> </span><span class="o">/</span><span class="n">files</span><span class="o">/</span><span class="n">register</span>
+<span class="w">  </span><span class="err">├─</span><span class="w"> </span><span class="n">SHA256</span><span class="w"> </span><span class="n">content_hash</span><span class="w"> </span><span class="p">(</span><span class="n">dedup</span><span class="w"> </span><span class="err">檢查</span><span class="p">)</span>
+<span class="w">  </span><span class="err">├─</span><span class="w"> </span><span class="n">file_name</span><span class="w"> </span><span class="err">衝突檢查</span><span class="w"> </span><span class="p">(</span><span class="err">自動</span><span class="w"> </span><span class="n">rename</span><span class="p">)</span>
+<span class="w">  </span><span class="err">├─</span><span class="w"> </span><span class="n">Pre</span><span class="o">-</span><span class="n">process</span><span class="w"> </span><span class="p">(</span><span class="n">SHA256</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">ffprobe</span><span class="w"> </span><span class="o">+</span><span class="w"> </span><span class="n">UUID</span><span class="w"> </span><span class="err">→</span><span class="w"> </span><span class="p">.</span><span class="n">pre</span><span class="p">.</span><span class="n">json</span><span class="p">)</span>
+<span class="w">  </span><span class="err">├─</span><span class="w"> </span><span class="n">UUID</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">f</span><span class="p">(</span><span class="n">mac</span><span class="p">,</span><span class="w"> </span><span class="n">mtime</span><span class="p">,</span><span class="w"> </span><span class="n">path</span><span class="p">,</span><span class="w"> </span><span class="n">filename</span><span class="p">)</span>
+<span class="w">  </span><span class="err">├─</span><span class="w"> </span><span class="n">Unified</span><span class="w"> </span><span class="n">probe</span><span class="w"> </span><span class="p">(</span><span class="n">video</span><span class="err">→</span><span class="n">ffprobe</span><span class="p">,</span><span class="w"> </span><span class="n">doc</span><span class="err">→</span><span class="n">Python</span><span class="p">)</span>
+<span class="w">  </span><span class="err">└─</span><span class="w"> </span><span class="n">INSERT</span><span class="w"> </span><span class="n">INTO</span><span class="w"> </span><span class="n">videos</span>
+</code></pre></div>
+
+<hr />
+<h2>4. Probe 確認</h2>
+<p>The probe endpoint returns ffprobe metadata about the registered file.</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Substitute the actual file_uuid from step 3</span>
+<span class="nv">FILE_UUID</span><span class="o">=</span><span class="s2">&quot;e1111111111111111111111111111111&quot;</span>
+
+curl<span class="w"> </span>-s<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/file/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">/probe&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-m<span class="w"> </span>json.tool
+</code></pre></div>
+
+<p>Output (abbreviated):</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;e1111111111111111111111111111111&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;demo_test_video.mp4&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">5.005</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">640</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">480</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">120</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;cached&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;format&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">        </span><span class="nt">&quot;filename&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/tmp/demo_test_video.mp4&quot;</span><span class="p">,</span>
+<span class="w">        </span><span class="nt">&quot;format_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;mov,mp4,m4a,3gp,3g2,mj2&quot;</span><span class="p">,</span>
+<span class="w">        </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;5.005000&quot;</span><span class="p">,</span>
+<span class="w">        </span><span class="nt">&quot;size&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;98304&quot;</span><span class="p">,</span>
+<span class="w">        </span><span class="nt">&quot;bit_rate&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;157184&quot;</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;streams&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">        </span><span class="p">{</span><span class="nt">&quot;index&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">0</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;codec_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;codec_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;h264&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">640</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">480</span><span class="p">,</span><span class="w"> </span><span class="err">...</span><span class="p">},</span>
+<span class="w">        </span><span class="p">{</span><span class="nt">&quot;index&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;codec_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;audio&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;codec_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aac&quot;</span><span class="p">,</span><span class="w"> </span><span class="err">...</span><span class="p">}</span>
+<span class="w">    </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p><strong>Error handling</strong> (Bug #3 fix):
+- Non-existent UUID → <code>{"error":"Video not found"}</code> + HTTP 404
+- File deleted from disk → <code>{"error":"File does not exist at registered path"}</code> + HTTP 404
+- ffprobe failure → <code>{"error":"ffprobe failed: ..."}</code> + HTTP 500</p>
+<h3>⚡ Intermediate Check — Bug #3: Probe Error Verification</h3>
+<p>Test both error cases return proper JSON + HTTP code instead of bare 500:</p>
+<div class="codehilite"><pre><span></span><code><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Non-existent UUID → expect 404 ===&quot;</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;\nHTTP: %{http_code}\n&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/file/bad_uuid_12345/probe&quot;</span>
+<span class="c1"># Expect: {&quot;error&quot;:&quot;Video not found&quot;,&quot;file_uuid&quot;:&quot;bad_uuid_12345&quot;}  HTTP 404</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;&quot;</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Non-existent file path → expect 404 ===&quot;</span>
+<span class="c1"># Temporarily change file_path to a non-existent location</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;UPDATE dev.videos SET file_path = &#39;/tmp/NONEXISTENT_FILE&#39; WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;&quot;</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;\nHTTP: %{http_code}\n&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/file/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">/probe&quot;</span>
+<span class="c1"># Expect: {&quot;error&quot;:&quot;File does not exist at registered path&quot;,...}  HTTP 404</span>
+<span class="c1"># Restore path</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;UPDATE dev.videos SET file_path = &#39;/tmp/demo_test_video.mp4&#39; WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="o">===</span><span class="w"> </span><span class="n">Non</span><span class="o">-</span><span class="n">existent</span><span class="w"> </span><span class="n">UUID</span><span class="w"> </span><span class="err">→</span><span class="w"> </span><span class="n">expect</span><span class="w"> </span><span class="mh">404</span><span class="w"> </span><span class="o">===</span>
+<span class="p">{</span><span class="s">&quot;error&quot;</span><span class="o">:</span><span class="s">&quot;Video not found&quot;</span><span class="p">,</span><span class="s">&quot;file_uuid&quot;</span><span class="o">:</span><span class="s">&quot;bad_uuid_12345&quot;</span><span class="p">}</span>
+<span class="nl">HTTP:</span><span class="w"> </span><span class="mh">404</span>
+
+<span class="o">===</span><span class="w"> </span><span class="n">Non</span><span class="o">-</span><span class="n">existent</span><span class="w"> </span><span class="n">file</span><span class="w"> </span><span class="n">path</span><span class="w"> </span><span class="err">→</span><span class="w"> </span><span class="n">expect</span><span class="w"> </span><span class="mh">404</span><span class="w"> </span><span class="o">===</span>
+<span class="p">{</span><span class="s">&quot;error&quot;</span><span class="o">:</span><span class="s">&quot;File does not exist at registered path&quot;</span><span class="p">,</span><span class="s">&quot;file_uuid&quot;</span><span class="o">:</span><span class="s">&quot;e1111111111111111111111111111111&quot;</span><span class="p">,</span><span class="s">&quot;file_path&quot;</span><span class="o">:</span><span class="s">&quot;/tmp/NONEXISTENT_FILE&quot;</span><span class="p">}</span>
+<span class="nl">HTTP:</span><span class="w"> </span><span class="mh">404</span>
+</code></pre></div>
+
+<hr />
+<h2>5. Process Video</h2>
+<p>Trigger pipeline processing for specific processors. The available processors are:</p>
+<table class="table">
+<thead>
+<tr>
+<th>Processor</th>
+<th>Function</th>
+<th>Script</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>asr</code></td>
+<td>Speech-to-text (faster-whisper)</td>
+<td><code>asr_processor.py</code></td>
+</tr>
+<tr>
+<td><code>cut</code></td>
+<td>Scene detection (PySceneDetect)</td>
+<td><code>cut_processor.py</code></td>
+</tr>
+<tr>
+<td><code>yolo</code></td>
+<td>Object detection (YOLOv8)</td>
+<td><code>yolo_processor.py</code></td>
+</tr>
+<tr>
+<td><code>face</code></td>
+<td>Face detection (InsightFace)</td>
+<td><code>face_processor.py</code></td>
+</tr>
+<tr>
+<td><code>pose</code></td>
+<td>Pose estimation (MediaPipe)</td>
+<td><code>pose_processor.py</code></td>
+</tr>
+<tr>
+<td><code>ocr</code></td>
+<td>Text detection (PaddleOCR)</td>
+<td><code>ocr_processor.py</code></td>
+</tr>
+<tr>
+<td><code>asrx</code></td>
+<td>Speaker diarization</td>
+<td><code>asrx_processor.py</code></td>
+</tr>
+<tr>
+<td><code>visual_chunk</code></td>
+<td>Visual content analysis</td>
+<td><code>visual_chunk_processor.py</code></td>
+</tr>
+<tr>
+<td><code>scene</code></td>
+<td>Scene classification</td>
+<td><code>scene_classifier.py</code></td>
+</tr>
+<tr>
+<td><code>story</code></td>
+<td>Story generation (LLM)</td>
+<td><code>story_processor.py</code></td>
+</tr>
+<tr>
+<td><code>caption</code></td>
+<td>Caption generation</td>
+<td><code>caption_processor.py</code></td>
+</tr>
+</tbody>
+</table>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Trigger only ASR + CUT for quick test</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/file/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;processors&quot;: [&quot;asr&quot;, &quot;cut&quot;]}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-m<span class="w"> </span>json.tool
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">161</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;e1111111111111111111111111111111&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;PENDING&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;pids&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[],</span>
+<span class="w">    </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Processing triggered for demo_test_video.mp4&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p><strong>Processing flow</strong>:</p>
+<div class="codehilite"><pre><span></span><code><span class="n">POST</span> <span class="o">/</span><span class="n">process</span> <span class="err">→</span> <span class="n">trigger_processing</span><span class="p">()</span>
+  <span class="err">├─</span> <span class="n">Validate</span> <span class="n">file</span> <span class="n">exists</span> <span class="p">(</span><span class="n">DB</span> <span class="n">lookup</span><span class="p">)</span>
+  <span class="err">├─</span> <span class="n">Create</span> <span class="n">monitor_job</span> <span class="p">(</span><span class="n">status</span><span class="p">:</span> <span class="n">PENDING</span><span class="p">)</span>
+  <span class="err">├─</span> <span class="n">Create</span> <span class="n">processor_result</span> <span class="n">rows</span> <span class="n">for</span> <span class="n">each</span> <span class="n">requested</span> <span class="n">processor</span> <span class="p">(</span><span class="n">status</span><span class="p">:</span> <span class="n">pending</span><span class="p">)</span>
+  <span class="err">└─</span> <span class="n">Response</span> <span class="p">{</span> <span class="n">job_id</span><span class="p">,</span> <span class="n">status</span><span class="p">:</span> <span class="s">&quot;PENDING&quot;</span> <span class="p">}</span>
+</code></pre></div>
+
+<p><strong>Note</strong>: If no processors are specified, all processors are used:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;asr&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;cut&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;ocr&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;face&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;pose&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;asrx&quot;</span><span class="p">,</span><span class="w"> </span><span class="s2">&quot;visual_chunk&quot;</span><span class="p">]}</span>
+</code></pre></div>
+
+<h3>⚡ Intermediate Check — Verify Job + Processor Results after Trigger</h3>
+<div class="codehilite"><pre><span></span><code><span class="nv">PG_BIN</span><span class="o">=</span><span class="s2">&quot;/Users/accusys/pgsql/18.3/bin&quot;</span>
+
+<span class="c1"># Check monitor_jobs table</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT id, uuid, status, current_processor,</span>
+<span class="s2">       to_char(created_at, &#39;HH24:MI:SS&#39;) AS created</span>
+<span class="s2">FROM dev.monitor_jobs</span>
+<span class="s2">WHERE uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">ORDER BY id DESC LIMIT 1</span>
+<span class="s2">\gx</span>
+<span class="s2">&quot;</span>
+
+<span class="c1"># Check processor_results table</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT id, processor, status</span>
+<span class="s2">FROM dev.processor_results</span>
+<span class="s2">WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">ORDER BY id</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="o">-</span><span class="p">[</span> <span class="kr">RECORD</span> <span class="mi">1</span> <span class="p">]</span><span class="o">------+-----------------------------</span>
+<span class="n">id</span>                 <span class="p">|</span> <span class="mi">161</span>
+<span class="n">uuid</span>               <span class="p">|</span> <span class="n">e1111111111111111111111111111111</span>
+<span class="n">status</span>             <span class="p">|</span> <span class="n">PENDING</span>
+<span class="n">current_processor</span>  <span class="p">|</span> <span class="p">(</span><span class="n">null</span><span class="p">)</span>
+<span class="n">created</span>            <span class="p">|</span> <span class="mi">19</span><span class="p">:</span><span class="mi">00</span><span class="p">:</span><span class="mi">30</span>
+
+ <span class="n">id</span> <span class="p">|</span> <span class="n">processor</span> <span class="p">|</span> <span class="n">status</span>
+<span class="o">----+-----------+---------</span>
+  <span class="mi">1</span> <span class="p">|</span> <span class="n">asr</span>       <span class="p">|</span> <span class="n">pending</span>
+  <span class="mi">2</span> <span class="p">|</span> <span class="n">cut</span>       <span class="p">|</span> <span class="n">pending</span>
+</code></pre></div>
+
+<p><strong>Checklist after trigger:</strong>
+- [ ] <code>monitor_jobs.status = 'PENDING'</code> — job created, awaiting worker
+- [ ] <code>processor_results</code> rows match requested processors (2 rows for <code>asr</code>, <code>cut</code>)
+- [ ] Each <code>processor.status = 'pending'</code> — not yet executed</p>
+<hr />
+<h2>6. Worker Execution</h2>
+<p>The worker polls for pending jobs and executes them one by one.</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">DATABASE_SCHEMA</span><span class="o">=</span>dev<span class="w"> </span>cargo<span class="w"> </span>run<span class="w"> </span>--bin<span class="w"> </span>momentry_playground<span class="w"> </span>--<span class="w"> </span>worker<span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>--max-concurrent<span class="w"> </span><span class="m">2</span><span class="w"> </span>--poll-interval<span class="w"> </span><span class="m">5</span>
+</code></pre></div>
+
+<p>Or in background:</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">DATABASE_SCHEMA</span><span class="o">=</span>dev<span class="w"> </span>nohup<span class="w"> </span>target/debug/momentry_playground<span class="w"> </span>worker<span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>--max-concurrent<span class="w"> </span><span class="m">2</span><span class="w"> </span>--poll-interval<span class="w"> </span><span class="m">5</span><span class="w"> </span>&gt;<span class="w"> </span>/tmp/worker_demo.log<span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">&amp;</span>
+</code></pre></div>
+
+<p><strong>Worker flow</strong>:</p>
+<div class="codehilite"><pre><span></span><code>Worker loop (every 5 seconds):
+  ├─ Poll: SELECT * FROM monitor_jobs WHERE status = &#39;PENDING&#39;
+  ├─ Set job status → RUNNING
+  ├─ For each pending processor:
+  │    ├─ SHA256 integrity check (verify_script_integrity)
+  │    │    └─ checksums.sha256 manifest lookup
+  │    ├─ Execute script via PythonExecutor
+  │    │    └─ Command: {MOMENTRY_PYTHON_PATH} scripts/&lt;processor&gt;.py &lt;args&gt;
+  │    ├─ Verify output (file exists, content valid)
+  │    └─ Update processor_result (completed/failed)
+  ├─ Check completion: all processors done?
+  ├─ Yes → Set job + video status → COMPLETED
+  └─ No → Wait for next poll cycle
+</code></pre></div>
+
+<p><strong>Worker log output</strong>:</p>
+<div class="codehilite"><pre><span></span><code><span class="o">[</span><span class="n">CHECKSUMS</span><span class="o">]</span><span class="w"> </span><span class="n">Loaded</span><span class="w"> </span><span class="mi">345</span><span class="w"> </span><span class="n">entries</span><span class="w"> </span><span class="k">from</span><span class="w"> </span><span class="n">checksums</span><span class="p">.</span><span class="n">sha256</span>
+<span class="o">[</span><span class="n">INTEGRITY</span><span class="o">]</span><span class="w"> </span><span class="n">asr_processor</span><span class="p">.</span><span class="n">py</span><span class="w"> </span><span class="nf">checksum</span><span class="w"> </span><span class="n">OK</span>
+<span class="o">[</span><span class="n">ASR</span><span class="o">]</span><span class="w"> </span><span class="n">Starting</span><span class="w"> </span><span class="n">asr_processor</span><span class="p">.</span><span class="n">py</span>
+<span class="o">[</span><span class="n">INTEGRITY</span><span class="o">]</span><span class="w"> </span><span class="n">cut_processor</span><span class="p">.</span><span class="n">py</span><span class="w"> </span><span class="nf">checksum</span><span class="w"> </span><span class="n">OK</span><span class="w">  </span>
+<span class="o">[</span><span class="n">CUT</span><span class="o">]</span><span class="w"> </span><span class="n">Starting</span><span class="w"> </span><span class="n">cut_processor</span><span class="p">.</span><span class="n">py</span>
+<span class="o">[</span><span class="n">ASR</span><span class="o">]</span><span class="w"> </span><span class="n">Completed</span><span class="w"> </span><span class="n">successfully</span>
+<span class="o">[</span><span class="n">CUT</span><span class="o">]</span><span class="w"> </span><span class="n">Completed</span><span class="w"> </span><span class="n">successfully</span>
+<span class="nl">check_and_complete_job</span><span class="p">:</span><span class="w"> </span><span class="n">results</span><span class="o">=</span><span class="mi">2</span><span class="o">/</span><span class="mi">2</span><span class="w"> </span><span class="err">→</span><span class="w"> </span><span class="n">Job</span><span class="w"> </span><span class="n">COMPLETED</span>
+</code></pre></div>
+
+<h3>⚡ Intermediate Check — Poll Progress During Worker Execution</h3>
+<p>While the worker is running, poll the progress endpoint to watch state transitions:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Poll every 5 seconds until completed</span>
+<span class="nv">FILE_UUID</span><span class="o">=</span><span class="s2">&quot;e1111111111111111111111111111111&quot;</span>
+<span class="k">for</span><span class="w"> </span>i<span class="w"> </span><span class="k">in</span><span class="w"> </span><span class="k">$(</span>seq<span class="w"> </span><span class="m">1</span><span class="w"> </span><span class="m">12</span><span class="k">)</span><span class="p">;</span><span class="w"> </span><span class="k">do</span>
+<span class="w">    </span>sleep<span class="w"> </span><span class="m">5</span>
+<span class="w">    </span><span class="nv">STATUS</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">        </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/progress/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">        </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;d=json.load(sys.stdin);print(d.get(&#39;status&#39;,&#39;?&#39;))&quot;</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null<span class="w"> </span><span class="o">||</span><span class="w"> </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;pending&quot;</span><span class="k">)</span>
+<span class="w">    </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;Poll </span><span class="nv">$i</span><span class="s2">: status=</span><span class="nv">$STATUS</span><span class="s2">&quot;</span>
+<span class="w">    </span><span class="o">[</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$STATUS</span><span class="s2">&quot;</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="w"> </span><span class="o">]</span><span class="w"> </span><span class="o">||</span><span class="w"> </span><span class="o">[</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$STATUS</span><span class="s2">&quot;</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="s2">&quot;failed&quot;</span><span class="w"> </span><span class="o">]</span><span class="w"> </span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="k">break</span>
+<span class="k">done</span>
+</code></pre></div>
+
+<p>Output (typical):</p>
+<div class="codehilite"><pre><span></span><code><span class="n">Poll</span><span class="w"> </span><span class="mh">1</span><span class="o">:</span><span class="w"> </span><span class="n">status</span><span class="o">=</span><span class="n">registered</span><span class="w">         </span><span class="err">←</span><span class="w"> </span><span class="n">worker</span><span class="w"> </span><span class="n">hasn</span><span class="p">&#39;</span><span class="n">t</span><span class="w"> </span><span class="n">picked</span><span class="w"> </span><span class="n">it</span><span class="w"> </span><span class="n">up</span><span class="w"> </span><span class="n">yet</span>
+<span class="n">Poll</span><span class="w"> </span><span class="mh">2</span><span class="o">:</span><span class="w"> </span><span class="n">status</span><span class="o">=</span><span class="n">pending</span><span class="w">            </span><span class="err">←</span><span class="w"> </span><span class="n">worker</span><span class="w"> </span><span class="n">picked</span><span class="w"> </span><span class="n">up</span><span class="p">,</span><span class="w"> </span><span class="n">job</span><span class="w"> </span><span class="n">status</span><span class="w"> </span><span class="n">changed</span>
+<span class="n">Poll</span><span class="w"> </span><span class="mh">3</span><span class="o">:</span><span class="w"> </span><span class="n">status</span><span class="o">=</span><span class="n">processing</span><span class="w">         </span><span class="err">←</span><span class="w"> </span><span class="n">worker</span><span class="w"> </span><span class="n">running</span><span class="w"> </span><span class="n">ASR</span>
+<span class="n">Poll</span><span class="w"> </span><span class="mh">4</span><span class="o">:</span><span class="w"> </span><span class="n">status</span><span class="o">=</span><span class="n">processing</span><span class="w">         </span><span class="err">←</span><span class="w"> </span><span class="n">worker</span><span class="w"> </span><span class="n">running</span><span class="w"> </span><span class="n">CUT</span>
+<span class="n">Poll</span><span class="w"> </span><span class="mh">5</span><span class="o">:</span><span class="w"> </span><span class="n">status</span><span class="o">=</span><span class="n">completed</span><span class="w">          </span><span class="err">←</span><span class="w"> </span><span class="n">all</span><span class="w"> </span><span class="n">done</span>
+</code></pre></div>
+
+<p>Check status transitions in DB:</p>
+<div class="codehilite"><pre><span></span><code><span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT id, processor, status,</span>
+<span class="s2">       to_char(started_at, &#39;HH24:MI:SS&#39;) AS started,</span>
+<span class="s2">       to_char(completed_at, &#39;HH24:MI:SS&#39;) AS completed</span>
+<span class="s2">FROM dev.processor_results</span>
+<span class="s2">WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">ORDER BY id</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code> id | processor |  status    | started   | completed
+----+-----------+------------+-----------+-----------
+  1 | asr       | completed  | 19:01:02  | 19:01:25
+  2 | cut       | completed  | 19:01:02  | 19:01:08
+</code></pre></div>
+
+<h3>⚡ Processing Checklist — Step-by-Step Verification</h3>
+<p>This checklist covers every stage of the pipeline processing flow:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># ──────────────────────────────────────────────────────</span>
+<span class="c1"># Stage A: Before Worker Starts</span>
+<span class="c1"># ──────────────────────────────────────────────────────</span>
+<span class="nv">PG_BIN</span><span class="o">=</span><span class="s2">&quot;/Users/accusys/pgsql/18.3/bin&quot;</span>
+<span class="nv">FILE_UUID</span><span class="o">=</span><span class="s2">&quot;e1111111111111111111111111111111&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== A1. Job status = PENDING ===&quot;</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT id, status, current_processor, created_at FROM dev.monitor_jobs WHERE uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">&quot;</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== A2. Processor results = pending ===&quot;</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT id, processor, status FROM dev.processor_results WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39; ORDER BY id</span>
+<span class="s2">&quot;</span>
+
+<span class="c1"># ──────────────────────────────────────────────────────</span>
+<span class="c1"># Stage B: Worker Running</span>
+<span class="c1"># ──────────────────────────────────────────────────────</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Start worker ===&quot;</span>
+<span class="nv">DATABASE_SCHEMA</span><span class="o">=</span>dev<span class="w"> </span>nohup<span class="w"> </span>target/debug/momentry_playground<span class="w"> </span>worker<span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>--max-concurrent<span class="w"> </span><span class="m">1</span><span class="w"> </span>--poll-interval<span class="w"> </span><span class="m">3</span><span class="w"> </span>&gt;<span class="w"> </span>/tmp/worker_check.log<span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">&amp;</span>
+<span class="nv">WPID</span><span class="o">=</span><span class="nv">$!</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== B1. Worker picks up job (within 3-10s) ===&quot;</span>
+<span class="k">for</span><span class="w"> </span>i<span class="w"> </span><span class="k">in</span><span class="w"> </span><span class="k">$(</span>seq<span class="w"> </span><span class="m">1</span><span class="w"> </span><span class="m">10</span><span class="k">)</span><span class="p">;</span><span class="w"> </span><span class="k">do</span>
+<span class="w">    </span>sleep<span class="w"> </span><span class="m">3</span>
+<span class="w">    </span><span class="nv">JOB_STATUS</span><span class="o">=</span><span class="k">$(</span><span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-t<span class="w"> </span>-A<span class="w"> </span>-c<span class="w"> </span><span class="se">\</span>
+<span class="w">        </span><span class="s2">&quot;SELECT status FROM dev.monitor_jobs WHERE uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;&quot;</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null<span class="k">)</span>
+<span class="w">    </span><span class="nv">VIDEO_STATUS</span><span class="o">=</span><span class="k">$(</span><span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-t<span class="w"> </span>-A<span class="w"> </span>-c<span class="w"> </span><span class="se">\</span>
+<span class="w">        </span><span class="s2">&quot;SELECT status FROM dev.videos WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;&quot;</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null<span class="k">)</span>
+<span class="w">    </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;  Poll </span><span class="nv">$i</span><span class="s2">: job=</span><span class="nv">$JOB_STATUS</span><span class="s2"> video=</span><span class="nv">$VIDEO_STATUS</span><span class="s2">&quot;</span>
+<span class="w">    </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;  </span><span class="k">$(</span>grep<span class="w"> </span><span class="s1">&#39;\[INTEGRITY\]\|\[SCHEMA\]\|Starting:\|Completed\|failed\|Job &#39;</span><span class="w"> </span>/tmp/worker_check.log<span class="w"> </span><span class="m">2</span>&gt;/dev/null<span class="w"> </span><span class="p">|</span><span class="w"> </span>tail<span class="w"> </span>-3<span class="k">)</span><span class="s2">&quot;</span>
+
+<span class="w">    </span><span class="c1"># Check alive</span>
+<span class="w">    </span><span class="nb">kill</span><span class="w"> </span>-0<span class="w"> </span><span class="nv">$WPID</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null<span class="w"> </span><span class="o">||</span><span class="w"> </span><span class="o">{</span><span class="w"> </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;  Worker died unexpectedly&quot;</span><span class="p">;</span><span class="w"> </span><span class="k">break</span><span class="p">;</span><span class="w"> </span><span class="o">}</span>
+
+<span class="w">    </span><span class="k">if</span><span class="w"> </span><span class="o">[</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$VIDEO_STATUS</span><span class="s2">&quot;</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="w"> </span><span class="o">]</span><span class="w"> </span><span class="o">||</span><span class="w"> </span><span class="o">[</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$VIDEO_STATUS</span><span class="s2">&quot;</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="s2">&quot;failed&quot;</span><span class="w"> </span><span class="o">]</span><span class="p">;</span><span class="w"> </span><span class="k">then</span><span class="w"> </span><span class="k">break</span><span class="p">;</span><span class="w"> </span><span class="k">fi</span>
+<span class="k">done</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== B2. Each processor status ===&quot;</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT id, processor, status,</span>
+<span class="s2">       to_char(started_at, &#39;HH24:MI:SS&#39;) AS started,</span>
+<span class="s2">       to_char(completed_at, &#39;HH24:MI:SS&#39;) AS completed,</span>
+<span class="s2">       COALESCE(chunks_produced, 0) AS chunks,</span>
+<span class="s2">       COALESCE(frames_processed, 0) AS frames,</span>
+<span class="s2">       COALESCE(error_message, &#39;&#39;) AS error</span>
+<span class="s2">FROM dev.processor_results</span>
+<span class="s2">WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">ORDER BY id</span>
+<span class="s2">&quot;</span>
+
+<span class="nb">kill</span><span class="w"> </span><span class="nv">$WPID</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null<span class="w"> </span><span class="o">||</span><span class="w"> </span><span class="nb">true</span>
+
+<span class="c1"># ──────────────────────────────────────────────────────</span>
+<span class="c1"># Stage C: After Completion</span>
+<span class="c1"># ──────────────────────────────────────────────────────</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== C1. Video final status ===&quot;</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT file_uuid, file_name, status, duration, fps, total_frames FROM dev.videos WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">&quot;</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== C2. Chunks produced ===&quot;</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT chunk_type, count(*) FROM dev.chunk WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39; GROUP BY chunk_type ORDER BY chunk_type</span>
+<span class="s2">&quot;</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== C3. Job final status ===&quot;</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT id, status, current_processor FROM dev.monitor_jobs WHERE uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Expected output (all green):</p>
+<div class="codehilite"><pre><span></span><code><span class="o">===</span><span class="w"> </span><span class="n">A1</span><span class="p">.</span><span class="w"> </span><span class="n">Job</span><span class="w"> </span><span class="n">status</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">PENDING</span><span class="w"> </span><span class="o">===</span>
+<span class="w"> </span><span class="n">id</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">status</span><span class="w">  </span><span class="o">|</span><span class="w"> </span><span class="n">current_processor</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">created_at</span>
+<span class="c1">----+---------+-------------------+-------------------</span>
+<span class="w"> </span><span class="mi">161</span><span class="o">|</span><span class="w"> </span><span class="n">PENDING</span><span class="w"> </span><span class="o">|</span><span class="w">                   </span><span class="o">|</span><span class="w"> </span><span class="mi">2026</span><span class="o">-</span><span class="mi">05</span><span class="o">-</span><span class="mi">15</span><span class="w"> </span><span class="mi">19</span><span class="err">:</span><span class="mi">00</span><span class="err">:</span><span class="mi">30</span>
+
+<span class="o">===</span><span class="w"> </span><span class="n">A2</span><span class="p">.</span><span class="w"> </span><span class="n">Processor</span><span class="w"> </span><span class="n">results</span><span class="w"> </span><span class="o">=</span><span class="w"> </span><span class="n">pending</span><span class="w"> </span><span class="o">===</span>
+<span class="w"> </span><span class="n">id</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">processor</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">status</span>
+<span class="c1">----+-----------+---------</span>
+<span class="w">  </span><span class="mi">1</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">asr</span><span class="w">       </span><span class="o">|</span><span class="w"> </span><span class="n">pending</span>
+<span class="w">  </span><span class="mi">2</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">cut</span><span class="w">       </span><span class="o">|</span><span class="w"> </span><span class="n">pending</span>
+
+<span class="o">===</span><span class="w"> </span><span class="k">Start</span><span class="w"> </span><span class="n">worker</span><span class="w"> </span><span class="o">===</span>
+<span class="o">===</span><span class="w"> </span><span class="n">B1</span><span class="p">.</span><span class="w"> </span><span class="n">Worker</span><span class="w"> </span><span class="n">picks</span><span class="w"> </span><span class="n">up</span><span class="w"> </span><span class="n">job</span><span class="w"> </span><span class="p">(</span><span class="k">within</span><span class="w"> </span><span class="mi">3</span><span class="o">-</span><span class="mi">10</span><span class="n">s</span><span class="p">)</span><span class="w"> </span><span class="o">===</span>
+<span class="w">  </span><span class="n">Poll</span><span class="w"> </span><span class="mi">1</span><span class="err">:</span><span class="w"> </span><span class="n">job</span><span class="o">=</span><span class="n">PENDING</span><span class="w"> </span><span class="n">video</span><span class="o">=</span><span class="n">registered</span>
+<span class="w">  </span><span class="n">Poll</span><span class="w"> </span><span class="mi">2</span><span class="err">:</span><span class="w"> </span><span class="n">job</span><span class="o">=</span><span class="n">RUNNING</span><span class="w"> </span><span class="n">video</span><span class="o">=</span><span class="n">processing</span>
+<span class="w">  </span><span class="o">[</span><span class="n">INTEGRITY</span><span class="o">]</span><span class="w"> </span><span class="n">asr_processor</span><span class="p">.</span><span class="n">py</span><span class="w"> </span><span class="nf">checksum</span><span class="w"> </span><span class="n">OK</span>
+<span class="w">  </span><span class="n">Poll</span><span class="w"> </span><span class="mi">3</span><span class="err">:</span><span class="w"> </span><span class="n">job</span><span class="o">=</span><span class="n">RUNNING</span><span class="w"> </span><span class="n">video</span><span class="o">=</span><span class="n">processing</span>
+<span class="w">  </span><span class="o">[</span><span class="n">ASR</span><span class="o">]</span><span class="w"> </span><span class="nl">Starting</span><span class="p">:</span><span class="w"> </span><span class="n">asr_processor</span><span class="p">.</span><span class="n">py</span>
+<span class="w">  </span><span class="n">Poll</span><span class="w"> </span><span class="mi">4</span><span class="err">:</span><span class="w"> </span><span class="n">job</span><span class="o">=</span><span class="n">RUNNING</span><span class="w"> </span><span class="n">video</span><span class="o">=</span><span class="n">processing</span>
+<span class="w">  </span><span class="o">[</span><span class="n">ASR</span><span class="o">]</span><span class="w"> </span><span class="n">Completed</span><span class="w"> </span><span class="n">successfully</span>
+<span class="w">  </span><span class="n">Poll</span><span class="w"> </span><span class="mi">5</span><span class="err">:</span><span class="w"> </span><span class="n">job</span><span class="o">=</span><span class="n">RUNNING</span><span class="w"> </span><span class="n">video</span><span class="o">=</span><span class="n">processing</span>
+<span class="w">  </span><span class="o">[</span><span class="n">CUT</span><span class="o">]</span><span class="w"> </span><span class="n">Completed</span><span class="w"> </span><span class="n">successfully</span>
+<span class="w">  </span><span class="n">Poll</span><span class="w"> </span><span class="mi">6</span><span class="err">:</span><span class="w"> </span><span class="n">job</span><span class="o">=</span><span class="n">COMPLETED</span><span class="w"> </span><span class="n">video</span><span class="o">=</span><span class="n">completed</span>
+
+<span class="o">===</span><span class="w"> </span><span class="n">B2</span><span class="p">.</span><span class="w"> </span><span class="k">Each</span><span class="w"> </span><span class="n">processor</span><span class="w"> </span><span class="n">status</span><span class="w"> </span><span class="o">===</span>
+<span class="w"> </span><span class="n">id</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">processor</span><span class="w"> </span><span class="o">|</span><span class="w">  </span><span class="n">status</span><span class="w">   </span><span class="o">|</span><span class="w"> </span><span class="n">started</span><span class="w">   </span><span class="o">|</span><span class="w"> </span><span class="n">completed</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">chunks</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">frames</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">error</span>
+<span class="c1">----+-----------+-----------+-----------+-----------+--------+--------+-------</span>
+<span class="w">  </span><span class="mi">1</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">asr</span><span class="w">       </span><span class="o">|</span><span class="w"> </span><span class="n">completed</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="mi">19</span><span class="err">:</span><span class="mi">01</span><span class="err">:</span><span class="mi">02</span><span class="w">  </span><span class="o">|</span><span class="w"> </span><span class="mi">19</span><span class="err">:</span><span class="mi">01</span><span class="err">:</span><span class="mi">25</span><span class="w"> </span><span class="o">|</span><span class="w">      </span><span class="mi">3</span><span class="w"> </span><span class="o">|</span><span class="w">    </span><span class="mi">120</span><span class="w"> </span><span class="o">|</span>
+<span class="w">  </span><span class="mi">2</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">cut</span><span class="w">       </span><span class="o">|</span><span class="w"> </span><span class="n">completed</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="mi">19</span><span class="err">:</span><span class="mi">01</span><span class="err">:</span><span class="mi">02</span><span class="w">  </span><span class="o">|</span><span class="w"> </span><span class="mi">19</span><span class="err">:</span><span class="mi">01</span><span class="err">:</span><span class="mi">08</span><span class="w"> </span><span class="o">|</span><span class="w">      </span><span class="mi">1</span><span class="w"> </span><span class="o">|</span><span class="w">    </span><span class="mi">120</span><span class="w"> </span><span class="o">|</span>
+
+<span class="o">===</span><span class="w"> </span><span class="n">C1</span><span class="p">.</span><span class="w"> </span><span class="n">Video</span><span class="w"> </span><span class="n">final</span><span class="w"> </span><span class="n">status</span><span class="w"> </span><span class="o">===</span>
+<span class="w">  </span><span class="n">file_uuid</span><span class="w">   </span><span class="o">|</span><span class="w">      </span><span class="nf">file_name</span><span class="w">      </span><span class="o">|</span><span class="w">  </span><span class="n">status</span><span class="w">   </span><span class="o">|</span><span class="w"> </span><span class="n">duration</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">fps</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">total_frames</span>
+<span class="c1">--------------+---------------------+-----------+----------+-----+--------------</span>
+<span class="w"> </span><span class="n">e11111111</span><span class="p">...</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">demo_test_video</span><span class="p">.</span><span class="n">mp4</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="n">completed</span><span class="w"> </span><span class="o">|</span><span class="w">    </span><span class="mf">5.005</span><span class="w"> </span><span class="o">|</span><span class="w">  </span><span class="mi">24</span><span class="w"> </span><span class="o">|</span><span class="w">          </span><span class="mi">120</span>
+
+<span class="o">===</span><span class="w"> </span><span class="n">C2</span><span class="p">.</span><span class="w"> </span><span class="n">Chunks</span><span class="w"> </span><span class="n">produced</span><span class="w"> </span><span class="o">===</span>
+<span class="w"> </span><span class="n">chunk_type</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="nf">count</span>
+<span class="c1">------------+-------</span>
+<span class="w"> </span><span class="n">cut</span><span class="w">        </span><span class="o">|</span><span class="w">     </span><span class="mi">1</span>
+<span class="w"> </span><span class="n">sentence</span><span class="w">   </span><span class="o">|</span><span class="w">     </span><span class="mi">3</span>
+
+<span class="o">===</span><span class="w"> </span><span class="n">C3</span><span class="p">.</span><span class="w"> </span><span class="n">Job</span><span class="w"> </span><span class="n">final</span><span class="w"> </span><span class="n">status</span><span class="w"> </span><span class="o">===</span>
+<span class="w"> </span><span class="n">id</span><span class="w"> </span><span class="o">|</span><span class="w">  </span><span class="n">status</span><span class="w">   </span><span class="o">|</span><span class="w"> </span><span class="n">current_processor</span>
+<span class="c1">----+-----------+-------------------</span>
+<span class="w"> </span><span class="mi">161</span><span class="o">|</span><span class="w"> </span><span class="n">COMPLETED</span><span class="w"> </span><span class="o">|</span><span class="w"> </span><span class="p">(</span><span class="k">null</span><span class="p">)</span>
+</code></pre></div>
+
+<p><strong>Checklist during execution:</strong></p>
+<table class="table">
+<thead>
+<tr>
+<th>Stage</th>
+<th>#</th>
+<th>Check</th>
+<th>Expected</th>
+<th style="text-align: center;">Pass</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>A. Pre-worker</strong></td>
+<td>A1</td>
+<td><code>monitor_jobs.status</code></td>
+<td><code>PENDING</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>A2</td>
+<td><code>processor_results</code> rows</td>
+<td>= requested processor count</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>A3</td>
+<td>Each <code>processor_results.status</code></td>
+<td><code>pending</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td><strong>B. Running</strong></td>
+<td>B1</td>
+<td>Job picked up (within poll interval)</td>
+<td>status → <code>RUNNING</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>B2</td>
+<td>SHA256 integrity check in logs</td>
+<td><code>[INTEGRITY] *.py checksum OK</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>B3</td>
+<td>Each processor transitions</td>
+<td><code>pending → running → completed</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>B4</td>
+<td><code>started_at</code> populated</td>
+<td>NOT NULL per processor</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>B5</td>
+<td>Processors complete without error</td>
+<td><code>error_message</code> is NULL</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>B6</td>
+<td>Max concurrent respected</td>
+<td>≤ <code>--max-concurrent</code> running at once</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td><strong>C. Post-completion</strong></td>
+<td>C1</td>
+<td><code>videos.status</code></td>
+<td><code>completed</code> (not <code>failed</code>)</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>C2</td>
+<td><code>chunks_produced</code> &gt; 0</td>
+<td>ASR has sentence chunks</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>C3</td>
+<td><code>monitor_jobs.status</code></td>
+<td><code>COMPLETED</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>C4</td>
+<td><code>chunk</code> table has data</td>
+<td>rows with this <code>file_uuid</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td></td>
+<td>C5</td>
+<td>Chunk IDs formatted correctly</td>
+<td><code>{uuid}_{start}_{end}</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>7. Check Results</h2>
+<p>Monitor job progress:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Check job status</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/jobs?page=1&amp;page_size=5&amp;status=pending,running,completed,failed&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;d=json.load(sys.stdin);[print(f&#39;{j[\&quot;uuid\&quot;]}: {j[\&quot;status\&quot;]}&#39;) for j in d.get(&#39;jobs&#39;,[])]&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="mf">9</span><span class="n">eca53f422f668dd59a9995d29dc9388</span><span class="p">:</span><span class="w"> </span><span class="n">completed</span>
+<span class="n">e1111111111111111111111111111111</span><span class="p">:</span><span class="w"> </span><span class="n">completed</span>
+</code></pre></div>
+
+<h3>⚡ Intermediate Check — Bug #2: Chunk Fallback Verification</h3>
+<p>Verify that both new and old chunk_id formats resolve correctly:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Pick a chunk_id from the DB</span>
+<span class="nv">CHUNK_INFO</span><span class="o">=</span><span class="k">$(</span><span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-t<span class="w"> </span>-A<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT chunk_id, id FROM dev.chunk WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39; LIMIT 1</span>
+<span class="s2">&quot;</span><span class="k">)</span>
+<span class="nv">NEW_ID</span><span class="o">=</span><span class="k">$(</span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$CHUNK_INFO</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>cut<span class="w"> </span>-d<span class="s1">&#39;|&#39;</span><span class="w"> </span>-f1<span class="k">)</span>
+<span class="nv">DB_ID</span><span class="o">=</span><span class="k">$(</span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$CHUNK_INFO</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>cut<span class="w"> </span>-d<span class="s1">&#39;|&#39;</span><span class="w"> </span>-f2<span class="k">)</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== New format: </span><span class="nv">$NEW_ID</span><span class="s2"> ===&quot;</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot; HTTP %{http_code}&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/file/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">/chunk/</span><span class="si">${</span><span class="nv">NEW_ID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;d=json.load(sys.stdin);print(f&#39;chunk_id={d.get(\&quot;chunk_id\&quot;)}&#39;)&quot;</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;&quot;</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Old integer fallback (id=</span><span class="nv">$DB_ID</span><span class="s2">) ===&quot;</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot; HTTP %{http_code}&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/file/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">/chunk/</span><span class="si">${</span><span class="nv">DB_ID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;d=json.load(sys.stdin);print(f&#39;chunk_id={d.get(\&quot;chunk_id\&quot;)}&#39;)&quot;</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code>=== New format: e1111111111111111111111111111111_0_5 ===
+chunk_id=e1111111111111111111111111111111_0_5 HTTP 200
+
+=== Old integer fallback (id=1075655) ===
+chunk_id=e1111111111111111111111111111111_0_5 HTTP 200
+</code></pre></div>
+
+<p>Both return <code>chunk_id=e1111111111111111111111111111111_0_5</code> — the fallback correctly resolves <code>id=1075655</code> to the same chunk.</p>
+<h3>⚡ Intermediate Check — Verify Chunks after Processing</h3>
+<div class="codehilite"><pre><span></span><code><span class="nv">PG_BIN</span><span class="o">=</span><span class="s2">&quot;/Users/accusys/pgsql/18.3/bin&quot;</span>
+
+<span class="c1"># Count chunks produced</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT chunk_type, count(*) AS count</span>
+<span class="s2">FROM dev.chunk</span>
+<span class="s2">WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">GROUP BY chunk_type</span>
+<span class="s2">ORDER BY chunk_type</span>
+<span class="s2">&quot;</span>
+
+<span class="c1"># Sample chunk content</span>
+<span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT chunk_id, chunk_type, start_frame, end_frame,</span>
+<span class="s2">       substring(text_content, 1, 60) AS text_preview</span>
+<span class="s2">FROM dev.chunk</span>
+<span class="s2">WHERE file_uuid = &#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">ORDER BY start_frame</span>
+<span class="s2">LIMIT 5</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="c"> chunk_type | count</span>
+<span class="nb">------------+-------</span>
+<span class="c"> cut        |     1</span>
+<span class="c"> sentence   |     3</span>
+
+<span class="c">                     chunk_id                     | chunk_type | start_frame | end_frame |                    text_preview</span>
+<span class="nb">--------------------------------------------------+------------+-------------+-----------+-----------------------------------------------------</span>
+<span class="c"> e1111111111111111111111111111111_0_5              | cut        |           0 |       120 | demo_test_video_auto_demo</span><span class="nt">.</span><span class="c">mp4</span>
+<span class="c"> e1111111111111111111111111111111_0_0              | sentence   |           0 |       120 | test pattern test pattern color bars test pattern </span><span class="nt">...</span>
+</code></pre></div>
+
+<p>Check per-processor results in DB:</p>
+<div class="codehilite"><pre><span></span><code><span class="s2">&quot;</span><span class="nv">$PG_BIN</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT processor, status, error_message,</span>
+<span class="s2">       to_char(started_at, &#39;HH24:MI:SS&#39;) AS started,</span>
+<span class="s2">       to_char(completed_at, &#39;HH24:MI:SS&#39;) AS completed,</span>
+<span class="s2">       COALESCE(chunks_produced, 0) AS chunks</span>
+<span class="s2">FROM dev.processor_results</span>
+<span class="s2">WHERE file_uuid=&#39;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">&#39;</span>
+<span class="s2">ORDER BY id;</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="c"> processor |  status   | error_message | started   | completed | chunks</span>
+<span class="nb">-----------+-----------+---------------+-----------+-----------+--------</span>
+<span class="c"> asr       | completed |               | 19:01:02  | 19:01:25 |      3</span>
+<span class="c"> cut       | completed |               | 19:01:02  | 19:01:08 |      1</span>
+</code></pre></div>
+
+<p><strong>Checklist after processing:</strong>
+- [ ] <code>video.status = 'completed'</code> — pipeline finished
+- [ ] <code>processor_results</code> all show <code>status = 'completed'</code>
+- [ ] <code>chunks_produced &gt; 0</code> — each processor produced output
+- [ ] <code>chunk</code> table has rows with correct chunk_type (<code>cut</code>, <code>sentence</code>)
+- [ ] <code>chunk_id</code> format is <code>{file_uuid}_{start}_{end}</code> (Bug #2 fix verified)</p>
+<hr />
+<h2>8. Search Chunks</h2>
+<p>After processing, search the generated chunks:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Text search (ASR output)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/search/universal&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-d<span class="w"> </span><span class="s2">&quot;{\&quot;query\&quot;: \&quot;test\&quot;, \&quot;uuid\&quot;: \&quot;</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">\&quot;, \&quot;limit\&quot;: 5}&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">import json,sys;d=json.load(sys.stdin)</span>
+<span class="s2">print(f&#39;Total hits: {d[\&quot;total\&quot;]}&#39;)</span>
+<span class="s2">for r in d[&#39;results&#39;]:</span>
+<span class="s2">    if r.get(&#39;chunk_id&#39;):</span>
+<span class="s2">        print(f&#39;  {r[\&quot;chunk_id\&quot;]}: \&quot;{r.get(\&quot;text\&quot;,\&quot;\&quot;)[:60]}\&quot; score={r.get(\&quot;score\&quot;,0):.3f}&#39;)</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code>Total hits: 3
+  e1111111111111111111111111111111_0_5: &quot;test pattern test pattern...&quot; score=0.423
+  e1111111111111111111111111111111_5_10: &quot;silence&quot; score=0.215
+</code></pre></div>
+
+<p>Get a specific chunk by ID:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Single chunk detail  </span>
+curl<span class="w"> </span>-s<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="s2">&quot;http://m5api.momentry.ddns.net/api/v1/file/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">/chunk/</span><span class="si">${</span><span class="nv">FILE_UUID</span><span class="si">}</span><span class="s2">_0_5&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">import json,sys;d=json.load(sys.stdin)</span>
+<span class="s2">print(f&#39;Type: {d[\&quot;chunk_type\&quot;]}  Rule: {d[\&quot;rule\&quot;]}&#39;)</span>
+<span class="s2">print(f&#39;Frame: {d[\&quot;start_frame\&quot;]}–{d[\&quot;end_frame\&quot;]}  FPS: {d[\&quot;fps\&quot;]}&#39;)</span>
+<span class="s2">print(f&#39;Text: {d[\&quot;text_content\&quot;][:100]}&#39;)</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<hr />
+<h2>9. Health Check</h2>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Basic health</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>http://m5api.momentry.ddns.net/health<span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-m<span class="w"> </span>json.tool
+
+<span class="c1"># Detailed health (services + pipeline + schema + resources)</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>http://m5api.momentry.ddns.net/health/detailed<span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">import json,sys;d=json.load(sys.stdin)</span>
+<span class="s2">p=d[&#39;pipeline&#39;];s=d[&#39;schema&#39;]</span>
+<span class="s2">print(f&#39;Status:   {d[\&quot;status\&quot;]}&#39;)</span>
+<span class="s2">print(f&#39;Build:    {d[\&quot;build_git_hash\&quot;]}&#39;)</span>
+<span class="s2">print(f&#39;Services: postgres={d[\&quot;services\&quot;][\&quot;postgres\&quot;][\&quot;status\&quot;]} redis={d[\&quot;services\&quot;][\&quot;redis\&quot;][\&quot;status\&quot;]}&#39;)</span>
+<span class="s2">print(f&#39;Schema:   {s[\&quot;applied\&quot;][-1][\&quot;filename\&quot;] if s[\&quot;applied\&quot;] else \&quot;none\&quot;} ({len(s[\&quot;applied\&quot;])}/{len(s[\&quot;required\&quot;])} applied, ok={s[\&quot;ok\&quot;]})&#39;)</span>
+<span class="s2">print(f&#39;Scripts:  {p[\&quot;scripts_count\&quot;]} files, integrity={p[\&quot;scripts_integrity\&quot;][\&quot;matched\&quot;]}/{p[\&quot;scripts_integrity\&quot;][\&quot;total\&quot;]}&#39;)</span>
+<span class="s2">print(f&#39;Procs:    &#39; + &#39; &#39;.join([k for k,v in p[&#39;processors&#39;].items() if v and k != &#39;total_py_files&#39;]))</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code>Status:   ok
+Build:    0e73d2a
+Services: postgres=ok redis=ok
+Schema:   migrate_fix_chunk_id_format.sql (8/8 applied, ok=True)
+Scripts:  286 files, integrity=345/345
+Procs:    asr yolo face pose ocr cut caption scene story asrx probe visual_chunk
+</code></pre></div>
+
+<hr />
+<h2>10. Schema Version</h2>
+<p>Each binary embeds a list of required migrations. At startup and via <code>/health/detailed</code>, the server verifies all migrations are applied.</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Check schema version via API</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>http://m5api.momentry.ddns.net/health/detailed<span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">import json,sys;d=json.load(sys.stdin)[&#39;schema&#39;]</span>
+<span class="s2">print(f&#39;Table exists: {d[\&quot;table_exists\&quot;]}&#39;)</span>
+<span class="s2">print(f&#39;All OK:       {d[\&quot;ok\&quot;]}&#39;)</span>
+<span class="s2">for m in d[&#39;required&#39;]:</span>
+<span class="s2">    match = &#39;✓&#39; if any(a[&#39;filename&#39;]==m[&#39;filename&#39;] and a[&#39;checksum&#39;]==m[&#39;checksum&#39;] for a in d[&#39;applied&#39;]) else &#39;✗&#39;</span>
+<span class="s2">    print(f&#39;  {match} {m[\&quot;filename\&quot;]}  {m[\&quot;checksum\&quot;][:16]}&#39;)</span>
+<span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>Output:</p>
+<div class="codehilite"><pre><span></span><code><span class="n">Table</span><span class="w"> </span><span class="nl">exists:</span><span class="w"> </span><span class="n">True</span>
+<span class="n">All</span><span class="w"> </span><span class="nl">OK:</span><span class="w">       </span><span class="n">True</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_add_content_hash</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="mh">42</span><span class="n">b81554248c4bec</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_add_registered_status</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="mf">566f</span><span class="n">dfcdc624f6fa</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_add_schema_version</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="mh">585</span><span class="n">b31df6056a937</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_cleanup_inactive_identities</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="n">daa52a0827b24a77</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_fix_chunk_id_format</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="n">a1b2c3d4e5f6a7b8</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_public_schema_v4</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="mh">973908076</span><span class="n">c614363</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_public_schema_v4_tables</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="mh">1</span><span class="n">d62dc42e4dec8f4</span>
+<span class="w">  </span><span class="err">✓</span><span class="w"> </span><span class="n">migrate_public_v4_complete</span><span class="p">.</span><span class="n">sql</span><span class="w">  </span><span class="mh">2</span><span class="n">a6fda7d2c5660e4</span>
+</code></pre></div>
+
+<p>If a migration is missing at startup:</p>
+<div class="codehilite"><pre><span></span><code><span class="o">[</span><span class="n">SCHEMA</span><span class="o">]</span><span class="w"> </span><span class="mi">7</span><span class="o">/</span><span class="mi">8</span><span class="w"> </span><span class="n">migrations</span><span class="w"> </span><span class="n">applied</span><span class="p">.</span><span class="w"> </span><span class="nl">Missing</span><span class="p">:</span><span class="w"> </span><span class="n">migrate_fix_chunk_id_format</span><span class="p">.</span><span class="k">sql</span>
+</code></pre></div>
+
+<hr />
+<hr />
+<h2>Summary Checklist</h2>
+<p>After completing a pipeline run, verify all items:</p>
+<h3>Registration</h3>
+<table class="table">
+<thead>
+<tr>
+<th>#</th>
+<th>Check</th>
+<th>Expected</th>
+<th style="text-align: center;">Pass</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>1</td>
+<td><code>videos.status</code></td>
+<td><code>registered</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>2</td>
+<td>file_uuid consistency</td>
+<td>API response uuid = DB uuid</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>3</td>
+<td>Probe returns metadata</td>
+<td><code>duration &gt; 0</code>, <code>fps &gt; 0</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>4</td>
+<td>Probe error (Bug #3)</td>
+<td>Bad UUID → JSON error + 404</td>
+<td style="text-align: center;">☐</td>
+</tr>
+</tbody>
+</table>
+<h3>Processing</h3>
+<table class="table">
+<thead>
+<tr>
+<th>#</th>
+<th>Check</th>
+<th>Expected</th>
+<th style="text-align: center;">Pass</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>5</td>
+<td>Job created</td>
+<td><code>monitor_jobs.status = PENDING</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>6</td>
+<td>Processors queued</td>
+<td><code>processor_results</code> rows = requested count</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>7</td>
+<td>Worker picks up job</td>
+<td><code>monitor_jobs.status → RUNNING</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>8</td>
+<td>SHA256 integrity (Bug #2)</td>
+<td><code>[INTEGRITY] *.py checksum OK</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>9</td>
+<td>Each processor completes</td>
+<td><code>processor_results.status = completed</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>10</td>
+<td>No processor errors</td>
+<td><code>error_message</code> all NULL</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>11</td>
+<td>Pipeline completes</td>
+<td><code>videos.status = completed</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+</tbody>
+</table>
+<h3>Results</h3>
+<table class="table">
+<thead>
+<tr>
+<th>#</th>
+<th>Check</th>
+<th>Expected</th>
+<th style="text-align: center;">Pass</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>12</td>
+<td>Chunks produced</td>
+<td><code>chunk</code> table has &gt; 0 rows</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>13</td>
+<td>Chunk ID format</td>
+<td><code>chunk_id = {uuid}_{start}_{end}</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>14</td>
+<td>Chunk fallback (Bug #2)</td>
+<td>Old integer ID → 200 via handler fallback</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>15</td>
+<td>Search works</td>
+<td><code>POST /search/universal</code> returns hits</td>
+<td style="text-align: center;">☐</td>
+</tr>
+<tr>
+<td>16</td>
+<td>Schema version</td>
+<td><code>schema.ok = true</code> in <code>/health/detailed</code></td>
+<td style="text-align: center;">☐</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Full Automation Script</h2>
+<p>Save as <code>demo_full_cycle.sh</code>:</p>
+<div class="codehilite"><pre><span></span><code><span class="ch">#!/bin/bash</span>
+<span class="nb">set</span><span class="w"> </span>-euo<span class="w"> </span>pipefail
+
+<span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://m5api.momentry.ddns.net&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span>
+<span class="nv">PG</span><span class="o">=</span><span class="s2">&quot;/Users/accusys/pgsql/18.3/bin&quot;</span>
+
+<span class="c1"># Generate test video</span>
+ffmpeg<span class="w"> </span>-y<span class="w"> </span>-f<span class="w"> </span>lavfi<span class="w"> </span>-i<span class="w"> </span><span class="s2">&quot;testsrc=duration=5:size=640x480:rate=24&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-f<span class="w"> </span>lavfi<span class="w"> </span>-i<span class="w"> </span><span class="s2">&quot;anullsrc=r=44100:cl=mono&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-c:v<span class="w"> </span>libx264<span class="w"> </span>-preset<span class="w"> </span>ultrafast<span class="w"> </span>-crf<span class="w"> </span><span class="m">28</span><span class="w"> </span>-c:a<span class="w"> </span>aac<span class="w"> </span>-shortest<span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>/tmp/auto_demo.mp4<span class="w"> </span><span class="m">2</span>&gt;/dev/null
+
+<span class="c1"># Register</span>
+<span class="nv">UUID</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/tmp/auto_demo.mp4&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;print(json.load(sys.stdin)[&#39;file_uuid&#39;])&quot;</span><span class="k">)</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;Registered: </span><span class="nv">$UUID</span><span class="s2">&quot;</span>
+
+<span class="c1"># Process</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$UUID</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;processors&quot;:[&quot;asr&quot;,&quot;cut&quot;]}&#39;</span><span class="w"> </span>&gt;<span class="w"> </span>/dev/null
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;Processing triggered&quot;</span>
+
+<span class="c1"># Run worker</span>
+<span class="nv">DATABASE_SCHEMA</span><span class="o">=</span>dev<span class="w"> </span>target/debug/momentry_playground<span class="w"> </span>worker<span class="w"> </span><span class="se">\</span>
+<span class="w">    </span>--max-concurrent<span class="w"> </span><span class="m">1</span><span class="w"> </span>--poll-interval<span class="w"> </span><span class="m">3</span><span class="w"> </span><span class="p">&amp;</span>
+<span class="nv">WPID</span><span class="o">=</span><span class="nv">$!</span>
+sleep<span class="w"> </span><span class="m">30</span>
+<span class="nb">kill</span><span class="w"> </span><span class="nv">$WPID</span><span class="w"> </span><span class="m">2</span>&gt;/dev/null<span class="w"> </span><span class="o">||</span><span class="w"> </span><span class="nb">true</span>
+
+<span class="c1"># Results</span>
+<span class="s2">&quot;</span><span class="nv">$PG</span><span class="s2">/psql&quot;</span><span class="w"> </span>-U<span class="w"> </span>accusys<span class="w"> </span>-d<span class="w"> </span>momentry<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;</span>
+<span class="s2">SELECT processor, status FROM dev.processor_results WHERE file_uuid=&#39;</span><span class="nv">$UUID</span><span class="s2">&#39; ORDER BY id&quot;</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;Done: </span><span class="nv">$UUID</span><span class="s2">&quot;</span>
+</code></pre></div>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/M5API_Pipeline_Demo.html b/docs_v1.0/doc_user/M5API_Pipeline_Demo.html
new file mode 100644
index 0000000..141ef3f
--- /dev/null
+++ b/docs_v1.0/doc_user/M5API_Pipeline_Demo.html
@@ -0,0 +1,472 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>M5Api Pipeline Demo - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "demo_guide"
+service: "MOMENTRY_CORE"
+title: "M5API Pipeline Demo"
+date: "2026-05-16"
+version: "V1.0"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"
+tags:
+  - "demo"
+  - "pipeline"
+  - "api"
+  - "m5api"
+ai_query_hints:
+  - "M5API Pipeline demo"
+  - "如何透過 M5 的 API 執行 Pipeline"
+related_documents:
+  - "GUIDES/Demo_EndToEnd.md"
+  - "GUIDES/API_ENDPOINTS.md"</p>
+<hr />
+<h1>Momentry Core — M5API Pipeline Demo</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>建立者</td>
+<td>OpenCode</td>
+</tr>
+<tr>
+<td>建立時間</td>
+<td>2026-05-16</td>
+</tr>
+<tr>
+<td>文件版本</td>
+<td>V1.0</td>
+</tr>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key、M5 服務已啟動</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Prerequisites</h2>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;https://m5api.momentry.ddns.net&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69&quot;</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 1: System Health Check</h2>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{ip, port, status, version, build_git_hash}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;ip&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;192.168.110.201&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;port&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3002</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;version&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;1.0.0&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;build_git_hash&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;c41f7e0c&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p>All core services verified:</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health/detailed&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{</span>
+<span class="s1">  services, schema: .schema.ok,</span>
+<span class="s1">  scripts: .pipeline.scripts_count,</span>
+<span class="s1">  integrity: .pipeline.scripts_integrity,</span>
+<span class="s1">  procs: [.pipeline.processors | to_entries[] | select(.value==true and .key!=&quot;total_py_files&quot;) | .key]</span>
+<span class="s1">}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;services&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;postgres&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;redis&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;qdrant&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="nt">&quot;mongodb&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ok&quot;</span><span class="p">}</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;schema&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;scripts&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">286</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;integrity&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;procs&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span><span class="s2">&quot;asr&quot;</span><span class="p">,</span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span><span class="s2">&quot;face&quot;</span><span class="p">,</span><span class="s2">&quot;pose&quot;</span><span class="p">,</span><span class="s2">&quot;ocr&quot;</span><span class="p">,</span><span class="s2">&quot;cut&quot;</span><span class="p">,</span><span class="s2">&quot;caption&quot;</span><span class="p">,</span><span class="s2">&quot;scene&quot;</span><span class="p">,</span><span class="s2">&quot;story&quot;</span><span class="p">,</span><span class="s2">&quot;asrx&quot;</span><span class="p">,</span><span class="s2">&quot;probe&quot;</span><span class="p">,</span><span class="s2">&quot;visual_chunk&quot;</span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 2: List Registered Files</h2>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files?page=1&amp;page_size=5&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{total, files: [.data[]? | {name: .file_name[0:50], status}]}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">56</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;files&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade (1963) Cary Grant &amp; Audrey Hepburn ...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ExaSAN PCIe series - Director Ou Yu-Zhi ...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Old_Time_Movie_Show_-_Charade_1963.HD.mov&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Old Felix the Cat Cartoon.mp4&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;unregistered&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;short_clip.mov&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 3: Register a New File</h2>
+<div class="codehilite"><pre><span></span><code><span class="c1"># POST with file_path (must exist on server filesystem)</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{success, file_uuid, file_name, file_type, duration, fps, already_exists}&#39;</span>
+</code></pre></div>
+
+<p>Response (new registration):</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade (1963) Cary Grant &amp; Audrey Hepburn ...mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">6785.014</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">23.976</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;already_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p>Response (duplicate content — SHA256 dedup):</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;already_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Content already registered (identical file)&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 4: Probe (ffprobe Metadata)</h2>
+<div class="codehilite"><pre><span></span><code><span class="nv">UUID</span><span class="o">=</span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94&quot;</span>
+
+curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">/probe&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{name: .file_name, video: &quot;\(.width)x\(.height)&quot;, fps, duration, cached, streams: [.streams[] | {type: .codec_type, codec: .codec_name}]}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade (1963) Cary Grant &amp; Audrey Hepburn ...mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;video&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;720x304&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">23.976</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">6785.014</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;cached&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;streams&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;codec&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;h264&quot;</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;audio&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;codec&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;aac&quot;</span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p>Error cases:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Non-existent UUID</span>
+curl<span class="w"> </span>-sf<span class="w"> </span><span class="s2">&quot;https://m5api.momentry.ddns.net/api/v1/file/bad_uuid/probe&quot;</span>
+<span class="c1"># → {&quot;error&quot;:&quot;Video not found&quot;,&quot;file_uuid&quot;:&quot;bad_uuid&quot;}  HTTP 404</span>
+
+<span class="c1"># File deleted from disk</span>
+<span class="c1"># → {&quot;error&quot;:&quot;File does not exist at registered path&quot;,&quot;file_uuid&quot;:&quot;...&quot;,&quot;file_path&quot;:&quot;...&quot;}  HTTP 404</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 5: Submit Processing Job</h2>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Specific processors</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;processors&quot;:[&quot;asr&quot;,&quot;cut&quot;,&quot;yolo&quot;,&quot;face&quot;,&quot;pose&quot;,&quot;ocr&quot;]}&#39;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{job_id, file_uuid: .file_uuid[0:16], status}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">167</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d9459762&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;PENDING&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<blockquote>
+<p><strong>All processors</strong>: Send <code>{}</code> (empty body) to run all 12 processors.
+Available: <code>asr</code>, <code>cut</code>, <code>yolo</code>, <code>face</code>, <code>pose</code>, <code>ocr</code>, <code>asrx</code>, <code>visual_chunk</code>, <code>scene</code>, <code>story</code>, <code>caption</code></p>
+</blockquote>
+<hr />
+<h2>Step 6: Monitor Progress</h2>
+<div class="codehilite"><pre><span></span><code><span class="k">while</span><span class="w"> </span>true<span class="p">;</span><span class="w"> </span><span class="k">do</span>
+<span class="w">  </span><span class="nv">PROGRESS</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/progress/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">&quot;</span><span class="k">)</span>
+<span class="w">  </span><span class="nv">STATUS</span><span class="o">=</span><span class="k">$(</span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$PROGRESS</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span>-r<span class="w"> </span><span class="s1">&#39;.status // &quot;?&quot;&#39;</span><span class="k">)</span>
+<span class="w">  </span><span class="nv">PROCS</span><span class="o">=</span><span class="k">$(</span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$PROGRESS</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span>-r<span class="w"> </span><span class="s1">&#39;[.processors[]? | &quot;\(.name)=\(.status)(\(.frames_processed))&quot;] | join(&quot;  &quot;)&#39;</span><span class="k">)</span>
+<span class="w">  </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="k">$(</span>date<span class="w"> </span>+%H:%M:%S<span class="k">)</span><span class="s2">: </span><span class="nv">$PROCS</span><span class="s2">&quot;</span>
+<span class="w">  </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$PROCS</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span>-q<span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="w"> </span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="k">break</span>
+<span class="w">  </span>sleep<span class="w"> </span><span class="m">10</span>
+<span class="k">done</span>
+</code></pre></div>
+
+<p>Typical output:</p>
+<div class="codehilite"><pre><span></span><code><span class="mf">12</span><span class="p">:</span><span class="mf">30</span><span class="p">:</span><span class="mf">01</span><span class="p">:</span><span class="w"> </span><span class="n">asr</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">cut</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">yolo</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">face</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="nb">pos</span><span class="n">e</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">ocr</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span>
+<span class="mf">12</span><span class="p">:</span><span class="mf">30</span><span class="p">:</span><span class="mf">11</span><span class="p">:</span><span class="w"> </span><span class="n">asr</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">cut</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">yolo</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">face</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="nb">pos</span><span class="n">e</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">ocr</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span>
+<span class="mf">12</span><span class="p">:</span><span class="mf">30</span><span class="p">:</span><span class="mf">21</span><span class="p">:</span><span class="w"> </span><span class="n">asr</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">cut</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">yolo</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">face</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="nb">pos</span><span class="n">e</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">ocr</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span>
+<span class="mf">12</span><span class="p">:</span><span class="mf">30</span><span class="p">:</span><span class="mf">31</span><span class="p">:</span><span class="w"> </span><span class="n">asr</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">cut</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">yolo</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">face</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="nb">pos</span><span class="n">e</span><span class="o">=</span><span class="n">pending</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span>
+<span class="mf">12</span><span class="p">:</span><span class="mf">30</span><span class="p">:</span><span class="mf">41</span><span class="p">:</span><span class="w"> </span><span class="n">asr</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span><span class="w">  </span><span class="n">cut</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">yolo</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">face</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="nb">pos</span><span class="n">e</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span>
+<span class="mf">12</span><span class="p">:</span><span class="mf">30</span><span class="p">:</span><span class="mf">51</span><span class="p">:</span><span class="w"> </span><span class="n">asr</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">cut</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">yolo</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">face</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="nb">pos</span><span class="n">e</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">ocr</span><span class="o">=</span><span class="kr">run</span><span class="n">ning</span><span class="p">(</span><span class="mf">0</span><span class="p">)</span>
+<span class="mf">12</span><span class="p">:</span><span class="mf">31</span><span class="p">:</span><span class="mf">01</span><span class="p">:</span><span class="w"> </span><span class="n">asr</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">cut</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">yolo</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">face</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="nb">pos</span><span class="n">e</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span><span class="w">  </span><span class="n">ocr</span><span class="o">=</span><span class="n">completed</span><span class="p">(</span><span class="mf">8951</span><span class="p">)</span>
+</code></pre></div>
+
+<p><strong>Status transition chain</strong>: <code>pending → running → completed</code></p>
+<p>Check job state:</p>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/jobs?uuid=</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;[.jobs[]? | {id, status}]&#39;</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 7: Verify Results</h2>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/progress/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{processors: [.processors[] | {name, status, frames: .frames_processed}]}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;processors&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;asr&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">162568</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;cut&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">162568</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;yolo&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">162568</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;face&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">162568</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;pose&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">162568</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;ocr&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">162568</span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 8: Universal Search</h2>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Search for a person name</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s2">&quot;{\&quot;query\&quot;:\&quot;Audrey\&quot;,\&quot;uuid\&quot;:\&quot;</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">\&quot;,\&quot;limit\&quot;:3}&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/universal&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{total, hits: [.results[]? | {chunk_id: .chunk_id[0:40], text: .text[0:80], score}]}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;hits&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94_998192&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Shorede stars two legends of classical Hollywood, Audrey Hepburn and Carrie Gran&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.9</span>
+<span class="w">    </span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94_998193&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Shorede stars two legends of classical Hollywood, Audrey Hepburn and Carrie Gran&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;score&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.9</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Search Chinese text</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s2">&quot;{\&quot;query\&quot;:\&quot;導演\&quot;,\&quot;uuid\&quot;:\&quot;</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">\&quot;,\&quot;limit\&quot;:3}&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/universal&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total}&#39;</span>
+</code></pre></div>
+
+<p><strong>Search modes</strong>: The universal search endpoint supports:
+- Text match (ILIKE on <code>text_content</code> and <code>content</code> columns)
+- Time range filtering (<code>time_range: [start, end]</code>)
+- Speaker/person ID filtering
+- Chunk type filtering
+- Visual content filtering (objects, density, classes)</p>
+<hr />
+<h2>Step 9: Get Chunk Detail</h2>
+<div class="codehilite"><pre><span></span><code><span class="nv">CHUNK_ID</span><span class="o">=</span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94_998192&quot;</span>
+
+curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">/chunk/</span><span class="si">${</span><span class="nv">CHUNK_ID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{chunk_id, chunk_type, text: .text_content, fps, start_frame, end_frame}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94_998192&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;chunk_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;sentence&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Shorede stars two legends of classical Hollywood, Audrey Hepburn and Carrie Gran&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">23.976</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;start_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2395281</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;end_frame&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2395341</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 10: Chunk Fallback (Stale Qdrant Compatibility)</h2>
+<p>Old integer-format chunk_ids from stale Qdrant payloads are automatically resolved via <code>WHERE id = int(chunk_id)</code>:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Integer format (old Qdrant payload)</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">/chunk/998192&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{chunk_id, text: .text_content}&#39;</span>
+</code></pre></div>
+
+<p>Response (same chunk as above):</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;chunk_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3abeee81d94597629ed8cb943f182e94_998192&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;text&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Shorede stars two legends of classical Hollywood, Audrey Hepburn and Carrie Gran&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<p><strong>Both formats work:</strong>
+- <code>chunk/{uuid}_{id}</code> → exact <code>chunk_id</code> match
+- <code>chunk/{id}</code> → fallback by primary key <code>id</code></p>
+<hr />
+<h2>Step 11: File Detail</h2>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{file_name, status, file_type, file_path}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade (1963) Cary Grant &amp; Audrey Hepburn ...mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/Users/accusys/momentry/var/sftpgo/data/demo/Charade...&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 12: File Identities</h2>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">/identities&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{total, identities: [.data[]? | {name, face_count, confidence}]}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;identities&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Audrey Hepburn&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;face_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">22082</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.93</span><span class="p">},</span>
+<span class="w">    </span><span class="p">{</span><span class="nt">&quot;name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Cary Grant&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;face_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15334</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;confidence&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">0.91</span><span class="p">}</span>
+<span class="w">  </span><span class="p">]</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 13: Identity Detail</h2>
+<div class="codehilite"><pre><span></span><code><span class="c1"># List all global identities</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identities?page=1&amp;page_size=3&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{total, identities: [.data[]? | {name, type: .identity_type, source}]}&#39;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Get identity files (cross-file faces)</span>
+<span class="nv">IDENTITY_UUID</span><span class="o">=</span><span class="s2">&quot;c3545906-c82d-4b66-aa1d-150bc02decce&quot;</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/identity/</span><span class="si">${</span><span class="nv">IDENTITY_UUID</span><span class="si">}</span><span class="s2">/files&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{total, files: [.data[]? | {file_uuid: .file_uuid[0:16], face_count}]}&#39;</span>
+</code></pre></div>
+
+<hr />
+<h2>Step 14: Schema &amp; Integrity Verification</h2>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-sf<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health/detailed&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{</span>
+<span class="s1">  ip, port,</span>
+<span class="s1">  schema: .schema.ok,</span>
+<span class="s1">  migrations: [.schema.applied[]?.filename],</span>
+<span class="s1">  integrity: .pipeline.scripts_integrity</span>
+<span class="s1">}&#39;</span>
+</code></pre></div>
+
+<p>Response:</p>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;ip&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;192.168.110.201&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;port&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">3002</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;schema&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;migrations&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="s2">&quot;migrate_add_content_hash.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_add_registered_status.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_add_schema_version.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_cleanup_inactive_identities.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_public_schema_v4_tables.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_public_schema_v4.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_public_v4_complete.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_fix_chunk_id_format.sql&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="s2">&quot;migrate_add_identity_indexes.sql&quot;</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;integrity&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span><span class="nt">&quot;matched&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">345</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;ok&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">}</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h2>Full Automation Script</h2>
+<div class="codehilite"><pre><span></span><code><span class="ch">#!/bin/bash</span>
+<span class="nb">set</span><span class="w"> </span>-euo<span class="w"> </span>pipefail
+
+<span class="nv">API</span><span class="o">=</span><span class="s2">&quot;</span><span class="si">${</span><span class="nv">API</span><span class="k">:-</span><span class="nv">https</span><span class="p">://m5api.momentry.ddns.net</span><span class="si">}</span><span class="s2">&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;</span><span class="si">${</span><span class="nv">KEY</span><span class="k">:-</span><span class="nv">muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69</span><span class="si">}</span><span class="s2">&quot;</span>
+
+<span class="c1"># 1. Health</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Health ===&quot;</span>
+curl<span class="w"> </span>-sf<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/health&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{status, version, build_git_hash}&#39;</span>
+
+<span class="c1"># 2. Register file (argument: file path)</span>
+<span class="nv">FILE_PATH</span><span class="o">=</span><span class="s2">&quot;</span><span class="si">${</span><span class="nv">1</span><span class="p">:?Usage: </span><span class="nv">$0</span><span class="p"> &lt;file_path&gt;</span><span class="si">}</span><span class="s2">&quot;</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Register ===&quot;</span>
+<span class="nv">REG</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s2">&quot;{\&quot;file_path\&quot;:\&quot;</span><span class="nv">$FILE_PATH</span><span class="s2">\&quot;}&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="k">)</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$REG</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{success, file_uuid, file_name}&#39;</span>
+<span class="nv">UUID</span><span class="o">=</span><span class="k">$(</span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$REG</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span>-r<span class="w"> </span><span class="s1">&#39;.file_uuid&#39;</span><span class="k">)</span>
+<span class="o">[</span><span class="w"> </span>-z<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$UUID</span><span class="s2">&quot;</span><span class="w"> </span><span class="o">]</span><span class="w"> </span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="o">{</span><span class="w"> </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;Registration failed&quot;</span><span class="p">;</span><span class="w"> </span><span class="nb">exit</span><span class="w"> </span><span class="m">1</span><span class="p">;</span><span class="w"> </span><span class="o">}</span>
+
+<span class="c1"># 3. Probe</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Probe ===&quot;</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">/probe&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>jq<span class="w"> </span><span class="s1">&#39;{name, fps, duration}&#39;</span>
+
+<span class="c1"># 4. Submit job</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Process ===&quot;</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{}&#39;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">/process&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{job_id, status}&#39;</span>
+
+<span class="c1"># 5. Poll progress</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Waiting for pipeline... ===&quot;</span>
+<span class="k">while</span><span class="w"> </span>true<span class="p">;</span><span class="w"> </span><span class="k">do</span>
+<span class="w">  </span><span class="nv">PROGRESS</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-sf<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/progress/</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">&quot;</span><span class="k">)</span>
+<span class="w">  </span><span class="nv">STATUS</span><span class="o">=</span><span class="k">$(</span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$PROGRESS</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span>-r<span class="w"> </span><span class="s1">&#39;.status // &quot;?&quot;&#39;</span><span class="k">)</span>
+<span class="w">  </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="k">$(</span>date<span class="w"> </span>+%H:%M:%S<span class="k">)</span><span class="s2">: </span><span class="k">$(</span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$PROGRESS</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span>-r<span class="w"> </span><span class="s1">&#39;[.processors[]? | &quot;\(.name)=\(.status)(\(.frames_processed))&quot;] | join(&quot;  &quot;)&#39;</span><span class="k">)</span><span class="s2">&quot;</span>
+<span class="w">  </span><span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$PROGRESS</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span>-e<span class="w"> </span><span class="s1">&#39;[.processors[]? | select(.status == &quot;pending&quot;)] | length == 0&#39;</span><span class="w"> </span>&gt;/dev/null<span class="w"> </span><span class="o">&amp;&amp;</span><span class="w"> </span><span class="k">break</span>
+<span class="w">  </span>sleep<span class="w"> </span><span class="m">10</span>
+<span class="k">done</span>
+
+<span class="c1"># 6. Search</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;=== Search ===&quot;</span>
+curl<span class="w"> </span>-sf<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s2">&quot;{\&quot;query\&quot;:\&quot;test\&quot;,\&quot;uuid\&quot;:\&quot;</span><span class="si">${</span><span class="nv">UUID</span><span class="si">}</span><span class="s2">\&quot;,\&quot;limit\&quot;:3}&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/search/universal&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, hits: [.results[]? | {chunk_id: .chunk_id[0:30], text: .text[0:60]}]}&#39;</span>
+
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;&quot;</span>
+<span class="nb">echo</span><span class="w"> </span><span class="s2">&quot;✅ Done: </span><span class="nv">$UUID</span><span class="s2">&quot;</span>
+</code></pre></div>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/TMDb_User_Guide.html b/docs_v1.0/doc_user/TMDb_User_Guide.html
new file mode 100644
index 0000000..9c1e1d1
--- /dev/null
+++ b/docs_v1.0/doc_user/TMDb_User_Guide.html
@@ -0,0 +1,923 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Tmdb User Guide - Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 960px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 24px; margin: 24px 0 12px; }
+h2 { font-size: 20px; margin: 20px 0 10px; color: #222; }
+h3 { font-size: 16px; margin: 16px 0 8px; color: #444; }
+p { line-height: 1.6; margin: 8px 0; }
+table { border-collapse: collapse; width: 100%; margin: 12px 0; font-size: 14px; }
+th, td { border: 1px solid #ddd; padding: 8px 12px; text-align: left; }
+th { background: #f0f0f0; font-weight: 600; }
+code { background: #f0f0f0; padding: 2px 6px; border-radius: 3px; font-size: 13px; }
+pre { background: #f8f8f8; border: 1px solid #ddd; border-radius: 6px; padding: 12px; overflow-x: auto; margin: 12px 0; }
+pre code { background: none; padding: 0; }
+a { color: #0066cc; }
+.back { display: inline-block; margin-bottom: 20px; color: #666; }
+.back:hover { color: #333; }
+</style>
+</head>
+<body>
+<div class="container">
+<a class="back" href="index.html">&larr; Back to index</a>
+<hr />
+<p>document_type: "user_manual"
+service: "MOMENTRY_CORE"
+title: "TMDb Enrichment 使用指南"
+date: "2026-05-17"
+version: "V1.0"
+status: "active"
+owner: "M5"
+created_by: "OpenCode"</p>
+<hr />
+<h1>TMDb Enrichment 使用指南</h1>
+<table class="table">
+<thead>
+<tr>
+<th>項目</th>
+<th>內容</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>目標讀者</td>
+<td>developer</td>
+</tr>
+<tr>
+<td>預備知識</td>
+<td>需有 API Key</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>Base URL</h2>
+<table class="table">
+<thead>
+<tr>
+<th>Environment</th>
+<th>URL</th>
+<th>Purpose</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td>Playground (Dev)</td>
+<td><code>http://localhost:3003</code></td>
+<td>Development and testing</td>
+</tr>
+<tr>
+<td>Production</td>
+<td><code>http://localhost:3002</code></td>
+<td>Production deployment</td>
+</tr>
+<tr>
+<td>External (M5)</td>
+<td><code>https://m5api.momentry.ddns.net</code></td>
+<td>Remote access</td>
+</tr>
+</tbody>
+</table>
+<h2>Variables</h2>
+<p>All examples in this documentation use these environment variables:</p>
+<div class="codehilite"><pre><span></span><code><span class="nv">API</span><span class="o">=</span><span class="s2">&quot;http://localhost:3003&quot;</span>
+<span class="nv">KEY</span><span class="o">=</span><span class="s2">&quot;your-api-key-here&quot;</span>
+</code></pre></div>
+
+<h2>Authentication</h2>
+<p>All endpoints under <code>/api/v1/*</code> require authentication.
+The following endpoints are public (no auth needed):</p>
+<ul>
+<li><code>GET /health</code></li>
+<li><code>POST /api/v1/auth/login</code></li>
+<li><code>POST /api/v1/auth/logout</code></li>
+</ul>
+<h3>Three Authentication Modes</h3>
+<p>The system supports three authentication methods, checked in <strong>priority order</strong> by the middleware:</p>
+<div class="codehilite"><pre><span></span><code>Middleware priority:
+  1. Session Cookie (Portal/browser)
+  2. JWT Bearer (API clients: n8n, CLI)
+  3. API Key Header (legacy compatibility)
+  4. API Key Query Param (?api_key=)
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Mode</th>
+<th>Transport</th>
+<th>Expiry</th>
+<th>Scope</th>
+<th>Best for</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td><code>Cookie: session_id=&lt;uuid&gt;</code></td>
+<td>24h</td>
+<td>per-browser session</td>
+<td>Portal (browser)</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td><code>Authorization: Bearer &lt;token&gt;</code></td>
+<td>1h</td>
+<td>per-login token</td>
+<td>API clients (n8n, CLI, scripts)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td><code>X-API-Key: &lt;key&gt;</code></td>
+<td>90d</td>
+<td>fixed key for automation</td>
+<td>Legacy scripts, WordPress</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Login</h3>
+<p><strong>Default accounts &amp; API keys:</strong></p>
+<table class="table">
+<thead>
+<tr>
+<th>Username</th>
+<th>Password</th>
+<th>API Key</th>
+<th>Role</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>admin</code></td>
+<td><code>admin</code></td>
+<td>—</td>
+<td>admin</td>
+</tr>
+<tr>
+<td><code>demo</code></td>
+<td><code>demo</code></td>
+<td><code>muser_demo_key_32chars_abcdef1234567890</code></td>
+<td>user</td>
+</tr>
+</tbody>
+</table>
+<p>The demo API key is set via <code>MOMENTRY_DEMO_API_KEY</code> env var and can be used in place of JWT for marcom integrations:</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Using API key instead of JWT</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: muser_demo_key_32chars_abcdef1234567890&quot;</span>
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login as admin</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;admin&quot;, &quot;password&quot;: &quot;admin&quot;}&#39;</span>
+
+<span class="c1"># Login as demo user</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;: &quot;demo&quot;, &quot;password&quot;: &quot;demo&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Success Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;jwt&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;eyJhbGciOiJIUzI1NiIs...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_key&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;muser_...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;user&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">{</span>
+<span class="w">    </span><span class="nt">&quot;username&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span><span class="p">,</span>
+<span class="w">    </span><span class="nt">&quot;role&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;admin&quot;</span>
+<span class="w">  </span><span class="p">},</span>
+<span class="w">  </span><span class="nt">&quot;expires_at&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-18T13:00:00Z&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>jwt</code></td>
+<td>string</td>
+<td>JWT access token. Use as <code>Authorization: Bearer &lt;jwt&gt;</code>. Expires in 1 hour.</td>
+</tr>
+<tr>
+<td><code>api_key</code></td>
+<td>string</td>
+<td>Legacy API key. Use as <code>X-API-Key: &lt;key&gt;</code>. Good for 90 days.</td>
+</tr>
+<tr>
+<td><code>user.username</code></td>
+<td>string</td>
+<td>Username</td>
+</tr>
+<tr>
+<td><code>user.role</code></td>
+<td>string</td>
+<td>Role: <code>admin</code>, <code>user</code>, or <code>readonly</code></td>
+</tr>
+<tr>
+<td><code>expires_at</code></td>
+<td>string</td>
+<td>ISO8601 timestamp of JWT expiration</td>
+</tr>
+</tbody>
+</table>
+<p>The login endpoint also sets a <code>Set-Cookie</code> header for browser-based clients:</p>
+<div class="codehilite"><pre><span></span><code><span class="nt">Set-Cookie</span><span class="o">:</span><span class="w"> </span><span class="nt">session_id</span><span class="o">=&lt;</span><span class="nt">uuid</span><span class="o">&gt;;</span><span class="w"> </span><span class="nt">Path</span><span class="o">=/</span><span class="nt">api</span><span class="o">;</span><span class="w"> </span><span class="nt">HttpOnly</span><span class="o">;</span><span class="w"> </span><span class="nt">SameSite</span><span class="o">=</span><span class="nt">Strict</span><span class="o">;</span><span class="w"> </span><span class="nt">Max-Age</span><span class="o">=</span><span class="nt">86400</span>
+</code></pre></div>
+
+<h4>Error Response (401)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Invalid username or password&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+<h3>Using JWT</h3>
+<p>JWT is preferred for API clients (n8n, CLI scripts, WordPress). It is validated by the middleware without a database lookup (stateless).</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login and capture JWT</span>
+<span class="nv">JWT</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>python3<span class="w"> </span>-c<span class="w"> </span><span class="s2">&quot;import json,sys;print(json.load(sys.stdin)[&#39;jwt&#39;])&quot;</span><span class="k">)</span>
+
+<span class="c1"># Use JWT for all subsequent requests</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$JWT</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span>
+</code></pre></div>
+
+<p>JWT is short-lived (1 hour). When it expires, request a new one via login.</p>
+<hr />
+<h3>Using Session Cookie (Browser)</h3>
+<p>Browser-based clients (Portal) get a session cookie automatically after login. The browser sends the cookie with every request—no manual header needed.</p>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Login captures the session cookie from Set-Cookie header</span>
+curl<span class="w"> </span>-v<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="m">2</span>&gt;<span class="p">&amp;</span><span class="m">1</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span>
+
+<span class="c1"># Browser automatically sends: Cookie: session_id=&lt;uuid&gt;</span>
+<span class="c1"># No manual header needed for subsequent requests</span>
+</code></pre></div>
+
+<p>The session cookie is HttpOnly (not accessible from JavaScript) and SameSite=Strict (protected against CSRF).</p>
+<hr />
+<h3>Using Legacy API Key</h3>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+
+<span class="c1"># Also accepted via Bearer header (non-JWT format) or query parameter:</span>
+curl<span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;Authorization: Bearer </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span>
+curl<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?api_key=</span><span class="nv">$KEY</span><span class="s2">&quot;</span>
+</code></pre></div>
+
+<p>API keys are validated via SHA256 hash lookup in the database. They are long-lived (90 days) and intended for automation.</p>
+<h3>Obtaining an API Key (CLI)</h3>
+<div class="codehilite"><pre><span></span><code>momentry<span class="w"> </span>api-key<span class="w"> </span>create<span class="w"> </span><span class="s2">&quot;My API Key&quot;</span><span class="w"> </span>--key-type<span class="w"> </span>user
+</code></pre></div>
+
+<hr />
+<h3>Logout</h3>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Logout using the session cookie (browser)</span>
+curl<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=&lt;uuid&gt;&quot;</span>
+</code></pre></div>
+
+<h4>What logout does</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Auth mode</th>
+<th>Effect</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Session Cookie</strong></td>
+<td>Session deleted from database. Same cookie returns 401 on subsequent requests.</td>
+</tr>
+<tr>
+<td><strong>JWT</strong></td>
+<td>JWT remains valid until expiry. (JWT is stateless — logout adds JWT to a blacklist only if API key mode is used.)</td>
+</tr>
+<tr>
+<td><strong>API Key</strong></td>
+<td>API key remains valid. (Legacy keys are shared across sessions — revoking would break other clients.)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example: full session lifecycle</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># 1. Login</span>
+<span class="nv">SESSION_ID</span><span class="o">=</span><span class="k">$(</span>curl<span class="w"> </span>-s<span class="w"> </span>-D<span class="w"> </span>-<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/login&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;username&quot;:&quot;admin&quot;,&quot;password&quot;:&quot;admin&quot;}&#39;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>grep<span class="w"> </span><span class="s2">&quot;Set-Cookie&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>sed<span class="w"> </span><span class="s1">&#39;s/.*session_id=\([^;]*\).*/\1/&#39;</span><span class="k">)</span>
+
+<span class="c1"># 2. Use session (works)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 200</span>
+
+<span class="c1"># 3. Logout</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/auth/logout&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → {&quot;success&quot;: true}</span>
+
+<span class="c1"># 4. Use session again (rejected)</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-o<span class="w"> </span>/dev/null<span class="w"> </span>-w<span class="w"> </span><span class="s2">&quot;HTTP %{http_code}\n&quot;</span><span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Cookie: session_id=</span><span class="nv">$SESSION_ID</span><span class="s2">&quot;</span>
+<span class="c1"># → HTTP 401</span>
+</code></pre></div>
+
+<hr />
+<h3>Authentication Flow Summary</h3>
+<div class="codehilite"><pre><span></span><code>Login Request
+     │
+     ▼
+┌──────────────────┐
+│  1. Check users  │ ← users table (argon2 password verify)
+│     table        │
+└──────┬───────────┘
+       │
+   ┌───┴───┐
+   │ match │
+   └───┬───┘
+       │
+       ▼
+┌──────────────────┐
+│  2. Create JWT   │ ← 1h expiry, signed with JWT_SECRET
+├──────────────────┤
+│  3. Create       │ ← 24h expiry, stored in sessions table
+│     session      │
+├──────────────────┤
+│  4. Set-Cookie   │ ← HttpOnly, SameSite=Strict, Path=/api
+├──────────────────┤
+│  5. Return       │ ← JWT + api_key + user info to client
+└──────────────────┘
+</code></pre></div>
+
+<div class="codehilite"><pre><span></span><code>Protected Request
+     │
+     ▼
+┌──────────────────────┐
+│  Middleware checks:  │
+│                      │
+│  1. Cookie session?  │ → DB lookup session → get api_key → verify
+│                      │
+│  2. JWT Bearer?      │ → verify JWT signature → decode claims
+│                      │
+│  3. X-API-Key?       │ → SHA256 hash → DB lookup → verify
+│                      │
+│  4. ?api_key=?       │ → same as #3
+│                      │
+│  5. None → 401       │
+└──────────────────────┘
+</code></pre></div>
+
+<hr />
+<h3>Error Responses</h3>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid authentication</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>Session expired or logged out</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>JWT expired</td>
+</tr>
+<tr>
+<td><code>401</code></td>
+<td>API key revoked or inactive</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3>Related</h3>
+<ul>
+<li><code>POST /api/v1/resource/tmdb/check</code> — test authentication + TMDb API connectivity</li>
+<li><code>GET /health/detailed</code> — view auth status (integrations section)</li>
+</ul>
+<hr />
+<h2>File Registration</h2>
+<h3><code>POST /api/v1/files/register</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Register a video file for processing. Returns the file's metadata and UUID.</p>
+<p><strong>New in v0.1.2</strong>: Registration now <strong>automatically triggers the processing pipeline</strong> — no need to call <code>POST /api/v1/file/:uuid/process</code> separately. The system will:
+1. Register the file and run ffprobe
+2. Auto-run offline TMDb probe (reads local identity files, no API calls)
+3. Create a monitor job for the worker
+4. Worker starts all 10 processors (Cut → ASR → ASRX → YOLO → OCR → Face → Pose → VisualChunk → Story → 5W1H)</p>
+<p>If the file already exists (same content hash), returns the existing record with <code>already_exists: true</code>.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>—</td>
+<td>Path to video file on disk</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex pattern for batch register (requires <code>file_path</code> to be a directory)</td>
+</tr>
+<tr>
+<td><code>user_id</code></td>
+<td>integer</td>
+<td>No</td>
+<td>—</td>
+<td>User ID to associate with registration</td>
+</tr>
+<tr>
+<td><code>content_hash</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Pre-computed SHA-256 hash (skips computation)</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Register a single file</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/video.mp4&quot;}&#39;</span>
+
+<span class="c1"># Batch register files matching a pattern in a directory</span>
+curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/register&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_path&quot;: &quot;/path/to/dir&quot;, &quot;pattern&quot;: &quot;.*\\.mp4$&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/path/to/video.mp4&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;file_type&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video&quot;</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;duration&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">120.5</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;width&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1920</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;height&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1080</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;fps&quot;</span><span class="p">:</span><span class="w"> </span><span class="mf">24.0</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_frames&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">2892</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;already_exists&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;File registered successfully&quot;</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>success</code></td>
+<td>boolean</td>
+<td>Always true on 200</td>
+</tr>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID of the registered file</td>
+</tr>
+<tr>
+<td><code>file_name</code></td>
+<td>string</td>
+<td>File name (auto-renamed if name conflict)</td>
+</tr>
+<tr>
+<td><code>file_path</code></td>
+<td>string</td>
+<td>Canonical path on disk</td>
+</tr>
+<tr>
+<td><code>file_type</code></td>
+<td>string</td>
+<td><code>"video"</code>, <code>"audio"</code>, or <code>"unknown"</code></td>
+</tr>
+<tr>
+<td><code>duration</code></td>
+<td>float</td>
+<td>Duration in seconds</td>
+</tr>
+<tr>
+<td><code>width</code></td>
+<td>integer</td>
+<td>Video width in pixels</td>
+</tr>
+<tr>
+<td><code>height</code></td>
+<td>integer</td>
+<td>Video height in pixels</td>
+</tr>
+<tr>
+<td><code>fps</code></td>
+<td>float</td>
+<td>Frames per second</td>
+</tr>
+<tr>
+<td><code>total_frames</code></td>
+<td>integer</td>
+<td>Total frame count</td>
+</tr>
+<tr>
+<td><code>already_exists</code></td>
+<td>boolean</td>
+<td>True if same content was already registered</td>
+</tr>
+<tr>
+<td><code>message</code></td>
+<td>string</td>
+<td>Human-readable status</td>
+</tr>
+</tbody>
+</table>
+<h4>Error Responses</h4>
+<table class="table">
+<thead>
+<tr>
+<th>HTTP</th>
+<th>When</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>401</code></td>
+<td>Missing or invalid API key</td>
+</tr>
+<tr>
+<td><code>400</code></td>
+<td>Invalid request body</td>
+</tr>
+<tr>
+<td><code>404</code></td>
+<td>File path does not exist</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h3><code>GET /api/v1/files/scan</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Scan the filesystem directory and list all media files, showing which are registered, processing, or unregistered.</p>
+<h4>Query Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Default</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>No</td>
+<td>1</td>
+<td>Page number (1-based)</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Items per page (alias: <code>limit</code>)</td>
+</tr>
+<tr>
+<td><code>limit</code></td>
+<td>integer</td>
+<td>No</td>
+<td>all</td>
+<td>Max items (alias for <code>page_size</code>)</td>
+</tr>
+<tr>
+<td><code>pattern</code></td>
+<td>string</td>
+<td>No</td>
+<td>—</td>
+<td>Regex filter on file name (e.g., <code>.*\\.mp4$</code>)</td>
+</tr>
+<tr>
+<td><code>sort_by</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>name</code></td>
+<td>Sort field: <code>name</code>, <code>size</code>, <code>modified</code>, <code>status</code></td>
+</tr>
+<tr>
+<td><code>sort_order</code></td>
+<td>string</td>
+<td>No</td>
+<td><code>asc</code></td>
+<td>Sort direction: <code>asc</code> or <code>desc</code></td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code><span class="c1"># Full scan</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{total, registered_count, unregistered_count}&#39;</span>
+
+<span class="c1"># Paginated (page 1, 5 per page)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?page=1&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{page, total_pages, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Regex filter: only mp4 files</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?pattern=.*\\.mp4</span>$<span class="s2">&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{filtered_total, files: [.files[].file_name]}&#39;</span>
+
+<span class="c1"># Sort by file size (largest first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=size&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, file_size}]&#39;</span>
+
+<span class="c1"># Sort by modified time (most recent first)</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=modified&amp;sort_order=desc&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, modified_time}]&#39;</span>
+
+<span class="c1"># Sort by status</span>
+curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/files/scan?sort_by=status&amp;page_size=5&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;[.files[] | {file_name, status}]&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;files&quot;</span><span class="p">:</span><span class="w"> </span><span class="p">[</span>
+<span class="w">    </span><span class="p">{</span>
+<span class="w">      </span><span class="nt">&quot;file_name&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;video.mp4&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">12345678</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;is_registered&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;3a6c1865...&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;status&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;completed&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;registration_time&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;2026-05-16T12:00:00Z&quot;</span><span class="p">,</span>
+<span class="w">      </span><span class="nt">&quot;job_id&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">42</span>
+<span class="w">    </span><span class="p">}</span>
+<span class="w">  </span><span class="p">],</span>
+<span class="w">  </span><span class="nt">&quot;total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">107</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;filtered_total&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">80</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">1</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;page_size&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">20</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;total_pages&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">4</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;registered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">26</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;unregistered_count&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">81</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>files</code></td>
+<td>array</td>
+<td>Array of file info objects (paginated)</td>
+</tr>
+<tr>
+<td><code>files[].file_name</code></td>
+<td>string</td>
+<td>File name</td>
+</tr>
+<tr>
+<td><code>files[].relative_path</code></td>
+<td>string</td>
+<td>Path relative to scan root</td>
+</tr>
+<tr>
+<td><code>files[].file_path</code></td>
+<td>string</td>
+<td>Absolute path on disk</td>
+</tr>
+<tr>
+<td><code>files[].file_size</code></td>
+<td>integer</td>
+<td>File size in bytes</td>
+</tr>
+<tr>
+<td><code>files[].modified_time</code></td>
+<td>string</td>
+<td>Last modified timestamp (ISO8601)</td>
+</tr>
+<tr>
+<td><code>files[].is_registered</code></td>
+<td>boolean</td>
+<td>Whether file is registered in DB</td>
+</tr>
+<tr>
+<td><code>files[].file_uuid</code></td>
+<td>string</td>
+<td>32-char hex UUID (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].status</code></td>
+<td>string</td>
+<td><code>"completed"</code>, <code>"processing"</code>, <code>"registered"</code>, <code>"unregistered"</code>, or <code>null</code></td>
+</tr>
+<tr>
+<td><code>files[].registration_time</code></td>
+<td>string</td>
+<td>DB registration timestamp (only if registered)</td>
+</tr>
+<tr>
+<td><code>files[].job_id</code></td>
+<td>integer</td>
+<td>Processing job ID (only if a job exists)</td>
+</tr>
+<tr>
+<td><code>total</code></td>
+<td>integer</td>
+<td>Total files found on disk (unfiltered)</td>
+</tr>
+<tr>
+<td><code>filtered_total</code></td>
+<td>integer</td>
+<td>Files matching regex filter</td>
+</tr>
+<tr>
+<td><code>page</code></td>
+<td>integer</td>
+<td>Current page number</td>
+</tr>
+<tr>
+<td><code>page_size</code></td>
+<td>integer</td>
+<td>Items per page</td>
+</tr>
+<tr>
+<td><code>total_pages</code></td>
+<td>integer</td>
+<td>Total pages</td>
+</tr>
+<tr>
+<td><code>registered_count</code></td>
+<td>integer</td>
+<td>Files registered in DB</td>
+</tr>
+<tr>
+<td><code>unregistered_count</code></td>
+<td>integer</td>
+<td>Files not yet registered</td>
+</tr>
+</tbody>
+</table>
+<h4>Notes</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Feature</th>
+<th>Behavior</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><strong>Regex</strong></td>
+<td>Case-insensitive (<code>(?i)</code> prefix auto-applied). Applied to <code>file_name</code>.</td>
+</tr>
+<tr>
+<td><strong>Sort order</strong></td>
+<td>Default (<code>sort_by=name</code>): registered files first, then alphabetically. <code>sort_by=status</code>: alphabetical by status string.</td>
+</tr>
+<tr>
+<td><strong>Pagination</strong></td>
+<td><code>page_size</code> and <code>limit</code> are aliases. Default: show all results.</td>
+</tr>
+<tr>
+<td><strong>Processing order</strong></td>
+<td><code>pattern</code> regex filter → <code>sort_by</code>/<code>sort_order</code> → <code>page</code>/<code>page_size</code> slice.</td>
+</tr>
+</tbody>
+</table>
+<hr />
+<h2>TMDb Enrichment</h2>
+<blockquote>
+<p>⚠️ <strong>External resource</strong>: TMDb requires internet access, violating Momentry's local-only principle.
+All core processing (ASR, YOLO, Face, OCR, Pose, embeddings) runs fully offline.
+TMDb enrichment is <strong>optional</strong> and gated behind <code>TMDB_API_KEY</code> + <code>MOMENTRY_TMDB_PROBE_ENABLED</code>.</p>
+</blockquote>
+<h3>Overview</h3>
+<p>TMDb enrichment is an optional identity enrichment step that can be run after Pipeline face detection completes. The workflow is:</p>
+<ol>
+<li><strong>Prefetch</strong> (requires internet): Download movie cast data from TMDb API → cache to <code>{file_uuid}.tmdb.json</code></li>
+<li><strong>Probe</strong>: Read local cache → create identities for <strong>all</strong> cast members (<code>source='tmdb'</code>) + save <code>identity.json</code> + download profile image to <code>{OUTPUT}/identities/{uuid}/profile.jpg</code></li>
+<li><strong>Match</strong>: The worker automatically matches video faces against TMDb identities when <code>MOMENTRY_TMDB_PROBE_ENABLED=true</code></li>
+</ol>
+<h3><code>POST /api/v1/agents/tmdb/prefetch</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Fetch TMDb cast data for a registered file and cache it locally. This is the only step requiring internet access.</p>
+<h4>Request Parameters</h4>
+<table class="table">
+<thead>
+<tr>
+<th>Field</th>
+<th>Type</th>
+<th>Required</th>
+<th>Description</th>
+</tr>
+</thead>
+<tbody>
+<tr>
+<td><code>file_uuid</code></td>
+<td>string</td>
+<td>Yes</td>
+<td>File UUID to enrich</td>
+</tr>
+</tbody>
+</table>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/agents/tmdb/prefetch&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;Content-Type: application/json&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-d<span class="w"> </span><span class="s1">&#39;{&quot;file_uuid&quot;: &quot;&#39;</span><span class="s2">&quot;</span><span class="nv">$FILE_UUID</span><span class="s2">&quot;</span><span class="s1">&#39;&quot;}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;file_uuid&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;...&quot;</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;cache_path&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;/output/...tmdb.json&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/file/:file_uuid/tmdb-probe</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: file-level</p>
+<p>Read local TMDb cache and create/update identities. Requires prefetch to have been run first.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/file/</span><span class="nv">$FILE_UUID</span><span class="s2">/tmdb-probe&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_created, movie_title}&#39;</span>
+</code></pre></div>
+
+<h4>Response (200 — identities created)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;identities_created&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">15</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;movie_title&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;Charade&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h4>Response (200 — no cache)</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span><span class="nt">&quot;success&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span><span class="w"> </span><span class="nt">&quot;message&quot;</span><span class="p">:</span><span class="w"> </span><span class="s2">&quot;No TMDb cache found. Run tmdb-prefetch first.&quot;</span><span class="p">}</span>
+</code></pre></div>
+
+<h3><code>GET /api/v1/resource/tmdb</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>View TMDb resource status including configuration, identity counts, and cache file count.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb&quot;</span><span class="w"> </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;{identities_seeded, cache_files}&#39;</span>
+</code></pre></div>
+
+<h3><code>POST /api/v1/resource/tmdb/check</code></h3>
+<p><strong>Auth</strong>: Required
+<strong>Scope</strong>: system-level</p>
+<p>Ping the TMDb API to verify connectivity and measure latency.</p>
+<h4>Example</h4>
+<div class="codehilite"><pre><span></span><code>curl<span class="w"> </span>-s<span class="w"> </span>-X<span class="w"> </span>POST<span class="w"> </span><span class="s2">&quot;</span><span class="nv">$API</span><span class="s2">/api/v1/resource/tmdb/check&quot;</span><span class="w"> </span><span class="se">\</span>
+<span class="w">  </span>-H<span class="w"> </span><span class="s2">&quot;X-API-Key: </span><span class="nv">$KEY</span><span class="s2">&quot;</span><span class="w"> </span><span class="p">|</span><span class="w"> </span>jq<span class="w"> </span><span class="s1">&#39;.status&#39;</span>
+</code></pre></div>
+
+<h4>Response</h4>
+<div class="codehilite"><pre><span></span><code><span class="p">{</span>
+<span class="w">  </span><span class="nt">&quot;api_key_configured&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;enabled&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">false</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_reachable&quot;</span><span class="p">:</span><span class="w"> </span><span class="kc">true</span><span class="p">,</span>
+<span class="w">  </span><span class="nt">&quot;api_latency_ms&quot;</span><span class="p">:</span><span class="w"> </span><span class="mi">120</span>
+<span class="p">}</span>
+</code></pre></div>
+
+<hr />
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/index.html b/docs_v1.0/doc_user/index.html
new file mode 100644
index 0000000..a1019c2
--- /dev/null
+++ b/docs_v1.0/doc_user/index.html
@@ -0,0 +1,26 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Momentry API Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; color: #333; padding: 40px; }
+.container { max-width: 900px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; }
+h1 { font-size: 28px; margin-bottom: 8px; }
+p.subtitle { color: #666; margin-bottom: 24px; }
+ul { list-style: none; }
+li { padding: 8px 0; border-bottom: 1px solid #eee; }
+li:last-child { border: none; }
+a { color: #0066cc; text-decoration: none; font-size: 16px; }
+a:hover { text-decoration: underline; }
+</style>
+</head>
+<body>
+<div class="container">
+<h1>Momentry API Documentation</h1>
+<p class="subtitle">Generated from API_WORKSPACE modules</p>
+<ul><li><a href="API_ACCESS.html">Api Access</a></li><li><a href="API_ENDPOINTS.html">Api Endpoints</a></li><li><a href="API_ERROR_CODES.html">Api Error Codes</a></li><li><a href="API_INDEX.html">Api Index</a></li><li><a href="API_QUICK_REFERENCE.html">Api Quick Reference</a></li><li><a href="API_REFERENCE.html">Api Reference</a></li><li><a href="API_TRAINING_MARCOM.html">Api Training Marcom</a></li><li><a href="Demo_EndToEnd.html">Demo Endtoend</a></li><li><a href="M5API_Pipeline_Demo.html">M5Api Pipeline Demo</a></li><li><a href="TMDb_User_Guide.html">Tmdb User Guide</a></li></ul>
+</div>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_user/login.html b/docs_v1.0/doc_user/login.html
new file mode 100644
index 0000000..c199107
--- /dev/null
+++ b/docs_v1.0/doc_user/login.html
@@ -0,0 +1,46 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<title>Login - Momentry Docs</title>
+<style>
+* { margin: 0; padding: 0; box-sizing: border-box; }
+body { font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #f5f5f5; display: flex; justify-content: center; align-items: center; height: 100vh; }
+.card { background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.08); padding: 40px; width: 360px; }
+h1 { font-size: 24px; margin-bottom: 24px; text-align: center; }
+input { width: 100%; padding: 10px 12px; margin-bottom: 12px; border: 1px solid #ddd; border-radius: 6px; font-size: 14px; }
+button { width: 100%; padding: 10px; background: #0066cc; color: white; border: none; border-radius: 6px; font-size: 16px; cursor: pointer; }
+button:hover { background: #0052a3; }
+.error { color: #cc0000; font-size: 13px; margin-bottom: 12px; display: none; }
+</style>
+</head>
+<body>
+<div class="card">
+<h1>Momentry Docs</h1>
+<form id="loginForm">
+<input type="text" id="username" placeholder="Username" value="demo" required>
+<input type="password" id="password" placeholder="Password" value="demo" required>
+<div class="error" id="error">Invalid credentials</div>
+<button type="submit">Login</button>
+</form>
+</div>
+<script>
+document.getElementById('loginForm').onsubmit = async function(e) {
+    e.preventDefault();
+    const resp = await fetch('/api/v1/auth/login', {
+        method: 'POST',
+        headers: {'Content-Type': 'application/json'},
+        body: JSON.stringify({
+            username: document.getElementById('username').value,
+            password: document.getElementById('password').value
+        })
+    });
+    if (resp.ok) {
+        window.location.href = '/doc/index.html';
+    } else {
+        document.getElementById('error').style.display = 'block';
+    }
+};
+</script>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs_v1.0/doc_wasm/index.html b/docs_v1.0/doc_wasm/index.html
index 9b0f3f9..3e1f5f0 100644
--- a/docs_v1.0/doc_wasm/index.html
+++ b/docs_v1.0/doc_wasm/index.html
@@ -66,6 +66,7 @@ const MODULES = [
   ["10_pipeline","生產線","Pipeline"],
   ["12_agent","智慧代理","AI Agents"],
   ["13_config","系統設定","System Config"],
+  ["14_identity_history","操作歷史","Operation History (Undo/Redo)"],
 ];
 
 const el = document.getElementById('content');
diff --git a/docs_v1.0/doc_wasm/modules/06_search.md b/docs_v1.0/doc_wasm/modules/06_search.md
index 0fad9df..3d2d83a 100644
--- a/docs_v1.0/doc_wasm/modules/06_search.md
+++ b/docs_v1.0/doc_wasm/modules/06_search.md
@@ -7,7 +7,7 @@
 ### `POST /api/v1/search/smart`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
 Semantic vector search using EmbeddingGemma-300m. Generates a query embedding via EmbeddingGemma (port 11436), then searches pgvector `story_parent` and `llm_parent` chunks by cosine similarity.
 
@@ -15,13 +15,22 @@ Semantic vector search using EmbeddingGemma-300m. Generates a query embedding vi
 
 | Field | Type | Required | Default | Description |
 |-------|------|----------|---------|-------------|
-| `file_uuid` | string | Yes | — | File UUID to search within |
 | `query` | string | Yes | — | Search text |
+| `file_uuid` | string | No | — | File UUID to search within. If omitted, searches all files (global search) |
 | `limit` | integer | No | 5 | Max results to return |
 | `page` | integer | No | 1 | Page number |
 | `page_size` | integer | No | 5 | Items per page |
 
-#### Example
+#### Example (Global Search)
+
+```bash
+curl -s -X POST "$API/api/v1/search/smart" \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer $JWT" \
+  -d '{"query": "Audrey Hepburn"}'
+```
+
+#### Example (File-specific Search)
 
 ```bash
 curl -s -X POST "$API/api/v1/search/smart" \
@@ -37,6 +46,7 @@ curl -s -X POST "$API/api/v1/search/smart" \
   "query": "Audrey Hepburn",
   "results": [
     {
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
       "parent_id": 1087822,
       "scene_order": 1087822,
       "start_frame": 104438,
@@ -54,12 +64,16 @@ curl -s -X POST "$API/api/v1/search/smart" \
 }
 ```
 
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].file_uuid` | string | File UUID where result was found |
+
 ---
 
 ### `POST /api/v1/search/universal`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
 Multi-type BM25 full-text search across chunks, frames, and persons. Uses PostgreSQL `tsvector`.
 
@@ -68,13 +82,22 @@ Multi-type BM25 full-text search across chunks, frames, and persons. Uses Postgr
 | Field | Type | Required | Default | Description |
 |-------|------|----------|---------|-------------|
 | `query` | string | Yes | — | Search text |
-| `file_uuid` | string | No | — | Restrict to specific file |
+| `file_uuid` | string | No | — | Restrict to specific file. If omitted, searches all files (global search) |
 | `types` | string[] | No | `["chunk","frame","person"]` | Search types |
 | `limit` | integer | No | 10 | Max results per type |
 | `page` | integer | No | 1 | Page number |
 | `page_size` | integer | No | 20 | Items per page |
 
-#### Example
+#### Example (Global Search)
+
+```bash
+curl -s -X POST "$API/api/v1/search/universal" \
+  -H "Content-Type: application/json" \
+  -H "Authorization: Bearer $JWT" \
+  -d '{"query": "Cary Grant"}'
+```
+
+#### Example (File-specific Search)
 
 ```bash
 curl -s -X POST "$API/api/v1/search/universal" \
@@ -90,6 +113,7 @@ curl -s -X POST "$API/api/v1/search/universal" \
   "results": [
     {
       "type": "chunk",
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
       "chunk_id": "bd80fec92b0b6963d177a2c55bf713e2_2",
       "chunk_type": "story_child",
       "start_frame": 5103,
@@ -98,6 +122,25 @@ curl -s -X POST "$API/api/v1/search/universal" \
       "end_time": 213.64,
       "text": "[213s-214s] Cary Grant: \"Olá!\"",
       "score": 0.9
+    },
+    {
+      "type": "frame",
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "frame_number": 5105,
+      "timestamp": 212.72,
+      "score": 0.7,
+      "objects": null,
+      "ocr_texts": null,
+      "faces": null
+    },
+    {
+      "type": "person",
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "identity_id": 12,
+      "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+      "name": "Cary Grant",
+      "appearance_count": 542,
+      "score": 0.95
     }
   ],
   "total": 20,
@@ -105,23 +148,78 @@ curl -s -X POST "$API/api/v1/search/universal" \
 }
 ```
 
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].type` | string | Result type: `chunk`, `frame`, or `person` |
+| `results[].file_uuid` | string | File UUID where result was found (all types) |
+
 ---
 
 ### `POST /api/v1/search/frames`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
 Search face detection frames by identity name or trace ID.
 
 ---
 
-### `POST /api/v1/search/identity_text`
+### `GET /api/v1/search/identity_text`
 
 **Auth**: Required
-**Scope**: file-level
+**Scope**: global / file-level
 
-Search text chunks spoken by a specific identity.
+Search text chunks → find associated identities. Returns chunks where face detections overlap with text content.
+
+#### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `q` | string | Yes | — | Search text (ILIKE match) |
+| `file_uuid` | string | No | — | Restrict to specific file. If omitted, searches all files (global search) |
+| `limit` | integer | No | 50 | Max results |
+| `page` | integer | No | 1 | Page number |
+| `page_size` | integer | No | 50 | Items per page |
+
+#### Example (Global Search)
+
+```bash
+curl -s "$API/api/v1/search/identity_text?q=love" -H "X-API-Key: $KEY"
+```
+
+#### Example (File-specific Search)
+
+```bash
+curl -s "$API/api/v1/search/identity_text?file_uuid=$FILE_UUID&q=love" -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "total": 5,
+  "results": [
+    {
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "chunk_id": "llm_parent_..._256_270",
+      "start_time": 256.256,
+      "end_time": 270.228,
+      "text_content": "...lack of affection...",
+      "identity_id": 9,
+      "identity_name": "Audrey Hepburn",
+      "identity_source": "tmdb",
+      "trace_id": 94
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].file_uuid` | string | File UUID where chunk was found |
+| `results[].identity_id` | integer | Identity ID if face was detected |
+| `results[].trace_id` | integer | Face trace ID |
 
 ---
 
@@ -145,4 +243,4 @@ Search text chunks spoken by a specific identity.
 | **Storage** | pgvector (`chunk.embedding` column) |
 
 ---
-*Updated: 2026-05-19 12:49:24*
+*Updated: 2026-05-27 — Added global search support for smart, universal, identity_text APIs*
diff --git a/docs_v1.0/doc_wasm/modules/07_identity.md b/docs_v1.0/doc_wasm/modules/07_identity.md
index f662b2f..3178ba9 100644
--- a/docs_v1.0/doc_wasm/modules/07_identity.md
+++ b/docs_v1.0/doc_wasm/modules/07_identity.md
@@ -70,7 +70,16 @@ curl -s "$API/api/v1/identity/$IDENTITY_UUID" -H "X-API-Key: $KEY"
 **Auth**: Required
 **Scope**: identity-level
 
-Delete an identity permanently.
+Delete an identity permanently. All face detections bound to this identity are unbound (`identity_id` set to `NULL`). The identity JSON file is deleted from disk.
+
+#### History & Undo/Redo
+
+Every DELETE records a full snapshot of the identity and its unbound faces. See [`14_identity_history.md`](14_identity_history.md#4-delete-history--undoredo) for:
+
+- Undo via `POST /api/v1/identity/:identity_uuid/undo` — recreates identity and re-binds faces
+- Redo via `POST /api/v1/identity/:identity_uuid/redo` — re-deletes the identity
+
+**Note**: Delete undo/redo reuses the same endpoints as PATCH undo/redo. The endpoint automatically detects whether the identity was deleted (undo) or needs to be re-deleted (redo) based on the history record.
 
 ---
 
@@ -129,124 +138,75 @@ curl -s -X PATCH "$API/api/v1/identity/$IDENTITY_UUID" \
 
 | HTTP | When |
 |------|------|
-| `400` | No fields to update or invalid UUID format |
 | `404` | Identity not found |
+| `500` | Database error |
+
+#### History & Undo/Redo
+
+Every bind records a before/after snapshot. See [`14_identity_history.md`](14_identity_history.md#2-bindunbindtrace-history--undoredo) for:
+
+- `POST /api/v1/identity/:identity_uuid/bind/undo` — Revert a bind
+- `POST /api/v1/identity/:identity_uuid/bind/redo` — Reapply an undone bind
+- `GET /api/v1/identity/:identity_uuid/bind/history` — Query bind operations
 
 ---
 
-### `GET /api/v1/identity/:identity_uuid/files`
+## Metadata (Embedded JSON)
 
-**Auth**: Required
-**Scope**: identity-level
+The `identities.metadata` column is a **JSONB** field that stores arbitrary structured data alongside the identity's core fields (name, status, identity_type). No schema is enforced — any valid JSON object is accepted.
 
-Get all files where this identity appears. Returns per-file summary including face count, confidence, and appearance time range.
+### Merge Behavior
 
-#### Example
+| Operation | Strategy | Example |
+|-----------|----------|---------|
+| **PATCH** | Shallow top-level merge: `COALESCE(metadata,'{}'::jsonb) \|\| $1::jsonb` | Sending `{"tmdb_rating": 8.5}` only adds/overwrites `tmdb_rating`; all other existing keys are preserved. |
+| **mergeinto** | Recursive deep merge — nested sub-keys are merged individually, not replaced wholesale | Target has `{"tmdb": {"biography": "..."}}`, source has `{"tmdb": {"birthday": "1904-01-18"}}` → result is `{"tmdb": {"biography": "...", "birthday": "1904-01-18"}}`. |
+| **Upload (`POST`)** | Direct overwrite — the entire `metadata` field is replaced with the request value. | |
 
-```bash
-curl -s "$API/api/v1/identity/$IDENTITY_UUID/files" -H "X-API-Key: $KEY"
-```
+### Validation
 
----
+| Scenario | Result |
+|----------|--------|
+| PATCH with non-object metadata (`string`, `array`, `number`, `null`) | `400 Bad Request: "metadata must be a JSON object"` |
+| mergeinto with non-object metadata | Accepted (mergeinto validates at application level) |
+| Upload with non-object metadata | Accepted (upload replaces directly) |
 
-### `GET /api/v1/identity/:identity_uuid/faces`
+### Conventional Keys
 
-**Auth**: Required
-**Scope**: identity-level
+| Key | Type | Writer | Purpose |
+|-----|------|--------|---------|
+| `aliases` | `[{locale, name}]` | PATCH, mergeinto | Multilingual display names (see [Alias System](#alias-system-bcp-47-locale-tags)) |
+| `merged_into` | `{uuid, at}` | mergeinto | Marks an identity as merged (undo mechanism reads this) |
+| `tmdb_*` | various | TMDb probe | Movie metadata (biography, birthday, known_for, etc.). Written only when `MOMENTRY_TMDB_PROBE_ENABLED=true`. |
+| `source` | string | mergeinto | Tagged on aliases/metadata when added by merge (`"merge"` value) |
 
-Get all face detection records associated with this identity.
+Custom keys are fully supported — no registration required.
 
-#### Example
+### Search Coverage
 
-```bash
-curl -s "$API/api/v1/identity/$IDENTITY_UUID/faces" -H "X-API-Key: $KEY"
-```
+The identity search endpoint (`GET /api/v1/identity/search`) matches across three scopes:
 
-| Field | Type | Description |
-|-------|------|-------------|
-| `file_uuid` | string | File where face was detected |
-| `frame_number` | integer | Frame number of detection |
-| `face_id` | string | Face ID (format: `face_{frame_number}`) |
-| `confidence` | float | Detection confidence |
+1. `i.name` — exact and ILIKE against display name
+2. `jsonb_array_elements(i.metadata->'aliases')->>'name'` — locale-tagged alias names
+3. `i.metadata::text ILIKE $1` — raw string search across the entire JSON blob (all keys, all values)
 
----
+This means searching for `"1904-01-18"` or `"biography"` will match identities whose metadata contains those strings anywhere.
 
-### `GET /api/v1/identity/:identity_uuid/chunks`
+### History Snapshots
 
-**Auth**: Required
-**Scope**: identity-level
+Every `identity_history` record captures the **full metadata** in both `before_snapshot` and `after_snapshot` (as part of the complete identity JSONB dump). Undo restores the identity row — including metadata — to the `before_snapshot` state.
 
-Get all text chunks (sentences) spoken while this identity's face was on screen. Useful for finding what a person said.
+For merge operations, the MongoDB merge history records `metadata_fields_added` and `metadata_fields_added_paths` (dot-separated paths like `"tmdb.biography"`). Merge undo removes only those specific paths, preserving subsequent manual edits to other metadata keys.
 
-#### Example
+### Best Practices
 
-```bash
-curl -s "$API/api/v1/identity/$IDENTITY_UUID/chunks" -H "X-API-Key: $KEY"
-```
-
-#### Response (200)
-
-```json
-{
-  "success": true,
-  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
-  "data": [
-    {
-      "id": 0,
-      "file_uuid": "bd80fec92b0b6963d177a2c55bf713e2",
-      "chunk_id": "bd80fec92b0b6963d177a2c55bf713e2_2",
-      "chunk_type": "sentence",
-      "start_frame": 5103,
-      "end_frame": 5127,
-      "fps": 24.0,
-      "start_time": 212.64,
-      "end_time": 213.64,
-      "text_content": "[213s-214s] Cary Grant: \"Olá!\""
-    }
-  ]
-}
-```
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `file_uuid` | string | File identifier |
-| `chunk_id` | string | Sentence chunk identifier |
-| `start_frame` | integer | Frame-accurate start position |
-| `end_frame` | integer | Frame-accurate end position |
-| `fps` | float | Frames per second |
-| `start_time` | float | Start time in seconds |
-| `end_time` | float | End time in seconds |
-| `text_content` | string | Spoken text content |
-
----
-
-### `POST /api/v1/identity/:identity_uuid/bind`
-
-**Auth**: Required
-**Scope**: identity-level
-
-Bind a face detection to an identity. Associates the face trace with the identity for future search and recognition.
-
-#### Request Parameters
-
-| Field | Type | Required | Description |
-|-------|------|----------|-------------|
-| `file_uuid` | string | Yes | File where face is detected |
-| `face_id` | string | Yes | Face ID (format: `{frame}_{idx}`) |
-
-#### Side Effects
-
-- 清除該 face detection row 的 `stranger_id`（設為 NULL）
-- 不影響 `identities` 表中原有的 stranger auto-identity 記錄
-
-#### Example
-
-```bash
-curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind" \
-  -H "X-API-Key: $KEY" \
-  -H "Content-Type: application/json" \
-  -d '{"file_uuid": "'"$FILE_UUID"'", "face_id": "1_5"}'
-```
+| Guideline | Reason |
+|-----------|--------|
+| Deep nesting is allowed in metadata | All metadata merge operations use `jsonb_deep_merge()` — nested sub-keys are merged recursively, not replaced wholesale |
+| Use `aliases` for display names | Frontend has built-in locale fallback logic (see [Alias System](#alias-system-bcp-47-locale-tags)) |
+| Avoid >1MB per identity | Metadata is included in search indexing (`metadata::text ILIKE`); large blobs degrade query performance |
+| Don't rely on metadata ordering | JSONB preserves insertion order but PostgreSQL does not guarantee it across operations |
+| No LLM/Gemma4 agent writes to metadata | Only API endpoints (PATCH, mergeinto, upload) and TMDb probe modify `identities.metadata` |
 
 ---
 
@@ -295,6 +255,10 @@ curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind/trace" \
 | `404` | Identity not found |
 | `500` | Database error |
 
+#### History & Undo/Redo
+
+Trace bind operations share the same history/undo/redo system as single-face binds. See [`14_identity_history.md`](14_identity_history.md#2-bindunbindtrace-history--undoredo) for endpoints.
+
 ---
 
 ### `GET /api/v1/identity/:identity_uuid/traces`
@@ -382,6 +346,13 @@ Unbind a face detection from an identity. Removes the identity association from
 - 被 unbind 的 face 不會自動成為 stranger
 - 要重新標記為 stranger 需重新跑 Agent API（`identity/analyze`）
 
+#### History & Undo/Redo
+
+Unbind records a before/after snapshot. See [`14_identity_history.md`](14_identity_history.md#2-bindunbindtrace-history--undoredo) for:
+
+- `POST /api/v1/identity/:identity_uuid/bind/undo` — Revert an unbind
+- `POST /api/v1/identity/:identity_uuid/bind/redo` — Reapply an undone unbind
+
 ---
 
 ### `POST /api/v1/identity/:identity_uuid/mergeinto`
@@ -391,6 +362,13 @@ Unbind a face detection from an identity. Removes the identity association from
 
 Transfer all face bindings from this identity to another identity, then optionally delete or mark the source as merged.
 
+#### Two Merge Cases
+
+| Case | Description | Undo/Redo Support |
+|------|-------------|-------------------|
+| **stranger → identity** | Merge an auto-generated stranger identity into a known identity (TMDb or user-defined) | ✅ 24hr undo/redo |
+| **identity A → identity B** | Merge two known identities (e.g., duplicate entries) | ✅ 24hr undo/redo |
+
 #### Request Parameters
 
 | Field | Type | Required | Default | Description |
@@ -402,8 +380,12 @@ Transfer all face bindings from this identity to another identity, then optional
 
 - 轉移所有 `face_detections.identity_id` 到目標 identity
 - 同時清除所有被轉移 rows 的 `stranger_id`
+- 將 source name 加入 target aliases (with `source: "merge"` tag)
+- 將 source aliases 加入 target aliases (if not already present)
+- 將 source metadata fields 加入 target metadata (if not already present)
 - `keep_history: true`（預設）：source identity 設為 `status='merged'`，保留記錄
 - `keep_history: false`：**刪除** source identity 及其 identity JSON 檔案
+- **記錄 merge history 到 MongoDB**（支援 undo/redo）
 
 #### Example
 
@@ -411,7 +393,7 @@ Transfer all face bindings from this identity to another identity, then optional
 curl -s -X POST "$API/api/v1/identity/$SOURCE_UUID/mergeinto" \
   -H "X-API-Key: $KEY" \
   -H "Content-Type: application/json" \
-  -d '{"into_uuid": "'"$TARGET_UUID"'", "keep_history": false}'
+  -d '{"into_uuid": "'"$TARGET_UUID"'", "keep_history": true}'
 ```
 
 #### Response (200)
@@ -419,11 +401,23 @@ curl -s -X POST "$API/api/v1/identity/$SOURCE_UUID/mergeinto" \
 ```json
 {
   "success": true,
-  "message": "Merged 'stranger_13894' into 'Louis Viret' (52 faces transferred, source deleted)",
-  "data": { "faces_transferred": 52 }
+  "message": "Merged 'stranger_13894' into 'Louis Viret' (52 faces transferred, history kept)",
+  "data": {
+    "merge_id": "550e8400-e29b-41d4-a716-446655440000",
+    "faces_transferred": 52,
+    "aliases_added": 1,
+    "metadata_fields_added": 2
+  }
 }
 ```
 
+| Field | Type | Description |
+|-------|------|-------------|
+| `merge_id` | string | Unique merge operation ID (for undo) |
+| `faces_transferred` | integer | Number of face detections transferred |
+| `aliases_added` | integer | Number of aliases added to target |
+| `metadata_fields_added` | integer | Number of metadata fields added to target |
+
 #### Error Responses
 
 | HTTP | When |
@@ -433,25 +427,189 @@ curl -s -X POST "$API/api/v1/identity/$SOURCE_UUID/mergeinto" \
 
 ---
 
-### `GET /api/v1/identities/search`
+### `POST /api/v1/identity/merge/:merge_id/undo`
 
 **Auth**: Required
 **Scope**: identity-level
 
-Search identities by name (ILIKE search). Returns matching identity records.
+Undo a merge operation within 24 hours. Restores the source identity and reverts face bindings.
+
+#### Undo Behavior
+
+| Action | Description |
+|--------|-------------|
+| Restore source identity | If `keep_history=true`: restore status to `confirmed`<br>If `keep_history=false`: recreate identity from MongoDB snapshot |
+| Restore faces | Transfer faces back to source identity |
+| Remove aliases from target | Remove aliases with `source: "merge"` tag |
+| Remove metadata fields from target | Remove fields that were added from source |
+| **Preserve manual changes** | Keep aliases/metadata manually added after merge |
 
 #### Example
 
 ```bash
-curl -s "$API/api/v1/identities/search?q=Cary" -H "X-API-Key: $KEY"
+curl -s -X POST "$API/api/v1/identity/merge/550e8400-e29b-41d4-a716-446655440000/undo" \
+  -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "message": "Undo merge completed: 'stranger_13894' restored, 52 faces reverted",
+  "data": {
+    "source_identity_restored": {
+      "uuid": "a9a90105...",
+      "name": "stranger_13894",
+      "status": "confirmed"
+    },
+    "faces_reverted": 52,
+    "aliases_removed_from_target": 1,
+    "metadata_fields_removed_from_target": 2
+  }
+}
+```
+
+#### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | Undo deadline expired (>24hr) or already undone |
+| `404` | Merge record not found |
+| `500` | Database error |
+
+---
+
+### `POST /api/v1/identity/merge/:merge_id/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo a previously undone merge operation. See [`14_identity_history.md`](14_identity_history.md#post-apiv1identitymergemerge_idredo) for full details.
+
+---
+
+### `GET /api/v1/identity/merge/history`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Query merge history records from MongoDB.
+
+#### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `source_uuid` | string | No | — | Filter by source identity UUID |
+| `target_uuid` | string | No | — | Filter by target identity UUID |
+| `merge_id` | string | No | — | Filter by specific merge ID |
+| `undone` | bool | No | — | Filter by undone status |
+| `page` | int | No | 1 | Page number |
+| `page_size` | int | No | 20 | Items per page |
+
+#### Example
+
+```bash
+curl -s "$API/api/v1/identity/merge/history?page=1&page_size=10" \
+  -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "total": 5,
+  "page": 1,
+  "page_size": 10,
+  "results": [
+    {
+      "merge_id": "550e8400-e29b-41d4-a716-446655440000",
+      "source_name": "stranger_13894",
+      "target_name": "Louis Viret",
+      "faces_transferred": 52,
+      "merged_at": "2026-05-27T10:00:00Z",
+      "undo_deadline": "2026-05-28T10:00:00Z",
+      "undone": false,
+      "undo_expired": false
+    }
+  ]
+}
 ```
 
 | Field | Type | Description |
 |-------|------|-------------|
-| `name` | string | Identity name |
-| `source` | string | Identity source |
-| `tmdb_id` | integer | TMDb ID (if source = tmdb) |
-| `file_uuid` | string | Associated file |
+| `merge_id` | string | Unique merge operation ID |
+| `source_name` | string | Source identity name |
+| `target_name` | string | Target identity name |
+| `faces_transferred` | integer | Number of faces transferred |
+| `merged_at` | datetime | When merge occurred |
+| `undo_deadline` | datetime | 24hr deadline for undo |
+| `undone` | bool | Whether merge was undone |
+| `undo_expired` | bool | Whether undo deadline passed |
+
+---
+
+### `GET /api/v1/identities/search`
+
+**Auth**: Required
+**Scope**: global / file-level
+
+Search identity name → find associated chunks. Searches identity name and aliases, returns identities with their associated text chunks.
+
+#### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `q` | string | Yes | — | Search text (ILIKE match on name and aliases) |
+| `file_uuid` | string | No | — | Restrict to specific file. If omitted, searches all files (global search) |
+| `limit` | integer | No | 50 | Max results |
+
+#### Example (Global Search)
+
+```bash
+curl -s "$API/api/v1/identities/search?q=Audrey" -H "X-API-Key: $KEY"
+```
+
+#### Example (File-specific Search)
+
+```bash
+curl -s "$API/api/v1/identities/search?q=Audrey&file_uuid=$FILE_UUID" -H "X-API-Key: $KEY"
+```
+
+#### Response (200)
+
+```json
+{
+  "success": true,
+  "total": 5,
+  "results": [
+    {
+      "identity_id": 9,
+      "name": "Audrey Hepburn",
+      "source": "tmdb",
+      "tmdb_id": 1932,
+      "file_uuid": "a6fb22eebefaef17e62af874997c5944",
+      "trace_id": 41,
+      "chunk_id": "llm_parent_..._204_207",
+      "start_time": 204.162,
+      "text_content": "...confrontation..."
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `results[].identity_id` | integer | Identity ID |
+| `results[].name` | string | Identity name |
+| `results[].source` | string | Identity source (`tmdb`, `user_defined`, etc.) |
+| `results[].tmdb_id` | integer | TMDb person ID (if source = tmdb) |
+| `results[].file_uuid` | string | File where identity appears |
+| `results[].trace_id` | integer | Face trace ID |
+| `results[].chunk_id` | string | Associated chunk ID |
+| `results[].start_time` | float | Chunk start time |
+| `results[].text_content` | string | Chunk text content |
 
 ---
 
@@ -628,4 +786,4 @@ PATCH /api/v1/identity/:identity_uuid
 This **replaces** the entire `aliases` array. To add to existing aliases, include all existing entries in the request.
 
 ---
-*Updated: 2026-05-25
+*Updated: 2026-05-25 — Added `GET /api/v1/file/:file_uuid/faces` with 4 binding states, filters, strangers table split
diff --git a/docs_v1.0/doc_wasm/modules/14_identity_history.md b/docs_v1.0/doc_wasm/modules/14_identity_history.md
new file mode 100644
index 0000000..d61df17
--- /dev/null
+++ b/docs_v1.0/doc_wasm/modules/14_identity_history.md
@@ -0,0 +1,696 @@
+<!-- module: identity_history -->
+<!-- description: Identity operation history, undo, and redo (PATCH, bind, unbind, bind_trace, mergeinto) -->
+<!-- depends: 01_auth, 07_identity -->
+
+## Identity Operation History
+
+Every mutation on an identity automatically records a before/after snapshot. Use undo/redo to revert or reapply changes, and history to inspect the operation log.
+
+Three independent undo/redo systems exist:
+
+| System | Storage | Operations Covered |
+|--------|---------|-------------------|
+| **PATCH** | PostgreSQL `identity_history` | `update` |
+| **Bind** | PostgreSQL `identity_history` | `bind`, `unbind`, `bind_trace` |
+| **Merge** | MongoDB `identity_merge_history` | mergeinto |
+| **Delete** | PostgreSQL `identity_history` | `delete` |
+
+---
+
+### 1. PATCH History & Undo/Redo
+
+#### Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | PostgreSQL `identity_history` table |
+| Snapshot | Full identity record (all fields) before and after each PATCH |
+| Max records | 256 per identity (oldest auto-deleted when limit exceeded) |
+| Undo steps | Unlimited (no expiry, no step limit) |
+| Redo stack | Cleared on new PATCH (`is_undone=true` + `operation='update'` records are deleted) |
+
+##### Stack Model
+
+```
+PATCH 1 → PATCH 2 → PATCH 3         (undo stack, is_undone=false)
+                           ↓ undo
+PATCH 1 → PATCH 2                   (undo stack)
+           PATCH 3                   (redo stack, is_undone=true)
+                           ↓ redo
+PATCH 1 → PATCH 2 → PATCH 3         (undo stack)
+```
+
+A new PATCH after undo clears only the operation='update' redo stack (PATCH 3 is lost). Bind/merge redo stacks are not affected.
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/undo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Undo the most recent PATCH operations. Restores the identity's `before_snapshot` and marks the history records as undone.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of undo steps to apply (max records undone in one call) |
+
+##### Behavior
+
+- Queries `is_undone=false` records with `operation='update'`, ordered by `created_at DESC`
+- Restores `name`, `identity_type`, `source`, `status`, `metadata`, `tmdb_id`, `tmdb_profile` from the last record's `before_snapshot`
+- Marks the undone records as `is_undone=true` with `undone_at=NOW()`
+- Syncs `identity.json` to disk
+- Updates `_index.json` if name changed
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/undo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "undone_count": 1,
+  "current_state": {
+    "id": 9,
+    "uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+    "name": "Cary Grant",
+    "identity_type": "people",
+    "source": "tmdb",
+    "status": "confirmed",
+    "metadata": {},
+    "tmdb_id": 112,
+    "tmdb_profile": null
+  }
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `undone_count` | integer | Number of history records undone |
+| `current_state` | object | Full identity state after undo |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No undo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo previously undone PATCH operations. Restores the identity's `after_snapshot` and marks the history records as no longer undone.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of redo steps to apply |
+
+##### Behavior
+
+- Queries `is_undone=true` records with `operation='update'`, ordered by `created_at DESC`
+- Restores all identity fields from the last record's `after_snapshot`
+- Marks records as `is_undone=false` with `undone_at=NULL`
+- Syncs `identity.json` to disk
+- Updates `_index.json` if name changed
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/redo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "redone_count": 1,
+  "current_state": {
+    "id": 9,
+    "uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+    "name": "John Smith",
+    "identity_type": "people",
+    "source": "tmdb",
+    "status": "confirmed",
+    "metadata": { "aliases": [...] },
+    "tmdb_id": 112,
+    "tmdb_profile": null
+  }
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `redone_count` | integer | Number of history records redone |
+| `current_state` | object | Full identity state after redo |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No redo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `GET /api/v1/identity/:identity_uuid/history`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Query the PATCH operation history for an identity. Returns paginated records with undo/redo stack counts (filtered to `operation='update'`).
+
+##### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `page` | integer | No | `1` | Page number (1-indexed) |
+| `limit` | integer | No | `20` | Items per page (max 100) |
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "total": 5,
+  "undo_stack_count": 3,
+  "redo_stack_count": 2,
+  "results": [
+    {
+      "history_id": 42,
+      "operation": "update",
+      "is_undone": false,
+      "created_at": "2026-05-27T12:00:00Z",
+      "undone_at": null
+    },
+    {
+      "history_id": 41,
+      "operation": "update",
+      "is_undone": true,
+      "created_at": "2026-05-27T11:30:00Z",
+      "undone_at": "2026-05-27T13:00:00Z"
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `total` | integer | Total PATCH history records for this identity |
+| `undo_stack_count` | integer | Records available for undo (`is_undone=false`) |
+| `redo_stack_count` | integer | Records available for redo (`is_undone=true`) |
+| `results[].history_id` | integer | History record ID |
+| `results[].operation` | string | Operation type (`"update"` for PATCH) |
+| `results[].is_undone` | boolean | Whether the operation has been undone |
+| `results[].created_at` | string | When the PATCH was applied |
+| `results[].undone_at` | string | When the undo occurred (null if not undone) |
+
+##### Example
+
+```bash
+curl -s "$API/api/v1/identity/$IDENTITY_UUID/history?page=1&limit=10" \
+  -H "X-API-Key: $KEY"
+```
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+### 2. Bind/Unbind/Trace History & Undo/Redo
+
+All three operations (`bind`, `unbind`, `bind_trace`) share a single history table and undo/redo stack.
+
+#### Bind Operation Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | PostgreSQL `identity_history` table (same table as PATCH) |
+| Snapshot | `{"file_uuid", "face_id" (or "trace_id"), "identity_id_before/after"}` |
+| Max records | 256 per identity (shared limit across all operation types) |
+| Undo steps | Unlimited (`steps` param) |
+| Redo stack | Cleared on new bind/unbind/bind_trace (`operation IN ('bind','unbind','bind_trace')` + `is_undone=true` records deleted) |
+| Stack isolation | Bind redo stack is **independent** from PATCH redo stack — clearing one does not affect the other |
+
+##### Stack Model
+
+```
+bind face_1 (to id=9)              → unbind face_1          → bind trace 906 (to id=9)
+(undo stack, is_undone=false)         (undo stack)              (undo stack)
+                                                               ↓ undo (first undone: bind_trace)
+                                     bind trace 906 (is_undone=true)
+                                     (redo stack)
+                                                               ↓ redo
+bind face_1 → unbind face_1 → bind trace 906
+(undo stack)
+```
+
+A new bind/unbind/trace after undo clears only the bind redo stack (operations with `IN ('bind','unbind','bind_trace')`).
+
+##### Snapshot Format
+
+**Before (bind):**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_before": null
+}
+```
+
+**After (bind):**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_after": 9
+}
+```
+
+**Before (unbind) — binding existed before:**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_before": 9
+}
+```
+
+**After (unbind):**
+```json
+{
+  "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+  "face_id": "1_5",
+  "identity_id_after": null
+}
+```
+
+For `bind_trace`, the snapshot uses `trace_id` instead of `face_id`, with `identity_id_before` capturing the first face's identity in that trace.
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/bind/undo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Undo the most recent bind/unbind/bind_trace operations. Restores `identity_id_before` from the snapshot and marks records as undone.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of undo steps to apply |
+
+##### Behavior
+
+- Queries `is_undone=false` records with `operation IN ('bind','unbind','bind_trace')`, ordered by `created_at DESC`
+- Restores `identity_id_before` — for bind this is `null` (face was unbound), for unbind this is the original identity (face goes back), for bind_trace this is the trace's previous identity
+- Marks the undone records as `is_undone=true` with `undone_at=NOW()`
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind/undo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "operation": "bind",
+  "undone_count": 1,
+  "affected_rows": 53
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `operation` | string | The actual operation undone (`bind`, `unbind`, or `bind_trace`) |
+| `undone_count` | integer | Number of history records undone |
+| `affected_rows` | integer | Number of `face_detections` rows updated |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No bind undo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `POST /api/v1/identity/:identity_uuid/bind/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo previously undone bind/unbind/bind_trace operations. Restores `identity_id_after` from the snapshot.
+
+##### Request (JSON)
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `steps` | integer | No | `1` | Number of redo steps to apply |
+
+##### Behavior
+
+- Queries `is_undone=true` records with `operation IN ('bind','unbind','bind_trace')`, ordered by `created_at DESC`
+- Restores `identity_id_after` — for bind this is the identity the face was bound to, for unbind this is `null`
+- Marks records as `is_undone=false` with `undone_at=NULL`
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/$IDENTITY_UUID/bind/redo" \
+  -H "X-API-Key: $KEY" \
+  -H "Content-Type: application/json" \
+  -d '{"steps": 1}'
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "operation": "unbind",
+  "redone_count": 1,
+  "affected_rows": 1
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `operation` | string | The actual operation redone (`bind`, `unbind`, or `bind_trace`) |
+| `redone_count` | integer | Number of history records redone |
+| `affected_rows` | integer | Number of `face_detections` rows updated |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | No bind redo operations available |
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+#### `GET /api/v1/identity/:identity_uuid/bind/history`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Query the bind/unbind/bind_trace operation history for an identity. Returns paginated records with undo/redo stack counts.
+
+##### Query Parameters
+
+| Field | Type | Required | Default | Description |
+|-------|------|----------|---------|-------------|
+| `page` | integer | No | `1` | Page number (1-indexed) |
+| `limit` | integer | No | `20` | Items per page (max 100) |
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "identity_uuid": "a9a901056d6b46ff92da0c3c1a57dff4",
+  "total": 3,
+  "undo_stack_count": 2,
+  "redo_stack_count": 1,
+  "results": [
+    {
+      "history_id": 52,
+      "operation": "bind_trace",
+      "is_undone": false,
+      "created_at": "2026-05-27T14:00:00Z",
+      "undone_at": null
+    },
+    {
+      "history_id": 51,
+      "operation": "unbind",
+      "is_undone": true,
+      "created_at": "2026-05-27T13:00:00Z",
+      "undone_at": "2026-05-27T14:30:00Z"
+    },
+    {
+      "history_id": 50,
+      "operation": "bind",
+      "is_undone": false,
+      "created_at": "2026-05-27T12:00:00Z",
+      "undone_at": null
+    }
+  ]
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `total` | integer | Total bind history records for this identity |
+| `undo_stack_count` | integer | Records available for undo (`is_undone=false`) |
+| `redo_stack_count` | integer | Records available for redo (`is_undone=true`) |
+| `results[].history_id` | integer | History record ID |
+| `results[].operation` | string | Operation type (`bind`, `unbind`, or `bind_trace`) |
+| `results[].is_undone` | boolean | Whether the operation has been undone |
+| `results[].created_at` | string | When the operation was applied |
+| `results[].undone_at` | string | When the undo occurred (null if not undone) |
+
+##### Example
+
+```bash
+curl -s "$API/api/v1/identity/$IDENTITY_UUID/bind/history?page=1&limit=10" \
+  -H "X-API-Key: $KEY"
+```
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `404` | Identity not found |
+| `500` | Database error |
+
+---
+
+### 3. Merge History & Undo/Redo
+
+Merge operations use MongoDB for richer record-keeping, with a 24-hour undo deadline.
+
+#### Merge Operation Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | MongoDB `identity_merge_history` collection |
+| Snapshot | Full source identity state + target identity state + aliases/metadata diffs |
+| Trigger | Every mergeinto with `keep_history=true` |
+| Undo deadline | 24 hours (renewed on redo) |
+| Redo support | Yes — restores undone merges with new 24hr deadline |
+| Max records | Unlimited |
+
+---
+
+#### `POST /api/v1/identity/merge/:merge_id/undo`
+
+Already documented in [`07_identity.md`](07_identity.md#post-apiv1identitymergemerge_idundo). See that document for full details.
+
+---
+
+#### `POST /api/v1/identity/merge/:merge_id/redo`
+
+**Auth**: Required
+**Scope**: identity-level
+
+Redo a previously undone merge operation within the renewed 24-hour deadline.
+
+##### Request
+
+No body required. The merge ID is taken from the URL path.
+
+##### Behavior
+
+1. Validates the merge record exists and `undone=true` (not already active)
+2. Checks the 24-hour undo deadline (if expired, the redo is rejected)
+3. Restores face bindings: moves all faces from `target_identity` back to `source_identity`
+4. Re-adds aliases that were removed by the undo (aliases with `source: "merge"` tag)
+5. Re-adds metadata fields that were removed by the undo
+6. If `keep_history=true`: sets `source_identity.status = 'merged'` again
+7. If `keep_history=false`: recreates source identity from the `undone_snapshot` stored at undo time
+8. Syncs both identity JSON files to disk
+9. Sets `undone=false`, clears `undone_snapshot`, renews `undo_deadline = NOW() + 24h`
+10. Records `redone_by` user for audit
+
+##### Example
+
+```bash
+curl -s -X POST "$API/api/v1/identity/merge/550e8400-e29b-41d4-a716-446655440000/redo" \
+  -H "X-API-Key: $KEY"
+```
+
+##### Response (200)
+
+```json
+{
+  "success": true,
+  "message": "Redo merge completed: merged 'stranger_13894' into 'Louis Viret' (52 faces transferred)",
+  "data": {
+    "merge_id": "550e8400-e29b-41d4-a716-446655440000",
+    "faces_transferred": 52,
+    "aliases_re_added": 1,
+    "metadata_fields_re_added": 2
+  }
+}
+```
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `merge_id` | string | The merge operation ID |
+| `faces_transferred` | integer | Number of faces transferred from source to target |
+| `aliases_re_added` | integer | Number of aliases restored to target |
+| `metadata_fields_re_added` | integer | Number of metadata fields restored to target |
+
+##### Error Responses
+
+| HTTP | When |
+|------|------|
+| `400` | Merge not undone, deadline expired, or cannot redo |
+| `404` | Merge record not found |
+| `500` | Database error |
+
+---
+
+### 4. Delete History & Undo/Redo
+
+#### Delete Operation Overview
+
+| Property | Value |
+|----------|-------|
+| Storage | PostgreSQL `identity_history` table |
+| Snapshot | `{"identity": {...full row...}, "unbound_faces": [{file_uuid, face_id, trace_id}, ...]}` |
+| Max records | 1 active delete record per identity (redo stack cleared on new delete) |
+| Undo support | Yes — recreates identity row, re-binds faces |
+| Redo support | Yes — re-deletes the identity |
+| Identity file | Deleted on delete, recreated on undo |
+
+#### Snapshot Format
+
+```json
+{
+  "identity": {
+    "id": 9,
+    "uuid": "a9a90105-6d6b-46ff-92da-0c3c1a57dff4",
+    "name": "Cary Grant",
+    "identity_type": "people",
+    "source": "tmdb",
+    "status": "confirmed",
+    "metadata": {},
+    "tmdb_id": 112,
+    "tmdb_profile": null
+  },
+  "unbound_faces": [
+    {
+      "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+      "face_id": "1_5",
+      "trace_id": null
+    },
+    {
+      "file_uuid": "aeed71342a899fe4b4c57b7d41bcb692",
+      "face_id": "1_6",
+      "trace_id": 906
+    }
+  ]
+}
+```
+
+#### Stack Model
+
+```
+DELETE identity                          (undo stack, is_undone=false)
+               ↓ undo
+Identity recreated, faces re-bound
+               → delete history marked is_undone=true
+               ↓ redo (re-delete)
+Identity deleted again, faces unbound
+               → delete history marked is_undone=false
+```
+
+A new delete after an undo clears the delete redo stack (no redo possible for the old delete).
+
+#### Undo Behavior (via existing `POST /api/v1/identity/:identity_uuid/undo`)
+
+1. Normal identity lookup fails (row was deleted)
+2. Checks `identity_history` for `operation='delete' AND is_undone=false` matching the UUID in the snapshot
+3. Recreates the identity row (new internal `id`, same UUID)
+4. Re-binds all faces listed in `unbound_faces` to the new identity
+5. Deletes the `identity_history` delete record as `is_undone=true` with `undone_at=NOW()`
+6. Syncs `identity.json` to disk
+7. Updates `_index.json`
+
+#### Redo Behavior (via existing `POST /api/v1/identity/:identity_uuid/redo`)
+
+1. Identity lookup succeeds (identity was restored by prior undo)
+2. Checks `identity_history` for `operation='delete' AND is_undone=true` matching the identity_id
+3. Deletes `identity.json` from disk
+4. Unbinds all faces (`identity_id = NULL`)
+5. Deletes the identity row
+6. Marks the delete history record as `is_undone=false`
+7. Returns success
+
+#### Error Responses (delete undo/redo)
+
+| HTTP | Scenario |
+|------|----------|
+| `400` | No delete history available (either no delete or already undone/redone) |
+| `404` | Identity not found (for redo — identity wasn't restored) |
+| `500` | Database error |
+
+---
+
+### Comparison: PATCH vs Bind vs Merge vs Delete Undo/Redo
+
+| Aspect | PATCH Undo/Redo | Bind Undo/Redo | Merge Undo/Redo | Delete Undo/Redo |
+|--------|----------------|----------------|-----------------|------------------|
+| Storage | PostgreSQL `identity_history` | PostgreSQL `identity_history` | MongoDB `identity_merge_history` | PostgreSQL `identity_history` |
+| Operation filter | `operation='update'` | `operation IN ('bind','unbind','bind_trace')` | — | `operation='delete'` |
+| Trigger | Every PATCH | Every bind/unbind/bind_trace | Every mergeinto with `keep_history=true` | Every DELETE |
+| Undo deadline | None (unlimited) | None (unlimited) | 24 hours (renewed on redo) | None (unlimited) |
+| Redo support | Yes | Yes | Yes | Yes |
+| Step undo | Yes (`steps` param) | Yes (`steps` param) | No (full undo/redo only) | No (single record) |
+| Max records | 256 per identity | 256 per identity (shared) | Unlimited | 256 per identity (shared) |
+| User tracking | `user_id` + `user_source` | `user_id` + `user_source` | `performed_by_user` + `undone_by` / `redone_by` | `user_id` + `user_source` |
+
+---
+
+*Updated: 2026-05-28*
diff --git a/docs_v1.0/doc_wasm/pkg/md_wasm_bg.wasm b/docs_v1.0/doc_wasm/pkg/md_wasm_bg.wasm
index c1fdac7..bad117d 100644
Binary files a/docs_v1.0/doc_wasm/pkg/md_wasm_bg.wasm and b/docs_v1.0/doc_wasm/pkg/md_wasm_bg.wasm differ
diff --git a/migrations/033_create_identity_history_table.sql b/migrations/033_create_identity_history_table.sql
new file mode 100644
index 0000000..2755dc7
--- /dev/null
+++ b/migrations/033_create_identity_history_table.sql
@@ -0,0 +1,28 @@
+-- Migration: Create identity_history table for undo/redo support
+-- Description: Stores PATCH operation history for identity undo/redo functionality
+-- Date: 2026-05-28
+
+-- Create identity_history table
+CREATE TABLE IF NOT EXISTS identity_history (
+    id BIGSERIAL PRIMARY KEY,
+    identity_id INTEGER NOT NULL REFERENCES identities(id) ON DELETE CASCADE,
+    operation VARCHAR(20) NOT NULL,           -- 'update', 'create', 'delete'
+    before_snapshot JSONB,                    -- 操作前完整狀態
+    after_snapshot JSONB,                     -- 操作後完整狀態
+    is_undone BOOLEAN DEFAULT FALSE,          -- 是否已被 undo
+    undone_at TIMESTAMPTZ,                    -- undo 時間
+    user_id VARCHAR(100),                     -- 操作者
+    user_source VARCHAR(50),                  -- 'wordpress', 'api', 'cli'
+    created_at TIMESTAMPTZ DEFAULT NOW()
+);
+
+-- Create indexes for efficient undo/redo operations
+CREATE INDEX IF NOT EXISTS idx_identity_history_identity_time 
+    ON identity_history(identity_id, created_at DESC);
+
+CREATE INDEX IF NOT EXISTS idx_identity_history_not_undone 
+    ON identity_history(identity_id, created_at DESC) 
+    WHERE NOT is_undone;
+
+-- Add comment
+COMMENT ON TABLE identity_history IS 'Stores identity PATCH operation history for undo/redo support. Max 256 records per identity.';
\ No newline at end of file
diff --git a/migrations/3002_public_schema_pipeline_tables.sql b/migrations/3002_public_schema_pipeline_tables.sql
new file mode 100644
index 0000000..ada9e26
--- /dev/null
+++ b/migrations/3002_public_schema_pipeline_tables.sql
@@ -0,0 +1,314 @@
+-- ============================================================
+-- 3002/3003 Schema Separation: Create pipeline tables in public
+-- Generated: 2026-05-17
+-- ============================================================
+-- Run: /Users/accusys/pgsql/18.3/bin/psql "postgres://accusys@localhost:5432/momentry" -f migrations/3002_public_schema_pipeline_tables.sql
+-- ============================================================
+
+BEGIN;
+
+-- ============================================================
+-- 1. videos
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.videos_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.videos (
+    id integer DEFAULT nextval('public.videos_id_seq') NOT NULL,
+    file_uuid character varying(32) NOT NULL,
+    file_path text NOT NULL,
+    file_name text NOT NULL,
+    duration double precision,
+    width integer,
+    height integer,
+    fps double precision,
+    probe_json jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    fs_video boolean DEFAULT false,
+    fs_json boolean DEFAULT false,
+    psql_chunk boolean DEFAULT false,
+    pobject_chunk boolean DEFAULT false,
+    mobject_chunk boolean DEFAULT false,
+    pvector_chunk boolean DEFAULT false,
+    qvector_chunk boolean DEFAULT false,
+    status character varying(20) DEFAULT 'pending'::character varying,
+    user_id bigint,
+    job_id integer,
+    registration_time timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    file_type character varying(20),
+    processing_status jsonb DEFAULT '{}'::jsonb,
+    birth_registration jsonb,
+    total_frames bigint DEFAULT 0,
+    parent_uuid character varying(32),
+    cut_done boolean DEFAULT false,
+    scene_done boolean DEFAULT false,
+    audio_tracks jsonb DEFAULT '[]'::jsonb,
+    cut_count integer DEFAULT 0,
+    cut_max_duration double precision DEFAULT 0,
+    content_hash text
+);
+
+ALTER SEQUENCE public.videos_id_seq OWNED BY public.videos.id;
+
+-- ============================================================
+-- 2. chunk (with pgvector support)
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.chunks_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.chunk (
+    id integer DEFAULT nextval('public.chunks_id_seq') NOT NULL,
+    file_uuid character varying(32) NOT NULL,
+    chunk_type character varying(32) NOT NULL,
+    start_time double precision NOT NULL,
+    end_time double precision NOT NULL,
+    content jsonb NOT NULL,
+    vector_id character varying(64),
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
+    file_id integer,
+    text_content text,
+    frame_count integer DEFAULT 0,
+    pre_chunk_ids integer[],
+    parent_chunk_id character varying(64),
+    child_chunk_ids text[],
+    search_vector tsvector,
+    fps double precision DEFAULT 24.0,
+    start_frame bigint DEFAULT 0,
+    end_frame bigint DEFAULT 0,
+    metadata jsonb,
+    updated_at timestamp with time zone DEFAULT now(),
+    visual_stats jsonb,
+    summary_text text,
+    chunk_id character varying(128) NOT NULL,
+    embedding public.vector,
+    old_chunk_id character varying(128),
+    chunk_index integer DEFAULT 0,
+    unique_key character varying
+);
+
+ALTER SEQUENCE public.chunks_id_seq OWNED BY public.chunk.id;
+
+-- ============================================================
+-- 3. chunk_vectors
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.chunk_vectors_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.chunk_vectors (
+    id integer DEFAULT nextval('public.chunk_vectors_id_seq') NOT NULL,
+    chunk_id character varying(64) NOT NULL,
+    uuid character varying(64) NOT NULL,
+    chunk_type character varying(32) DEFAULT 'sentence'::character varying NOT NULL,
+    embedding jsonb,
+    created_at timestamp with time zone DEFAULT now()
+);
+
+ALTER SEQUENCE public.chunk_vectors_id_seq OWNED BY public.chunk_vectors.id;
+
+-- ============================================================
+-- 4. cuts
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.cuts_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.cuts (
+    id integer DEFAULT nextval('public.cuts_id_seq') NOT NULL,
+    file_uuid character varying(32) NOT NULL,
+    cut_number integer NOT NULL,
+    start_frame bigint NOT NULL,
+    end_frame bigint NOT NULL,
+    start_time double precision,
+    end_time double precision,
+    fps double precision,
+    metadata jsonb DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT now()
+);
+
+ALTER SEQUENCE public.cuts_id_seq OWNED BY public.cuts.id;
+
+-- ============================================================
+-- 5. frames
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.frames_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.frames (
+    id integer DEFAULT nextval('public.frames_id_seq') NOT NULL,
+    file_id integer NOT NULL,
+    frame_number bigint NOT NULL,
+    timestamp double precision NOT NULL,
+    fps double precision DEFAULT 24.0,
+    yolo_objects jsonb,
+    ocr_results jsonb,
+    face_results jsonb,
+    frame_path text,
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+ALTER SEQUENCE public.frames_id_seq OWNED BY public.frames.id;
+
+-- ============================================================
+-- 6. monitor_jobs
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.monitor_jobs_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.monitor_jobs (
+    id integer DEFAULT nextval('public.monitor_jobs_id_seq') NOT NULL,
+    uuid character varying(32) NOT NULL,
+    video_path character varying(512),
+    status character varying(20) DEFAULT 'pending'::character varying NOT NULL,
+    current_processor character varying(20),
+    progress_total integer DEFAULT 0,
+    progress_current integer DEFAULT 0,
+    error_count integer DEFAULT 0,
+    last_error text,
+    started_at timestamp without time zone,
+    updated_at timestamp with time zone,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    video_id bigint,
+    user_id bigint,
+    processors text[],
+    completed_processors text[],
+    failed_processors text[]
+);
+
+ALTER SEQUENCE public.monitor_jobs_id_seq OWNED BY public.monitor_jobs.id;
+
+-- ============================================================
+-- 7. processor_results
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.processor_results_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.processor_results (
+    id integer DEFAULT nextval('public.processor_results_id_seq') NOT NULL,
+    job_id integer,
+    video_id bigint,
+    processor character varying(20),
+    status character varying(20) DEFAULT 'pending'::character varying NOT NULL,
+    output_path text,
+    started_at timestamp with time zone,
+    completed_at timestamp with time zone,
+    error_message text,
+    progress_total integer DEFAULT 0,
+    progress_current integer DEFAULT 0,
+    last_checkpoint jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    duration_secs double precision,
+    chunks_produced integer DEFAULT 0,
+    frames_processed integer DEFAULT 0,
+    output_size_bytes bigint DEFAULT 0,
+    file_uuid character varying(32),
+    result jsonb,
+    output_data jsonb,
+    retry_count integer DEFAULT 0,
+    processor_type character varying(64),
+    uuid character varying(255)
+);
+
+ALTER SEQUENCE public.processor_results_id_seq OWNED BY public.processor_results.id;
+
+-- ============================================================
+-- 8. processor_versions
+-- ============================================================
+CREATE TABLE IF NOT EXISTS public.processor_versions (
+    processor character varying(64) NOT NULL,
+    model_version character varying(128) NOT NULL,
+    processor_type character varying(32) DEFAULT 'processor'::character varying NOT NULL,
+    dependencies text[] DEFAULT '{}'::text[],
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    file_uuid character varying(64)
+);
+
+-- ============================================================
+-- 9. parent_chunks
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.parent_chunks_id_seq AS integer START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.parent_chunks (
+    id integer DEFAULT nextval('public.parent_chunks_id_seq') NOT NULL,
+    uuid character varying(32) NOT NULL,
+    chunk_id character varying(64),
+    summary_text text,
+    summary_tsvector tsvector,
+    metadata jsonb DEFAULT '{}'::jsonb
+);
+
+ALTER SEQUENCE public.parent_chunks_id_seq OWNED BY public.parent_chunks.id;
+
+-- ============================================================
+-- 10. tkg_edges
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.tkg_edges_id_seq AS bigint START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.tkg_edges (
+    id bigint DEFAULT nextval('public.tkg_edges_id_seq') NOT NULL,
+    edge_type character varying(64) NOT NULL,
+    source_node_id bigint NOT NULL,
+    target_node_id bigint NOT NULL,
+    file_uuid character varying(64) NOT NULL,
+    properties jsonb NOT NULL DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+ALTER SEQUENCE public.tkg_edges_id_seq OWNED BY public.tkg_edges.id;
+
+-- ============================================================
+-- 11. tkg_nodes
+-- ============================================================
+CREATE SEQUENCE IF NOT EXISTS public.tkg_nodes_id_seq AS bigint START WITH 1;
+
+CREATE TABLE IF NOT EXISTS public.tkg_nodes (
+    id bigint DEFAULT nextval('public.tkg_nodes_id_seq') NOT NULL,
+    node_type character varying(64) NOT NULL,
+    external_id character varying(256) NOT NULL,
+    file_uuid character varying(64) NOT NULL,
+    label character varying(512),
+    properties jsonb NOT NULL DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+ALTER SEQUENCE public.tkg_nodes_id_seq OWNED BY public.tkg_nodes.id;
+
+-- ============================================================
+-- Indexes & Constraints
+-- ============================================================
+
+-- videos
+CREATE UNIQUE INDEX IF NOT EXISTS idx_videos_file_uuid ON public.videos (file_uuid);
+
+-- chunk
+CREATE INDEX IF NOT EXISTS idx_chunk_file_uuid ON public.chunk (file_uuid);
+CREATE INDEX IF NOT EXISTS idx_chunk_type ON public.chunk (chunk_type);
+CREATE INDEX IF NOT EXISTS idx_chunk_parent ON public.chunk (parent_chunk_id);
+CREATE INDEX IF NOT EXISTS idx_chunk_file_type ON public.chunk (file_uuid, chunk_type);
+CREATE UNIQUE INDEX IF NOT EXISTS idx_chunk_file_old_id ON public.chunk (file_uuid, old_chunk_id) WHERE old_chunk_id IS NOT NULL;
+
+-- chunk_vectors
+CREATE INDEX IF NOT EXISTS idx_chunk_vec_uuid ON public.chunk_vectors (uuid);
+CREATE INDEX IF NOT EXISTS idx_chunk_vec_chunk ON public.chunk_vectors (chunk_id);
+
+-- cuts
+CREATE INDEX IF NOT EXISTS idx_cuts_file_uuid ON public.cuts (file_uuid);
+
+-- frames
+CREATE INDEX IF NOT EXISTS idx_frames_file_id ON public.frames (file_id);
+
+-- monitor_jobs
+CREATE UNIQUE INDEX IF NOT EXISTS idx_monitor_jobs_uuid ON public.monitor_jobs (uuid);
+CREATE INDEX IF NOT EXISTS idx_monitor_jobs_status ON public.monitor_jobs (status);
+
+-- processor_results
+CREATE INDEX IF NOT EXISTS idx_pr_job_id ON public.processor_results (job_id);
+CREATE INDEX IF NOT EXISTS idx_pr_uuid ON public.processor_results (uuid);
+CREATE UNIQUE INDEX IF NOT EXISTS idx_pr_job_processor_type ON public.processor_results (job_id, processor_type);
+
+-- parent_chunks
+CREATE INDEX IF NOT EXISTS idx_parent_chunks_uuid ON public.parent_chunks (uuid);
+
+-- tkg_edges
+CREATE INDEX IF NOT EXISTS idx_tkg_edges_file_uuid ON public.tkg_edges (file_uuid);
+CREATE INDEX IF NOT EXISTS idx_tkg_edges_type ON public.tkg_edges (edge_type);
+
+-- tkg_nodes
+CREATE INDEX IF NOT EXISTS idx_tkg_nodes_file_uuid ON public.tkg_nodes (file_uuid);
+CREATE INDEX IF NOT EXISTS idx_tkg_nodes_type ON public.tkg_nodes (node_type);
+CREATE INDEX IF NOT EXISTS idx_tkg_nodes_external ON public.tkg_nodes (external_id);
+
+COMMIT;
diff --git a/momentry_runtime/plist/com.momentry.api.plist b/momentry_runtime/plist/com.momentry.api.plist
index 78a0b78..7a327be 100644
--- a/momentry_runtime/plist/com.momentry.api.plist
+++ b/momentry_runtime/plist/com.momentry.api.plist
@@ -12,43 +12,13 @@
     <string>staff</string>
     
     <key>WorkingDirectory</key>
-    <string>/Users/accusys/momentry_core_0.1</string>
+    <string>/Users/accusys/momentry_core</string>
     
     <key>ProgramArguments</key>
     <array>
-        <string>/Users/accusys/momentry_core_0.1/target/release/momentry</string>
-        <string>server</string>
-        <string>--port</string>
-        <string>3002</string>
+        <string>/Users/accusys/momentry_core/scripts/wrapper_production.sh</string>
     </array>
     
-    <key>EnvironmentVariables</key>
-    <dict>
-        <key>PATH</key>
-        <string>/opt/homebrew/bin:/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin</string>
-        
-        <key>DATABASE_URL</key>
-        <string>postgres://accusys@localhost:5432/momentry</string>
-        
-        <key>DB_MAX_CONNECTIONS</key>
-        <string>50</string>
-        
-        <key>DB_ACQUIRE_TIMEOUT</key>
-        <string>30</string>
-        
-        <key>REDIS_URL</key>
-        <string>redis://:accusys@localhost:6379</string>
-        
-        <key>REDIS_PASSWORD</key>
-        <string>accusys</string>
-        
-        <key>OLLAMA_HOST</key>
-        <string>http://localhost:11434</string>
-        
-        <key>QDRANT_URL</key>
-        <string>http://127.0.0.1:6333</string>
-    </dict>
-    
     <key>RunAtLoad</key>
     <true/>
     
diff --git a/momentry_runtime/plist/com.momentry.embedding.plist b/momentry_runtime/plist/com.momentry.embedding.plist
new file mode 100644
index 0000000..6b34587
--- /dev/null
+++ b/momentry_runtime/plist/com.momentry.embedding.plist
@@ -0,0 +1,34 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+<dict>
+    <key>Label</key>
+    <string>com.momentry.embedding</string>
+
+    <key>UserName</key>
+    <string>accusys</string>
+
+    <key>GroupName</key>
+    <string>staff</string>
+
+    <key>WorkingDirectory</key>
+    <string>/Users/accusys/momentry_core</string>
+
+    <key>ProgramArguments</key>
+    <array>
+        <string>/Users/accusys/momentry_core/scripts/wrapper_embedding.sh</string>
+    </array>
+
+    <key>RunAtLoad</key>
+    <true/>
+
+    <key>KeepAlive</key>
+    <true/>
+
+    <key>StandardOutPath</key>
+    <string>/Users/accusys/momentry/log/embedding.log</string>
+
+    <key>StandardErrorPath</key>
+    <string>/Users/accusys/momentry/log/embedding.error.log</string>
+</dict>
+</plist>
diff --git a/momentry_runtime/plist/com.momentry.gitea.plist b/momentry_runtime/plist/com.momentry.gitea.plist
index cc719cc..ec1d667 100644
--- a/momentry_runtime/plist/com.momentry.gitea.plist
+++ b/momentry_runtime/plist/com.momentry.gitea.plist
@@ -13,7 +13,7 @@
     
     <key>ProgramArguments</key>
     <array>
-        <string>/opt/homebrew/opt/gitea/bin/gitea</string>
+        <string>/Users/accusys/gitea/bin/gitea</string>
         <string>web</string>
         <string>--config</string>
         <string>/Users/accusys/momentry/etc/gitea/app.ini</string>
diff --git a/momentry_runtime/plist/com.momentry.llamacpp-a4b.plist b/momentry_runtime/plist/com.momentry.llamacpp-a4b.plist
new file mode 100644
index 0000000..ea1cf4a
--- /dev/null
+++ b/momentry_runtime/plist/com.momentry.llamacpp-a4b.plist
@@ -0,0 +1,48 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+<dict>
+    <key>Label</key>
+    <string>com.momentry.llamacpp-a4b</string>
+
+    <key>UserName</key>
+    <string>accusys</string>
+
+    <key>WorkingDirectory</key>
+    <string>/Users/accusys</string>
+
+    <key>ProgramArguments</key>
+    <array>
+        <string>/Users/accusys/llama/bin/llama-server</string>
+        <string>-m</string>
+        <string>/Users/accusys/models/google_gemma-4-26B-A4B-it-Q5_K_M.gguf</string>
+        <string>--mmproj</string>
+        <string>/Users/accusys/models/gemma-4-26B-A4B-it.mmproj-f16.gguf</string>
+        <string>--host</string>
+        <string>0.0.0.0</string>
+        <string>--port</string>
+        <string>8082</string>
+        <string>-ngl</string>
+        <string>99</string>
+        <string>-c</string>
+        <string>16384</string>
+        <string>--temp</string>
+        <string>0.1</string>
+        <string>--mlock</string>
+        <string>--reasoning</string>
+        <string>off</string>
+    </array>
+
+    <key>RunAtLoad</key>
+    <true/>
+
+    <key>KeepAlive</key>
+    <true/>
+
+    <key>StandardOutPath</key>
+    <string>/Users/accusys/momentry/log/llamacpp-a4b.log</string>
+
+    <key>StandardErrorPath</key>
+    <string>/Users/accusys/momentry/log/llamacpp-a4b.error.log</string>
+</dict>
+</plist>
diff --git a/momentry_runtime/plist/com.momentry.llamacpp-e4b.plist b/momentry_runtime/plist/com.momentry.llamacpp-e4b.plist
new file mode 100644
index 0000000..8c27cfb
--- /dev/null
+++ b/momentry_runtime/plist/com.momentry.llamacpp-e4b.plist
@@ -0,0 +1,46 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+<dict>
+    <key>Label</key>
+    <string>com.momentry.llamacpp-e4b</string>
+
+    <key>UserName</key>
+    <string>accusys</string>
+
+    <key>WorkingDirectory</key>
+    <string>/Users/accusys</string>
+
+    <key>ProgramArguments</key>
+    <array>
+        <string>/Users/accusys/llama/bin/llama-server</string>
+        <string>-m</string>
+        <string>/Users/accusys/models/gemma-4-E4B-it-Q4_K_M.gguf</string>
+        <string>--mmproj</string>
+        <string>/Users/accusys/models/mmproj-gemma-4-E4B-it-BF16.gguf</string>
+        <string>--host</string>
+        <string>0.0.0.0</string>
+        <string>--port</string>
+        <string>8083</string>
+        <string>-ngl</string>
+        <string>99</string>
+        <string>-c</string>
+        <string>16384</string>
+        <string>--temp</string>
+        <string>0.1</string>
+        <string>--mlock</string>
+    </array>
+
+    <key>RunAtLoad</key>
+    <true/>
+
+    <key>KeepAlive</key>
+    <true/>
+
+    <key>StandardOutPath</key>
+    <string>/Users/accusys/momentry/log/llamacpp-e4b.log</string>
+
+    <key>StandardErrorPath</key>
+    <string>/Users/accusys/momentry/log/llamacpp-e4b.error.log</string>
+</dict>
+</plist>
diff --git a/momentry_runtime/plist/com.momentry.postgresql.plist b/momentry_runtime/plist/com.momentry.postgresql.plist
index d799ab2..8a4dcf2 100644
--- a/momentry_runtime/plist/com.momentry.postgresql.plist
+++ b/momentry_runtime/plist/com.momentry.postgresql.plist
@@ -15,13 +15,13 @@
     </dict>
 
     <key>WorkingDirectory</key>
-    <string>/Users/accusys/momentry/var/postgresql</string>
+    <string>/Users/accusys</string>
     
     <key>ProgramArguments</key>
     <array>
-        <string>/opt/homebrew/opt/postgresql@18/bin/postgres</string>
+        <string>/Users/accusys/pgsql/18.3/bin/postgres</string>
         <string>-D</string>
-        <string>/Users/accusys/momentry/var/postgresql</string>
+        <string>/Users/accusys/pgsql/data</string>
     </array>
     
     <key>RunAtLoad</key>
diff --git a/momentry_runtime/plist/com.momentry.sftpgo.plist b/momentry_runtime/plist/com.momentry.sftpgo.plist
index e6c3c60..fc3c9c9 100644
--- a/momentry_runtime/plist/com.momentry.sftpgo.plist
+++ b/momentry_runtime/plist/com.momentry.sftpgo.plist
@@ -9,14 +9,14 @@
     <string>accusys</string>
 
     <key>WorkingDirectory</key>
-    <string>/Users/accusys/workspace/sftpgo</string>
+    <string>/Users/accusys/momentry/var/sftpgo</string>
     
     <key>ProgramArguments</key>
     <array>
         <string>/Users/accusys/bin/sftpgo</string>
         <string>serve</string>
-        <string>--config-file</string>
-        <string>/Users/accusys/momentry/etc/sftpgo/sftpgo.json</string>
+        <string>-c</string>
+        <string>/Users/accusys/momentry/etc/sftpgo</string>
     </array>
     
     <key>EnvironmentVariables</key>
diff --git a/portal/src/components/Face3DViewer.vue b/portal/src/components/Face3DViewer.vue
new file mode 100644
index 0000000..83a80db
--- /dev/null
+++ b/portal/src/components/Face3DViewer.vue
@@ -0,0 +1,174 @@
+<template>
+  <div ref="container" class="w-full h-full min-h-[300px] bg-gray-900 rounded-lg overflow-hidden"></div>
+</template>
+
+<script setup lang="ts">
+import { ref, onMounted, onBeforeUnmount } from 'vue'
+import * as THREE from 'three'
+import { OrbitControls } from 'three/examples/jsm/controls/OrbitControls.js'
+
+const props = defineProps<{
+  landmarks: number[][]  // 468 x [x, y, z]
+}>()
+
+const container = ref<HTMLElement>()
+let renderer: THREE.WebGLRenderer | null = null
+let scene: THREE.Scene | null = null
+let camera: THREE.PerspectiveCamera | null = null
+let controls: OrbitControls | null = null
+let animId: number
+let objects: THREE.Object3D[] = []
+
+function disposeScene() {
+  cancelAnimationFrame(animId)
+  for (const obj of objects) {
+    scene?.remove(obj)
+    if (obj instanceof THREE.Mesh) {
+      obj.geometry?.dispose()
+      if (Array.isArray(obj.material)) obj.material.forEach(m => m.dispose())
+      else obj.material?.dispose()
+    }
+    if (obj instanceof THREE.Points) {
+      obj.geometry?.dispose()
+      if (obj.material) obj.material.dispose()
+    }
+  }
+  objects = []
+  controls?.dispose()
+  controls = null
+  if (renderer) {
+    renderer.dispose()
+    renderer = null
+  }
+  scene = null
+  camera = null
+}
+
+const FACES_TRI = [
+  // Eyes
+  [33, 133, 7], [33, 7, 163], [160, 159, 158], [159, 158, 157],
+  // Nose
+  [168, 6, 197], [6, 197, 195], [197, 195, 5],
+  // Mouth outer
+  [61, 146, 91], [91, 181, 84], [84, 17, 314], [314, 405, 321],
+  // Mouth inner
+  [78, 95, 88], [95, 88, 178], [87, 14, 317], [14, 317, 402],
+  // Jaw
+  [10, 338, 297], [297, 332, 284], [284, 251, 389],
+  // Left eye brow
+  [46, 53, 52], [53, 52, 65],
+  // Right eye brow
+  [276, 283, 282], [283, 282, 295],
+  // Face oval
+  [10, 338, 297], [297, 332, 284], [284, 251, 389], [389, 356, 454],
+  [454, 323, 361], [361, 288, 397], [397, 365, 379], [379, 378, 400],
+  [400, 377, 152], [152, 148, 176], [176, 149, 150], [150, 136, 172],
+  [172, 58, 132], [132, 93, 234], [234, 127, 162], [162, 21, 54],
+  [54, 103, 67], [67, 109, 10]
+]
+
+function buildMesh(pts: number[][]): THREE.BufferGeometry {
+  const verts = new Float32Array(pts.length * 3)
+  for (let i = 0; i < pts.length; i++) {
+    verts[i * 3] = (pts[i][0] - 0.5) * 2
+    verts[i * 3 + 1] = -(pts[i][1] - 0.5) * 2
+    verts[i * 3 + 2] = pts[i][2] * 2
+  }
+  const indices: number[] = []
+  for (const tri of FACES_TRI) {
+    if (tri.every(i => i < pts.length)) indices.push(...tri)
+  }
+  const geo = new THREE.BufferGeometry()
+  geo.setAttribute('position', new THREE.BufferAttribute(verts, 3))
+  geo.setIndex(indices)
+  geo.computeVertexNormals()
+  return geo
+}
+
+function init() {
+  if (!container.value) return
+  
+  // Dispose previous scene if re-initializing
+  disposeScene()
+
+  const rect = container.value.getBoundingClientRect()
+  const w = rect.width || 400, h = rect.height || 300
+
+  scene = new THREE.Scene()
+  camera = new THREE.PerspectiveCamera(45, w / h, 0.1, 10)
+  camera.position.set(0, 0, 2.5)
+
+  renderer = new THREE.WebGLRenderer({ antialias: true, alpha: true })
+  renderer.setSize(w, h)
+  renderer.setPixelRatio(Math.min(window.devicePixelRatio, 2))
+  container.value.appendChild(renderer.domElement)
+
+  controls = new OrbitControls(camera, renderer.domElement)
+  controls.enableDamping = true
+  controls.dampingFactor = 0.05
+  controls.autoRotate = true
+  controls.autoRotateSpeed = 2
+
+  // Mesh
+  if (props.landmarks?.length) {
+    const geo = buildMesh(props.landmarks)
+    const mat = new THREE.MeshPhongMaterial({
+      color: 0x4488ff,
+      flatShading: false,
+      transparent: true,
+      opacity: 0.85,
+      side: THREE.DoubleSide
+    })
+    const mesh = new THREE.Mesh(geo, mat)
+    scene.add(mesh)
+    objects.push(mesh)
+
+    // Points
+    const ptGeo = new THREE.BufferGeometry()
+    ptGeo.setAttribute('position', geo.getAttribute('position')!)
+    const ptMat = new THREE.PointsMaterial({ color: 0x88bbff, size: 0.008 })
+    const points = new THREE.Points(ptGeo, ptMat)
+    scene.add(points)
+    objects.push(points)
+  }
+
+  // Lights
+  const ambient = new THREE.AmbientLight(0x404060)
+  scene.add(ambient)
+  const dir = new THREE.DirectionalLight(0xffffff, 1)
+  dir.position.set(1, 1, 1)
+  scene.add(dir)
+  const dir2 = new THREE.DirectionalLight(0x8888ff, 0.5)
+  dir2.position.set(-1, -1, 0.5)
+  scene.add(dir2)
+
+  // Resize observer
+  const resizeObserver = new ResizeObserver(() => {
+    if (!container.value || !renderer || !camera) return
+    const r = container.value.getBoundingClientRect()
+    const w = r.width || 400, h = r.height || 300
+    renderer.setSize(w, h)
+    camera.aspect = w / h
+    camera.updateProjectionMatrix()
+  })
+  resizeObserver.observe(container.value)
+  ;(container.value as any).__resizeObserver = resizeObserver
+
+  animate()
+}
+
+function animate() {
+  animId = requestAnimationFrame(animate)
+  controls?.update()
+  if (renderer && scene && camera) renderer.render(scene, camera)
+}
+
+onMounted(() => init())
+onBeforeUnmount(() => {
+  cancelAnimationFrame(animId)
+  if ((container.value as any)?.__resizeObserver) {
+    (container.value as any).__resizeObserver.disconnect()
+  }
+  disposeScene()
+})
+</script>
diff --git a/portal/src/components/IdentitySwimlane.vue b/portal/src/components/IdentitySwimlane.vue
new file mode 100644
index 0000000..25dbfbc
--- /dev/null
+++ b/portal/src/components/IdentitySwimlane.vue
@@ -0,0 +1,80 @@
+<template>
+  <div class="space-y-2">
+    <div class="flex items-center justify-between">
+      <h3 class="text-sm font-semibold text-gray-300">身分泳道圖 V2</h3>
+      <span class="text-xs text-gray-500">{{ identities.length }} identities</span>
+    </div>
+    <div class="relative overflow-x-auto" ref="scrollRef">
+      <svg :width="svgW" :height="rowH * identities.length + 30" class="block">
+        <!-- time axis -->
+        <line x1="80" :y1="rowH * identities.length + 5" :x2="svgW" :y2="rowH * identities.length + 5" stroke="#4b5563" stroke-width="1" />
+        <g v-for="t in ticks" :key="t">
+          <line :x1="xPos(t)" :y1="rowH * identities.length + 1" :x2="xPos(t)" :y2="rowH * identities.length + 5" stroke="#6b7280" stroke-width="1" />
+          <text :x="xPos(t)" :y="rowH * identities.length + 16" fill="#9ca3af" font-size="9" text-anchor="middle">{{ t }}s</text>
+        </g>
+        <!-- swimlanes -->
+        <g v-for="(ident, i) in identities" :key="ident.name">
+          <text x="4" :y="rowH * i + rowH / 2 + 5" fill="#d1d5db" font-size="11" class="select-none">{{ ident.name }}</text>
+          <rect x="78" :y="rowH * i + 4" width="2" :height="rowH - 8" fill="#374151" rx="2" />
+          <rect
+            v-for="seg in ident.segments" :key="seg.start"
+            :x="xPos(seg.start)" :y="rowH * i + 6"
+            :width="Math.max(2, xPos(seg.end) - xPos(seg.start))"
+            :height="rowH - 12"
+            :fill="ident.color"
+            :opacity="0.7"
+            rx="3"
+            class="cursor-pointer hover:opacity-100"
+            @click="$emit('selectTrace', seg.trace_id)"
+          />
+        </g>
+      </svg>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { computed } from 'vue'
+
+const props = defineProps<{
+  identities: SwimlaneIdentity[]
+  totalDuration: number
+}>()
+
+defineEmits<{ selectTrace: [traceId: number] }>()
+
+export interface SwimlaneSegment {
+  trace_id: number
+  start: number
+  end: number
+  face_count: number
+}
+
+export interface SwimlaneIdentity {
+  name: string
+  color: string
+  segments: SwimlaneSegment[]
+}
+
+const rowH = 28
+const labelW = 80
+const padR = 20
+
+const svgW = computed(() => {
+  const dur = props.totalDuration || 6000
+  return Math.max(500, labelW + dur / 8)
+})
+
+function xPos(sec: number): number {
+  const dur = props.totalDuration || 6000
+  return labelW + (sec / dur) * (svgW.value - labelW - padR)
+}
+
+const ticks = computed(() => {
+  const dur = props.totalDuration || 6000
+  const step = Math.max(30, Math.round(dur / 6 / 30) * 30)
+  const tks: number[] = []
+  for (let t = 0; t <= dur; t += step) tks.push(t)
+  return tks
+})
+</script>
diff --git a/portal/src/components/ServiceStatusCard.vue b/portal/src/components/ServiceStatusCard.vue
new file mode 100644
index 0000000..4195d2a
--- /dev/null
+++ b/portal/src/components/ServiceStatusCard.vue
@@ -0,0 +1,33 @@
+<template>
+  <div :class="['rounded-lg p-3 border', bgColor]">
+    <div class="flex items-center justify-between">
+      <span class="font-semibold">{{ name }}</span>
+      <span :class="statusColor">{{ status === 'ok' ? '●' : '○' }}</span>
+    </div>
+    <div v-if="latency" class="text-xs text-gray-400 mt-1">{{ latency }}ms</div>
+    <div v-if="error" class="text-xs text-red-400 mt-1 truncate">{{ error }}</div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { computed } from 'vue'
+
+const props = defineProps<{
+  name?: string
+  status?: string
+  latency?: number | null
+  error?: string | null
+}>()
+
+const statusColor = computed(() => {
+  if (props.status === 'ok') return 'text-green-400'
+  if (props.status === 'degraded') return 'text-yellow-400'
+  return 'text-red-400'
+})
+
+const bgColor = computed(() => {
+  if (props.status === 'ok') return 'bg-green-900/20 border-green-700'
+  if (props.status === 'degraded') return 'bg-yellow-900/20 border-yellow-700'
+  return 'bg-red-900/20 border-red-700'
+})
+</script>
\ No newline at end of file
diff --git a/portal/src/components/SpaceTimeCube.vue b/portal/src/components/SpaceTimeCube.vue
new file mode 100644
index 0000000..a427ae1
--- /dev/null
+++ b/portal/src/components/SpaceTimeCube.vue
@@ -0,0 +1,354 @@
+<template>
+  <div class="bg-gray-800 rounded-lg p-6 border border-gray-700">
+    <h3 class="text-lg font-semibold mb-4 text-blue-400">V5: 3D Space-Time Cube</h3>
+    <div class="text-xs text-gray-500 mb-3 flex gap-2 items-center">
+      <span>X/Y = 畫面位置</span>
+      <span>Z = 深度（bbox 大小）</span>
+      <span>T = 時間</span>
+    </div>
+
+    <!-- Trace selector -->
+    <div class="flex gap-2 mb-3">
+      <select v-model="selectedTraceId"
+              class="bg-gray-700 text-white px-3 py-1.5 rounded text-sm flex-1">
+        <option :value="null" disabled>選擇 Trace</option>
+        <option v-for="t in traceOptions" :key="t.id"
+                :value="t.id">{{ t.label }}</option>
+      </select>
+      <button @click="loadData"
+              class="bg-blue-600 hover:bg-blue-500 text-white px-4 py-1.5 rounded text-sm"
+              :disabled="!selectedTraceId || loading">
+        {{ loading ? '載入中...' : '載入' }}
+      </button>
+    </div>
+
+    <div ref="container" class="w-full h-[400px] bg-gray-900 rounded-lg overflow-hidden"></div>
+
+    <div class="text-xs text-gray-500 mt-2 flex gap-4">
+      <span>🖱 拖曳旋轉</span>
+      <span>🔍 滾輪縮放</span>
+      <span v-if="faceCount">{{ faceCount }} 個檢測點</span>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { ref, onMounted, onBeforeUnmount, computed, watch } from 'vue'
+import * as THREE from 'three'
+import { OrbitControls } from 'three/examples/jsm/controls/OrbitControls.js'
+import { httpFetch, getCurrentConfig } from '@/api/client'
+
+const props = defineProps<{
+  fileUuid: string
+  traces?: any[]
+  frameWidth?: number
+  frameHeight?: number
+}>()
+
+const container = ref<HTMLElement>()
+const selectedTraceId = ref<number | null>(null)
+const loading = ref(false)
+const faceCount = ref(0)
+
+const traceOptions = computed(() => {
+  return (props.traces || []).map((t: any) => ({
+    id: t.trace_id,
+    label: `#${t.trace_id} (${t.face_count} faces, ${(t.duration_sec || 0).toFixed(1)}s)`
+  }))
+})
+
+let renderer: THREE.WebGLRenderer | null = null
+let scene: THREE.Scene | null = null
+let camera: THREE.PerspectiveCamera | null = null
+let controls: OrbitControls | null = null
+let animId: number
+let objects: THREE.Object3D[] = []
+
+function disposeScene() {
+  cancelAnimationFrame(animId)
+  for (const obj of objects) {
+    scene?.remove(obj)
+    if (obj instanceof THREE.Mesh || obj instanceof THREE.Points || obj instanceof THREE.Line) {
+      obj.geometry?.dispose()
+      const mat = (obj as any).material
+      if (mat) {
+        if (Array.isArray(mat)) mat.forEach((m: any) => m.dispose())
+        else mat.dispose()
+      }
+    }
+  }
+  objects = []
+  controls?.dispose()
+  controls = null
+  if (renderer) {
+    renderer.dispose()
+    renderer = null
+  }
+  scene = null
+  camera = null
+}
+
+type FacePoint = {
+  frame: number
+  t: number
+  x: number
+  y: number
+  w: number
+  h: number
+  z: number
+}
+
+function loadData() {
+  if (!selectedTraceId.value) return
+  loading.value = true
+
+  const config = getCurrentConfig()
+  httpFetch(`${config.api_base_url}/api/v1/file/${props.fileUuid}/trace/${selectedTraceId.value}/faces?interpolate=true&limit=2000&dimension=3d`)
+    .then((res: any) => {
+      const faces = res?.faces || []
+      const fw = props.frameWidth || 1920
+      const fh = props.frameHeight || 1080
+
+      const points: FacePoint[] = faces.map((f: any) => {
+        const w = f.width || 1
+        const h = f.height || 1
+        const areaPct = (w * h) / (fw * fh)
+        const z = f.z_rel !== undefined && f.z_rel !== null
+          ? f.z_rel
+          : 1.0 - Math.min(areaPct * 50, 1.0)
+        return {
+          frame: f.start_frame || 0,
+          t: f.start_time || 0,
+          x: f.x || 0,
+          y: f.y || 0,
+          w,
+          h,
+          z
+        }
+      })
+      faceCount.value = points.length
+      buildScene(points)
+    })
+    .catch((err: any) => {
+      console.error('Failed to load trace faces:', err)
+    })
+    .finally(() => {
+      loading.value = false
+    })
+}
+
+function buildScene(points: FacePoint[]) {
+  if (!container.value) return
+  disposeScene()
+
+  // Normalize coordinates to [-1, 1] range
+  const fw = props.frameWidth || 1920
+  const fh = props.frameHeight || 1080
+  const maxT = points.length > 0 ? points[points.length - 1].t : 100
+
+  const vertexData = points.map(p => ({
+    x: (p.x / fw) * 2 - 1,
+    y: -((p.y / fh) * 2 - 1),
+    z: p.z * 2 - 1,
+    t: (p.t / maxT) * 2 - 1
+  }))
+
+  const rect = container.value.getBoundingClientRect()
+  const w = rect.width || 600, h = rect.height || 400
+
+  scene = new THREE.Scene()
+  scene.background = new THREE.Color(0x111827)
+
+  camera = new THREE.PerspectiveCamera(50, w / h, 0.1, 10)
+  camera.position.set(2.5, 1.8, 3)
+  camera.lookAt(0, 0, 0)
+
+  renderer = new THREE.WebGLRenderer({ antialias: true })
+  renderer.setSize(w, h)
+  renderer.setPixelRatio(Math.min(window.devicePixelRatio, 2))
+  container.value.appendChild(renderer.domElement)
+
+  controls = new OrbitControls(camera, renderer.domElement)
+  controls.enableDamping = true
+  controls.dampingFactor = 0.08
+  controls.target.set(0, 0, 0)
+  controls.update()
+
+  // ---- Axes helper with labels ----
+  const axesLen = 1.2
+  const axesMat = (color: number) => new THREE.LineBasicMaterial({ color })
+
+  // X axis (red) — screen x
+  const xLine = new THREE.Line(
+    new THREE.BufferGeometry().setFromPoints([
+      new THREE.Vector3(-axesLen, -axesLen, -axesLen),
+      new THREE.Vector3(axesLen, -axesLen, -axesLen)
+    ]),
+    axesMat(0xff4444)
+  )
+  scene.add(xLine)
+  objects.push(xLine)
+
+  // Y axis (green) — screen y
+  const yLine = new THREE.Line(
+    new THREE.BufferGeometry().setFromPoints([
+      new THREE.Vector3(-axesLen, -axesLen, -axesLen),
+      new THREE.Vector3(-axesLen, axesLen, -axesLen)
+    ]),
+    axesMat(0x44ff44)
+  )
+  scene.add(yLine)
+  objects.push(yLine)
+
+  // Z axis (blue) — depth
+  const zLine = new THREE.Line(
+    new THREE.BufferGeometry().setFromPoints([
+      new THREE.Vector3(-axesLen, -axesLen, -axesLen),
+      new THREE.Vector3(-axesLen, -axesLen, axesLen)
+    ]),
+    axesMat(0x4488ff)
+  )
+  scene.add(zLine)
+  objects.push(zLine)
+
+  // T axis (yellow) — time (at an angle for 3D effect)
+  const tLine = new THREE.Line(
+    new THREE.BufferGeometry().setFromPoints([
+      new THREE.Vector3(-axesLen, -axesLen, -axesLen),
+      new THREE.Vector3(axesLen, axesLen, axesLen)
+    ]),
+    axesMat(0xffdd44)
+  )
+  scene.add(tLine)
+  objects.push(tLine)
+
+  // ---- Cube wireframe ----
+  const cubeSize = axesLen * 2
+  const cubeGeo = new THREE.BoxGeometry(cubeSize, cubeSize, cubeSize)
+  const cubeWire = new THREE.LineSegments(
+    new THREE.EdgesGeometry(cubeGeo),
+    new THREE.LineBasicMaterial({ color: 0x444466, transparent: true, opacity: 0.3 })
+  )
+  cubeWire.position.set(0, 0, 0)
+  scene.add(cubeWire)
+  objects.push(cubeWire)
+
+  // ---- Points: color by time (t) ----
+  if (vertexData.length > 0) {
+    const positions = new Float32Array(vertexData.length * 3)
+    const colors = new Float32Array(vertexData.length * 3)
+    const color = new THREE.Color()
+
+    for (let i = 0; i < vertexData.length; i++) {
+      const p = vertexData[i]
+      // Position: (x, y, z) with time as movement along diagonal
+      positions[i * 3] = p.x
+      positions[i * 3 + 1] = p.y
+      positions[i * 3 + 2] = p.t * 0.5  // compress time a bit
+
+      // Color gradient: blue (early) → cyan → yellow → red (late)
+      const tNorm = (p.t + 1) / 2  // 0..1
+      color.setHSL(0.6 - tNorm * 0.6, 0.9, 0.5)
+      colors[i * 3] = color.r
+      colors[i * 3 + 1] = color.g
+      colors[i * 3 + 2] = color.b
+    }
+
+    const ptGeo = new THREE.BufferGeometry()
+    ptGeo.setAttribute('position', new THREE.BufferAttribute(positions, 3))
+    ptGeo.setAttribute('color', new THREE.BufferAttribute(colors, 3))
+
+    const ptMat = new THREE.PointsMaterial({
+      size: 0.03,
+      vertexColors: true,
+      transparent: true,
+      opacity: 0.8,
+      sizeAttenuation: true
+    })
+    const pointsObj = new THREE.Points(ptGeo, ptMat)
+    scene.add(pointsObj)
+    objects.push(pointsObj)
+
+    // ---- Trajectory line ----
+    const linePositions = new Float32Array(vertexData.length * 3)
+    for (let i = 0; i < vertexData.length; i++) {
+      const p = vertexData[i]
+      linePositions[i * 3] = p.x
+      linePositions[i * 3 + 1] = p.y
+      linePositions[i * 3 + 2] = p.t * 0.5
+    }
+    const lineGeo = new THREE.BufferGeometry()
+    lineGeo.setAttribute('position', new THREE.BufferAttribute(linePositions, 3))
+    const lineMat = new THREE.LineBasicMaterial({
+      color: 0x88ccff,
+      transparent: true,
+      opacity: 0.35
+    })
+    const line = new THREE.Line(lineGeo, lineMat)
+    scene.add(line)
+    objects.push(line)
+  }
+
+  // ---- Lights ----
+  const ambient = new THREE.AmbientLight(0x404060)
+  scene.add(ambient)
+  const dir = new THREE.DirectionalLight(0xffffff, 0.8)
+  dir.position.set(1, 2, 1)
+  scene.add(dir)
+
+  // ---- Grid helper (subtle) ----
+  const gridHelper = new THREE.GridHelper(2.5, 10, 0x444466, 0x333355)
+  gridHelper.position.y = -axesLen - 0.05
+  scene.add(gridHelper)
+  objects.push(gridHelper)
+
+  // Resize
+  const resizeObserver = new ResizeObserver(() => {
+    if (!container.value || !renderer || !camera) return
+    const r = container.value.getBoundingClientRect()
+    const rw = r.width || 600, rh = r.height || 400
+    renderer.setSize(rw, rh)
+    camera.aspect = rw / rh
+    camera.updateProjectionMatrix()
+  })
+  resizeObserver.observe(container.value)
+  ;(container.value as any).__resizeObserver = resizeObserver
+
+  animate()
+
+  // Notify demo runner via callback URL if present
+  const cb = new URLSearchParams(window.location.search).get("_callback")
+  if (cb) {
+    fetch(cb, { mode: "no-cors" }).catch(() => {})
+  }
+}
+
+function animate() {
+  animId = requestAnimationFrame(animate)
+  controls?.update()
+  if (renderer && scene && camera) renderer.render(scene, camera)
+}
+
+onMounted(() => {
+  tryAutoLoad()
+})
+
+watch(() => props.traces, () => {
+  tryAutoLoad()
+}, { deep: false })
+
+function tryAutoLoad() {
+  if (props.traces?.length && !selectedTraceId.value && !loading.value) {
+    selectedTraceId.value = props.traces[0].trace_id
+    loadData()
+  }
+}
+
+onBeforeUnmount(() => {
+  cancelAnimationFrame(animId)
+  if ((container.value as any)?.__resizeObserver) {
+    (container.value as any).__resizeObserver.disconnect()
+  }
+  disposeScene()
+})
+</script>
\ No newline at end of file
diff --git a/portal/src/components/TraceDurationHistogram.vue b/portal/src/components/TraceDurationHistogram.vue
new file mode 100644
index 0000000..4a49710
--- /dev/null
+++ b/portal/src/components/TraceDurationHistogram.vue
@@ -0,0 +1,41 @@
+<template>
+  <div class="space-y-2">
+    <div class="flex items-center justify-between">
+      <h3 class="text-sm font-semibold text-gray-300">持續時間分布圖 V3</h3>
+      <span class="text-xs text-gray-500">{{ traces.length }} traces</span>
+    </div>
+    <div class="bg-gray-900 rounded p-4" v-if="bars.length">
+      <svg :width="barW * bars.length + 4" :height="maxH + 30" class="block">
+        <g v-for="(b, i) in bars" :key="i">
+          <rect :x="i * barW + 2" :y="maxH - b.h" :width="barW - 4" :height="b.h" fill="#4488ff" :opacity="0.6 + 0.4 * b.r" rx="2" />
+          <text :x="i * barW + barW / 2" :y="maxH - b.h - 4" fill="#9ca3af" font-size="9" text-anchor="middle" v-if="b.c > 0">{{ b.c }}</text>
+          <text :x="i * barW + barW / 2" :y="maxH + 16" fill="#6b7280" font-size="8" text-anchor="middle">{{ b.l }}</text>
+        </g>
+      </svg>
+    </div>
+    <div v-else class="text-center text-gray-500 text-sm py-8">no data</div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { computed } from 'vue'
+
+const props = defineProps<{ traces: any[] }>()
+const barW = 44
+const maxBars = 20
+const maxH = 200
+
+const bars = computed(() => {
+  const d = props.traces.map((t: any) => t.duration_sec).filter((x: number) => x > 0)
+  if (!d.length) return []
+  const mx = Math.ceil(Math.max(...d))
+  const st = Math.max(1, Math.ceil(mx / maxBars))
+  const bins: { l: string; c: number; r: number; h: number }[] = []
+  for (let s = 0; s <= mx; s += st) {
+    bins.push({ l: `${s}-${s + st}s`, c: d.filter((x: number) => x >= s && x < s + st).length, r: 0, h: 0 })
+  }
+  const mc = Math.max(...bins.map(b => b.c), 1)
+  bins.forEach(b => { b.r = b.c / mc; b.h = Math.max(4, b.r * maxH) })
+  return bins
+})
+</script>
diff --git a/portal/src/components/TraceSimilarityMatrix.vue b/portal/src/components/TraceSimilarityMatrix.vue
new file mode 100644
index 0000000..5ae7a96
--- /dev/null
+++ b/portal/src/components/TraceSimilarityMatrix.vue
@@ -0,0 +1,63 @@
+<template>
+  <div class="space-y-2">
+    <div class="flex items-center justify-between">
+      <h3 class="text-sm font-semibold text-gray-300">相似度矩陣 V4</h3>
+      <span class="text-xs text-gray-500">{{ traces.length }} traces</span>
+    </div>
+    <div class="bg-gray-900 rounded p-4 overflow-x-auto" v-if="matrix.length">
+      <svg :width="cellS * matrix.length + 60" :height="cellS * matrix.length + 40" class="block">
+        <!-- labels -->
+        <text v-for="(_, i) in matrix" :key="'l'+i"
+          :x="cellS * i + cellS / 2 + 50" :y="14" fill="#9ca3af" font-size="7" text-anchor="end"
+          transform="rotate(-60, 10, 10)">{{ traces[i]?.trace_id }}</text>
+        <text v-for="(_, i) in matrix" :key="'r'+i"
+          :x="44" :y="cellS * i + cellS / 2 + 24" fill="#9ca3af" font-size="7">{{ traces[i]?.trace_id }}</text>
+        <!-- cells -->
+        <g v-for="(row, i) in matrix" :key="i">
+          <rect v-for="(v, j) in row" :key="j"
+            :x="cellS * j + 50" :y="cellS * i + 20"
+            :width="cellS" :height="cellS"
+            :fill="color(v)" stroke="#374151" stroke-width="0.5" />
+        </g>
+      </svg>
+    </div>
+    <div v-else class="text-center text-gray-500 text-sm py-8">no data</div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { computed } from 'vue'
+
+const props = defineProps<{ traces: any[] }>()
+const cellS = 14
+const maxN = 40
+
+const matrix = computed(() => {
+  const t = props.traces.slice(0, maxN)
+  if (t.length < 2) return []
+  const durs = t.map(x => x.duration_sec || 0)
+  const cnt = t.map(x => x.face_count || 0)
+  const maxDur = Math.max(...durs, 1)
+  const maxCnt = Math.max(...cnt, 1)
+  const m: number[][] = []
+  for (let i = 0; i < t.length; i++) {
+    const row: number[] = []
+    for (let j = 0; j < t.length; j++) {
+      if (i === j) { row.push(1); continue }
+      // Simple similarity: duration + face_count proximity
+      const durSim = 1 - Math.abs(durs[i] - durs[j]) / maxDur
+      const cntSim = 1 - Math.abs(cnt[i] - cnt[j]) / maxCnt
+      row.push((durSim + cntSim) / 2)
+    }
+    m.push(row)
+  }
+  return m
+})
+
+function color(v: number): string {
+  if (v > 0.85) return 'rgba(68, 255, 68, 0.8)'  // bright green = similar
+  if (v > 0.7) return 'rgba(68, 200, 68, 0.6)'
+  if (v > 0.5) return 'rgba(100, 100, 100, 0.4)'
+  return 'rgba(40, 40, 50, 0.3)'  // dark = dissimilar
+}
+</script>
diff --git a/portal/src/components/TraceThumbnailTimeline.vue b/portal/src/components/TraceThumbnailTimeline.vue
new file mode 100644
index 0000000..f38dc7f
--- /dev/null
+++ b/portal/src/components/TraceThumbnailTimeline.vue
@@ -0,0 +1,86 @@
+<template>
+  <div class="space-y-2">
+    <div class="flex items-center justify-between">
+      <h3 class="text-sm font-semibold text-gray-300">臉孔縮圖時間軸 V1</h3>
+      <span class="text-xs text-gray-500">{{ traces.length }} traces</span>
+    </div>
+    <div class="relative overflow-x-auto py-4" ref="scrollRef">
+      <svg :width="svgW" :height="80" class="block">
+        <!-- time axis -->
+        <line x1="0" y1="70" :x2="svgW" y2="70" stroke="#4b5563" stroke-width="1" />
+        <!-- time ticks -->
+        <g v-for="t in ticks" :key="t">
+          <line :x1="xPos(t)" y1="66" :x2="xPos(t)" y2="70" stroke="#6b7280" stroke-width="1" />
+          <text :x="xPos(t)" y="78" fill="#9ca3af" font-size="9" text-anchor="middle">{{ t }}s</text>
+        </g>
+        <!-- trace thumbnails -->
+        <g v-for="(tr, idx) in topTraces" :key="tr.trace_id">
+          <image
+            :x="thumbX(tr, idx)" :y="thumbY(idx)"
+            :width="thumbSize" :height="thumbSize"
+            :href="thumbUrl(tr)"
+            preserveAspectRatio="xMidYMid slice"
+            class="cursor-pointer hover:opacity-80"
+            @click="$emit('select', tr.trace_id)"
+          />
+          <text
+            :x="thumbX(tr, idx) + thumbSize / 2" :y="thumbY(idx) + thumbSize + 10"
+            fill="#9ca3af" font-size="8" text-anchor="middle"
+          >#{{ tr.trace_id }}</text>
+        </g>
+      </svg>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { computed } from 'vue'
+import { getCurrentConfig } from '@/api/client'
+
+const props = defineProps<{
+  fileUuid: string
+  traces: any[]
+  totalDuration: number
+}>()
+
+defineEmits<{ select: [traceId: number] }>()
+
+const config = getCurrentConfig()
+const thumbSize = 40
+const maxTraces = 15
+const timelinePad = 60
+
+const topTraces = computed(() =>
+  [...props.traces].sort((a, b) => b.face_count - a.face_count).slice(0, maxTraces)
+)
+
+const svgW = computed(() => {
+  const dur = props.totalDuration || 6000
+  return Math.max(600, timelinePad * 2 + dur / 10)
+})
+
+function xPos(sec: number): number {
+  const dur = props.totalDuration || 6000
+  return timelinePad + (sec / dur) * (svgW.value - timelinePad * 2)
+}
+
+function thumbY(_index: number): number {
+  return 15 + (_index % 3) * (thumbSize + 8)
+}
+
+function thumbX(tr: any, _index: number): number {
+  return xPos((tr.first_sec + tr.last_sec) / 2) - thumbSize / 2
+}
+
+function thumbUrl(tr: any): string {
+  return `${config.api_base_url}/api/v1/file/${props.fileUuid}/thumbnail?frame=${tr.first_frame}`
+}
+
+const ticks = computed(() => {
+  const dur = props.totalDuration || 6000
+  const step = Math.max(30, Math.round(dur / 8 / 30) * 30)
+  const tks: number[] = []
+  for (let t = 0; t <= dur; t += step) tks.push(t)
+  return tks
+})
+</script>
diff --git a/portal/src/test-setup.ts b/portal/src/test-setup.ts
new file mode 100644
index 0000000..57a3826
--- /dev/null
+++ b/portal/src/test-setup.ts
@@ -0,0 +1,16 @@
+import { vi } from 'vitest'
+
+const mockStorage = new Map<string, string>()
+
+Object.defineProperty(globalThis, 'localStorage', {
+  value: {
+    getItem: (key: string) => mockStorage.get(key) ?? null,
+    setItem: (key: string, value: string) => mockStorage.set(key, String(value)),
+    removeItem: (key: string) => mockStorage.delete(key),
+    clear: () => mockStorage.clear(),
+    get length() { return mockStorage.size },
+    key: (index: number) => [...mockStorage.keys()][index] ?? null,
+  },
+  configurable: true,
+  writable: true,
+})
diff --git a/portal/src/views/LoginView.test.ts b/portal/src/views/LoginView.test.ts
new file mode 100644
index 0000000..8717128
--- /dev/null
+++ b/portal/src/views/LoginView.test.ts
@@ -0,0 +1,184 @@
+import { describe, it, expect, vi, beforeEach } from 'vitest'
+import { mount } from '@vue/test-utils'
+import { nextTick } from 'vue'
+
+const mockPush = vi.fn()
+const mockReplace = vi.fn()
+const mockUseRoute = vi.fn(() => ({
+  query: { username: '', password: '' },
+  path: '/login',
+}))
+
+vi.mock('vue-router', () => ({
+  useRouter: () => ({ push: mockPush, replace: mockReplace }),
+  useRoute: mockUseRoute,
+}))
+
+const mockHttpFetch = vi.fn()
+vi.mock('@/api/client', () => ({
+  httpFetch: mockHttpFetch,
+  getCurrentConfig: () => ({
+    api_base_url: 'http://localhost:3003',
+    api_key: '',
+    timeout_secs: 30,
+  }),
+  saveConfig: vi.fn(),
+}))
+
+beforeEach(() => {
+  vi.clearAllMocks()
+  localStorage.clear()
+  mockUseRoute.mockReturnValue({
+    query: { username: '', password: '' },
+    path: '/login',
+  })
+})
+
+async function createWrapper() {
+  const { default: LoginView } = await import('./LoginView.vue')
+  return mount(LoginView, {
+    attachTo: document.body,
+  })
+}
+
+describe('LoginView', () => {
+  it('renders login form', async () => {
+    const wrapper = await createWrapper()
+    expect(wrapper.find('h1').text()).toBe('Momentry')
+    expect(wrapper.find('input[type="text"]').exists()).toBe(true)
+    expect(wrapper.find('input[type="password"]').exists()).toBe(true)
+    expect(wrapper.find('button[type="submit"]').text()).toBe('Login')
+  })
+
+  it('updates username and password on input', async () => {
+    const wrapper = await createWrapper()
+    const usernameInput = wrapper.find('input[type="text"]')
+    const passwordInput = wrapper.find('input[type="password"]')
+
+    await usernameInput.setValue('demo')
+    await passwordInput.setValue('secret')
+
+    expect((usernameInput.element as HTMLInputElement).value).toBe('demo')
+    expect((passwordInput.element as HTMLInputElement).value).toBe('secret')
+  })
+
+  it('toggles password visibility', async () => {
+    const wrapper = await createWrapper()
+    const toggleBtn = wrapper.find('button[type="button"]')
+    const passwordInput = wrapper.find('input[type="password"]')
+
+    expect(passwordInput.attributes('type')).toBe('password')
+    await toggleBtn.trigger('click')
+    expect(passwordInput.attributes('type')).toBe('text')
+    await toggleBtn.trigger('click')
+    expect(passwordInput.attributes('type')).toBe('password')
+  })
+
+  it('shows loading state on submit', async () => {
+    mockHttpFetch.mockImplementation(() => new Promise(() => {}))
+    const wrapper = await createWrapper()
+
+    await wrapper.find('input[type="text"]').setValue('demo')
+    await wrapper.find('input[type="password"]').setValue('demo')
+    await wrapper.find('form').trigger('submit.prevent')
+    await nextTick()
+
+    expect(wrapper.find('button[type="submit"]').text()).toBe('Logging in...')
+    expect(wrapper.find('button[type="submit"]').attributes('disabled')).toBeDefined()
+  })
+
+  it('shows error on login failure with message', async () => {
+    mockHttpFetch.mockResolvedValue({ success: false, message: 'Account disabled' })
+    const wrapper = await createWrapper()
+
+    await wrapper.find('input[type="text"]').setValue('demo')
+    await wrapper.find('input[type="password"]').setValue('demo')
+    await wrapper.find('form').trigger('submit.prevent')
+    await nextTick()
+
+    expect(wrapper.text()).toContain('Account disabled')
+  })
+
+  it('shows generic error for 401', async () => {
+    mockHttpFetch.mockRejectedValue(new Error('401 Unauthorized'))
+    const wrapper = await createWrapper()
+
+    await wrapper.find('input[type="text"]').setValue('bad')
+    await wrapper.find('input[type="password"]').setValue('creds')
+    await wrapper.find('form').trigger('submit.prevent')
+    await nextTick()
+
+    expect(wrapper.text()).toContain('Invalid username or password')
+  })
+
+  it('shows connection error on network failure', async () => {
+    mockHttpFetch.mockRejectedValue(new Error('NetworkError'))
+    const wrapper = await createWrapper()
+
+    await wrapper.find('input[type="text"]').setValue('demo')
+    await wrapper.find('input[type="password"]').setValue('demo')
+    await wrapper.find('form').trigger('submit.prevent')
+    await nextTick()
+
+    expect(wrapper.text()).toContain('Connection error')
+  })
+
+  it('redirects on successful login', async () => {
+    mockHttpFetch.mockResolvedValue({
+      success: true,
+      api_key: 'test_key_123',
+      user: { name: 'demo', role: 'admin' },
+    })
+    const wrapper = await createWrapper()
+
+    await wrapper.find('input[type="text"]').setValue('admin')
+    await wrapper.find('input[type="password"]').setValue('admin')
+    await wrapper.find('form').trigger('submit.prevent')
+    await nextTick()
+
+    expect(localStorage.getItem('momentry_user')).toBe(
+      JSON.stringify({ name: 'demo', role: 'admin' }),
+    )
+    expect(localStorage.getItem('momentry_api_key')).toBe('test_key_123')
+    expect(mockPush).toHaveBeenCalledWith('/home')
+  })
+
+  it('redirects to original redirect path after login', async () => {
+    mockUseRoute.mockReturnValue({
+      query: { redirect: '/search?q=test' },
+      path: '/login',
+    })
+    mockHttpFetch.mockResolvedValue({
+      success: true,
+      api_key: 'key',
+      user: { name: 'demo' },
+    })
+    const wrapper = await createWrapper()
+
+    await wrapper.find('input[type="text"]').setValue('demo')
+    await wrapper.find('input[type="password"]').setValue('demo')
+    await wrapper.find('form').trigger('submit.prevent')
+    await nextTick()
+
+    expect(mockPush).toHaveBeenCalledWith('/search?q=test')
+  })
+
+  it('auto-submits when query params are present', async () => {
+    mockUseRoute.mockReturnValue({
+      query: { username: 'auto', password: 'login' },
+      path: '/login',
+    })
+    mockHttpFetch.mockResolvedValue({
+      success: true,
+      api_key: 'auto_key',
+      user: { name: 'auto_user' },
+    })
+
+    await createWrapper()
+    await nextTick()
+    await nextTick()
+
+    expect(mockHttpFetch).toHaveBeenCalled()
+    expect(localStorage.getItem('momentry_api_key')).toBe('auto_key')
+  })
+})
diff --git a/portal/src/views/NotFoundView.vue b/portal/src/views/NotFoundView.vue
new file mode 100644
index 0000000..df26672
--- /dev/null
+++ b/portal/src/views/NotFoundView.vue
@@ -0,0 +1,11 @@
+<template>
+  <div class="flex flex-col items-center justify-center min-h-[60vh] text-center">
+    <div class="text-8xl font-bold text-gray-600 mb-4">404</div>
+    <h2 class="text-2xl font-semibold text-gray-300 mb-2">頁面不存在</h2>
+    <p class="text-gray-500 mb-8">您要尋找的頁面不存在或已被移除</p>
+    <router-link to="/home"
+      class="bg-blue-600 hover:bg-blue-500 text-white px-6 py-2 rounded-lg transition">
+      回到首頁
+    </router-link>
+  </div>
+</template>
\ No newline at end of file
diff --git a/portal/src/views/PipelineProgressView.vue b/portal/src/views/PipelineProgressView.vue
new file mode 100644
index 0000000..a3d57d1
--- /dev/null
+++ b/portal/src/views/PipelineProgressView.vue
@@ -0,0 +1,370 @@
+<template>
+  <div class="min-h-screen bg-gray-900 text-gray-100 p-6">
+
+    <div v-if="loading" class="text-center py-12"><p class="text-gray-400">載入中...</p></div>
+    <div v-else-if="error" class="bg-red-900/50 border border-red-700 rounded p-4 mb-4">
+      <p class="text-red-300">{{ error }}</p>
+    </div>
+
+    <div v-else>
+      <!-- ═══ 頂部：標題 + 篩選 + 搜尋 ═══ -->
+      <div class="flex flex-wrap items-center justify-between mb-4 gap-3">
+        <h1 class="text-2xl font-bold">📋 檔案歷程</h1>
+        <div class="flex items-center gap-2">
+          <!-- 狀態篩選 -->
+          <button v-for="f in filterOptions" :key="f.key"
+            @click="activeFilter = f.key"
+            class="px-3 py-1 rounded text-sm transition"
+            :class="activeFilter === f.key ? 'bg-blue-700 text-white' : 'bg-gray-700 text-gray-300 hover:bg-gray-600'">
+            {{ f.label }}
+          </button>
+          <!-- 搜尋 -->
+          <input v-model="searchQuery" placeholder="搜尋 UUID 或檔名..."
+            class="bg-gray-700 border border-gray-600 rounded px-3 py-1.5 text-sm w-48 focus:border-blue-500 outline-none" />
+        </div>
+      </div>
+
+      <!-- ═══ Job 清單（摺疊） ═══ -->
+      <div class="bg-gray-800 rounded-lg mb-4 overflow-hidden">
+        <table class="w-full text-sm">
+          <thead>
+            <tr class="text-gray-400 border-b border-gray-700 text-xs">
+              <th class="text-left py-2 px-3 w-12">#</th>
+              <th class="text-left py-2">檔案名稱</th>
+              <th class="text-left py-2 w-16">狀態</th>
+              <th class="text-left py-2 w-20">時間</th>
+              <th class="text-left py-2 w-16">進度</th>
+              <th class="text-left py-2 w-12"></th>
+            </tr>
+          </thead>
+          <tbody>
+            <tr v-for="job in filteredJobs" :key="job.id"
+              @click="selectedId = job.id"
+              class="border-b border-gray-700/30 cursor-pointer transition"
+              :class="selectedId === job.id ? 'bg-blue-900/30' : 'hover:bg-gray-700/30'">
+              <td class="py-2 px-3 font-mono text-xs text-gray-500">{{ job.id }}</td>
+              <td class="py-2 truncate max-w-64">{{ job.file_name || '未知' }}</td>
+              <td class="py-2"><span :class="statusBadge(job.status)" class="px-2 py-0.5 rounded text-xs">{{ job.status }}</span></td>
+              <td class="py-2 font-mono text-xs text-gray-400">{{ job.createdAt || '-' }}</td>
+              <td class="py-2">{{ completedCount(job) }}/{{ job.processorList?.length || 0 }}</td>
+              <td class="py-2 text-xs text-gray-500">{{ selectedId === job.id ? '◀' : '▶' }}</td>
+            </tr>
+          </tbody>
+        </table>
+      </div>
+
+      <!-- ═══ 選中的 Job 詳細資料 ═══ -->
+      <div v-if="selectedJob">
+        <!-- ① 檔案基本資料 -->
+        <div class="bg-gray-800 rounded-lg p-5 mb-4">
+          <div class="flex items-start justify-between mb-3">
+            <div>
+              <h2 class="text-xl font-semibold flex items-center gap-2">
+                {{ selectedJob.file_name || '未知檔案' }}
+                <span :class="statusBadge(selectedJob.status)" class="px-2 py-0.5 rounded text-xs">{{ selectedJob.status }}</span>
+              </h2>
+              <p class="text-gray-400 text-xs mt-1 font-mono">UUID: {{ selectedJob.uuid || '-' }}</p>
+            </div>
+            <div class="text-right text-xs text-gray-500">
+              <div>Job #{{ selectedJob.id }}</div>
+              <div v-if="selectedJob.metadata && selectedJob.metadata['duration']">{{ Math.round(selectedJob.metadata['duration']/60) }}min</div>
+            </div>
+          </div>
+
+          <div v-if="selectedJob.metadata" class="grid grid-cols-4 gap-3 text-sm bg-gray-900/50 rounded p-3 mb-3">
+            <div><span class="text-gray-500">長度</span><br>{{ selectedJob.metadata['duration'] ? Math.round(selectedJob.metadata['duration']) + 's' : '-' }}</div>
+            <div><span class="text-gray-500">解析度</span><br>{{ selectedJob.metadata['width'] || '?' }}x{{ selectedJob.metadata['height'] || '?' }}</div>
+            <div><span class="text-gray-500">FPS</span><br>{{ selectedJob.metadata['fps'] || '?' }}</div>
+            <div><span class="text-gray-500">總幀數</span><br>{{ selectedJob.metadata['total_frames'] || '?' }}</div>
+          </div>
+
+          <div class="flex gap-2 flex-wrap mb-3" v-if="selectedJob.uuid">
+            <a :href="baseURL + '/api/v1/file/' + selectedJob.uuid + '/video'" target="_blank" class="px-3 py-1 bg-blue-700 hover:bg-blue-600 rounded text-xs">🎬 串流</a>
+            <a :href="baseURL + '/api/v1/file/' + selectedJob.uuid + '/thumbnail?frame=0'" target="_blank" class="px-3 py-1 bg-green-700 hover:bg-green-600 rounded text-xs">🖼️ 縮圖</a>
+            <router-link :to="'/search?uuid=' + selectedJob.uuid" class="px-3 py-1 bg-purple-700 hover:bg-purple-600 rounded text-xs">🔍 搜尋</router-link>
+          </div>
+
+          <!-- ② 時間軸 -->
+          <div v-if="selectedJob.timeline && selectedJob.timeline.length" class="mb-4">
+            <h3 class="text-sm font-semibold text-gray-300 mb-2">⏱️ 處理時間軸</h3>
+            <div class="relative h-8 bg-gray-900 rounded overflow-hidden">
+              <div v-for="(seg, i) in selectedJob.timeline" :key="i"
+                   :title="seg.label + ': ' + seg.duration"
+                   class="absolute h-full flex items-center justify-center text-xs font-bold text-white truncate"
+                   :style="{ left: seg.left + '%', width: seg.width + '%', background: seg.color }">
+                {{ seg.width > 8 ? seg.label : '' }}
+              </div>
+            </div>
+            <div class="flex gap-3 mt-1 text-xs text-gray-500 flex-wrap">
+              <span v-for="(seg, i) in selectedJob.timeline" :key="'l'+i"><span :style="{ color: seg.color }">●</span> {{ seg.label }} ({{ seg.duration }})</span>
+            </div>
+          </div>
+
+          <!-- ③ Processors -->
+          <table class="w-full text-sm mb-3">
+            <thead>
+              <tr class="text-gray-400 border-b border-gray-700">
+                <th class="text-left py-2 w-20">Proc</th>
+                <th class="text-left py-2 w-10">St</th>
+                <th class="text-left py-2 w-14">Start</th>
+                <th class="text-left py-2 w-14">End</th>
+                <th class="text-left py-2 w-16">耗時</th>
+                <th class="text-right py-2">已產出</th>
+                <th class="text-right py-2">已處理</th>
+              </tr>
+            </thead>
+            <tbody>
+              <tr v-for="p in selectedJob.processorList" :key="p.name" class="border-b border-gray-700/50 hover:bg-gray-700/30">
+                <td class="py-1.5 font-mono text-sm">{{ p.name }}</td>
+                <td class="py-1.5">{{ statusIcon(p.status) }}</td>
+                <td class="py-1.5 font-mono text-xs text-gray-400">{{ p.start }}</td>
+                <td class="py-1.5 font-mono text-xs text-gray-400">{{ p.end }}</td>
+                <td class="py-1.5 font-mono text-xs text-gray-400">{{ p.duration || '-' }}</td>
+                <td class="py-1.5 text-right font-mono text-sm">{{ p.chunks ?? '-' }}</td>
+                <td class="py-1.5 text-right font-mono text-sm">{{ p.frames ?? '-' }}</td>
+              </tr>
+            </tbody>
+          </table>
+          <div class="text-xs text-gray-500 mb-3">已處理 {{ completedCount(selectedJob) }}/{{ selectedJob.processorList?.length || 0 }}</div>
+
+          <!-- ④ Post-Processing -->
+          <div v-if="selectedJob.postProcessing" class="mb-4">
+            <h3 class="text-sm font-semibold text-gray-300 mb-2">⚙️ Post-Processing</h3>
+            <table class="w-full text-sm">
+              <thead>
+                <tr class="text-gray-400 border-b border-gray-700">
+                  <th class="text-left py-2">Stage</th>
+                  <th class="text-left py-2 w-10">St</th>
+                  <th class="text-right py-2 w-16">已產出</th>
+                  <th class="text-left py-2 pl-4">依賴進度狀態</th>
+                </tr>
+              </thead>
+              <tbody>
+                <tr v-for="pp in selectedJob.postProcessing" :key="pp.stage" class="border-b border-gray-700/50 hover:bg-gray-700/30">
+                  <td class="py-1.5 text-sm">{{ pp.stage }}</td>
+                  <td class="py-1.5">{{ statusIcon(pp.status) }}</td>
+                  <td class="py-1.5 text-right font-mono text-xs text-gray-400">{{ pp.output || '-' }}</td>
+                  <td class="py-1.5 pl-4 font-mono text-xs text-gray-400">{{ pp.deps }}</td>
+                </tr>
+              </tbody>
+            </table>
+          </div>
+
+          <!-- ⑤ Resources -->
+          <div v-if="selectedJob.processorList.some(p => p.version)" class="mb-2">
+            <h3 class="text-sm font-semibold text-gray-300 mb-2">🔧 Resources</h3>
+            <div class="grid grid-cols-2 sm:grid-cols-3 md:grid-cols-4 gap-2">
+              <div v-for="p in selectedJob.processorList.filter(p => p.version)" :key="p.name" class="bg-gray-900/50 rounded p-2 text-xs">
+                <div class="text-gray-400">{{ p.name }}</div>
+                <div class="font-mono text-gray-300 truncate">{{ p.version }}</div>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+
+      <!-- 無匹配 -->
+      <div v-if="filteredJobs.length === 0" class="text-center py-12 text-gray-500">無符合條件的檔案記錄</div>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { ref, computed, onMounted, onUnmounted } from 'vue'
+import { httpFetch } from '@/api/client'
+
+interface ProcessorInfo {
+  name: string; status: string; start: string; end: string; duration: string
+  chunks: number; frames: number; version: string
+}
+interface PostProcessInfo { stage: string; status: string; output: string; deps: string }
+interface TimelineSeg { label: string; left: number; width: number; color: string; duration: string }
+interface JobInfo {
+  id: number; uuid: string; status: string; file_name: string; createdAt: string
+  metadata: any
+  timeline: TimelineSeg[]
+  processorList: ProcessorInfo[]
+  postProcessing: PostProcessInfo[]
+}
+
+const baseURL = JSON.parse(localStorage.getItem('portal_config') || '{}').api_base_url || 'http://127.0.0.1:3003'
+const loading = ref(true)
+const error = ref('')
+const jobs = ref<JobInfo[]>([])
+const activeFilter = ref('all')
+const searchQuery = ref('')
+const selectedId = ref<number | null>(null)
+let refreshTimer: ReturnType<typeof setInterval> | null = null
+
+const filterOptions = [
+  { key: 'all', label: 'All' },
+  { key: 'running', label: '⏳ Running' },
+  { key: 'completed', label: '✅ Completed' },
+  { key: 'failed', label: '❌ Failed' },
+]
+
+const filteredJobs = computed(() => {
+  let list = jobs.value
+  if (activeFilter.value !== 'all') {
+    list = list.filter(j => j.status === activeFilter.value)
+  }
+  if (searchQuery.value) {
+    const q = searchQuery.value.toLowerCase()
+    list = list.filter(j =>
+      (j.file_name && j.file_name.toLowerCase().includes(q)) ||
+      (j.uuid && j.uuid.toLowerCase().includes(q))
+    )
+  }
+  return list
+})
+
+const selectedJob = computed(() => {
+  return jobs.value.find(j => j.id === selectedId.value) || null
+})
+
+const procColors: Record<string, string> = {
+  cut: '#3b82f6', face: '#10b981', ocr: '#f59e0b',
+  pose: '#8b5cf6', yolo: '#ef4444', asr: '#06b6d4', asrx: '#ec4899'
+}
+
+function statusIcon(st: string): string {
+  return ({ completed: '✅', running: '⏳', pending: '⬜', failed: '❌', skipped: '⏭️' })[st] || '⬜'
+}
+function statusBadge(st: string): string {
+  return ({
+    completed: 'bg-green-700 text-green-200', running: 'bg-blue-700 text-blue-200',
+    failed: 'bg-red-700 text-red-200'
+  })[st] || 'bg-gray-600 text-gray-300'
+}
+function completedCount(job: JobInfo): number {
+  return job.processorList?.filter(p => p.status === 'completed').length || 0
+}
+function formatTime(iso: string): string {
+  if (!iso) return '-'
+  try { return new Date(iso).toTimeString().substring(0, 5) }
+  catch { return iso.substring(11, 16) }
+}
+function formatDuration(secs: number): string {
+  if (!secs || secs <= 0) return '-'
+  if (secs < 60) return Math.round(secs) + 's'
+  return Math.floor(secs / 60) + 'm ' + Math.round(secs % 60) + 's'
+}
+function formatDateTime(iso: string): string {
+  if (!iso) return '-'
+  try { return new Date(iso).toLocaleString('zh-TW', { month: '2-digit', day: '2-digit', hour: '2-digit', minute: '2-digit' }) }
+  catch { return iso.substring(5, 16) }
+}
+
+async function loadJobs() {
+  try {
+    const resp: any = await httpFetch(`${baseURL}/api/v1/jobs`)
+    const rawJobs = resp?.jobs || []
+    const result: JobInfo[] = []
+
+    for (const j of (Array.isArray(rawJobs) ? rawJobs : []).slice(-10)) {
+      const jobId = j.id
+      const uuid = j.uuid || ''
+      let processors: ProcessorInfo[] = []
+      let postProcessing: PostProcessInfo[] = []
+      let fileName = ''
+      let fileMeta: Record<string, any> | null = null
+      let timeline: TimelineSeg[] = []
+
+      if (uuid) {
+        try {
+          // Fetch file probe
+          const probe: any = await httpFetch(`${baseURL}/api/v1/file/${uuid}/probe`)
+          fileMeta = probe || null
+          fileName = probe?.file_name || fileName
+
+          // Fetch progress
+          const prog: any = await httpFetch(`${baseURL}/api/v1/progress/${uuid}`)
+          fileName = prog?.file_name || fileName
+
+          const procMap: Record<string, any> = {}
+          for (const p of (prog?.processors || [])) procMap[p.name] = p
+
+          const procOrder = ['cut', 'face', 'ocr', 'pose', 'yolo', 'asr', 'asrx']
+          const parsed: { name: string; start: number; end: number; status: string }[] = []
+
+          for (const name of procOrder) {
+            const p = procMap[name] || { status: 'pending' }
+            const startStr = p.started_at || ''
+            const endStr = p.completed_at || ''
+            const startMs = startStr ? new Date(startStr).getTime() : 0
+            const endMs = endStr ? new Date(endStr).getTime() : (startMs || 0)
+            const dur = (endMs && endMs >= startMs) ? (endMs - startMs) / 1000 : 0
+
+            processors.push({
+              name, status: p.status,
+              start: formatTime(startStr),
+              end: formatTime(endStr),
+              duration: formatDuration(dur),
+              chunks: p.chunks_produced ?? 0,
+              frames: p.frames_processed ?? 0,
+              version: p.version || ''
+            })
+            if (startMs && startStr) {
+              parsed.push({ name, start: startMs, end: endMs || Date.now(), status: p.status })
+            }
+          }
+
+          // Build timeline
+          if (parsed.length > 0) {
+            const minT = Math.min(...parsed.map(p => p.start))
+            const maxT = Math.max(...parsed.map(p => p.end === Date.now() ? Date.now() : p.end))
+            const range = maxT - minT || 1
+            for (const p of parsed) {
+              timeline.push({
+                label: p.name,
+                left: ((p.start - minT) / range) * 100,
+                width: Math.max(((p.end - p.start) / range) * 100, 3),
+                color: procColors[p.name] || '#6b7280',
+                duration: formatDuration((p.end - p.start) / 1000)
+              })
+            }
+          }
+
+          // Post-processing deps
+          const allDone = processors.every(p => p.status === 'completed')
+          const S = (n: string) => statusIcon(procMap[n]?.status || 'pending')
+          postProcessing = [
+            { stage: 'Rule 1 chunks', status: allDone ? 'running' : 'pending', output: '-', deps: `ASR${S('asr')} + ASRX${S('asrx')}` },
+            { stage: 'face_trace', status: allDone ? 'running' : 'pending', output: '-', deps: `cut${S('cut')} face${S('face')} ocr${S('ocr')} pose${S('pose')} yolo${S('yolo')} asr${S('asr')} asrx${S('asrx')}` },
+            { stage: 'Qdrant face sync', status: 'pending', output: '-', deps: 'face_trace⬜' },
+            { stage: 'Qdrant voice', status: 'pending', output: '-', deps: `ASRX${S('asrx')} (inline)` },
+            { stage: 'ANE vectorize', status: 'pending', output: '-', deps: 'Rule 1 chunks⬜' },
+            { stage: '5W1H Agent', status: 'pending', output: '-', deps: 'Rule 1⬜ + Rule 3⬜' },
+          ]
+        } catch (e) { console.warn(`skip ${uuid}:`, e) }
+      }
+
+      result.push({
+        id: jobId, uuid, status: j.status || 'unknown', file_name: fileName,
+        createdAt: j.created_at ? formatDateTime(j.created_at) : '',
+        metadata: fileMeta, timeline, processorList: processors, postProcessing
+      })
+    }
+    jobs.value = result.reverse()
+    if (result.length > 0 && selectedId.value === null) {
+      selectedId.value = result[result.length - 1].id
+    }
+
+    // Auto refresh if any job is running
+    const hasRunning = result.some(j => j.status === 'running')
+    if (hasRunning && !refreshTimer) {
+      refreshTimer = setInterval(loadJobs, 15000)
+    } else if (!hasRunning && refreshTimer) {
+      clearInterval(refreshTimer)
+      refreshTimer = null
+    }
+  } catch (e: any) {
+    error.value = e?.message || '載入失敗'
+  } finally {
+    loading.value = false
+  }
+}
+
+onMounted(loadJobs)
+onUnmounted(() => { if (refreshTimer) clearInterval(refreshTimer) })
+</script>
diff --git a/portal/src/views/TraceDetailView.vue b/portal/src/views/TraceDetailView.vue
new file mode 100644
index 0000000..4f5dfc6
--- /dev/null
+++ b/portal/src/views/TraceDetailView.vue
@@ -0,0 +1,85 @@
+<template>
+  <div class="space-y-6">
+    <div class="flex items-center space-x-4">
+      <button @click="$router.back()" class="text-gray-400 hover:text-white text-lg">← 返回</button>
+      <h2 class="text-2xl font-bold">Trace #{{ traceId }}</h2>
+      <span class="text-gray-400 text-sm">{{ fileUuid?.substring(0, 12) }}...</span>
+    </div>
+
+    <div v-if="loading" class="text-center py-12"><div class="animate-spin rounded-full h-10 w-10 border-b-2 border-blue-500 mx-auto"></div></div>
+
+    <div v-else-if="trace" class="grid gap-6">
+      <!-- Summary -->
+      <div class="bg-gray-800 rounded-lg p-6 border border-gray-700 grid grid-cols-2 md:grid-cols-4 gap-4">
+        <div><span class="text-xs text-gray-500">DETECTIONS</span><p class="text-white text-lg font-semibold">{{ trace.face_count }}</p></div>
+        <div><span class="text-xs text-gray-500">DURATION</span><p class="text-white text-lg font-semibold">{{ trace.duration_sec?.toFixed(1) }}s</p></div>
+        <div><span class="text-xs text-gray-500">CONFIDENCE</span><p class="text-white text-lg font-semibold">{{ (trace.avg_confidence * 100).toFixed(0) }}%</p></div>
+        <div><span class="text-xs text-gray-500">TIME</span><p class="text-white text-lg font-semibold">{{ trace.first_sec?.toFixed(0) }}s - {{ trace.last_sec?.toFixed(0) }}s</p></div>
+      </div>
+
+      <!-- Video -->
+      <div class="bg-gray-800 rounded-lg border border-gray-700 overflow-hidden">
+        <video controls autoplay class="w-full" @error="videoError = true">
+          <source :src="videoUrl" type="video/mp4" />
+        </video>
+        <div v-if="videoError" class="p-4 text-center text-gray-500">Video unavailable</div>
+      </div>
+
+      <!-- Recent Faces -->
+      <div class="bg-gray-800 rounded-lg p-6 border border-gray-700">
+        <h3 class="text-lg font-semibold mb-4 text-blue-400">Recent Detections</h3>
+        <div class="grid grid-cols-4 sm:grid-cols-6 md:grid-cols-8 gap-2">
+          <div v-for="f in recentFaces" :key="f.id" class="bg-gray-900 rounded overflow-hidden">
+            <img :src="thumbUrl(f)" class="w-full aspect-square object-cover" loading="lazy" @error="e => (e.target as HTMLElement).style.display='none'" />
+            <div class="p-1 text-[9px] text-gray-400 truncate">#{{ f.start_frame }}<br/>{{ (f.confidence * 100).toFixed(0) }}%</div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { ref, computed, onMounted } from 'vue'
+import { useRoute } from 'vue-router'
+import { getCurrentConfig, httpFetch } from '@/api/client'
+
+const route = useRoute()
+const fileUuid = route.params.file_uuid as string
+const traceId = route.params.trace_id as string
+const config = getCurrentConfig()
+
+const trace = ref<any>(null)
+const faces = ref<any[]>([])
+const loading = ref(true)
+const videoError = ref(false)
+
+const videoUrl = computed(() =>
+  `${config.api_base_url}/api/v1/file/${fileUuid}/trace/${traceId}/video?padding=1`
+)
+
+const recentFaces = computed(() => faces.value.slice(0, 40))
+
+function thumbUrl(f: any): string {
+  return `${config.api_base_url}/api/v1/file/${fileUuid}/thumbnail?frame=${f.start_frame}&x=${f.x}&y=${f.y}&w=${f.width}&h=${f.height}`
+}
+
+async function loadData() {
+  try {
+    const traces = await httpFetch<any>(`${config.api_base_url}/api/v1/file/${fileUuid}/face_trace/sortby`, {
+      method: 'POST',
+      body: JSON.stringify({ limit: 500 })
+    })
+    trace.value = (traces.traces || []).find((t: any) => String(t.trace_id) === traceId)
+    
+    const faceData = await httpFetch<any>(`${config.api_base_url}/api/v1/file/${fileUuid}/trace/${traceId}/faces?limit=50`)
+    faces.value = faceData.faces || []
+  } catch (e) {
+    console.error('Failed to load trace:', e)
+  } finally {
+    loading.value = false
+  }
+}
+
+onMounted(() => loadData())
+</script>
diff --git a/portal/src/views/TraceVizView.vue b/portal/src/views/TraceVizView.vue
new file mode 100644
index 0000000..7e7af6b
--- /dev/null
+++ b/portal/src/views/TraceVizView.vue
@@ -0,0 +1,64 @@
+<template>
+  <div class="min-h-screen bg-gray-900 text-white p-4">
+    <div class="flex items-center justify-between mb-4">
+      <h2 class="text-xl font-bold text-blue-400">V5: 3D Space-Time Cube</h2>
+      <button @click="goBack" class="text-sm bg-gray-700 hover:bg-gray-600 px-3 py-1 rounded">&larr; 返回</button>
+    </div>
+    <div class="text-xs text-gray-500 mb-3 flex gap-4">
+      <span>X = 畫面水平位置（紅軸）</span>
+      <span>Y = 畫面垂直位置（綠軸）</span>
+      <span>Z = 深度 - bbox 面積（藍軸）</span>
+      <span>T = 時間 - 顏色漸層藍&rarr;紅</span>
+    </div>
+    <div class="h-[calc(100vh-140px)]">
+      <SpaceTimeCube
+        :file-uuid="fileUuid"
+        :traces="allTraces"
+        :frame-width="1920"
+        :frame-height="1080"
+      />
+    </div>
+  </div>
+</template>
+
+<script setup lang="ts">
+import { ref, onMounted } from 'vue'
+import { useRoute, useRouter } from 'vue-router'
+import { getCurrentConfig } from '@/api/client'
+import SpaceTimeCube from '@/components/SpaceTimeCube.vue'
+
+const route = useRoute()
+const router = useRouter()
+const fileUuid = route.params.file_uuid as string
+const allTraces = ref<any[]>([])
+
+// Auto-configure from query params (for demo)
+const keyParam = route.query.key as string
+const baseParam = route.query.base as string
+if (keyParam && baseParam) {
+  const existing = JSON.parse(localStorage.getItem('portal_config') || '{}')
+  existing.api_key = keyParam
+  existing.api_base_url = baseParam
+  localStorage.setItem('portal_config', JSON.stringify(existing))
+}
+
+const goBack = () => router.back()
+
+onMounted(async () => {
+  const config = getCurrentConfig()
+  try {
+    const resp = await fetch(`${config.api_base_url}/api/v1/file/${fileUuid}/face_trace/sortby`, {
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        ...(config.api_key ? { 'X-API-Key': config.api_key } : {})
+      },
+      body: JSON.stringify({ sort_by: 'face_count', limit: 200, min_faces: 1 })
+    })
+    const data = await resp.json()
+    allTraces.value = data.traces || []
+  } catch (e) {
+    console.error('Failed to load traces:', e)
+  }
+})
+</script>
\ No newline at end of file
diff --git a/release/dev_upgrade_v1.0.3/UPGRADE.md b/release/dev_upgrade_v1.0.3/UPGRADE.md
new file mode 100644
index 0000000..cc0eb9a
--- /dev/null
+++ b/release/dev_upgrade_v1.0.3/UPGRADE.md
@@ -0,0 +1,15 @@
+# Dev Upgrade v1.0.3
+
+## Steps
+
+```bash
+# 1. Apply migration
+psql -U accusys -d momentry < schema/migration_v1.0.3.sql
+
+# 2. Replace binary
+cp bin/momentry_playground /Users/accusys/momentry_core_0.1/target/debug/
+
+# 3. Restart
+pkill momentry_playground
+DATABASE_SCHEMA=dev /Users/accusys/momentry_core_0.1/target/debug/momentry_playground server --port 3003
+```
diff --git a/release/dev_upgrade_v1.0.3/bin/momentry_playground b/release/dev_upgrade_v1.0.3/bin/momentry_playground
new file mode 100755
index 0000000..66a1e48
Binary files /dev/null and b/release/dev_upgrade_v1.0.3/bin/momentry_playground differ
diff --git a/release/dev_upgrade_v1.0.3/schema/migration_v1.0.3.sql b/release/dev_upgrade_v1.0.3/schema/migration_v1.0.3.sql
new file mode 100644
index 0000000..20b257e
--- /dev/null
+++ b/release/dev_upgrade_v1.0.3/schema/migration_v1.0.3.sql
@@ -0,0 +1,10 @@
+-- Migration: dev schema v1.0.3
+-- Date: 2026-05-11
+-- Auto-generated from current DB schema
+
+SET search_path TO dev;
+
+ALTER TABLE dev.face_detections ADD COLUMN IF NOT EXISTS timestamp_secs float8;
+
+-- Chunk index removals (already applied)
+-- chunk_vectors: standard columns
diff --git a/release/public_schema_v1.0.0.sql b/release/public_schema_v1.0.0.sql
new file mode 100644
index 0000000..5b15732
--- /dev/null
+++ b/release/public_schema_v1.0.0.sql
@@ -0,0 +1,4863 @@
+--
+-- PostgreSQL database dump
+--
+
+\restrict hRi4nBNv2E5FXxBTf47fTk0vxfJNiXtnegSYFeraY46zaCyMMlYNanEdl70C1E7
+
+-- Dumped from database version 18.1 (Homebrew)
+-- Dumped by pg_dump version 18.1 (Homebrew)
+
+SET statement_timeout = 0;
+SET lock_timeout = 0;
+SET idle_in_transaction_session_timeout = 0;
+SET transaction_timeout = 0;
+SET client_encoding = 'UTF8';
+SET standard_conforming_strings = on;
+SELECT pg_catalog.set_config('search_path', '', false);
+SET check_function_bodies = false;
+SET xmloption = content;
+SET client_min_messages = warning;
+SET row_security = off;
+
+--
+-- Name: public; Type: SCHEMA; Schema: -; Owner: pg_database_owner
+--
+
+CREATE SCHEMA public;
+
+
+ALTER SCHEMA public OWNER TO pg_database_owner;
+
+--
+-- Name: SCHEMA public; Type: COMMENT; Schema: -; Owner: pg_database_owner
+--
+
+COMMENT ON SCHEMA public IS 'standard public schema';
+
+
+--
+-- Name: auto_match_face_speaker(character varying, double precision); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.auto_match_face_speaker(p_video_uuid character varying, p_threshold double precision DEFAULT 0.5) RETURNS TABLE(face_id character varying, speaker_id character varying, confidence double precision, match_count bigint)
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    RETURN QUERY
+    -- Find face detections that overlap with ASRX segments
+    SELECT 
+        fd.face_id,
+        seg.speaker_id,
+        COUNT(*)::DOUBLE PRECISION / NULLIF(COUNT(DISTINCT seg.speaker_id), 0) AS confidence,
+        COUNT(*) AS match_count
+    FROM face_detections fd
+    CROSS JOIN LATERAL (
+        SELECT 
+            seg_data->>'speaker_id' AS speaker_id,
+            (seg_data->>'start')::DOUBLE PRECISION AS seg_start,
+            (seg_data->>'end')::DOUBLE PRECISION AS seg_end
+        FROM face_recognition_results frr,
+             jsonb_array_elements(frr.result_data->'frames') AS frame_data,
+             jsonb_array_elements(frame_data->'faces') AS face_data,
+             jsonb_array_elements(frr.result_data->'segments') AS seg_data
+        WHERE frr.video_uuid = p_video_uuid
+          AND face_data->>'face_id' = fd.face_id
+    ) seg
+    WHERE fd.video_uuid = p_video_uuid
+      AND fd.timestamp_secs >= seg.seg_start
+      AND fd.timestamp_secs <= seg.seg_end
+      AND fd.face_id IS NOT NULL
+      AND seg.speaker_id IS NOT NULL
+    GROUP BY fd.face_id, seg.speaker_id
+    HAVING COUNT(*)::DOUBLE PRECISION / NULLIF(COUNT(DISTINCT seg.speaker_id), 0) >= p_threshold
+    ORDER BY confidence DESC;
+END;
+$$;
+
+
+ALTER FUNCTION public.auto_match_face_speaker(p_video_uuid character varying, p_threshold double precision) OWNER TO accusys;
+
+--
+-- Name: FUNCTION auto_match_face_speaker(p_video_uuid character varying, p_threshold double precision); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.auto_match_face_speaker(p_video_uuid character varying, p_threshold double precision) IS 'Automatically matches face detections with speaker segments';
+
+
+--
+-- Name: find_or_create_face_identity(character varying, character varying, public.vector, jsonb, jsonb); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.find_or_create_face_identity(p_face_id character varying, p_name character varying DEFAULT NULL::character varying, p_embedding public.vector DEFAULT NULL::public.vector, p_attributes jsonb DEFAULT NULL::jsonb, p_metadata jsonb DEFAULT '{}'::jsonb) RETURNS integer
+    LANGUAGE plpgsql
+    AS $$
+DECLARE
+    v_id INTEGER;
+BEGIN
+    -- Try to find existing face identity
+    SELECT id INTO v_id
+    FROM face_identities
+    WHERE face_id = p_face_id;
+    
+    IF v_id IS NULL THEN
+        -- Create new face identity
+        INSERT INTO face_identities (face_id, name, embedding, attributes, metadata)
+        VALUES (p_face_id, p_name, p_embedding, p_attributes, p_metadata)
+        RETURNING id INTO v_id;
+    ELSE
+        -- Update existing face identity
+        UPDATE face_identities
+        SET 
+            name = COALESCE(p_name, name),
+            embedding = COALESCE(p_embedding, embedding),
+            attributes = COALESCE(p_attributes, attributes),
+            metadata = COALESCE(p_metadata, metadata),
+            updated_at = CURRENT_TIMESTAMP
+        WHERE id = v_id;
+    END IF;
+    
+    RETURN v_id;
+END;
+$$;
+
+
+ALTER FUNCTION public.find_or_create_face_identity(p_face_id character varying, p_name character varying, p_embedding public.vector, p_attributes jsonb, p_metadata jsonb) OWNER TO accusys;
+
+--
+-- Name: FUNCTION find_or_create_face_identity(p_face_id character varying, p_name character varying, p_embedding public.vector, p_attributes jsonb, p_metadata jsonb); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.find_or_create_face_identity(p_face_id character varying, p_name character varying, p_embedding public.vector, p_attributes jsonb, p_metadata jsonb) IS 'Finds or creates a face identity record';
+
+
+--
+-- Name: find_persons_at_time(character varying, double precision, double precision); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.find_persons_at_time(p_video_uuid character varying, p_time double precision, p_tolerance double precision DEFAULT 0.0) RETURNS TABLE(person_id character varying, name character varying, confidence double precision, appearance_id integer)
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    RETURN QUERY
+    SELECT 
+        pi.person_id,
+        pi.name,
+        pa.confidence,
+        pa.id AS appearance_id
+    FROM person_appearances pa
+    JOIN person_identities pi ON pa.person_id = pi.person_id
+    WHERE pa.video_uuid = p_video_uuid
+      AND pa.start_time <= p_time + p_tolerance
+      AND pa.end_time >= p_time - p_tolerance
+    ORDER BY pa.confidence DESC;
+END;
+$$;
+
+
+ALTER FUNCTION public.find_persons_at_time(p_video_uuid character varying, p_time double precision, p_tolerance double precision) OWNER TO accusys;
+
+--
+-- Name: FUNCTION find_persons_at_time(p_video_uuid character varying, p_time double precision, p_tolerance double precision); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.find_persons_at_time(p_video_uuid character varying, p_time double precision, p_tolerance double precision) IS 'Finds persons appearing at a specific time in video';
+
+
+--
+-- Name: find_persons_in_range(character varying, double precision, double precision); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.find_persons_in_range(p_video_uuid character varying, p_start_time double precision, p_end_time double precision) RETURNS TABLE(person_id character varying, name character varying, overlap_duration double precision, confidence double precision)
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    RETURN QUERY
+    SELECT 
+        pi.person_id,
+        pi.name,
+        LEAST(pa.end_time, p_end_time) - GREATEST(pa.start_time, p_start_time) AS overlap_duration,
+        AVG(pa.confidence) AS confidence
+    FROM person_appearances pa
+    JOIN person_identities pi ON pa.person_id = pi.person_id
+    WHERE pa.video_uuid = p_video_uuid
+      AND pa.start_time < p_end_time
+      AND pa.end_time > p_start_time
+    GROUP BY pi.person_id, pi.name, pa.end_time, pa.start_time
+    ORDER BY overlap_duration DESC;
+END;
+$$;
+
+
+ALTER FUNCTION public.find_persons_in_range(p_video_uuid character varying, p_start_time double precision, p_end_time double precision) OWNER TO accusys;
+
+--
+-- Name: FUNCTION find_persons_in_range(p_video_uuid character varying, p_start_time double precision, p_end_time double precision); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.find_persons_in_range(p_video_uuid character varying, p_start_time double precision, p_end_time double precision) IS 'Finds persons appearing in a time range with overlap calculation';
+
+
+--
+-- Name: find_similar_faces(public.vector, double precision, integer); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.find_similar_faces(query_embedding public.vector, similarity_threshold double precision DEFAULT 0.6, limit_count integer DEFAULT 10) RETURNS TABLE(face_id character varying, name character varying, similarity double precision, attributes jsonb, metadata jsonb)
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    RETURN QUERY
+    SELECT 
+        fi.face_id,
+        fi.name,
+        1 - (fi.embedding <=> query_embedding) AS similarity,
+        fi.attributes,
+        fi.metadata
+    FROM face_identities fi
+    WHERE fi.is_active = TRUE
+      AND fi.embedding IS NOT NULL
+      AND 1 - (fi.embedding <=> query_embedding) >= similarity_threshold
+    ORDER BY fi.embedding <=> query_embedding
+    LIMIT limit_count;
+END;
+$$;
+
+
+ALTER FUNCTION public.find_similar_faces(query_embedding public.vector, similarity_threshold double precision, limit_count integer) OWNER TO accusys;
+
+--
+-- Name: FUNCTION find_similar_faces(query_embedding public.vector, similarity_threshold double precision, limit_count integer); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.find_similar_faces(query_embedding public.vector, similarity_threshold double precision, limit_count integer) IS 'Finds similar faces based on embedding similarity';
+
+
+--
+-- Name: merge_person_identities(character varying, character varying[]); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.merge_person_identities(p_target_person_id character varying, p_source_person_ids character varying[]) RETURNS void
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    -- Update all appearances to point to target person
+    UPDATE person_appearances
+    SET person_id = p_target_person_id
+    WHERE person_id = ANY(p_source_person_ids);
+    
+    -- Delete source person identities
+    DELETE FROM person_identities
+    WHERE person_id = ANY(p_source_person_ids)
+      AND person_id != p_target_person_id;
+    
+    -- Update target person statistics
+    PERFORM update_person_appearance_stats(p_target_person_id);
+END;
+$$;
+
+
+ALTER FUNCTION public.merge_person_identities(p_target_person_id character varying, p_source_person_ids character varying[]) OWNER TO accusys;
+
+--
+-- Name: FUNCTION merge_person_identities(p_target_person_id character varying, p_source_person_ids character varying[]); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.merge_person_identities(p_target_person_id character varying, p_source_person_ids character varying[]) IS 'Merges multiple person identities into one';
+
+
+--
+-- Name: trigger_update_person_stats(); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.trigger_update_person_stats() RETURNS trigger
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    IF TG_OP = 'INSERT' THEN
+        PERFORM update_person_appearance_stats(NEW.person_id);
+    ELSIF TG_OP = 'UPDATE' THEN
+        PERFORM update_person_appearance_stats(NEW.person_id);
+        IF NEW.person_id != OLD.person_id THEN
+            PERFORM update_person_appearance_stats(OLD.person_id);
+        END IF;
+    ELSIF TG_OP = 'DELETE' THEN
+        PERFORM update_person_appearance_stats(OLD.person_id);
+    END IF;
+    
+    RETURN NULL;
+END;
+$$;
+
+
+ALTER FUNCTION public.trigger_update_person_stats() OWNER TO accusys;
+
+--
+-- Name: update_cluster_centroid(character varying); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.update_cluster_centroid(cluster_uuid character varying) RETURNS void
+    LANGUAGE plpgsql
+    AS $$
+DECLARE
+    new_centroid VECTOR(512);
+BEGIN
+    -- Calculate new centroid from all face embeddings in the cluster
+    SELECT AVG(embedding) INTO new_centroid
+    FROM face_detections
+    WHERE cluster_id = cluster_uuid
+      AND embedding IS NOT NULL;
+    
+    -- Update cluster centroid
+    UPDATE face_clusters
+    SET centroid = new_centroid,
+        size = (SELECT COUNT(*) FROM face_detections WHERE cluster_id = cluster_uuid)
+    WHERE cluster_id = cluster_uuid;
+END;
+$$;
+
+
+ALTER FUNCTION public.update_cluster_centroid(cluster_uuid character varying) OWNER TO accusys;
+
+--
+-- Name: FUNCTION update_cluster_centroid(cluster_uuid character varying); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.update_cluster_centroid(cluster_uuid character varying) IS 'Updates cluster centroid from member embeddings';
+
+
+--
+-- Name: update_person_appearance_stats(character varying); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.update_person_appearance_stats(p_person_id character varying) RETURNS void
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    UPDATE person_identities
+    SET 
+        appearance_count = (
+            SELECT COUNT(*) 
+            FROM person_appearances 
+            WHERE person_id = p_person_id
+        ),
+        total_appearance_duration = (
+            SELECT COALESCE(SUM(duration), 0.0)
+            FROM person_appearances 
+            WHERE person_id = p_person_id
+        ),
+        first_appearance_time = (
+            SELECT MIN(start_time)
+            FROM person_appearances 
+            WHERE person_id = p_person_id
+        ),
+        last_appearance_time = (
+            SELECT MAX(end_time)
+            FROM person_appearances 
+            WHERE person_id = p_person_id
+        ),
+        updated_at = CURRENT_TIMESTAMP
+    WHERE person_id = p_person_id;
+END;
+$$;
+
+
+ALTER FUNCTION public.update_person_appearance_stats(p_person_id character varying) OWNER TO accusys;
+
+--
+-- Name: FUNCTION update_person_appearance_stats(p_person_id character varying); Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON FUNCTION public.update_person_appearance_stats(p_person_id character varying) IS 'Updates person identity statistics from appearances';
+
+
+--
+-- Name: update_search_vector(); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.update_search_vector() RETURNS trigger
+    LANGUAGE plpgsql
+    AS $$
+            BEGIN
+                NEW.search_vector := to_tsvector('english', COALESCE(NEW.text_content, ''));
+                RETURN NEW;
+            END;
+            $$;
+
+
+ALTER FUNCTION public.update_search_vector() OWNER TO accusys;
+
+--
+-- Name: update_updated_at_column(); Type: FUNCTION; Schema: public; Owner: accusys
+--
+
+CREATE FUNCTION public.update_updated_at_column() RETURNS trigger
+    LANGUAGE plpgsql
+    AS $$
+BEGIN
+    NEW.updated_at = CURRENT_TIMESTAMP;
+    RETURN NEW;
+END;
+$$;
+
+
+ALTER FUNCTION public.update_updated_at_column() OWNER TO accusys;
+
+SET default_tablespace = '';
+
+SET default_table_access_method = heap;
+
+--
+-- Name: api_key_anomalies; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.api_key_anomalies (
+    id integer NOT NULL,
+    key_id character varying(32) NOT NULL,
+    anomaly_type character varying(30) NOT NULL,
+    severity character varying(10) NOT NULL,
+    ip_address character varying(45),
+    request_count integer,
+    error_count integer,
+    error_rate double precision,
+    unique_ips integer,
+    details jsonb,
+    resolved boolean DEFAULT false,
+    resolved_at timestamp without time zone,
+    resolved_by character varying(128),
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.api_key_anomalies OWNER TO accusys;
+
+--
+-- Name: api_key_anomalies_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.api_key_anomalies_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.api_key_anomalies_id_seq OWNER TO accusys;
+
+--
+-- Name: api_key_anomalies_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.api_key_anomalies_id_seq OWNED BY public.api_key_anomalies.id;
+
+
+--
+-- Name: api_key_audit_log; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.api_key_audit_log (
+    id integer NOT NULL,
+    key_id character varying(32) NOT NULL,
+    action character varying(50) NOT NULL,
+    actor character varying(128),
+    ip_address character varying(45),
+    user_agent text,
+    request_path text,
+    response_code integer,
+    anomaly_type character varying(30),
+    details jsonb,
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.api_key_audit_log OWNER TO accusys;
+
+--
+-- Name: api_key_audit_log_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.api_key_audit_log_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.api_key_audit_log_id_seq OWNER TO accusys;
+
+--
+-- Name: api_key_audit_log_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.api_key_audit_log_id_seq OWNED BY public.api_key_audit_log.id;
+
+
+--
+-- Name: api_keys; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.api_keys (
+    id integer NOT NULL,
+    key_id character varying(48) NOT NULL,
+    key_hash character varying(64) NOT NULL,
+    key_prefix character varying(8) NOT NULL,
+    name character varying(128) NOT NULL,
+    key_type character varying(20) DEFAULT 'user'::character varying NOT NULL,
+    user_id bigint,
+    service_name character varying(64),
+    permissions jsonb DEFAULT '["read", "write"]'::jsonb,
+    expires_at timestamp with time zone,
+    last_used_at timestamp with time zone,
+    last_used_ip character varying(45),
+    usage_count bigint DEFAULT 0,
+    status character varying(20) DEFAULT 'active'::character varying NOT NULL,
+    rotation_required boolean DEFAULT false,
+    rotation_reason text,
+    grace_period_end timestamp with time zone,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.api_keys OWNER TO accusys;
+
+--
+-- Name: api_keys_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.api_keys_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.api_keys_id_seq OWNER TO accusys;
+
+--
+-- Name: api_keys_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.api_keys_id_seq OWNED BY public.api_keys.id;
+
+
+--
+-- Name: backup_history; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.backup_history (
+    id integer NOT NULL,
+    service_name character varying(50) NOT NULL,
+    operation character varying(20),
+    backup_file character varying(500),
+    backup_tier character varying(20),
+    source_tier character varying(20),
+    dest_tier character varying(20),
+    file_count bigint,
+    size_bytes bigint,
+    duration_seconds integer,
+    status character varying(20),
+    error_message text,
+    executed_at timestamp without time zone DEFAULT now(),
+    CONSTRAINT backup_history_operation_check CHECK (((operation)::text = ANY ((ARRAY['backup'::character varying, 'restore'::character varying, 'tier_migration'::character varying, 'cleanup'::character varying, 'verify'::character varying])::text[]))),
+    CONSTRAINT backup_history_status_check CHECK (((status)::text = ANY ((ARRAY['success'::character varying, 'failed'::character varying, 'partial'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.backup_history OWNER TO accusys;
+
+--
+-- Name: backup_history_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.backup_history_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.backup_history_id_seq OWNER TO accusys;
+
+--
+-- Name: backup_history_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.backup_history_id_seq OWNED BY public.backup_history.id;
+
+
+--
+-- Name: backup_registry; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.backup_registry (
+    id integer NOT NULL,
+    service_name character varying(50) NOT NULL,
+    backup_file character varying(500) NOT NULL,
+    backup_size_bytes bigint,
+    backup_type character varying(20),
+    status character varying(20),
+    created_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.backup_registry OWNER TO accusys;
+
+--
+-- Name: backup_registry_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.backup_registry_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.backup_registry_id_seq OWNER TO accusys;
+
+--
+-- Name: backup_registry_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.backup_registry_id_seq OWNED BY public.backup_registry.id;
+
+
+--
+-- Name: backup_storage_stats; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.backup_storage_stats (
+    id integer NOT NULL,
+    tier character varying(20),
+    file_count bigint,
+    total_size_bytes bigint,
+    record_time timestamp without time zone DEFAULT now(),
+    CONSTRAINT backup_storage_stats_tier_check CHECK (((tier)::text = ANY ((ARRAY['daily'::character varying, 'weekly'::character varying, 'monthly'::character varying, 'archive'::character varying, 'total'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.backup_storage_stats OWNER TO accusys;
+
+--
+-- Name: backup_storage_stats_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.backup_storage_stats_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.backup_storage_stats_id_seq OWNER TO accusys;
+
+--
+-- Name: backup_storage_stats_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.backup_storage_stats_id_seq OWNED BY public.backup_storage_stats.id;
+
+
+--
+-- Name: castings; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.castings (
+    id bigint NOT NULL,
+    character_id bigint,
+    talent_id bigint,
+    track_type character varying(32) DEFAULT 'original'::character varying,
+    role_type character varying(32) DEFAULT 'both'::character varying
+);
+
+
+ALTER TABLE public.castings OWNER TO accusys;
+
+--
+-- Name: TABLE castings; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.castings IS 'Talent 與 Character 的飾演關係';
+
+
+--
+-- Name: castings_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.castings_id_seq
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.castings_id_seq OWNER TO accusys;
+
+--
+-- Name: castings_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.castings_id_seq OWNED BY public.castings.id;
+
+
+--
+-- Name: characters; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.characters (
+    id bigint NOT NULL,
+    video_uuid text NOT NULL,
+    name text NOT NULL,
+    language_track text DEFAULT 'original'::text,
+    is_voice_only boolean DEFAULT false,
+    metadata jsonb DEFAULT '{}'::jsonb
+);
+
+
+ALTER TABLE public.characters OWNER TO accusys;
+
+--
+-- Name: TABLE characters; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.characters IS '視頻中的劇中角色';
+
+
+--
+-- Name: characters_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.characters_id_seq
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.characters_id_seq OWNER TO accusys;
+
+--
+-- Name: characters_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.characters_id_seq OWNED BY public.characters.id;
+
+
+--
+-- Name: child_chunks; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.child_chunks (
+    id integer NOT NULL,
+    parent_id integer,
+    uuid text NOT NULL,
+    start_time double precision NOT NULL,
+    end_time double precision NOT NULL,
+    raw_text text,
+    raw_text_vector public.vector(768),
+    speaker_ids text[],
+    tags text[],
+    created_at timestamp with time zone DEFAULT now(),
+    face_ids text[] DEFAULT '{}'::text[],
+    start_frame bigint,
+    end_frame bigint,
+    fps double precision DEFAULT 24.0
+);
+
+
+ALTER TABLE public.child_chunks OWNER TO accusys;
+
+--
+-- Name: child_chunks_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.child_chunks_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.child_chunks_id_seq OWNER TO accusys;
+
+--
+-- Name: child_chunks_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.child_chunks_id_seq OWNED BY public.child_chunks.id;
+
+
+--
+-- Name: chunk_vectors; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.chunk_vectors (
+    id integer NOT NULL,
+    chunk_id character varying(64) NOT NULL,
+    uuid character varying(32) NOT NULL,
+    chunk_type character varying(32) NOT NULL,
+    start_time double precision,
+    end_time double precision,
+    embedding text,
+    metadata jsonb,
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
+    embedding_vector public.vector(768),
+    file_id integer
+);
+
+
+ALTER TABLE public.chunk_vectors OWNER TO accusys;
+
+--
+-- Name: chunk_vectors_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.chunk_vectors_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.chunk_vectors_id_seq OWNER TO accusys;
+
+--
+-- Name: chunk_vectors_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.chunk_vectors_id_seq OWNED BY public.chunk_vectors.id;
+
+
+--
+-- Name: chunks; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.chunks (
+    id integer NOT NULL,
+    uuid character varying(32) NOT NULL,
+    chunk_id character varying(64) NOT NULL,
+    chunk_index integer NOT NULL,
+    chunk_type character varying(32) NOT NULL,
+    start_time double precision NOT NULL,
+    end_time double precision NOT NULL,
+    content jsonb NOT NULL,
+    vector_id character varying(64),
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
+    fps double precision DEFAULT 24.0,
+    start_frame bigint DEFAULT 0,
+    end_frame bigint DEFAULT 0,
+    metadata jsonb,
+    updated_at timestamp without time zone DEFAULT now(),
+    file_id integer,
+    text_content text,
+    frame_count integer DEFAULT 0,
+    pre_chunk_ids integer[],
+    parent_chunk_id character varying(64),
+    child_chunk_ids text[],
+    search_vector tsvector,
+    speaker_ids text[] DEFAULT '{}'::text[],
+    face_ids text[] DEFAULT '{}'::text[],
+    visual_stats jsonb DEFAULT '{}'::jsonb
+);
+
+
+ALTER TABLE public.chunks OWNER TO accusys;
+
+--
+-- Name: chunks_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.chunks_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.chunks_id_seq OWNER TO accusys;
+
+--
+-- Name: chunks_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.chunks_id_seq OWNED BY public.chunks.id;
+
+
+--
+-- Name: face_clusters; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.face_clusters (
+    id integer NOT NULL,
+    cluster_id character varying(255) NOT NULL,
+    video_uuid character varying(255) NOT NULL,
+    centroid public.vector(512),
+    size integer DEFAULT 0 NOT NULL,
+    representative_face_id character varying(255),
+    metadata jsonb DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.face_clusters OWNER TO accusys;
+
+--
+-- Name: TABLE face_clusters; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.face_clusters IS 'Stores face clusters from video analysis';
+
+
+--
+-- Name: face_clusters_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.face_clusters_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.face_clusters_id_seq OWNER TO accusys;
+
+--
+-- Name: face_clusters_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.face_clusters_id_seq OWNED BY public.face_clusters.id;
+
+
+--
+-- Name: face_detections; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.face_detections (
+    id integer NOT NULL,
+    video_uuid character varying(255) NOT NULL,
+    frame_number bigint NOT NULL,
+    timestamp_secs double precision NOT NULL,
+    face_id character varying(255),
+    x integer NOT NULL,
+    y integer NOT NULL,
+    width integer NOT NULL,
+    height integer NOT NULL,
+    confidence double precision NOT NULL,
+    embedding public.vector(512),
+    attributes jsonb,
+    identity_id integer,
+    identity_confidence double precision,
+    cluster_id character varying(255),
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.face_detections OWNER TO accusys;
+
+--
+-- Name: TABLE face_detections; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.face_detections IS 'Stores individual face detections from videos';
+
+
+--
+-- Name: face_detections_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.face_detections_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.face_detections_id_seq OWNER TO accusys;
+
+--
+-- Name: face_detections_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.face_detections_id_seq OWNED BY public.face_detections.id;
+
+
+--
+-- Name: face_identities; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.face_identities (
+    id integer NOT NULL,
+    face_id character varying(255) NOT NULL,
+    name character varying(255),
+    embedding public.vector(512),
+    attributes jsonb,
+    metadata jsonb DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    is_active boolean DEFAULT true
+);
+
+
+ALTER TABLE public.face_identities OWNER TO accusys;
+
+--
+-- Name: TABLE face_identities; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.face_identities IS 'Stores registered face identities with embeddings';
+
+
+--
+-- Name: face_identities_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.face_identities_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.face_identities_id_seq OWNER TO accusys;
+
+--
+-- Name: face_identities_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.face_identities_id_seq OWNED BY public.face_identities.id;
+
+
+--
+-- Name: face_recognition_results; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.face_recognition_results (
+    id integer NOT NULL,
+    video_uuid character varying(255) NOT NULL,
+    frame_count bigint DEFAULT 0 NOT NULL,
+    fps double precision DEFAULT 0.0 NOT NULL,
+    total_faces integer DEFAULT 0 NOT NULL,
+    recognized_faces integer DEFAULT 0 NOT NULL,
+    clusters_count integer DEFAULT 0 NOT NULL,
+    result_data jsonb NOT NULL,
+    processing_time_secs double precision,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.face_recognition_results OWNER TO accusys;
+
+--
+-- Name: TABLE face_recognition_results; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.face_recognition_results IS 'Stores face recognition processing results';
+
+
+--
+-- Name: face_recognition_results_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.face_recognition_results_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.face_recognition_results_id_seq OWNER TO accusys;
+
+--
+-- Name: face_recognition_results_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.face_recognition_results_id_seq OWNED BY public.face_recognition_results.id;
+
+
+--
+-- Name: file_lifecycle; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.file_lifecycle (
+    id integer NOT NULL,
+    file_uuid uuid,
+    file_path text,
+    user_cluster character varying(50),
+    storage_tier character varying(20),
+    created_at timestamp without time zone,
+    last_accessed_at timestamp without time zone,
+    last_modified_at timestamp without time zone,
+    access_count integer DEFAULT 0,
+    current_status character varying(20) DEFAULT 'active'::character varying,
+    tier_migration_count integer DEFAULT 0,
+    migrated_at timestamp without time zone
+);
+
+
+ALTER TABLE public.file_lifecycle OWNER TO accusys;
+
+--
+-- Name: file_lifecycle_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.file_lifecycle_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.file_lifecycle_id_seq OWNER TO accusys;
+
+--
+-- Name: file_lifecycle_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.file_lifecycle_id_seq OWNED BY public.file_lifecycle.id;
+
+
+--
+-- Name: file_registry; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.file_registry (
+    file_uuid uuid DEFAULT gen_random_uuid() NOT NULL,
+    file_name character varying(255) NOT NULL,
+    file_path text NOT NULL,
+    file_path_hash character varying(64) NOT NULL,
+    file_size bigint NOT NULL,
+    file_hash character varying(64),
+    mime_type character varying(100),
+    user_cluster character varying(50),
+    owner_id character varying(100),
+    storage_tier character varying(20) DEFAULT 'hot'::character varying,
+    storage_location character varying(500),
+    status character varying(20) DEFAULT 'active'::character varying,
+    is_registered boolean DEFAULT true,
+    created_at timestamp without time zone DEFAULT now(),
+    updated_at timestamp without time zone DEFAULT now(),
+    last_accessed_at timestamp without time zone,
+    access_count integer DEFAULT 0,
+    archived_at timestamp without time zone,
+    archive_location character varying(500),
+    retention_until timestamp without time zone,
+    CONSTRAINT file_registry_status_check CHECK (((status)::text = ANY ((ARRAY['active'::character varying, 'temporary'::character varying, 'archived'::character varying, 'deleted'::character varying])::text[]))),
+    CONSTRAINT file_registry_storage_tier_check CHECK (((storage_tier)::text = ANY ((ARRAY['hot'::character varying, 'warm'::character varying, 'cold'::character varying])::text[]))),
+    CONSTRAINT file_registry_user_cluster_check CHECK (((user_cluster)::text = ANY ((ARRAY['family'::character varying, 'work'::character varying, 'wordpress'::character varying, 'shared'::character varying, 'system'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.file_registry OWNER TO accusys;
+
+--
+-- Name: frames; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.frames (
+    id integer NOT NULL,
+    file_id integer NOT NULL,
+    frame_number bigint NOT NULL,
+    "timestamp" double precision NOT NULL,
+    fps double precision DEFAULT 24.0 NOT NULL,
+    yolo_objects jsonb,
+    ocr_results jsonb,
+    face_results jsonb,
+    frame_path text,
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
+    pose_results jsonb
+);
+
+
+ALTER TABLE public.frames OWNER TO accusys;
+
+--
+-- Name: frames_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.frames_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.frames_id_seq OWNER TO accusys;
+
+--
+-- Name: frames_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.frames_id_seq OWNED BY public.frames.id;
+
+
+--
+-- Name: gitea_tokens; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.gitea_tokens (
+    id integer NOT NULL,
+    gitea_token_id bigint NOT NULL,
+    gitea_user character varying(128) NOT NULL,
+    token_name character varying(128) NOT NULL,
+    token_last_eight character varying(8) NOT NULL,
+    scopes jsonb DEFAULT '[]'::jsonb,
+    api_key_id character varying(48),
+    last_verified timestamp without time zone,
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.gitea_tokens OWNER TO accusys;
+
+--
+-- Name: gitea_tokens_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.gitea_tokens_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.gitea_tokens_id_seq OWNER TO accusys;
+
+--
+-- Name: gitea_tokens_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.gitea_tokens_id_seq OWNED BY public.gitea_tokens.id;
+
+
+--
+-- Name: identities; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.identities (
+    id integer NOT NULL,
+    name character varying(255) NOT NULL,
+    metadata jsonb DEFAULT '{}'::jsonb,
+    uuid uuid DEFAULT gen_random_uuid(),
+    identity_type character varying(30) DEFAULT 'people'::character varying,
+    source character varying(20) DEFAULT 'manual'::character varying,
+    status character varying(20) DEFAULT 'pending'::character varying,
+    voice_embedding public.vector(192),
+    identity_embedding public.vector(768),
+    reference_data jsonb DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT now(),
+    updated_at timestamp with time zone DEFAULT now(),
+    tmdb_id integer,
+    tmdb_profile text,
+    face_embedding public.vector(512),
+    CONSTRAINT identities_identity_type_check CHECK (((identity_type)::text = ANY ((ARRAY['people'::character varying, 'brand'::character varying, 'object'::character varying, 'concept'::character varying, 'logo'::character varying, 'symbol'::character varying, 'scene'::character varying, 'sound'::character varying, 'animal'::character varying, 'environmental'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.identities OWNER TO accusys;
+
+--
+-- Name: COLUMN identities.identity_type; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.identity_type IS 'Identity type: people, brand, object, concept, logo, symbol, scene, sound, animal, environmental';
+
+
+--
+-- Name: COLUMN identities.source; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.source IS 'Identity source: manual, tmdb, agent_suggested, ai_detection';
+
+
+--
+-- Name: COLUMN identities.status; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.status IS 'Identity status: pending, confirmed, skipped';
+
+
+--
+-- Name: COLUMN identities.voice_embedding; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.voice_embedding IS 'ECAPA-TDNN 192-dim voice embedding';
+
+
+--
+-- Name: COLUMN identities.identity_embedding; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.identity_embedding IS 'CLIP ViT-L/14 768-dim embedding for logo/symbol/object identity';
+
+
+--
+-- Name: COLUMN identities.reference_data; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.reference_data IS 'JSONB: {face_embeddings[], voice_embeddings[], identity_embeddings[], sound_embeddings[], image_urls[]}';
+
+
+--
+-- Name: COLUMN identities.tmdb_id; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.tmdb_id IS 'TMDB person ID';
+
+
+--
+-- Name: COLUMN identities.tmdb_profile; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.tmdb_profile IS 'TMDB profile image URL';
+
+
+--
+-- Name: COLUMN identities.face_embedding; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.identities.face_embedding IS 'InsightFace ArcFace 512-dim embedding';
+
+
+--
+-- Name: identities_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.identities_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.identities_id_seq OWNER TO accusys;
+
+--
+-- Name: identities_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.identities_id_seq OWNED BY public.identities.id;
+
+
+--
+-- Name: identity_bindings; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.identity_bindings (
+    id integer NOT NULL,
+    identity_id integer,
+    uuid text NOT NULL,
+    binding_type character varying(32) NOT NULL,
+    binding_value character varying(64) NOT NULL
+);
+
+
+ALTER TABLE public.identity_bindings OWNER TO accusys;
+
+--
+-- Name: identity_bindings_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.identity_bindings_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.identity_bindings_id_seq OWNER TO accusys;
+
+--
+-- Name: identity_bindings_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.identity_bindings_id_seq OWNED BY public.identity_bindings.id;
+
+
+--
+-- Name: merge_history; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.merge_history (
+    id integer NOT NULL,
+    merge_id uuid DEFAULT gen_random_uuid() NOT NULL,
+    target_person_id character varying(255) NOT NULL,
+    source_person_ids text[] NOT NULL,
+    original_target_stats jsonb NOT NULL,
+    original_source_stats jsonb NOT NULL,
+    merged_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    merged_by character varying(255),
+    is_undone boolean DEFAULT false,
+    undone_at timestamp with time zone,
+    metadata jsonb DEFAULT '{}'::jsonb
+);
+
+
+ALTER TABLE public.merge_history OWNER TO accusys;
+
+--
+-- Name: TABLE merge_history; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.merge_history IS 'Tracks person merges for undo capability';
+
+
+--
+-- Name: merge_history_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.merge_history_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.merge_history_id_seq OWNER TO accusys;
+
+--
+-- Name: merge_history_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.merge_history_id_seq OWNED BY public.merge_history.id;
+
+
+--
+-- Name: monitor_anomalies; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_anomalies (
+    id integer NOT NULL,
+    anomaly_type character varying(50),
+    severity character varying(20),
+    source_type character varying(20),
+    username character varying(100),
+    source_ip character varying(45),
+    description text,
+    details jsonb,
+    detected_at timestamp without time zone DEFAULT now(),
+    resolved boolean DEFAULT false,
+    resolved_at timestamp without time zone,
+    CONSTRAINT monitor_anomalies_anomaly_type_check CHECK (((anomaly_type)::text = ANY ((ARRAY['brute_force'::character varying, 'privilege_escalation'::character varying, 'unusual_access'::character varying, 'unusual_time'::character varying, 'excessive_queries'::character varying, 'idle_session'::character varying, 'schema_change'::character varying])::text[]))),
+    CONSTRAINT monitor_anomalies_severity_check CHECK (((severity)::text = ANY ((ARRAY['low'::character varying, 'medium'::character varying, 'high'::character varying, 'critical'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_anomalies OWNER TO accusys;
+
+--
+-- Name: monitor_anomalies_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_anomalies_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_anomalies_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_anomalies_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_anomalies_id_seq OWNED BY public.monitor_anomalies.id;
+
+
+--
+-- Name: monitor_config; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_config (
+    id integer NOT NULL,
+    config_key character varying(50) NOT NULL,
+    config_value text,
+    description character varying(255),
+    updated_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_config OWNER TO accusys;
+
+--
+-- Name: monitor_config_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_config_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_config_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_config_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_config_id_seq OWNED BY public.monitor_config.id;
+
+
+--
+-- Name: monitor_databases; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_databases (
+    id integer NOT NULL,
+    db_type character varying(20) NOT NULL,
+    db_name character varying(50),
+    metric_name character varying(50) NOT NULL,
+    metric_value jsonb,
+    checked_at timestamp without time zone DEFAULT now(),
+    CONSTRAINT monitor_databases_db_type_check CHECK (((db_type)::text = ANY ((ARRAY['postgresql'::character varying, 'redis'::character varying, 'qdrant'::character varying, 'mariadb'::character varying, 'mongodb'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_databases OWNER TO accusys;
+
+--
+-- Name: monitor_databases_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_databases_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_databases_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_databases_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_databases_id_seq OWNED BY public.monitor_databases.id;
+
+
+--
+-- Name: monitor_external; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_external (
+    id integer NOT NULL,
+    target_name character varying(50) NOT NULL,
+    target_type character varying(20),
+    target_host character varying(255),
+    is_reachable boolean,
+    response_time_ms integer,
+    dns_resolved_ip character varying(45),
+    error_message text,
+    checked_at timestamp without time zone DEFAULT now(),
+    CONSTRAINT monitor_external_target_type_check CHECK (((target_type)::text = ANY ((ARRAY['ddns'::character varying, 'gateway'::character varying, 'internet'::character varying, 'api'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_external OWNER TO accusys;
+
+--
+-- Name: monitor_external_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_external_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_external_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_external_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_external_id_seq OWNED BY public.monitor_external.id;
+
+
+--
+-- Name: monitor_jobs; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_jobs (
+    id integer NOT NULL,
+    uuid character varying(16) NOT NULL,
+    video_path character varying(512),
+    status character varying(20) DEFAULT 'pending'::character varying NOT NULL,
+    current_processor character varying(20),
+    progress_total integer DEFAULT 0,
+    progress_current integer DEFAULT 0,
+    error_count integer DEFAULT 0,
+    last_error text,
+    started_at timestamp without time zone,
+    updated_at timestamp without time zone,
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
+    video_id bigint,
+    user_id bigint,
+    processors character varying(20)[] DEFAULT '{asr,cut,yolo,ocr,face,pose,asrx,caption,story}'::character varying[],
+    completed_processors character varying(20)[] DEFAULT '{}'::character varying[],
+    failed_processors character varying(20)[] DEFAULT '{}'::character varying[],
+    CONSTRAINT chk_monitor_jobs_status CHECK (((status)::text = ANY ((ARRAY['pending'::character varying, 'running'::character varying, 'completed'::character varying, 'failed'::character varying, 'cancelled'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_jobs OWNER TO accusys;
+
+--
+-- Name: COLUMN monitor_jobs.video_id; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.monitor_jobs.video_id IS 'Foreign key to videos.id';
+
+
+--
+-- Name: COLUMN monitor_jobs.user_id; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.monitor_jobs.user_id IS 'WordPress user ID';
+
+
+--
+-- Name: COLUMN monitor_jobs.processors; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.monitor_jobs.processors IS 'Processors to run: asr, cut, yolo, ocr, face, pose, asrx';
+
+
+--
+-- Name: COLUMN monitor_jobs.completed_processors; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.monitor_jobs.completed_processors IS 'Successfully completed processors';
+
+
+--
+-- Name: COLUMN monitor_jobs.failed_processors; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.monitor_jobs.failed_processors IS 'Failed processors';
+
+
+--
+-- Name: monitor_jobs_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_jobs_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_jobs_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_jobs_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_jobs_id_seq OWNED BY public.monitor_jobs.id;
+
+
+--
+-- Name: monitor_logins; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_logins (
+    id integer NOT NULL,
+    user_type character varying(20),
+    username character varying(100),
+    source_ip character varying(45),
+    user_agent text,
+    login_method character varying(20),
+    success boolean,
+    failure_reason character varying(200),
+    login_at timestamp without time zone DEFAULT now(),
+    CONSTRAINT monitor_logins_user_type_check CHECK (((user_type)::text = ANY ((ARRAY['system'::character varying, 'wordpress'::character varying, 'n8n'::character varying, 'gitea'::character varying, 'sftpgo'::character varying, 'database'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_logins OWNER TO accusys;
+
+--
+-- Name: monitor_logins_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_logins_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_logins_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_logins_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_logins_id_seq OWNED BY public.monitor_logins.id;
+
+
+--
+-- Name: monitor_pg_schema_changes; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_pg_schema_changes (
+    id integer NOT NULL,
+    database_name character varying(50),
+    schema_name character varying(50),
+    table_name character varying(100),
+    change_type character varying(20),
+    column_name character varying(100),
+    old_value text,
+    new_value text,
+    detected_at timestamp without time zone DEFAULT now(),
+    CONSTRAINT monitor_pg_schema_changes_change_type_check CHECK (((change_type)::text = ANY ((ARRAY['table_created'::character varying, 'table_dropped'::character varying, 'column_added'::character varying, 'column_removed'::character varying, 'column_type_changed'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_pg_schema_changes OWNER TO accusys;
+
+--
+-- Name: monitor_pg_schema_changes_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_pg_schema_changes_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_pg_schema_changes_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_pg_schema_changes_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_pg_schema_changes_id_seq OWNED BY public.monitor_pg_schema_changes.id;
+
+
+--
+-- Name: monitor_pg_tables; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_pg_tables (
+    id integer NOT NULL,
+    database_name character varying(50),
+    schema_name character varying(50),
+    table_name character varying(100),
+    table_type character varying(20),
+    row_count bigint,
+    table_size_bytes bigint,
+    index_size_bytes bigint,
+    snapshot_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_pg_tables OWNER TO accusys;
+
+--
+-- Name: monitor_pg_tables_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_pg_tables_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_pg_tables_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_pg_tables_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_pg_tables_id_seq OWNED BY public.monitor_pg_tables.id;
+
+
+--
+-- Name: monitor_portal_pages; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_portal_pages (
+    id integer NOT NULL,
+    page_url character varying(500) NOT NULL,
+    page_type character varying(20),
+    is_accessible boolean,
+    response_time_ms integer,
+    http_status integer,
+    error_message text,
+    checked_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_portal_pages OWNER TO accusys;
+
+--
+-- Name: monitor_portal_pages_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_portal_pages_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_portal_pages_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_portal_pages_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_portal_pages_id_seq OWNED BY public.monitor_portal_pages.id;
+
+
+--
+-- Name: monitor_portal_users; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_portal_users (
+    id integer NOT NULL,
+    user_id bigint,
+    username character varying(100),
+    email character varying(255),
+    role character varying(50),
+    is_active boolean,
+    last_login timestamp without time zone,
+    created_at timestamp without time zone,
+    detected_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_portal_users OWNER TO accusys;
+
+--
+-- Name: monitor_portal_users_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_portal_users_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_portal_users_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_portal_users_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_portal_users_id_seq OWNED BY public.monitor_portal_users.id;
+
+
+--
+-- Name: monitor_qdrant_collections; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_qdrant_collections (
+    id integer NOT NULL,
+    collection_name character varying(100),
+    vectors_count bigint,
+    points_count bigint,
+    disk_size_bytes bigint,
+    status character varying(20),
+    snapshot_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_qdrant_collections OWNER TO accusys;
+
+--
+-- Name: monitor_qdrant_collections_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_qdrant_collections_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_qdrant_collections_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_qdrant_collections_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_qdrant_collections_id_seq OWNED BY public.monitor_qdrant_collections.id;
+
+
+--
+-- Name: monitor_resource_usage; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_resource_usage (
+    id integer NOT NULL,
+    user_type character varying(20),
+    username character varying(100),
+    service_name character varying(50),
+    cpu_percent numeric(5,2),
+    memory_mb integer,
+    disk_io_read_mb bigint,
+    disk_io_write_mb bigint,
+    network_rx_mb bigint,
+    network_tx_mb bigint,
+    recorded_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_resource_usage OWNER TO accusys;
+
+--
+-- Name: monitor_resource_usage_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_resource_usage_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_resource_usage_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_resource_usage_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_resource_usage_id_seq OWNED BY public.monitor_resource_usage.id;
+
+
+--
+-- Name: monitor_services; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_services (
+    id integer NOT NULL,
+    service_name character varying(50) NOT NULL,
+    service_type character varying(20),
+    port integer,
+    status character varying(20),
+    response_time_ms integer,
+    error_message text,
+    checked_at timestamp without time zone DEFAULT now(),
+    CONSTRAINT monitor_services_status_check CHECK (((status)::text = ANY ((ARRAY['up'::character varying, 'down'::character varying, 'degraded'::character varying, 'unknown'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_services OWNER TO accusys;
+
+--
+-- Name: monitor_services_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_services_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_services_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_services_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_services_id_seq OWNED BY public.monitor_services.id;
+
+
+--
+-- Name: monitor_sessions; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_sessions (
+    id integer NOT NULL,
+    session_type character varying(20),
+    service_name character varying(50),
+    username character varying(100),
+    source_ip character varying(45),
+    source_port integer,
+    connected_at timestamp without time zone,
+    last_activity_at timestamp without time zone,
+    disconnected_at timestamp without time zone,
+    bytes_sent bigint,
+    bytes_received bigint,
+    status character varying(20),
+    CONSTRAINT monitor_sessions_session_type_check CHECK (((session_type)::text = ANY ((ARRAY['ssh'::character varying, 'web'::character varying, 'db'::character varying, 'sftp'::character varying, 'rdp'::character varying])::text[]))),
+    CONSTRAINT monitor_sessions_status_check CHECK (((status)::text = ANY ((ARRAY['active'::character varying, 'disconnected'::character varying, 'timeout'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.monitor_sessions OWNER TO accusys;
+
+--
+-- Name: monitor_sessions_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_sessions_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_sessions_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_sessions_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_sessions_id_seq OWNED BY public.monitor_sessions.id;
+
+
+--
+-- Name: monitor_sudo_history; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_sudo_history (
+    id integer NOT NULL,
+    username character varying(100),
+    command text,
+    run_as character varying(100),
+    tty character varying(50),
+    source_ip character varying(45),
+    exit_code integer,
+    executed_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_sudo_history OWNER TO accusys;
+
+--
+-- Name: monitor_sudo_history_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_sudo_history_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_sudo_history_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_sudo_history_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_sudo_history_id_seq OWNED BY public.monitor_sudo_history.id;
+
+
+--
+-- Name: monitor_workflows; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.monitor_workflows (
+    id integer NOT NULL,
+    workflow_id character varying(50) NOT NULL,
+    workflow_name character varying(255),
+    workflow_type character varying(50),
+    is_active boolean DEFAULT false,
+    last_executed_at timestamp without time zone,
+    execution_count integer DEFAULT 0,
+    success_count integer DEFAULT 0,
+    failure_count integer DEFAULT 0,
+    avg_duration_ms integer,
+    has_schedule boolean DEFAULT false,
+    has_webhook boolean DEFAULT false,
+    idle_days integer,
+    suggestion character varying(100),
+    checked_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.monitor_workflows OWNER TO accusys;
+
+--
+-- Name: monitor_workflows_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.monitor_workflows_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.monitor_workflows_id_seq OWNER TO accusys;
+
+--
+-- Name: monitor_workflows_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.monitor_workflows_id_seq OWNED BY public.monitor_workflows.id;
+
+
+--
+-- Name: n8n_api_keys; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.n8n_api_keys (
+    id integer NOT NULL,
+    n8n_key_id character varying(64) NOT NULL,
+    label character varying(100) NOT NULL,
+    api_key_last_eight character varying(8) NOT NULL,
+    momentry_api_key_id character varying(48),
+    expires_at timestamp with time zone,
+    last_verified timestamp with time zone,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP
+);
+
+
+ALTER TABLE public.n8n_api_keys OWNER TO accusys;
+
+--
+-- Name: n8n_api_keys_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.n8n_api_keys_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.n8n_api_keys_id_seq OWNER TO accusys;
+
+--
+-- Name: n8n_api_keys_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.n8n_api_keys_id_seq OWNED BY public.n8n_api_keys.id;
+
+
+--
+-- Name: node_process_tracking; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.node_process_tracking (
+    id integer NOT NULL,
+    process_name character varying(100) NOT NULL,
+    pid integer,
+    command character varying(500),
+    node_version character varying(20),
+    is_managed boolean DEFAULT false,
+    started_at timestamp without time zone,
+    checked_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.node_process_tracking OWNER TO accusys;
+
+--
+-- Name: node_process_tracking_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.node_process_tracking_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.node_process_tracking_id_seq OWNER TO accusys;
+
+--
+-- Name: node_process_tracking_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.node_process_tracking_id_seq OWNED BY public.node_process_tracking.id;
+
+
+--
+-- Name: node_version_baseline; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.node_version_baseline (
+    id integer NOT NULL,
+    runtime_name character varying(50) NOT NULL,
+    required_version character varying(20) NOT NULL,
+    current_version character varying(20),
+    process_name character varying(100),
+    process_path text,
+    is_compliant boolean,
+    locked_path character varying(500),
+    checked_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.node_version_baseline OWNER TO accusys;
+
+--
+-- Name: node_version_baseline_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.node_version_baseline_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.node_version_baseline_id_seq OWNER TO accusys;
+
+--
+-- Name: node_version_baseline_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.node_version_baseline_id_seq OWNED BY public.node_version_baseline.id;
+
+
+--
+-- Name: parent_chunks; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.parent_chunks (
+    id integer NOT NULL,
+    uuid text NOT NULL,
+    scene_order integer,
+    start_time double precision NOT NULL,
+    end_time double precision NOT NULL,
+    summary_text text,
+    summary_vector public.vector(768),
+    metadata jsonb,
+    created_at timestamp with time zone DEFAULT now(),
+    rule_3_markers jsonb DEFAULT '{}'::jsonb,
+    start_frame bigint,
+    end_frame bigint,
+    fps double precision DEFAULT 24.0
+);
+
+
+ALTER TABLE public.parent_chunks OWNER TO accusys;
+
+--
+-- Name: parent_chunks_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.parent_chunks_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.parent_chunks_id_seq OWNER TO accusys;
+
+--
+-- Name: parent_chunks_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.parent_chunks_id_seq OWNED BY public.parent_chunks.id;
+
+
+--
+-- Name: parent_chunks_poc; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.parent_chunks_poc (
+    id integer NOT NULL,
+    uuid text NOT NULL,
+    scene_order integer,
+    start_time double precision NOT NULL,
+    end_time double precision NOT NULL,
+    summary_text text,
+    summary_vector public.vector(768),
+    metadata jsonb,
+    created_at timestamp with time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.parent_chunks_poc OWNER TO accusys;
+
+--
+-- Name: parent_chunks_poc_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.parent_chunks_poc_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.parent_chunks_poc_id_seq OWNER TO accusys;
+
+--
+-- Name: parent_chunks_poc_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.parent_chunks_poc_id_seq OWNED BY public.parent_chunks_poc.id;
+
+
+--
+-- Name: person_appearances; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.person_appearances (
+    id integer NOT NULL,
+    person_id character varying(255) NOT NULL,
+    video_uuid character varying(255) NOT NULL,
+    start_time double precision NOT NULL,
+    end_time double precision NOT NULL,
+    duration double precision NOT NULL,
+    face_detection_id integer,
+    asrx_segment_start double precision,
+    asrx_segment_end double precision,
+    confidence double precision DEFAULT 0.0,
+    metadata jsonb DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    CONSTRAINT person_appearances_confidence_check CHECK (((confidence >= (0.0)::double precision) AND (confidence <= (1.0)::double precision))),
+    CONSTRAINT person_appearances_duration_check CHECK ((duration > (0)::double precision)),
+    CONSTRAINT person_appearances_end_time_check CHECK ((end_time >= (0)::double precision)),
+    CONSTRAINT person_appearances_start_time_check CHECK ((start_time >= (0)::double precision)),
+    CONSTRAINT valid_appearance_time CHECK ((end_time > start_time)),
+    CONSTRAINT valid_duration CHECK (((end_time - start_time) = duration))
+);
+
+
+ALTER TABLE public.person_appearances OWNER TO accusys;
+
+--
+-- Name: TABLE person_appearances; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.person_appearances IS 'Stores individual person appearance records with time ranges';
+
+
+--
+-- Name: person_appearances_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.person_appearances_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.person_appearances_id_seq OWNER TO accusys;
+
+--
+-- Name: person_appearances_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.person_appearances_id_seq OWNED BY public.person_appearances.id;
+
+
+--
+-- Name: person_identities; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.person_identities (
+    id integer NOT NULL,
+    person_id character varying(255) NOT NULL,
+    face_identity_id integer,
+    speaker_id character varying(64),
+    video_uuid character varying(255) NOT NULL,
+    confidence double precision DEFAULT 0.0,
+    name character varying(255),
+    metadata jsonb DEFAULT '{}'::jsonb,
+    first_appearance_time double precision,
+    last_appearance_time double precision,
+    total_appearance_duration double precision DEFAULT 0.0,
+    appearance_count integer DEFAULT 0,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    is_confirmed boolean DEFAULT false,
+    aliases jsonb DEFAULT '[]'::jsonb,
+    original_name character varying(255),
+    character_name character varying(255),
+    age integer,
+    gender character varying(20),
+    CONSTRAINT person_identities_confidence_check CHECK (((confidence >= (0.0)::double precision) AND (confidence <= (1.0)::double precision))),
+    CONSTRAINT valid_time_range CHECK (((first_appearance_time IS NULL) OR (last_appearance_time IS NULL) OR (last_appearance_time >= first_appearance_time)))
+);
+
+
+ALTER TABLE public.person_identities OWNER TO accusys;
+
+--
+-- Name: TABLE person_identities; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.person_identities IS 'Stores person identity associations linking face and speaker identities';
+
+
+--
+-- Name: person_identities_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.person_identities_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.person_identities_id_seq OWNER TO accusys;
+
+--
+-- Name: person_identities_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.person_identities_id_seq OWNED BY public.person_identities.id;
+
+
+--
+-- Name: processor_results; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.processor_results (
+    id integer NOT NULL,
+    job_id integer,
+    video_id bigint,
+    processor character varying(20) NOT NULL,
+    status character varying(20) DEFAULT 'pending'::character varying NOT NULL,
+    output_path text,
+    started_at timestamp without time zone,
+    completed_at timestamp without time zone,
+    error_message text,
+    progress_total integer DEFAULT 0,
+    progress_current integer DEFAULT 0,
+    last_checkpoint jsonb,
+    created_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp without time zone DEFAULT CURRENT_TIMESTAMP,
+    output_data jsonb,
+    duration_secs double precision GENERATED ALWAYS AS (
+CASE
+    WHEN ((completed_at IS NOT NULL) AND (started_at IS NOT NULL)) THEN EXTRACT(epoch FROM (completed_at - started_at))
+    ELSE NULL::numeric
+END) STORED,
+    processor_version character varying(50),
+    model_name character varying(100),
+    model_version character varying(50),
+    contract_version character varying(20),
+    CONSTRAINT chk_processor_results_processor CHECK (((processor)::text = ANY ((ARRAY['asr'::character varying, 'cut'::character varying, 'yolo'::character varying, 'ocr'::character varying, 'face'::character varying, 'pose'::character varying, 'asrx'::character varying])::text[]))),
+    CONSTRAINT chk_processor_results_status CHECK (((status)::text = ANY ((ARRAY['pending'::character varying, 'running'::character varying, 'completed'::character varying, 'failed'::character varying, 'skipped'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.processor_results OWNER TO accusys;
+
+--
+-- Name: TABLE processor_results; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON TABLE public.processor_results IS 'Tracks individual processor execution status';
+
+
+--
+-- Name: COLUMN processor_results.status; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.processor_results.status IS 'pending, running, completed, failed, skipped';
+
+
+--
+-- Name: COLUMN processor_results.output_data; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.processor_results.output_data IS 'JSON output from processor execution';
+
+
+--
+-- Name: COLUMN processor_results.duration_secs; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.processor_results.duration_secs IS 'Computed duration in seconds (completed - started) as double precision';
+
+
+--
+-- Name: processor_results_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.processor_results_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.processor_results_id_seq OWNER TO accusys;
+
+--
+-- Name: processor_results_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.processor_results_id_seq OWNED BY public.processor_results.id;
+
+
+--
+-- Name: python_script_tracking; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.python_script_tracking (
+    id integer NOT NULL,
+    script_path text NOT NULL,
+    shebang_version character varying(20),
+    actual_version character varying(20),
+    is_compliant boolean DEFAULT false,
+    last_run_at timestamp without time zone,
+    exit_code integer,
+    error_output text,
+    checked_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.python_script_tracking OWNER TO accusys;
+
+--
+-- Name: python_script_tracking_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.python_script_tracking_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.python_script_tracking_id_seq OWNER TO accusys;
+
+--
+-- Name: python_script_tracking_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.python_script_tracking_id_seq OWNED BY public.python_script_tracking.id;
+
+
+--
+-- Name: python_version_baseline; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.python_version_baseline (
+    id integer NOT NULL,
+    runtime_name character varying(50) NOT NULL,
+    required_version character varying(20) NOT NULL,
+    current_version character varying(20),
+    interpreter_path character varying(500),
+    is_compliant boolean,
+    checked_at timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.python_version_baseline OWNER TO accusys;
+
+--
+-- Name: python_version_baseline_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.python_version_baseline_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.python_version_baseline_id_seq OWNER TO accusys;
+
+--
+-- Name: python_version_baseline_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.python_version_baseline_id_seq OWNED BY public.python_version_baseline.id;
+
+
+--
+-- Name: storage_access_logs; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.storage_access_logs (
+    id integer NOT NULL,
+    user_cluster character varying(50),
+    owner_id character varying(100),
+    file_path text,
+    access_type character varying(20),
+    access_time timestamp without time zone DEFAULT now(),
+    client_ip character varying(45),
+    access_method character varying(20),
+    CONSTRAINT storage_access_logs_access_type_check CHECK (((access_type)::text = ANY ((ARRAY['read'::character varying, 'write'::character varying, 'delete'::character varying, 'download'::character varying, 'move'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.storage_access_logs OWNER TO accusys;
+
+--
+-- Name: storage_access_logs_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.storage_access_logs_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.storage_access_logs_id_seq OWNER TO accusys;
+
+--
+-- Name: storage_access_logs_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.storage_access_logs_id_seq OWNED BY public.storage_access_logs.id;
+
+
+--
+-- Name: storage_usage_stats; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.storage_usage_stats (
+    id integer NOT NULL,
+    user_cluster character varying(50),
+    storage_tier character varying(20),
+    file_count bigint,
+    total_size_bytes bigint,
+    record_time timestamp without time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.storage_usage_stats OWNER TO accusys;
+
+--
+-- Name: storage_usage_stats_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.storage_usage_stats_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.storage_usage_stats_id_seq OWNER TO accusys;
+
+--
+-- Name: storage_usage_stats_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.storage_usage_stats_id_seq OWNED BY public.storage_usage_stats.id;
+
+
+--
+-- Name: v_idle_workflows; Type: VIEW; Schema: public; Owner: accusys
+--
+
+CREATE VIEW public.v_idle_workflows AS
+ SELECT workflow_name,
+    idle_days,
+    suggestion,
+    last_executed_at
+   FROM public.monitor_workflows
+  WHERE ((idle_days > 30) AND (is_active = true))
+  ORDER BY idle_days DESC;
+
+
+ALTER VIEW public.v_idle_workflows OWNER TO accusys;
+
+--
+-- Name: v_recent_anomalies; Type: VIEW; Schema: public; Owner: accusys
+--
+
+CREATE VIEW public.v_recent_anomalies AS
+ SELECT anomaly_type,
+    severity,
+    username,
+    source_ip,
+    description,
+    detected_at
+   FROM public.monitor_anomalies
+  WHERE (detected_at > (now() - '24:00:00'::interval))
+  ORDER BY detected_at DESC;
+
+
+ALTER VIEW public.v_recent_anomalies OWNER TO accusys;
+
+--
+-- Name: v_service_health; Type: VIEW; Schema: public; Owner: accusys
+--
+
+CREATE VIEW public.v_service_health AS
+ SELECT service_name,
+    status,
+    count(*) AS check_count,
+    count(*) FILTER (WHERE ((status)::text = 'up'::text)) AS up_count,
+    count(*) FILTER (WHERE ((status)::text = 'down'::text)) AS down_count,
+    avg(response_time_ms) AS avg_response_time,
+    max(checked_at) AS last_check
+   FROM public.monitor_services
+  WHERE (checked_at > (now() - '24:00:00'::interval))
+  GROUP BY service_name, status;
+
+
+ALTER VIEW public.v_service_health OWNER TO accusys;
+
+--
+-- Name: v_storage_overview; Type: VIEW; Schema: public; Owner: accusys
+--
+
+CREATE VIEW public.v_storage_overview AS
+ SELECT user_cluster,
+    storage_tier,
+    count(*) AS file_count,
+    sum(file_size) AS total_size
+   FROM public.file_registry
+  WHERE ((status)::text = 'active'::text)
+  GROUP BY user_cluster, storage_tier;
+
+
+ALTER VIEW public.v_storage_overview OWNER TO accusys;
+
+--
+-- Name: video_events; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.video_events (
+    id integer NOT NULL,
+    uuid text NOT NULL,
+    start_time double precision NOT NULL,
+    end_time double precision NOT NULL,
+    event_type text NOT NULL,
+    confidence double precision DEFAULT 0.0,
+    metadata jsonb,
+    created_at timestamp with time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.video_events OWNER TO accusys;
+
+--
+-- Name: video_events_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.video_events_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.video_events_id_seq OWNER TO accusys;
+
+--
+-- Name: video_events_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.video_events_id_seq OWNED BY public.video_events.id;
+
+
+--
+-- Name: video_identities; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.video_identities (
+    id integer NOT NULL,
+    uuid text NOT NULL,
+    name text NOT NULL,
+    metadata jsonb DEFAULT '{}'::jsonb,
+    created_at timestamp with time zone DEFAULT now()
+);
+
+
+ALTER TABLE public.video_identities OWNER TO accusys;
+
+--
+-- Name: video_identities_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.video_identities_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.video_identities_id_seq OWNER TO accusys;
+
+--
+-- Name: video_identities_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.video_identities_id_seq OWNED BY public.video_identities.id;
+
+
+--
+-- Name: videos; Type: TABLE; Schema: public; Owner: accusys
+--
+
+CREATE TABLE public.videos (
+    id integer NOT NULL,
+    file_uuid character varying(32) CONSTRAINT videos_uuid_not_null NOT NULL,
+    file_path text NOT NULL,
+    file_name text NOT NULL,
+    duration double precision,
+    width integer,
+    height integer,
+    fps double precision,
+    probe_json jsonb,
+    created_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    updated_at timestamp with time zone DEFAULT CURRENT_TIMESTAMP,
+    fs_video boolean DEFAULT false,
+    fs_json boolean DEFAULT false,
+    psql_chunk boolean DEFAULT false,
+    pobject_chunk boolean DEFAULT false,
+    mobject_chunk boolean DEFAULT false,
+    pvector_chunk boolean DEFAULT false,
+    qvector_chunk boolean DEFAULT false,
+    status character varying(20) DEFAULT 'pending'::character varying,
+    user_id bigint,
+    job_id integer,
+    registered_at timestamp without time zone,
+    registration_time timestamp with time zone,
+    total_frames bigint DEFAULT 0,
+    processing_status jsonb DEFAULT '{}'::jsonb,
+    file_type character varying(20),
+    birth_registration jsonb DEFAULT '{}'::jsonb,
+    CONSTRAINT chk_videos_status CHECK (((status)::text = ANY ((ARRAY['pending'::character varying, 'processing'::character varying, 'completed'::character varying, 'failed'::character varying])::text[])))
+);
+
+
+ALTER TABLE public.videos OWNER TO accusys;
+
+--
+-- Name: COLUMN videos.status; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.videos.status IS 'Video processing status: pending, processing, completed, failed';
+
+
+--
+-- Name: COLUMN videos.user_id; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.videos.user_id IS 'WordPress user ID (for user association tracking)';
+
+
+--
+-- Name: COLUMN videos.job_id; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.videos.job_id IS 'Associated monitor_jobs ID';
+
+
+--
+-- Name: COLUMN videos.processing_status; Type: COMMENT; Schema: public; Owner: accusys
+--
+
+COMMENT ON COLUMN public.videos.processing_status IS 'Processing progress JSON: {"active_processors": [...], "progress": {...}}';
+
+
+--
+-- Name: videos_id_seq; Type: SEQUENCE; Schema: public; Owner: accusys
+--
+
+CREATE SEQUENCE public.videos_id_seq
+    AS integer
+    START WITH 1
+    INCREMENT BY 1
+    NO MINVALUE
+    NO MAXVALUE
+    CACHE 1;
+
+
+ALTER SEQUENCE public.videos_id_seq OWNER TO accusys;
+
+--
+-- Name: videos_id_seq; Type: SEQUENCE OWNED BY; Schema: public; Owner: accusys
+--
+
+ALTER SEQUENCE public.videos_id_seq OWNED BY public.videos.id;
+
+
+--
+-- Name: api_key_anomalies id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.api_key_anomalies ALTER COLUMN id SET DEFAULT nextval('public.api_key_anomalies_id_seq'::regclass);
+
+
+--
+-- Name: api_key_audit_log id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.api_key_audit_log ALTER COLUMN id SET DEFAULT nextval('public.api_key_audit_log_id_seq'::regclass);
+
+
+--
+-- Name: api_keys id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.api_keys ALTER COLUMN id SET DEFAULT nextval('public.api_keys_id_seq'::regclass);
+
+
+--
+-- Name: backup_history id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.backup_history ALTER COLUMN id SET DEFAULT nextval('public.backup_history_id_seq'::regclass);
+
+
+--
+-- Name: backup_registry id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.backup_registry ALTER COLUMN id SET DEFAULT nextval('public.backup_registry_id_seq'::regclass);
+
+
+--
+-- Name: backup_storage_stats id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.backup_storage_stats ALTER COLUMN id SET DEFAULT nextval('public.backup_storage_stats_id_seq'::regclass);
+
+
+--
+-- Name: castings id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.castings ALTER COLUMN id SET DEFAULT nextval('public.castings_id_seq'::regclass);
+
+
+--
+-- Name: characters id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.characters ALTER COLUMN id SET DEFAULT nextval('public.characters_id_seq'::regclass);
+
+
+--
+-- Name: child_chunks id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.child_chunks ALTER COLUMN id SET DEFAULT nextval('public.child_chunks_id_seq'::regclass);
+
+
+--
+-- Name: chunk_vectors id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunk_vectors ALTER COLUMN id SET DEFAULT nextval('public.chunk_vectors_id_seq'::regclass);
+
+
+--
+-- Name: chunks id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunks ALTER COLUMN id SET DEFAULT nextval('public.chunks_id_seq'::regclass);
+
+
+--
+-- Name: face_clusters id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_clusters ALTER COLUMN id SET DEFAULT nextval('public.face_clusters_id_seq'::regclass);
+
+
+--
+-- Name: face_detections id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_detections ALTER COLUMN id SET DEFAULT nextval('public.face_detections_id_seq'::regclass);
+
+
+--
+-- Name: face_identities id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_identities ALTER COLUMN id SET DEFAULT nextval('public.face_identities_id_seq'::regclass);
+
+
+--
+-- Name: face_recognition_results id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_recognition_results ALTER COLUMN id SET DEFAULT nextval('public.face_recognition_results_id_seq'::regclass);
+
+
+--
+-- Name: file_lifecycle id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.file_lifecycle ALTER COLUMN id SET DEFAULT nextval('public.file_lifecycle_id_seq'::regclass);
+
+
+--
+-- Name: frames id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.frames ALTER COLUMN id SET DEFAULT nextval('public.frames_id_seq'::regclass);
+
+
+--
+-- Name: gitea_tokens id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.gitea_tokens ALTER COLUMN id SET DEFAULT nextval('public.gitea_tokens_id_seq'::regclass);
+
+
+--
+-- Name: identities id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.identities ALTER COLUMN id SET DEFAULT nextval('public.identities_id_seq'::regclass);
+
+
+--
+-- Name: identity_bindings id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.identity_bindings ALTER COLUMN id SET DEFAULT nextval('public.identity_bindings_id_seq'::regclass);
+
+
+--
+-- Name: merge_history id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.merge_history ALTER COLUMN id SET DEFAULT nextval('public.merge_history_id_seq'::regclass);
+
+
+--
+-- Name: monitor_anomalies id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_anomalies ALTER COLUMN id SET DEFAULT nextval('public.monitor_anomalies_id_seq'::regclass);
+
+
+--
+-- Name: monitor_config id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_config ALTER COLUMN id SET DEFAULT nextval('public.monitor_config_id_seq'::regclass);
+
+
+--
+-- Name: monitor_databases id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_databases ALTER COLUMN id SET DEFAULT nextval('public.monitor_databases_id_seq'::regclass);
+
+
+--
+-- Name: monitor_external id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_external ALTER COLUMN id SET DEFAULT nextval('public.monitor_external_id_seq'::regclass);
+
+
+--
+-- Name: monitor_jobs id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_jobs ALTER COLUMN id SET DEFAULT nextval('public.monitor_jobs_id_seq'::regclass);
+
+
+--
+-- Name: monitor_logins id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_logins ALTER COLUMN id SET DEFAULT nextval('public.monitor_logins_id_seq'::regclass);
+
+
+--
+-- Name: monitor_pg_schema_changes id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_pg_schema_changes ALTER COLUMN id SET DEFAULT nextval('public.monitor_pg_schema_changes_id_seq'::regclass);
+
+
+--
+-- Name: monitor_pg_tables id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_pg_tables ALTER COLUMN id SET DEFAULT nextval('public.monitor_pg_tables_id_seq'::regclass);
+
+
+--
+-- Name: monitor_portal_pages id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_portal_pages ALTER COLUMN id SET DEFAULT nextval('public.monitor_portal_pages_id_seq'::regclass);
+
+
+--
+-- Name: monitor_portal_users id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_portal_users ALTER COLUMN id SET DEFAULT nextval('public.monitor_portal_users_id_seq'::regclass);
+
+
+--
+-- Name: monitor_qdrant_collections id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_qdrant_collections ALTER COLUMN id SET DEFAULT nextval('public.monitor_qdrant_collections_id_seq'::regclass);
+
+
+--
+-- Name: monitor_resource_usage id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_resource_usage ALTER COLUMN id SET DEFAULT nextval('public.monitor_resource_usage_id_seq'::regclass);
+
+
+--
+-- Name: monitor_services id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_services ALTER COLUMN id SET DEFAULT nextval('public.monitor_services_id_seq'::regclass);
+
+
+--
+-- Name: monitor_sessions id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_sessions ALTER COLUMN id SET DEFAULT nextval('public.monitor_sessions_id_seq'::regclass);
+
+
+--
+-- Name: monitor_sudo_history id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_sudo_history ALTER COLUMN id SET DEFAULT nextval('public.monitor_sudo_history_id_seq'::regclass);
+
+
+--
+-- Name: monitor_workflows id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_workflows ALTER COLUMN id SET DEFAULT nextval('public.monitor_workflows_id_seq'::regclass);
+
+
+--
+-- Name: n8n_api_keys id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.n8n_api_keys ALTER COLUMN id SET DEFAULT nextval('public.n8n_api_keys_id_seq'::regclass);
+
+
+--
+-- Name: node_process_tracking id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.node_process_tracking ALTER COLUMN id SET DEFAULT nextval('public.node_process_tracking_id_seq'::regclass);
+
+
+--
+-- Name: node_version_baseline id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.node_version_baseline ALTER COLUMN id SET DEFAULT nextval('public.node_version_baseline_id_seq'::regclass);
+
+
+--
+-- Name: parent_chunks id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.parent_chunks ALTER COLUMN id SET DEFAULT nextval('public.parent_chunks_id_seq'::regclass);
+
+
+--
+-- Name: parent_chunks_poc id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.parent_chunks_poc ALTER COLUMN id SET DEFAULT nextval('public.parent_chunks_poc_id_seq'::regclass);
+
+
+--
+-- Name: person_appearances id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_appearances ALTER COLUMN id SET DEFAULT nextval('public.person_appearances_id_seq'::regclass);
+
+
+--
+-- Name: person_identities id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_identities ALTER COLUMN id SET DEFAULT nextval('public.person_identities_id_seq'::regclass);
+
+
+--
+-- Name: processor_results id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.processor_results ALTER COLUMN id SET DEFAULT nextval('public.processor_results_id_seq'::regclass);
+
+
+--
+-- Name: python_script_tracking id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.python_script_tracking ALTER COLUMN id SET DEFAULT nextval('public.python_script_tracking_id_seq'::regclass);
+
+
+--
+-- Name: python_version_baseline id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.python_version_baseline ALTER COLUMN id SET DEFAULT nextval('public.python_version_baseline_id_seq'::regclass);
+
+
+--
+-- Name: storage_access_logs id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.storage_access_logs ALTER COLUMN id SET DEFAULT nextval('public.storage_access_logs_id_seq'::regclass);
+
+
+--
+-- Name: storage_usage_stats id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.storage_usage_stats ALTER COLUMN id SET DEFAULT nextval('public.storage_usage_stats_id_seq'::regclass);
+
+
+--
+-- Name: video_events id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.video_events ALTER COLUMN id SET DEFAULT nextval('public.video_events_id_seq'::regclass);
+
+
+--
+-- Name: video_identities id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.video_identities ALTER COLUMN id SET DEFAULT nextval('public.video_identities_id_seq'::regclass);
+
+
+--
+-- Name: videos id; Type: DEFAULT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.videos ALTER COLUMN id SET DEFAULT nextval('public.videos_id_seq'::regclass);
+
+
+--
+-- Name: api_key_anomalies api_key_anomalies_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.api_key_anomalies
+    ADD CONSTRAINT api_key_anomalies_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: api_key_audit_log api_key_audit_log_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.api_key_audit_log
+    ADD CONSTRAINT api_key_audit_log_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: api_keys api_keys_key_id_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.api_keys
+    ADD CONSTRAINT api_keys_key_id_key UNIQUE (key_id);
+
+
+--
+-- Name: api_keys api_keys_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.api_keys
+    ADD CONSTRAINT api_keys_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: backup_history backup_history_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.backup_history
+    ADD CONSTRAINT backup_history_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: backup_registry backup_registry_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.backup_registry
+    ADD CONSTRAINT backup_registry_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: backup_storage_stats backup_storage_stats_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.backup_storage_stats
+    ADD CONSTRAINT backup_storage_stats_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: castings castings_character_id_talent_id_track_type_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.castings
+    ADD CONSTRAINT castings_character_id_talent_id_track_type_key UNIQUE (character_id, talent_id, track_type);
+
+
+--
+-- Name: castings castings_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.castings
+    ADD CONSTRAINT castings_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: characters characters_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.characters
+    ADD CONSTRAINT characters_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: characters characters_video_uuid_name_language_track_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.characters
+    ADD CONSTRAINT characters_video_uuid_name_language_track_key UNIQUE (video_uuid, name, language_track);
+
+
+--
+-- Name: child_chunks child_chunks_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.child_chunks
+    ADD CONSTRAINT child_chunks_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: chunk_vectors chunk_vectors_chunk_id_uuid_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunk_vectors
+    ADD CONSTRAINT chunk_vectors_chunk_id_uuid_key UNIQUE (chunk_id, uuid);
+
+
+--
+-- Name: chunk_vectors chunk_vectors_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunk_vectors
+    ADD CONSTRAINT chunk_vectors_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: chunks chunks_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunks
+    ADD CONSTRAINT chunks_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: chunks chunks_uuid_chunk_id_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunks
+    ADD CONSTRAINT chunks_uuid_chunk_id_key UNIQUE (uuid, chunk_id);
+
+
+--
+-- Name: face_clusters face_clusters_cluster_id_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_clusters
+    ADD CONSTRAINT face_clusters_cluster_id_key UNIQUE (cluster_id);
+
+
+--
+-- Name: face_clusters face_clusters_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_clusters
+    ADD CONSTRAINT face_clusters_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: face_detections face_detections_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_detections
+    ADD CONSTRAINT face_detections_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: face_identities face_identities_face_id_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_identities
+    ADD CONSTRAINT face_identities_face_id_key UNIQUE (face_id);
+
+
+--
+-- Name: face_identities face_identities_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_identities
+    ADD CONSTRAINT face_identities_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: face_recognition_results face_recognition_results_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_recognition_results
+    ADD CONSTRAINT face_recognition_results_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: face_recognition_results face_recognition_results_video_uuid_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_recognition_results
+    ADD CONSTRAINT face_recognition_results_video_uuid_key UNIQUE (video_uuid);
+
+
+--
+-- Name: file_lifecycle file_lifecycle_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.file_lifecycle
+    ADD CONSTRAINT file_lifecycle_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: file_registry file_registry_file_path_hash_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.file_registry
+    ADD CONSTRAINT file_registry_file_path_hash_key UNIQUE (file_path_hash);
+
+
+--
+-- Name: file_registry file_registry_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.file_registry
+    ADD CONSTRAINT file_registry_pkey PRIMARY KEY (file_uuid);
+
+
+--
+-- Name: frames frames_file_id_frame_number_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.frames
+    ADD CONSTRAINT frames_file_id_frame_number_key UNIQUE (file_id, frame_number);
+
+
+--
+-- Name: frames frames_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.frames
+    ADD CONSTRAINT frames_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: gitea_tokens gitea_tokens_gitea_user_token_name_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.gitea_tokens
+    ADD CONSTRAINT gitea_tokens_gitea_user_token_name_key UNIQUE (gitea_user, token_name);
+
+
+--
+-- Name: gitea_tokens gitea_tokens_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.gitea_tokens
+    ADD CONSTRAINT gitea_tokens_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: identities identities_name_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.identities
+    ADD CONSTRAINT identities_name_key UNIQUE (name);
+
+
+--
+-- Name: identities identities_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.identities
+    ADD CONSTRAINT identities_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: identity_bindings identity_bindings_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.identity_bindings
+    ADD CONSTRAINT identity_bindings_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: identity_bindings identity_bindings_uuid_binding_type_binding_value_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.identity_bindings
+    ADD CONSTRAINT identity_bindings_uuid_binding_type_binding_value_key UNIQUE (uuid, binding_type, binding_value);
+
+
+--
+-- Name: merge_history merge_history_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.merge_history
+    ADD CONSTRAINT merge_history_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_anomalies monitor_anomalies_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_anomalies
+    ADD CONSTRAINT monitor_anomalies_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_config monitor_config_config_key_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_config
+    ADD CONSTRAINT monitor_config_config_key_key UNIQUE (config_key);
+
+
+--
+-- Name: monitor_config monitor_config_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_config
+    ADD CONSTRAINT monitor_config_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_databases monitor_databases_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_databases
+    ADD CONSTRAINT monitor_databases_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_external monitor_external_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_external
+    ADD CONSTRAINT monitor_external_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_jobs monitor_jobs_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_jobs
+    ADD CONSTRAINT monitor_jobs_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_logins monitor_logins_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_logins
+    ADD CONSTRAINT monitor_logins_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_pg_schema_changes monitor_pg_schema_changes_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_pg_schema_changes
+    ADD CONSTRAINT monitor_pg_schema_changes_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_pg_tables monitor_pg_tables_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_pg_tables
+    ADD CONSTRAINT monitor_pg_tables_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_portal_pages monitor_portal_pages_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_portal_pages
+    ADD CONSTRAINT monitor_portal_pages_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_portal_users monitor_portal_users_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_portal_users
+    ADD CONSTRAINT monitor_portal_users_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_qdrant_collections monitor_qdrant_collections_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_qdrant_collections
+    ADD CONSTRAINT monitor_qdrant_collections_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_resource_usage monitor_resource_usage_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_resource_usage
+    ADD CONSTRAINT monitor_resource_usage_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_services monitor_services_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_services
+    ADD CONSTRAINT monitor_services_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_sessions monitor_sessions_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_sessions
+    ADD CONSTRAINT monitor_sessions_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_sudo_history monitor_sudo_history_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_sudo_history
+    ADD CONSTRAINT monitor_sudo_history_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: monitor_workflows monitor_workflows_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_workflows
+    ADD CONSTRAINT monitor_workflows_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: n8n_api_keys n8n_api_keys_n8n_key_id_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.n8n_api_keys
+    ADD CONSTRAINT n8n_api_keys_n8n_key_id_key UNIQUE (n8n_key_id);
+
+
+--
+-- Name: n8n_api_keys n8n_api_keys_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.n8n_api_keys
+    ADD CONSTRAINT n8n_api_keys_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: node_process_tracking node_process_tracking_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.node_process_tracking
+    ADD CONSTRAINT node_process_tracking_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: node_version_baseline node_version_baseline_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.node_version_baseline
+    ADD CONSTRAINT node_version_baseline_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: parent_chunks parent_chunks_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.parent_chunks
+    ADD CONSTRAINT parent_chunks_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: parent_chunks_poc parent_chunks_poc_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.parent_chunks_poc
+    ADD CONSTRAINT parent_chunks_poc_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: person_appearances person_appearances_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_appearances
+    ADD CONSTRAINT person_appearances_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: person_identities person_identities_person_id_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_identities
+    ADD CONSTRAINT person_identities_person_id_key UNIQUE (person_id);
+
+
+--
+-- Name: person_identities person_identities_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_identities
+    ADD CONSTRAINT person_identities_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: processor_results processor_results_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.processor_results
+    ADD CONSTRAINT processor_results_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: python_script_tracking python_script_tracking_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.python_script_tracking
+    ADD CONSTRAINT python_script_tracking_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: python_version_baseline python_version_baseline_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.python_version_baseline
+    ADD CONSTRAINT python_version_baseline_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: storage_access_logs storage_access_logs_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.storage_access_logs
+    ADD CONSTRAINT storage_access_logs_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: storage_usage_stats storage_usage_stats_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.storage_usage_stats
+    ADD CONSTRAINT storage_usage_stats_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: face_detections unique_detection_per_frame; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_detections
+    ADD CONSTRAINT unique_detection_per_frame UNIQUE (video_uuid, frame_number, x, y, width, height);
+
+
+--
+-- Name: processor_results unique_job_processor; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.processor_results
+    ADD CONSTRAINT unique_job_processor UNIQUE (job_id, processor);
+
+
+--
+-- Name: person_identities unique_person_identity; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_identities
+    ADD CONSTRAINT unique_person_identity UNIQUE (video_uuid, face_identity_id, speaker_id);
+
+
+--
+-- Name: video_events video_events_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.video_events
+    ADD CONSTRAINT video_events_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: video_identities video_identities_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.video_identities
+    ADD CONSTRAINT video_identities_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: videos videos_pkey; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.videos
+    ADD CONSTRAINT videos_pkey PRIMARY KEY (id);
+
+
+--
+-- Name: videos videos_uuid_key; Type: CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.videos
+    ADD CONSTRAINT videos_uuid_key UNIQUE (file_uuid);
+
+
+--
+-- Name: idx_anomalies_key_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_anomalies_key_id ON public.api_key_anomalies USING btree (key_id);
+
+
+--
+-- Name: idx_anomalies_resolved; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_anomalies_resolved ON public.api_key_anomalies USING btree (resolved);
+
+
+--
+-- Name: idx_api_keys_hash; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_api_keys_hash ON public.api_keys USING btree (key_hash);
+
+
+--
+-- Name: idx_api_keys_key_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_api_keys_key_id ON public.api_keys USING btree (key_id);
+
+
+--
+-- Name: idx_api_keys_status; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_api_keys_status ON public.api_keys USING btree (status);
+
+
+--
+-- Name: idx_api_keys_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_api_keys_type ON public.api_keys USING btree (key_type);
+
+
+--
+-- Name: idx_audit_action; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_audit_action ON public.api_key_audit_log USING btree (action);
+
+
+--
+-- Name: idx_audit_created_at; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_audit_created_at ON public.api_key_audit_log USING btree (created_at);
+
+
+--
+-- Name: idx_audit_key_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_audit_key_id ON public.api_key_audit_log USING btree (key_id);
+
+
+--
+-- Name: idx_backup_history_service; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_backup_history_service ON public.backup_history USING btree (service_name);
+
+
+--
+-- Name: idx_backup_history_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_backup_history_time ON public.backup_history USING btree (executed_at);
+
+
+--
+-- Name: idx_backup_registry_service; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_backup_registry_service ON public.backup_registry USING btree (service_name);
+
+
+--
+-- Name: idx_backup_registry_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_backup_registry_time ON public.backup_registry USING btree (created_at);
+
+
+--
+-- Name: idx_backup_storage_stats_tier; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_backup_storage_stats_tier ON public.backup_storage_stats USING btree (tier);
+
+
+--
+-- Name: idx_backup_storage_stats_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_backup_storage_stats_time ON public.backup_storage_stats USING btree (record_time);
+
+
+--
+-- Name: idx_bindings_identity; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_bindings_identity ON public.identity_bindings USING btree (identity_id);
+
+
+--
+-- Name: idx_bindings_lookup; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_bindings_lookup ON public.identity_bindings USING btree (uuid, binding_type, binding_value);
+
+
+--
+-- Name: idx_child_parent; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_child_parent ON public.child_chunks USING btree (parent_id);
+
+
+--
+-- Name: idx_chunk_vectors_chunk_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunk_vectors_chunk_id ON public.chunk_vectors USING btree (chunk_id);
+
+
+--
+-- Name: idx_chunk_vectors_embedding_hnsw; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunk_vectors_embedding_hnsw ON public.chunk_vectors USING hnsw (embedding_vector public.vector_cosine_ops);
+
+
+--
+-- Name: idx_chunk_vectors_file_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunk_vectors_file_id ON public.chunk_vectors USING btree (file_id);
+
+
+--
+-- Name: idx_chunk_vectors_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunk_vectors_uuid ON public.chunk_vectors USING btree (uuid);
+
+
+--
+-- Name: idx_chunks_content_gin; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunks_content_gin ON public.chunks USING gin (content);
+
+
+--
+-- Name: idx_chunks_file_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunks_file_id ON public.chunks USING btree (file_id);
+
+
+--
+-- Name: idx_chunks_search_vector; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunks_search_vector ON public.chunks USING gin (search_vector);
+
+
+--
+-- Name: idx_chunks_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunks_time ON public.chunks USING btree (start_time, end_time);
+
+
+--
+-- Name: idx_chunks_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunks_type ON public.chunks USING btree (chunk_type);
+
+
+--
+-- Name: idx_chunks_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunks_uuid ON public.chunks USING btree (uuid);
+
+
+--
+-- Name: idx_chunks_uuid_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_chunks_uuid_type ON public.chunks USING btree (uuid, chunk_type);
+
+
+--
+-- Name: idx_face_clusters_video_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_clusters_video_uuid ON public.face_clusters USING btree (video_uuid);
+
+
+--
+-- Name: idx_face_detections_cluster; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_detections_cluster ON public.face_detections USING btree (cluster_id);
+
+
+--
+-- Name: idx_face_detections_embedding; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_detections_embedding ON public.face_detections USING ivfflat (embedding public.vector_cosine_ops) WITH (lists='100');
+
+
+--
+-- Name: idx_face_detections_face_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_detections_face_id ON public.face_detections USING btree (face_id);
+
+
+--
+-- Name: idx_face_detections_frame; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_detections_frame ON public.face_detections USING btree (video_uuid, frame_number);
+
+
+--
+-- Name: idx_face_detections_identity; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_detections_identity ON public.face_detections USING btree (identity_id);
+
+
+--
+-- Name: idx_face_detections_video_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_detections_video_uuid ON public.face_detections USING btree (video_uuid);
+
+
+--
+-- Name: idx_face_identities_embedding; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_identities_embedding ON public.face_identities USING ivfflat (embedding public.vector_cosine_ops) WITH (lists='100');
+
+
+--
+-- Name: idx_face_recognition_results_created_at; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_face_recognition_results_created_at ON public.face_recognition_results USING btree (created_at);
+
+
+--
+-- Name: idx_file_registry_cluster; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_file_registry_cluster ON public.file_registry USING btree (user_cluster);
+
+
+--
+-- Name: idx_file_registry_status; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_file_registry_status ON public.file_registry USING btree (status);
+
+
+--
+-- Name: idx_file_registry_tier; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_file_registry_tier ON public.file_registry USING btree (storage_tier);
+
+
+--
+-- Name: idx_frames_face_gin; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_frames_face_gin ON public.frames USING gin (face_results);
+
+
+--
+-- Name: idx_frames_file_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_frames_file_id ON public.frames USING btree (file_id);
+
+
+--
+-- Name: idx_frames_frame; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_frames_frame ON public.frames USING btree (file_id, frame_number);
+
+
+--
+-- Name: idx_frames_ocr_gin; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_frames_ocr_gin ON public.frames USING gin (ocr_results);
+
+
+--
+-- Name: idx_frames_pose_gin; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_frames_pose_gin ON public.frames USING gin (pose_results);
+
+
+--
+-- Name: idx_frames_timestamp; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_frames_timestamp ON public.frames USING btree (file_id, "timestamp");
+
+
+--
+-- Name: idx_frames_yolo_gin; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_frames_yolo_gin ON public.frames USING gin (yolo_objects);
+
+
+--
+-- Name: idx_gitea_tokens_key_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_gitea_tokens_key_id ON public.gitea_tokens USING btree (api_key_id);
+
+
+--
+-- Name: idx_gitea_tokens_user; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_gitea_tokens_user ON public.gitea_tokens USING btree (gitea_user);
+
+
+--
+-- Name: idx_identities_face_embedding; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_identities_face_embedding ON public.identities USING ivfflat (face_embedding public.vector_cosine_ops) WITH (lists='100');
+
+
+--
+-- Name: idx_identities_identity_embedding; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_identities_identity_embedding ON public.identities USING ivfflat (identity_embedding public.vector_cosine_ops) WITH (lists='100');
+
+
+--
+-- Name: idx_identities_reference_data; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_identities_reference_data ON public.identities USING gin (reference_data);
+
+
+--
+-- Name: idx_identities_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_identities_uuid ON public.identities USING btree (uuid);
+
+
+--
+-- Name: idx_identities_voice_embedding; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_identities_voice_embedding ON public.identities USING ivfflat (voice_embedding public.vector_cosine_ops) WITH (lists='50');
+
+
+--
+-- Name: idx_monitor_anomalies_severity; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_anomalies_severity ON public.monitor_anomalies USING btree (severity);
+
+
+--
+-- Name: idx_monitor_anomalies_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_anomalies_time ON public.monitor_anomalies USING btree (detected_at);
+
+
+--
+-- Name: idx_monitor_anomalies_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_anomalies_type ON public.monitor_anomalies USING btree (anomaly_type);
+
+
+--
+-- Name: idx_monitor_databases_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_databases_time ON public.monitor_databases USING btree (checked_at);
+
+
+--
+-- Name: idx_monitor_databases_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_databases_type ON public.monitor_databases USING btree (db_type);
+
+
+--
+-- Name: idx_monitor_external_name; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_external_name ON public.monitor_external USING btree (target_name);
+
+
+--
+-- Name: idx_monitor_external_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_external_time ON public.monitor_external USING btree (checked_at);
+
+
+--
+-- Name: idx_monitor_jobs_created_at; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_jobs_created_at ON public.monitor_jobs USING btree (created_at);
+
+
+--
+-- Name: idx_monitor_jobs_processors; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_jobs_processors ON public.monitor_jobs USING gin (processors);
+
+
+--
+-- Name: idx_monitor_jobs_status; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_jobs_status ON public.monitor_jobs USING btree (status);
+
+
+--
+-- Name: idx_monitor_jobs_status_created; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_jobs_status_created ON public.monitor_jobs USING btree (status, created_at);
+
+
+--
+-- Name: idx_monitor_jobs_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_jobs_uuid ON public.monitor_jobs USING btree (uuid);
+
+
+--
+-- Name: idx_monitor_jobs_video_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_jobs_video_id ON public.monitor_jobs USING btree (video_id);
+
+
+--
+-- Name: idx_monitor_logins_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_logins_time ON public.monitor_logins USING btree (login_at);
+
+
+--
+-- Name: idx_monitor_logins_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_logins_type ON public.monitor_logins USING btree (user_type);
+
+
+--
+-- Name: idx_monitor_portal_pages_url; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_portal_pages_url ON public.monitor_portal_pages USING btree (page_url);
+
+
+--
+-- Name: idx_monitor_portal_users_username; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_portal_users_username ON public.monitor_portal_users USING btree (username);
+
+
+--
+-- Name: idx_monitor_services_name; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_services_name ON public.monitor_services USING btree (service_name);
+
+
+--
+-- Name: idx_monitor_services_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_services_time ON public.monitor_services USING btree (checked_at);
+
+
+--
+-- Name: idx_monitor_sessions_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_sessions_type ON public.monitor_sessions USING btree (session_type);
+
+
+--
+-- Name: idx_monitor_sessions_username; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_sessions_username ON public.monitor_sessions USING btree (username);
+
+
+--
+-- Name: idx_monitor_workflows_active; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_workflows_active ON public.monitor_workflows USING btree (is_active);
+
+
+--
+-- Name: idx_monitor_workflows_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_workflows_id ON public.monitor_workflows USING btree (workflow_id);
+
+
+--
+-- Name: idx_monitor_workflows_idle; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_monitor_workflows_idle ON public.monitor_workflows USING btree (idle_days);
+
+
+--
+-- Name: idx_n8n_api_keys_key_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_n8n_api_keys_key_id ON public.n8n_api_keys USING btree (momentry_api_key_id);
+
+
+--
+-- Name: idx_n8n_api_keys_label; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_n8n_api_keys_label ON public.n8n_api_keys USING btree (label);
+
+
+--
+-- Name: idx_node_process_name; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_node_process_name ON public.node_process_tracking USING btree (process_name);
+
+
+--
+-- Name: idx_node_version_name; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_node_version_name ON public.node_version_baseline USING btree (runtime_name);
+
+
+--
+-- Name: idx_person_appearances_face; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_appearances_face ON public.person_appearances USING btree (face_detection_id) WHERE (face_detection_id IS NOT NULL);
+
+
+--
+-- Name: idx_person_appearances_person; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_appearances_person ON public.person_appearances USING btree (person_id);
+
+
+--
+-- Name: idx_person_appearances_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_appearances_time ON public.person_appearances USING btree (video_uuid, start_time, end_time);
+
+
+--
+-- Name: idx_person_appearances_video; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_appearances_video ON public.person_appearances USING btree (video_uuid);
+
+
+--
+-- Name: idx_person_identities_confirmed; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_identities_confirmed ON public.person_identities USING btree (is_confirmed) WHERE (is_confirmed = true);
+
+
+--
+-- Name: idx_person_identities_face; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_identities_face ON public.person_identities USING btree (face_identity_id) WHERE (face_identity_id IS NOT NULL);
+
+
+--
+-- Name: idx_person_identities_name; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_identities_name ON public.person_identities USING btree (name) WHERE (name IS NOT NULL);
+
+
+--
+-- Name: idx_person_identities_speaker; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_identities_speaker ON public.person_identities USING btree (speaker_id) WHERE (speaker_id IS NOT NULL);
+
+
+--
+-- Name: idx_person_identities_video_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_person_identities_video_uuid ON public.person_identities USING btree (video_uuid);
+
+
+--
+-- Name: idx_processor_results_job; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_processor_results_job ON public.processor_results USING btree (job_id);
+
+
+--
+-- Name: idx_processor_results_output_data; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_processor_results_output_data ON public.processor_results USING gin (output_data);
+
+
+--
+-- Name: idx_processor_results_status; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_processor_results_status ON public.processor_results USING btree (status);
+
+
+--
+-- Name: idx_processor_results_video; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_processor_results_video ON public.processor_results USING btree (video_id);
+
+
+--
+-- Name: idx_python_script_path; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_python_script_path ON public.python_script_tracking USING btree (script_path);
+
+
+--
+-- Name: idx_python_version_name; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_python_version_name ON public.python_version_baseline USING btree (runtime_name);
+
+
+--
+-- Name: idx_storage_usage_cluster; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_storage_usage_cluster ON public.storage_usage_stats USING btree (user_cluster);
+
+
+--
+-- Name: idx_storage_usage_time; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_storage_usage_time ON public.storage_usage_stats USING btree (record_time);
+
+
+--
+-- Name: idx_video_events_type; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_video_events_type ON public.video_events USING btree (event_type);
+
+
+--
+-- Name: idx_video_events_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_video_events_uuid ON public.video_events USING btree (uuid);
+
+
+--
+-- Name: idx_video_identities_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_video_identities_uuid ON public.video_identities USING btree (uuid);
+
+
+--
+-- Name: idx_videos_file_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_videos_file_uuid ON public.videos USING btree (file_uuid);
+
+
+--
+-- Name: idx_videos_job_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_videos_job_id ON public.videos USING btree (job_id);
+
+
+--
+-- Name: idx_videos_status; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_videos_status ON public.videos USING btree (status);
+
+
+--
+-- Name: idx_videos_user_id; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_videos_user_id ON public.videos USING btree (user_id);
+
+
+--
+-- Name: idx_videos_uuid; Type: INDEX; Schema: public; Owner: accusys
+--
+
+CREATE INDEX idx_videos_uuid ON public.videos USING btree (file_uuid);
+
+
+--
+-- Name: chunks chunks_search_vector_trigger; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER chunks_search_vector_trigger BEFORE INSERT OR UPDATE ON public.chunks FOR EACH ROW EXECUTE FUNCTION public.update_search_vector();
+
+
+--
+-- Name: person_appearances trigger_update_person_appearance_stats; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER trigger_update_person_appearance_stats AFTER INSERT OR DELETE OR UPDATE ON public.person_appearances FOR EACH ROW EXECUTE FUNCTION public.trigger_update_person_stats();
+
+
+--
+-- Name: face_identities update_face_identities_updated_at; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER update_face_identities_updated_at BEFORE UPDATE ON public.face_identities FOR EACH ROW EXECUTE FUNCTION public.update_updated_at_column();
+
+
+--
+-- Name: face_recognition_results update_face_recognition_results_updated_at; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER update_face_recognition_results_updated_at BEFORE UPDATE ON public.face_recognition_results FOR EACH ROW EXECUTE FUNCTION public.update_updated_at_column();
+
+
+--
+-- Name: monitor_jobs update_monitor_jobs_updated_at; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER update_monitor_jobs_updated_at BEFORE UPDATE ON public.monitor_jobs FOR EACH ROW EXECUTE FUNCTION public.update_updated_at_column();
+
+
+--
+-- Name: person_identities update_person_identities_updated_at; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER update_person_identities_updated_at BEFORE UPDATE ON public.person_identities FOR EACH ROW EXECUTE FUNCTION public.update_updated_at_column();
+
+
+--
+-- Name: processor_results update_processor_results_updated_at; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER update_processor_results_updated_at BEFORE UPDATE ON public.processor_results FOR EACH ROW EXECUTE FUNCTION public.update_updated_at_column();
+
+
+--
+-- Name: videos update_videos_updated_at; Type: TRIGGER; Schema: public; Owner: accusys
+--
+
+CREATE TRIGGER update_videos_updated_at BEFORE UPDATE ON public.videos FOR EACH ROW EXECUTE FUNCTION public.update_updated_at_column();
+
+
+--
+-- Name: castings castings_character_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.castings
+    ADD CONSTRAINT castings_character_id_fkey FOREIGN KEY (character_id) REFERENCES public.characters(id) ON DELETE CASCADE;
+
+
+--
+-- Name: child_chunks child_chunks_parent_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.child_chunks
+    ADD CONSTRAINT child_chunks_parent_id_fkey FOREIGN KEY (parent_id) REFERENCES public.parent_chunks(id) ON DELETE CASCADE;
+
+
+--
+-- Name: chunk_vectors chunk_vectors_file_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunk_vectors
+    ADD CONSTRAINT chunk_vectors_file_id_fkey FOREIGN KEY (file_id) REFERENCES public.videos(id);
+
+
+--
+-- Name: chunks chunks_file_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.chunks
+    ADD CONSTRAINT chunks_file_id_fkey FOREIGN KEY (file_id) REFERENCES public.videos(id);
+
+
+--
+-- Name: face_detections face_detections_identity_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.face_detections
+    ADD CONSTRAINT face_detections_identity_id_fkey FOREIGN KEY (identity_id) REFERENCES public.face_identities(id) ON DELETE SET NULL;
+
+
+--
+-- Name: file_lifecycle file_lifecycle_file_uuid_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.file_lifecycle
+    ADD CONSTRAINT file_lifecycle_file_uuid_fkey FOREIGN KEY (file_uuid) REFERENCES public.file_registry(file_uuid);
+
+
+--
+-- Name: monitor_jobs fk_monitor_jobs_video_id; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.monitor_jobs
+    ADD CONSTRAINT fk_monitor_jobs_video_id FOREIGN KEY (video_id) REFERENCES public.videos(id) ON DELETE CASCADE;
+
+
+--
+-- Name: videos fk_videos_job_id; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.videos
+    ADD CONSTRAINT fk_videos_job_id FOREIGN KEY (job_id) REFERENCES public.monitor_jobs(id) ON DELETE SET NULL;
+
+
+--
+-- Name: frames frames_file_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.frames
+    ADD CONSTRAINT frames_file_id_fkey FOREIGN KEY (file_id) REFERENCES public.videos(id);
+
+
+--
+-- Name: identity_bindings identity_bindings_identity_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.identity_bindings
+    ADD CONSTRAINT identity_bindings_identity_id_fkey FOREIGN KEY (identity_id) REFERENCES public.video_identities(id) ON DELETE CASCADE;
+
+
+--
+-- Name: person_appearances person_appearances_face_detection_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_appearances
+    ADD CONSTRAINT person_appearances_face_detection_id_fkey FOREIGN KEY (face_detection_id) REFERENCES public.face_detections(id) ON DELETE SET NULL;
+
+
+--
+-- Name: person_appearances person_appearances_person_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_appearances
+    ADD CONSTRAINT person_appearances_person_id_fkey FOREIGN KEY (person_id) REFERENCES public.person_identities(person_id) ON DELETE CASCADE;
+
+
+--
+-- Name: person_identities person_identities_face_identity_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.person_identities
+    ADD CONSTRAINT person_identities_face_identity_id_fkey FOREIGN KEY (face_identity_id) REFERENCES public.face_identities(id) ON DELETE SET NULL;
+
+
+--
+-- Name: processor_results processor_results_job_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.processor_results
+    ADD CONSTRAINT processor_results_job_id_fkey FOREIGN KEY (job_id) REFERENCES public.monitor_jobs(id) ON DELETE CASCADE;
+
+
+--
+-- Name: processor_results processor_results_video_id_fkey; Type: FK CONSTRAINT; Schema: public; Owner: accusys
+--
+
+ALTER TABLE ONLY public.processor_results
+    ADD CONSTRAINT processor_results_video_id_fkey FOREIGN KEY (video_id) REFERENCES public.videos(id) ON DELETE CASCADE;
+
+
+--
+-- PostgreSQL database dump complete
+--
+
+\unrestrict hRi4nBNv2E5FXxBTf47fTk0vxfJNiXtnegSYFeraY46zaCyMMlYNanEdl70C1E7
+
diff --git a/scripts/__pycache__/redis_publisher.cpython-311.pyc b/scripts/__pycache__/redis_publisher.cpython-311.pyc
deleted file mode 100644
index 5217280..0000000
Binary files a/scripts/__pycache__/redis_publisher.cpython-311.pyc and /dev/null differ
diff --git a/scripts/asrx_processor.py b/scripts/asrx_processor.py
index aaa2bc7..6511b33 100755
--- a/scripts/asrx_processor.py
+++ b/scripts/asrx_processor.py
@@ -1,124 +1,320 @@
 #!/opt/homebrew/bin/python3.11
 """
-ASRX Processor - Speaker Diarization
-Uses whisperx for speaker diarization (local model)
+ASRX Processor - Hybrid Pipeline Wrapper
+
+Pipeline:
+  1. ffprobe → select best audio track → ffmpeg → 16kHz mono WAV
+  2. SelfASRXFixed.process() (7-step hybrid speaker diarization)
+  3. Convert to Rust-expected format
 """
 
 import sys
 import json
 import argparse
 import os
+import subprocess
+import tempfile
+from pathlib import Path
 
 sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+sys.path.insert(
+    0, os.path.join(os.path.dirname(os.path.abspath(__file__)), "asrx_self")
+)
+
 from redis_publisher import RedisPublisher
 
 
-def process_asrx(video_path: str, output_path: str, uuid: str = ""):
-    """Process video for speaker diarization using whisperx"""
+def probe_audio_tracks(video_path: str) -> list:
+    """ffprobe 列出所有音軌"""
+    cmd = [
+        "ffprobe", "-v", "quiet", "-print_format", "json",
+        "-show_streams", "-select_streams", "a", video_path,
+    ]
+    try:
+        result = subprocess.run(cmd, capture_output=True, text=True, timeout=30)
+        data = json.loads(result.stdout)
+        tracks = []
+        for stream in data.get("streams", []):
+            tracks.append({
+                "index": stream.get("index"),
+                "codec": stream.get("codec_name"),
+                "language": stream.get("tags", {}).get("language", "und"),
+                "channels": stream.get("channels", 0),
+                "sample_rate": stream.get("sample_rate", "0"),
+            })
+        return tracks
+    except Exception as e:
+        print(f"[ASRX] ffprobe failed: {e}")
+        return []
 
+
+def select_best_track(tracks: list) -> int:
+    """選最佳音軌: English > 最多channels > 0"""
+    if not tracks:
+        return 0
+    for i, t in enumerate(tracks):
+        if t["language"] in ("eng", "en"):
+            return i
+    best = 0
+    for i, t in enumerate(tracks):
+        if t["channels"] > tracks[best]["channels"]:
+            best = i
+    return best
+
+
+def extract_audio_to_wav(video_path: str, track_index: int, output_wav: str) -> bool:
+    """ffmpeg 提取音軌為 16kHz mono WAV"""
+    cmd = [
+        "ffmpeg", "-y", "-v", "quiet",
+        "-i", video_path,
+        "-map", f"0:{track_index}",
+        "-ar", "16000",
+        "-ac", "1",
+        "-sample_fmt", "s16",
+        output_wav,
+    ]
+    try:
+        subprocess.run(cmd, check=True, capture_output=True, timeout=300)
+        return True
+    except Exception as e:
+        print(f"[ASRX] ffmpeg extraction failed: {e}")
+        return False
+
+
+def _cleanup(tmp_dir):
+    if tmp_dir and os.path.exists(tmp_dir):
+        import shutil
+        shutil.rmtree(tmp_dir, ignore_errors=True)
+
+
+def _atomic_write(path: str, data: dict):
+    tmp = path + ".tmp"
+    with open(tmp, "w") as f:
+        json.dump(data, f, indent=2)
+    os.rename(tmp, path)
+
+
+def _shared_audio_setup(video_path):
+    """提取音頻，回傳 (tmp_dir, wav_path)"""
+    tracks = probe_audio_tracks(video_path)
+    track_idx = select_best_track(tracks) if tracks else 0
+    actual_track_index = tracks[track_idx]["index"] if tracks else track_idx
+
+    tmp_dir = tempfile.mkdtemp(prefix="asrx_")
+    wav_path = os.path.join(tmp_dir, "audio.wav")
+
+    if extract_audio_to_wav(video_path, actual_track_index, wav_path):
+        return tmp_dir, wav_path
+    print("[ASRX] Audio extraction failed, falling back to original file",
+          file=sys.stderr)
+    return tmp_dir, video_path
+
+
+def _convert_result(result, output_path):
+    """Stage 3: 將 SelfASRXFixed result 轉為 Rust-expected format"""
+    fps = 30.0
+    base_name = os.path.basename(output_path)
+    uuid_part = base_name.split(".")[0]
+    probe_path = os.path.join(os.path.dirname(output_path),
+                              f"{uuid_part}.probe.json")
+    if os.path.exists(probe_path):
+        try:
+            with open(probe_path) as pf:
+                probe_data = json.load(pf)
+                if "fps" in probe_data:
+                    fps = float(probe_data["fps"])
+        except Exception:
+            pass
+
+    output_result = {
+        "language": result.get("language"),
+        "segments": [],
+        "n_speakers": result.get("n_speakers", 0),
+        "speaker_stats": result.get("speaker_stats", {}),
+    }
+
+    for seg in result.get("segments", []):
+        start_sec = seg["start"]
+        end_sec = seg["end"]
+        output_result["segments"].append({
+            "start_time": start_sec,
+            "end_time": end_sec,
+            "start_frame": int(start_sec * fps),
+            "end_frame": int(end_sec * fps),
+            "text": seg.get("text", ""),
+            "speaker_id": seg.get("speaker_id", seg.get("speaker", "")),
+            "language": seg.get("language", ""),
+            "lang_prob": seg.get("lang_prob", 0.0),
+            "quality": seg.get("quality", 0.0),
+        })
+
+    if "references" in result:
+        output_result["references"] = result["references"]
+
+    return output_result
+
+
+def process_asrx(video_path: str, output_path: str, uuid: str = "",
+                 file_uuid: str = "", resume: bool = False):
+    """主處理函數"""
     publisher = RedisPublisher(uuid) if uuid else None
     if publisher:
         publisher.info("asrx", "ASRX_START")
 
-    try:
-        import whisperx
-        import torch
-    except ImportError:
-        if publisher:
-            publisher.error("asrx", "whisperx not installed")
-        result = {"language": None, "segments": []}
-        if publisher:
-            publisher.complete("asrx", "0 segments")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        return result
+    checkpoint_path = output_path + ".stage1.json"
 
-    if publisher:
-        publisher.info("asrx", "ASRX_LOADING_MODEL")
+    # ── Phase 2: Resume from checkpoint (Steps 4-7 only) ──
+    if resume and os.path.exists(checkpoint_path):
+        print(f"[ASRX] Found checkpoint, resuming from Step 4...")
+        tmp_dir, audio_input = _shared_audio_setup(video_path)
+        try:
+            from asrx_self.main_fixed import SelfASRXFixed
+            asrx = SelfASRXFixed()
+
+            result = asrx.resume_from_checkpoint(
+                checkpoint_path, audio_input, output_path=output_path,
+            )
+
+            if "error" in result:
+                if publisher:
+                    publisher.error("asrx", result["error"])
+                output_result = {"language": None, "segments": []}
+                _atomic_write(output_path, output_result)
+                if publisher:
+                    publisher.complete("asrx", "0 segments")
+                _cleanup(tmp_dir)
+                return output_result
+
+            output_result = _convert_result(result, output_path)
+
+            if publisher:
+                publisher.info("asrx",
+                               f"ASRX_COMPLETE:{len(output_result['segments'])}")
+
+            _atomic_write(output_path, output_result)
+
+            if publisher:
+                publisher.complete(
+                    "asrx", f"{len(output_result['segments'])} segments")
+
+            print(f"[ASRX] Saved {len(output_result['segments'])} segments "
+                  f"to {output_path}", file=sys.stderr)
+
+            # 刪除 checkpoint（完成後清理）
+            try:
+                os.remove(checkpoint_path)
+                print(f"[ASRX] Removed checkpoint: {checkpoint_path}")
+            except Exception:
+                pass
+
+            _cleanup(tmp_dir)
+            return output_result
+        except Exception as e:
+            if publisher:
+                publisher.error("asrx", str(e))
+            import traceback
+            traceback.print_exc()
+            output_result = {"language": None, "segments": []}
+            _atomic_write(output_path, output_result)
+            if publisher:
+                publisher.complete("asrx", "0 segments")
+            _cleanup(tmp_dir)
+            return output_result
+
+    # ── Phase 1: Full 7-step pipeline ──
+    tmp_dir = None
 
     try:
-        # Fix for PyTorch 2.6+ compatibility
-        # Allow omegaconf types in torch.load
-        import omegaconf
+        # Stage 1: Audio Track Preprocessing
+        tmp_dir, audio_input = _shared_audio_setup(video_path)
 
-        torch.serialization.add_safe_globals(
-            [omegaconf.listconfig.ListConfig, omegaconf.dictconfig.DictConfig]
-        )
+        # Stage 2: SelfASRXFixed 7-step pipeline
+        from asrx_self.main_fixed import SelfASRXFixed
 
-        # Load model - using faster-whisper for better performance
-        # You can also use: "large-v3", "medium", "small", "base", "tiny"
-        model = whisperx.load_model("base", device="cpu", compute_type="int8")
+        if publisher:
+            publisher.info("asrx", "ASRX_LOADING_MODEL")
+
+        asrx = SelfASRXFixed()
 
         if publisher:
             publisher.info("asrx", "ASRX_TRANSCRIBING")
 
-        # Transcribe audio
-        result = model.transcribe(video_path, language="en")
-
-        # Align timestamps
-        model_a, metadata = whisperx.load_align_model(language_code=result["language"])
-        result = whisperx.align(
-            result["segments"], model_a, metadata, video_path, device="cpu"
+        result = asrx.process(
+            audio_input,
+            output_path=None,
+            file_uuid=file_uuid or None,
+            max_speakers=10,
+            quality_threshold=0.85,
+            checkpoint_path=checkpoint_path,
         )
 
-        # Diarization (speaker segmentation)
-        try:
-            from whisperx.diarize import DiarizationPipeline
-
-            # DiarizationPipeline parameters: model_name, token, device, cache_dir
-            diarize_model = DiarizationPipeline(
-                model_name="pyannote/speaker-diarization",
-                token=None,  # HuggingFace token (None for public models)
-                device="cpu",
-            )
-            diarize_segments = diarize_model(video_path)
-
-            # Assign speaker labels
-            result = whisperx.assign_word_speakers(diarize_segments, result)
-        except Exception as e:
+        if "error" in result:
             if publisher:
-                publisher.info("asrx", f"Diarization skipped: {e}")
+                publisher.error("asrx", result["error"])
+            output_result = {"language": None, "segments": []}
+            _atomic_write(output_path, output_result)
+            if publisher:
+                publisher.complete("asrx", "0 segments")
+            _cleanup(tmp_dir)
+            return output_result
 
-        # Build output
-        segments = []
-        for seg in result.get("segments", []):
-            text = seg.get("text", "").strip()
-            if text:
-                segments.append(
-                    {
-                        "start": seg.get("start", 0.0),
-                        "end": seg.get("end", 0.0),
-                        "text": text,
-                        "speaker_id": seg.get("speaker", None),
-                    }
-                )
-
-        output_result = {"language": result.get("language"), "segments": segments}
+        # Stage 3: Convert to Rust-expected format
+        output_result = _convert_result(result, output_path)
 
         if publisher:
-            publisher.complete("asrx", f"{len(segments)} segments")
+            publisher.info("asrx", f"ASRX_COMPLETE:{len(output_result['segments'])}")
 
-        with open(output_path, "w") as f:
-            json.dump(output_result, f, indent=2)
+        _atomic_write(output_path, output_result)
 
+        if publisher:
+            publisher.complete("asrx",
+                               f"{len(output_result['segments'])} segments")
+
+        print(f"[ASRX] Saved {len(output_result['segments'])} segments "
+              f"to {output_path}", file=sys.stderr)
+
+        _cleanup(tmp_dir)
         return output_result
 
     except Exception as e:
         if publisher:
-            publisher.error("asrx", f"Error: {e}")
-        result = {"language": None, "segments": []}
+            publisher.error("asrx", str(e))
+        import traceback
+        traceback.print_exc()
+
+        output_result = {"language": None, "segments": []}
+        _atomic_write(output_path, output_result)
         if publisher:
             publisher.complete("asrx", "0 segments")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        return result
+        # 如果 checkpoint 已存在（Step 3 完成後 crash），保留 WAV 給 resume
+        if not os.path.exists(checkpoint_path):
+            _cleanup(tmp_dir)
+        else:
+            print(f"[ASRX] Checkpoint saved, keeping temp dir for resume: {tmp_dir}")
+        return output_result
 
 
 if __name__ == "__main__":
-    parser = argparse.ArgumentParser(description="ASRX Speaker Diarization")
-    parser.add_argument("video_path", help="Path to video file")
-    parser.add_argument("output_path", help="Output JSON path")
-    parser.add_argument("--uuid", "-u", help="UUID for Redis progress", default="")
+    parser = argparse.ArgumentParser(description="ASRX Processor (Hybrid Pipeline)")
+    parser.add_argument("video_path", help="Path to video/audio file")
+    parser.add_argument("output_path", help="Path to output JSON file")
+    parser.add_argument("--uuid", help="UUID for Redis publishing", default="")
+    parser.add_argument("--file-uuid", help="File UUID for Qdrant storage", default="")
+    parser.add_argument("--resume", action="store_true",
+                        help="Resume from checkpoint (skip Steps 1-3)")
+
     args = parser.parse_args()
 
-    process_asrx(args.video_path, args.output_path, args.uuid)
+    if not args.resume and not Path(args.video_path).exists():
+        print(f"Error: Video file not found: {args.video_path}")
+        sys.exit(1)
+
+    result = process_asrx(args.video_path, args.output_path, args.uuid,
+                          args.file_uuid, resume=args.resume)
+
+    print("\n[Summary]")
+    print(f"  Total segments: {len(result.get('segments', []))}")
+    if "speaker_stats" in result:
+        print(f"  Detected speakers: {len(result['speaker_stats'])}")
+        for speaker, stats in result["speaker_stats"].items():
+            print(f"    {speaker}: {stats['count']} segments")
diff --git a/scripts/asrx_processor_contract_v1.py b/scripts/asrx_processor_contract_v1.py
deleted file mode 100644
index a06bcc3..0000000
--- a/scripts/asrx_processor_contract_v1.py
+++ /dev/null
@@ -1,584 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-ASRX Processor - AI-Driven Processor Contract Version 1.0
-
-Compliant with AI-Driven Processor Contract v1.0
-Effective Date: 2025-03-27
-
-Features:
-1. Standardized command-line interface
-2. Redis progress reporting
-3. Signal handling (SIGTERM, SIGINT)
-4. Health check mode
-5. Resource monitoring
-6. Contract-compliant JSON output
-7. Unified configuration
-"""
-
-import sys
-import json
-import os
-import argparse
-import signal
-import time
-import subprocess
-import traceback
-from datetime import datetime
-from typing import Dict, Any
-
-# Redis Publisher for progress reporting
-try:
-    sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-    from redis_publisher import RedisPublisher
-
-    REDIS_AVAILABLE = True
-except ImportError:
-    REDIS_AVAILABLE = False
-    print(
-        "WARNING: RedisPublisher not available, progress reporting disabled",
-        file=sys.stderr,
-    )
-
-# Contract version
-CONTRACT_VERSION = "1.0"
-PROCESSOR_NAME = (
-    "/Users/accusys/momentry_core_0.1/scripts/asrx_processor_contract_v1.py"
-)
-PROCESSOR_VERSION = "1.0.0"
-MODEL_NAME = "pyannote"
-MODEL_VERSION = "3.1"
-
-# Unified configuration defaults
-DEFAULT_TIMEOUT = 7200  # 2 hours for speaker diarization
-DEFAULT_MODEL_SIZE = "base"
-DEFAULT_DEVICE = "cpu"
-DEFAULT_LANGUAGE = "auto"
-DEFAULT_BATCH_SIZE = 16
-DEFAULT_DIARIZATION = True
-DEFAULT_MIN_SPEAKERS = 1
-DEFAULT_MAX_SPEAKERS = 10
-
-
-# Signal handling with timeout support
-class SignalHandler:
-    """Handle system signals for graceful shutdown"""
-
-    def __init__(self):
-        self.should_exit = False
-        self.exit_code = 0
-        signal.signal(signal.SIGTERM, self.handle_signal)
-        signal.signal(signal.SIGINT, self.handle_signal)
-
-    def handle_signal(self, signum, frame):
-        """Handle termination signals"""
-        print(f"\n收到信号 {signum}，正在优雅关闭...")
-        self.should_exit = True
-        self.exit_code = 128 + signum
-
-    def should_stop(self):
-        """Check if should stop processing"""
-        return self.should_exit
-
-
-# Timeout manager
-class TimeoutManager:
-    """Manage processing timeouts"""
-
-    def __init__(self, timeout_seconds: int):
-        self.timeout_seconds = timeout_seconds
-        self.start_time = time.time()
-        self.timer = None
-
-    def check_timeout(self) -> bool:
-        """Check if timeout has been reached"""
-        elapsed = time.time() - self.start_time
-        return elapsed > self.timeout_seconds
-
-    def get_remaining_time(self) -> float:
-        """Get remaining time in seconds"""
-        elapsed = time.time() - self.start_time
-        return max(0, self.timeout_seconds - elapsed)
-
-    def format_remaining_time(self) -> str:
-        """Format remaining time as HH:MM:SS"""
-        remaining = self.get_remaining_time()
-        hours = int(remaining // 3600)
-        minutes = int((remaining % 3600) // 60)
-        seconds = int(remaining % 60)
-        return f"{hours:02d}:{minutes:02d}:{seconds:02d}"
-
-
-# Health check functions
-def check_environment() -> Dict[str, Any]:
-    """Check environment and dependencies"""
-    checks = []
-
-    # Check 1: whisperx for speaker diarization
-    try:
-        import whisperx
-
-        checks.append(
-            {
-                "name": "whisperx",
-                "status": "available",
-                "version": getattr(whisperx, "__version__", "unknown"),
-            }
-        )
-    except ImportError:
-        checks.append({"name": "whisperx", "status": "missing", "version": None})
-
-    # Check 2: FFmpeg/FFprobe
-    try:
-        ffprobe_result = subprocess.run(
-            ["ffprobe", "-version"],
-            capture_output=True,
-            text=True,
-            timeout=5,
-        )
-        if ffprobe_result.returncode == 0:
-            version_line = ffprobe_result.stdout.split("\n")[0]
-            checks.append(
-                {"name": "ffprobe", "status": "available", "version": version_line}
-            )
-        else:
-            checks.append({"name": "ffprobe", "status": "error", "version": None})
-    except (subprocess.TimeoutExpired, FileNotFoundError):
-        checks.append({"name": "ffprobe", "status": "missing", "version": None})
-
-    # Check 3: Redis (optional)
-    checks.append(
-        {
-            "name": "redis",
-            "status": "available" if REDIS_AVAILABLE else "optional",
-            "version": None,
-        }
-    )
-
-    # Check 4: Python version
-    checks.append(
-        {
-            "name": "python",
-            "status": "available",
-            "version": f"{sys.version_info.major}.{sys.version_info.minor}.{sys.version_info.micro}",
-        }
-    )
-
-    # Check 5: CUDA/GPU availability (optional)
-    try:
-        import torch
-
-        cuda_available = torch.cuda.is_available()
-        checks.append(
-            {
-                "name": "cuda",
-                "status": "available" if cuda_available else "optional",
-                "version": torch.version.cuda if cuda_available else None,
-            }
-        )
-    except ImportError:
-        checks.append({"name": "cuda", "status": "optional", "version": None})
-
-    return {
-        "timestamp": datetime.now().isoformat(),
-        "processor_name": PROCESSOR_NAME,
-        "processor_version": PROCESSOR_VERSION,
-        "contract_version": CONTRACT_VERSION,
-        "model_name": MODEL_NAME,
-        "model_version": MODEL_VERSION,
-        "checks": checks,
-    }
-
-
-def check_video_file(video_path: str) -> Dict[str, Any]:
-    """Check video file properties"""
-    try:
-        result = subprocess.run(
-            [
-                "ffprobe",
-                "-v",
-                "error",
-                "-select_streams",
-                "v:0",
-                "-show_entries",
-                "stream=codec_name,width,height,duration,r_frame_rate",
-                "-show_entries",
-                "format=duration,size",
-                "-of",
-                "json",
-                video_path,
-            ],
-            capture_output=True,
-            text=True,
-            timeout=10,
-        )
-
-        if result.returncode != 0:
-            return {
-                "valid": False,
-                "error": result.stderr[:200] if result.stderr else "Unknown error",
-            }
-
-        info = json.loads(result.stdout)
-
-        video_info = {}
-        if "streams" in info and len(info["streams"]) > 0:
-            stream = info["streams"][0]
-            video_info = {
-                "codec": stream.get("codec_name", "unknown"),
-                "width": int(stream.get("width", 0)),
-                "height": int(stream.get("height", 0)),
-                "duration": float(stream.get("duration", 0)),
-                "frame_rate": stream.get("r_frame_rate", "0/0"),
-            }
-
-        format_info = {}
-        if "format" in info:
-            format_info = {
-                "format_duration": float(info["format"].get("duration", 0)),
-                "file_size": int(info["format"].get("size", 0)),
-            }
-
-        return {
-            "valid": True,
-            "video_info": video_info,
-            "format_info": format_info,
-            "exists": os.path.exists(video_path),
-            "file_size": os.path.getsize(video_path)
-            if os.path.exists(video_path)
-            else 0,
-        }
-
-    except Exception as e:
-        return {"valid": False, "error": str(e)}
-
-
-# Main processing function
-def process_asrx(
-    video_path: str,
-    output_path: str,
-    uuid: str = "",
-    model_size: str = DEFAULT_MODEL_SIZE,
-    device: str = DEFAULT_DEVICE,
-    language: str = DEFAULT_LANGUAGE,
-    batch_size: int = DEFAULT_BATCH_SIZE,
-    diarization: bool = DEFAULT_DIARIZATION,
-    min_speakers: int = DEFAULT_MIN_SPEAKERS,
-    max_speakers: int = DEFAULT_MAX_SPEAKERS,
-    timeout: int = DEFAULT_TIMEOUT,
-) -> Dict[str, Any]:
-    """Process video for speaker diarization using whisperx"""
-
-    # Initialize
-    signal_handler = SignalHandler()
-    timeout_manager = TimeoutManager(timeout)
-    publisher = RedisPublisher(uuid) if REDIS_AVAILABLE and uuid else None
-
-    def publish(stage: str, message: str, data: Dict = None):
-        if publisher:
-            publisher.info(PROCESSOR_NAME, stage, message, data)
-
-    publish("ASRX_START", f"开始处理: {os.path.basename(video_path)}")
-
-    result = {
-        "processor_name": PROCESSOR_NAME,
-        "processor_version": PROCESSOR_VERSION,
-        "contract_version": CONTRACT_VERSION,
-        "model_name": MODEL_NAME,
-        "model_version": MODEL_VERSION,
-        "video_path": video_path,
-        "output_path": output_path,
-        "uuid": uuid,
-        "timestamp": datetime.now().isoformat(),
-        "parameters": {
-            "model_size": model_size,
-            "device": device,
-            "language": language,
-            "batch_size": batch_size,
-            "diarization": diarization,
-            "min_speakers": min_speakers,
-            "max_speakers": max_speakers,
-            "timeout": timeout,
-        },
-        "success": False,
-        "error": None,
-        "segments": [],
-        "speakers": [],
-        "processing_time": 0,
-        "resource_usage": {},
-    }
-
-    start_time = time.time()
-
-    try:
-        # Check timeout
-        if timeout_manager.check_timeout():
-            raise TimeoutError(f"超时 ({timeout} 秒)")
-
-        # Check if should exit
-        if signal_handler.should_stop():
-            raise KeyboardInterrupt("收到停止信号")
-
-        # Check video file
-        publish("ASRX_CHECK_VIDEO", "检查视频文件")
-        video_check = check_video_file(video_path)
-        if not video_check.get("valid", False):
-            raise ValueError(f"无效的视频文件: {video_check.get('error', '未知错误')}")
-
-        result["video_info"] = video_check.get("video_info", {})
-        result["format_info"] = video_check.get("format_info", {})
-
-        # Import whisperx
-        publish("ASRX_LOAD_MODEL", f"加载模型: {model_size}")
-        try:
-            import whisperx
-        except ImportError as e:
-            raise ImportError(f"whisperx 未安装: {e}")
-
-        # Load model
-        publish("ASRX_LOADING", f"加载 whisperx 模型 ({model_size}, {device})")
-        model = whisperx.load_model(
-            model_size,
-            device=device,
-            compute_type="int8" if device == "cpu" else "float16",
-        )
-
-        # Transcribe
-        publish("ASRX_TRANSCRIBING", "转录音频")
-        transcript = model.transcribe(
-            video_path,
-            language=language if language != "auto" else None,
-            batch_size=batch_size,
-        )
-
-        # Align timestamps
-        publish("ASRX_ALIGNING", "对齐时间戳")
-        model_a, metadata = whisperx.load_align_model(
-            language_code=transcript["language"]
-        )
-        transcript = whisperx.align(
-            transcript["segments"],
-            model_a,
-            metadata,
-            video_path,
-            device,
-            return_char_alignments=False,
-        )
-
-        # Speaker diarization
-        if diarization:
-            publish("ASRX_DIARIZATION", "说话人分离")
-            diarize_model = whisperx.DiarizationPipeline(
-                use_auth_token=None, device=device
-            )
-
-            # Add min/max speakers
-            diarize_segments = diarize_model(
-                video_path,
-                min_speakers=min_speakers,
-                max_speakers=max_speakers,
-            )
-
-            transcript = whisperx.assign_word_speakers(diarize_segments, transcript)
-
-            # Extract speaker information
-            speakers = {}
-            for segment in transcript["segments"]:
-                if "speaker" in segment:
-                    speaker_id = segment["speaker"]
-                    if speaker_id not in speakers:
-                        speakers[speaker_id] = {
-                            "id": speaker_id,
-                            "segment_count": 0,
-                            "total_words": 0,
-                            "total_duration": 0.0,
-                        }
-
-                    speakers[speaker_id]["segment_count"] += 1
-                    speakers[speaker_id]["total_words"] += len(
-                        segment.get("text", "").split()
-                    )
-                    speakers[speaker_id]["total_duration"] += segment.get(
-                        "end", 0
-                    ) - segment.get("start", 0)
-
-            result["speakers"] = list(speakers.values())
-
-        # Format segments
-        segments = []
-        for segment in transcript.get("segments", []):
-            segments.append(
-                {
-                    "start": segment.get("start", 0.0),
-                    "end": segment.get("end", 0.0),
-                    "text": segment.get("text", ""),
-                    "speaker": segment.get("speaker", None),
-                    "words": segment.get("words", []),
-                    "confidence": segment.get("confidence", 0.0),
-                }
-            )
-
-        result["segments"] = segments
-        result["language"] = transcript.get("language", "unknown")
-        result["success"] = True
-
-        publish("ASRX_COMPLETE", f"完成: {len(segments)} 个片段")
-
-    except TimeoutError as e:
-        result["error"] = f"处理超时: {e}"
-        publish("ASRX_TIMEOUT", f"超时: {e}")
-    except KeyboardInterrupt:
-        result["error"] = "处理被用户中断"
-        publish("ASRX_INTERRUPTED", "处理被中断")
-    except ImportError as e:
-        result["error"] = f"依赖缺失: {e}"
-        publish("ASRX_MISSING_DEPS", f"缺少依赖: {e}")
-    except Exception as e:
-        result["error"] = f"处理错误: {str(e)}"
-        publish("ASRX_ERROR", f"错误: {str(e)}")
-        traceback.print_exc()
-
-    # Calculate processing time
-    processing_time = time.time() - start_time
-    result["processing_time"] = processing_time
-
-    # Add resource usage
-    try:
-        import psutil
-
-        process = psutil.Process()
-        memory_info = process.memory_info()
-        result["resource_usage"] = {
-            "cpu_percent": process.cpu_percent(),
-            "memory_mb": memory_info.rss / (1024 * 1024),
-            "user_time": process.cpu_times().user,
-            "system_time": process.cpu_times().system,
-        }
-    except ImportError:
-        result["resource_usage"] = {"error": "psutil not available"}
-
-    # Save result
-    try:
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2, ensure_ascii=False)
-        publish("ASRX_SAVED", f"结果保存到: {output_path}")
-    except Exception as e:
-        result["error"] = f"保存结果失败: {str(e)}"
-        publish("ASRX_SAVE_ERROR", f"保存失败: {str(e)}")
-
-    return result
-
-
-def main():
-    """Main entry point"""
-    parser = argparse.ArgumentParser(
-        description=f"{PROCESSOR_NAME.upper()} Processor v{PROCESSOR_VERSION} - Speaker Diarization"
-    )
-    parser.add_argument("video_path", help="Path to input video file")
-    parser.add_argument("output_path", help="Path to output JSON file")
-    parser.add_argument("--uuid", help="UUID for progress tracking", default="")
-    parser.add_argument(
-        "--model-size",
-        help=f"Model size (default: {DEFAULT_MODEL_SIZE})",
-        default=DEFAULT_MODEL_SIZE,
-        choices=["tiny", "base", "small", "medium", "large-v3"],
-    )
-    parser.add_argument(
-        "--device",
-        help=f"Device to use (default: {DEFAULT_DEVICE})",
-        default=DEFAULT_DEVICE,
-        choices=["cpu", "cuda"],
-    )
-    parser.add_argument(
-        "--language",
-        help=f"Language code or 'auto' (default: {DEFAULT_LANGUAGE})",
-        default=DEFAULT_LANGUAGE,
-    )
-    parser.add_argument(
-        "--batch-size",
-        help=f"Batch size for processing (default: {DEFAULT_BATCH_SIZE})",
-        type=int,
-        default=DEFAULT_BATCH_SIZE,
-    )
-    parser.add_argument(
-        "--no-diarization",
-        help="Disable speaker diarization",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--min-speakers",
-        help=f"Minimum number of speakers (default: {DEFAULT_MIN_SPEAKERS})",
-        type=int,
-        default=DEFAULT_MIN_SPEAKERS,
-    )
-    parser.add_argument(
-        "--max-speakers",
-        help=f"Maximum number of speakers (default: {DEFAULT_MAX_SPEAKERS})",
-        type=int,
-        default=DEFAULT_MAX_SPEAKERS,
-    )
-    parser.add_argument(
-        "--timeout",
-        help=f"Timeout in seconds (default: {DEFAULT_TIMEOUT})",
-        type=int,
-        default=DEFAULT_TIMEOUT,
-    )
-    parser.add_argument(
-        "--health-check",
-        help="Run health check and exit",
-        action="store_true",
-    )
-    parser.add_argument(
-        "--check-video",
-        help="Check video file and exit",
-        action="store_true",
-    )
-
-    args = parser.parse_args()
-
-    # Health check mode
-    if args.health_check:
-        health = check_environment()
-        print(json.dumps(health, indent=2, ensure_ascii=False))
-        return (
-            0
-            if all(c["status"] in ["available", "optional"] for c in health["checks"])
-            else 1
-        )
-
-    # Video check mode
-    if args.check_video:
-        video_check = check_video_file(args.video_path)
-        print(json.dumps(video_check, indent=2, ensure_ascii=False))
-        return 0 if video_check.get("valid", False) else 1
-
-    # Normal processing mode
-    result = process_asrx(
-        video_path=args.video_path,
-        output_path=args.output_path,
-        uuid=args.uuid,
-        model_size=args.model_size,
-        device=args.device,
-        language=args.language,
-        batch_size=args.batch_size,
-        diarization=not args.no_diarization,
-        min_speakers=args.min_speakers,
-        max_speakers=args.max_speakers,
-        timeout=args.timeout,
-    )
-
-    # Print result summary
-    if result.get("success", False):
-        print(f"✅ {PROCESSOR_NAME.upper()} 处理成功")
-        print(f"   片段数: {len(result.get('segments', []))}")
-        print(f"   说话人数: {len(result.get('speakers', []))}")
-        print(f"   处理时间: {result.get('processing_time', 0):.1f} 秒")
-        print(f"   输出文件: {args.output_path}")
-        return 0
-    else:
-        print(f"❌ {PROCESSOR_NAME.upper()} 处理失败")
-        print(f"   错误: {result.get('error', '未知错误')}")
-        return 1
-
-
-if __name__ == "__main__":
-    sys.exit(main())
diff --git a/scripts/asrx_processor_custom.py b/scripts/asrx_processor_custom.py
deleted file mode 100644
index 33168e8..0000000
--- a/scripts/asrx_processor_custom.py
+++ /dev/null
@@ -1,328 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-ASRX Processor - Custom Implementation Wrapper
-Uses SpeechBrain ECAPA-TDNN (no HuggingFace token required)
-
-Pipeline:
-  1. Preprocess: ffprobe audio tracks → select best track → extract WAV
-  2. Process: VAD (Silero) → Speaker embedding (ECAPA-TDNN) → Spectral clustering
-  3. Output: segments with speaker_id
-"""
-
-import sys
-import json
-import argparse
-import os
-import subprocess
-import tempfile
-from pathlib import Path
-
-sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-sys.path.insert(
-    0, os.path.join(os.path.dirname(os.path.abspath(__file__)), "asrx_self")
-)
-
-from redis_publisher import RedisPublisher
-
-
-def probe_audio_tracks(video_path: str) -> list:
-    """Use ffprobe to list all audio tracks in the video file."""
-    cmd = [
-        "ffprobe", "-v", "quiet", "-print_format", "json",
-        "-show_streams", "-select_streams", "a", video_path,
-    ]
-    try:
-        result = subprocess.run(cmd, capture_output=True, text=True, timeout=30)
-        data = json.loads(result.stdout)
-        tracks = []
-        for stream in data.get("streams", []):
-            track = {
-                "index": stream.get("index"),
-                "codec": stream.get("codec_name"),
-                "language": stream.get("tags", {}).get("language", "und"),
-                "channels": stream.get("channels", 0),
-                "sample_rate": stream.get("sample_rate", "0"),
-            }
-            tracks.append(track)
-        return tracks
-    except Exception as e:
-        print(f"[ASRX] ffprobe failed: {e}")
-        return []
-
-
-def select_best_track(tracks: list) -> int:
-    """Select the best audio track: English > first available > fallback to 0."""
-    if not tracks:
-        return 0
-
-    # Priority 1: English track
-    for i, t in enumerate(tracks):
-        if t["language"] == "eng" or t["language"] == "en":
-            print(f"[ASRX] Selected English track (index {t['index']})")
-            return i
-
-    # Priority 2: First track with the most channels
-    best = 0
-    for i, t in enumerate(tracks):
-        if t["channels"] > tracks[best]["channels"]:
-            best = i
-
-    print(f"[ASRX] Selected track {best} (lang={tracks[best]['language']}, ch={tracks[best]['channels']})")
-    return best
-
-
-def extract_audio_to_wav(video_path: str, track_index: int, output_wav: str) -> bool:
-    """Extract selected audio track to 16kHz mono WAV using ffmpeg."""
-    cmd = [
-        "ffmpeg", "-y", "-v", "quiet",
-        "-i", video_path,
-        "-map", f"0:{track_index}",
-        "-ar", "16000",
-        "-ac", "1",
-        "-sample_fmt", "s16",
-        output_wav,
-    ]
-    try:
-        subprocess.run(cmd, check=True, capture_output=True, timeout=300)
-        return True
-    except Exception as e:
-        print(f"[ASRX] ffmpeg extraction failed: {e}")
-        return False
-
-
-def _cleanup(tmp_dir):
-    """Clean up temporary directory."""
-    if tmp_dir and os.path.exists(tmp_dir):
-        import shutil
-        shutil.rmtree(tmp_dir, ignore_errors=True)
-
-
-def process_asrx_custom(video_path: str, output_path: str, uuid: str = ""):
-    """Process video for speaker diarization using custom implementation"""
-
-    publisher = RedisPublisher(uuid) if uuid else None
-    if publisher:
-        publisher.info("asrx", "ASRX_START")
-
-    tmp_dir = None
-
-    try:
-        # Ensure working directory is the scripts dir for model loading
-        script_dir = os.path.dirname(os.path.abspath(__file__))
-        os.chdir(script_dir)
-
-        # Debug: check ffmpeg availability
-        import shutil
-        ffmpeg_path = shutil.which("ffmpeg")
-        print(f"[ASRX] ffmpeg: {ffmpeg_path}", file=sys.stderr)
-        print(f"[ASRX] CWD: {os.getcwd()}", file=sys.stderr)
-
-        # ---- Stage 1: Audio Track Preprocessing ----
-        print("\n[ASRX] ===== Stage 1: Audio Track Analysis =====", file=sys.stderr)
-        print(f"[ASRX] Input: {video_path}", file=sys.stderr)
-
-        tracks = probe_audio_tracks(video_path)
-        if tracks:
-            print(f"[ASRX] Found {len(tracks)} audio track(s):", file=sys.stderr)
-            for t in tracks:
-                print(f"  Track {t['index']}: {t['codec']} {t['channels']}ch {t['sample_rate']}Hz lang={t['language']}", file=sys.stderr)
-        else:
-            print("[ASRX] No audio tracks found via ffprobe, using raw file", file=sys.stderr)
-
-        # Select best track
-        track_idx = select_best_track(tracks) if tracks else 0
-        actual_track_index = tracks[track_idx]["index"] if tracks else track_idx
-
-        # Extract audio to WAV
-        tmp_dir = tempfile.mkdtemp(prefix="asrx_")
-        wav_path = os.path.join(tmp_dir, "audio.wav")
-
-        if extract_audio_to_wav(video_path, actual_track_index, wav_path):
-            wav_size = os.path.getsize(wav_path)
-            print(f"[ASRX] Audio extracted: {wav_path} ({wav_size / 1024 / 1024:.1f}MB)", file=sys.stderr)
-            audio_input = wav_path
-        else:
-            print("[ASRX] Audio extraction failed, falling back to original file", file=sys.stderr)
-            audio_input = video_path
-
-        # ---- Stage 2: Load ASR segments for time alignment ----
-        # Try multiple paths to find ASR JSON
-        asr_segments = []
-        asr_fallback_reason = ""
-        asr_candidates = [
-            output_path.replace(".asrx.json", ".asr.json") if output_path else "",
-            os.path.join(os.path.dirname(output_path) if output_path else ".", os.path.basename(video_path).rsplit(".", 1)[0] + ".asr.json"),
-            os.path.join(os.path.dirname(output_path) if output_path else ".", "dd61fda85fee441fdd00ab5528213ff7.asr.json"),
-        ]
-        asr_path = ""
-        for candidate in asr_candidates:
-            if candidate and os.path.exists(candidate):
-                asr_path = candidate
-                break
-        if asr_path:
-            try:
-                with open(asr_path) as f:
-                    asr_data = json.load(f)
-                asr_segments = asr_data.get("segments", [])
-                print(f"[ASRX] Loaded {len(asr_segments)} ASR segments from {asr_path}", file=sys.stderr)
-                asr_fallback_reason = f"loaded_{len(asr_segments)}_segments"
-            except Exception as e:
-                asr_fallback_reason = f"load_error_{e}"
-                print(f"[ASRX] Failed to load ASR segments: {e}", file=sys.stderr)
-        else:
-            asr_fallback_reason = f"asr_json_not_found_tried_{len(asr_candidates)}_paths"
-            print(f"[ASRX] ASR output not found, tried {len(asr_candidates)} paths. First candidate: {asr_candidates[0]}", file=sys.stderr)
-
-        # ---- Stage 3: ASRX Processing ----
-        from asrx_self.main_fixed import SelfASRXFixed
-
-        if publisher:
-            publisher.info("asrx", "ASRX_LOADING_MODEL")
-
-        asrx = SelfASRXFixed()
-
-        if publisher:
-            publisher.info("asrx", "ASRX_TRANSCRIBING")
-
-        if asr_segments:
-            # Use ASR segment boundaries for speaker embedding extraction
-            print(f"[ASRX] Using {len(asr_segments)} ASR segments for diarization", file=sys.stderr)
-            result = asrx.process_with_segments(
-                audio_input,
-                asr_segments,
-                output_path=None,
-            )
-        else:
-            # Fallback: VAD-based diarization
-            result = asrx.process(
-                audio_input,
-                output_path=None,
-                min_speech_duration_ms=500,
-                max_speakers=10,
-            )
-
-        if "error" in result:
-            if publisher:
-                publisher.error("asrx", result["error"])
-
-            # Return empty result
-            output_result = {"language": None, "segments": []}
-
-            with open(output_path, "w") as f:
-                json.dump(output_result, f, indent=2)
-
-            if publisher:
-                publisher.complete("asrx", "0 segments")
-
-            _cleanup(tmp_dir)
-            return output_result
-
-        # Convert to Rust-expected format (start_frame/end_frame/speaker)
-        # Read fps from probe json ({file_uuid}.probe.json)
-        _debug = {"asr_fallback": asr_fallback_reason, "asr_path": asr_path}
-        fps = 30.0
-        output_dir = os.path.dirname(output_path) if output_path else "."
-        base_name = os.path.basename(output_path) if output_path else ""
-        # Extract uuid from {uuid}.{type}.json format
-        uuid_part = base_name.split(".")[0] if base_name else ""
-        probe_candidates = [
-            os.path.join(output_dir, f"{uuid_part}.probe.json"),
-        ]
-        for p in probe_candidates:
-            if os.path.exists(p):
-                try:
-                    with open(p) as pf:
-                        probe_data = json.load(pf)
-                        if "fps" in probe_data:
-                            fps = float(probe_data["fps"])
-                            print(f"[ASRX] FPS from probe: {fps}", file=sys.stderr)
-                        break
-                except:
-                    pass
-        output_result = {
-            "language": None,
-            "segments": [],
-        }
-
-        # Convert segments
-        for seg in result["segments"]:
-            start_sec = seg["start"]
-            end_sec = seg["end"]
-            output_result["segments"].append(
-                {
-                    "start_time": start_sec,
-                    "end_time": end_sec,
-                    "start_frame": int(start_sec * fps),
-                    "end_frame": int(end_sec * fps),
-                    "text": "",
-                    "speaker_id": seg["speaker"],
-                }
-            )
-
-        # Add speaker_stats as optional metadata
-        if "speaker_stats" in result:
-            output_result["speaker_stats"] = result["speaker_stats"]
-
-        # 傳遞 embeddings（每個 segment 對應的 192-D speaker embedding）
-        if "embeddings" in result:
-            output_result["embeddings"] = result["embeddings"]
-
-        if publisher:
-            publisher.info("asrx", f"ASRX_COMPLETE:{len(output_result['segments'])}")
-
-        # Save output
-        output_result["_debug"] = _debug
-        with open(output_path, "w") as f:
-            json.dump(output_result, f, indent=2)
-
-        if publisher:
-            publisher.complete("asrx", f"{len(output_result['segments'])} segments")
-
-        print(f"[ASRX-Custom] Saved {len(output_result['segments'])} segments to {output_path}", file=sys.stderr)
-
-        _cleanup(tmp_dir)
-        return output_result
-
-    except Exception as e:
-        if publisher:
-            publisher.error("asrx", str(e))
-
-        import traceback
-
-        traceback.print_exc()
-
-        # Return empty result on error
-        output_result = {"language": None, "segments": []}
-
-        with open(output_path, "w") as f:
-            json.dump(output_result, f, indent=2)
-
-        if publisher:
-            publisher.complete("asrx", "0 segments")
-
-        _cleanup(tmp_dir)
-        return output_result
-
-
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser(
-        description="ASRX Processor (Custom Implementation)"
-    )
-    parser.add_argument("video_path", help="Path to video/audio file")
-    parser.add_argument("output_path", help="Path to output JSON file")
-    parser.add_argument("--uuid", help="UUID for Redis publishing", default="")
-
-    args = parser.parse_args()
-
-    if not Path(args.video_path).exists():
-        print(f"Error: Video file not found: {args.video_path}")
-        sys.exit(1)
-
-    result = process_asrx_custom(args.video_path, args.output_path, args.uuid)
-
-    print("\n[Summary]")
-    print(f"  Total segments: {len(result['segments'])}")
-    if "speaker_stats" in result:
-        print(f"  Detected speakers: {len(result['speaker_stats'])}")
-        for speaker, stats in result["speaker_stats"].items():
-            print(f"    {speaker}: {stats['count']} segments")
diff --git a/scripts/asrx_processor_simplified.py b/scripts/asrx_processor_simplified.py
deleted file mode 100755
index deace63..0000000
--- a/scripts/asrx_processor_simplified.py
+++ /dev/null
@@ -1,177 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-ASRX 處理器 - 簡化版
-先做轉錄，說話人分離可選
-修復 PyTorch 2.6 兼容性問題
-"""
-
-# Fix for PyTorch 2.6+ compatibility - MUST be set before importing torch
-import os
-os.environ["TORCH_FORCE_WEIGHTS_ONLY_LOAD"] = "0"
-
-import sys
-import json
-import argparse
-import signal
-import subprocess
-
-sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-from redis_publisher import RedisPublisher
-
-
-def signal_handler(signum, frame):
-    print(f"ASRX: Received signal {signum}, exiting...")
-    sys.exit(1)
-
-
-def has_audio_stream(video_path):
-    """Check if video file has audio stream using ffprobe."""
-    try:
-        cmd = [
-            "ffprobe",
-            "-v",
-            "error",
-            "-select_streams",
-            "a",
-            "-show_entries",
-            "stream=codec_type",
-            "-of",
-            "csv=p=0",
-            video_path,
-        ]
-        result = subprocess.run(cmd, capture_output=True, text=True, check=True)
-        return bool(result.stdout.strip())
-    except subprocess.CalledProcessError:
-        return False
-    except FileNotFoundError:
-        print("WARNING: ffprobe not found, assuming audio exists")
-        return True
-
-
-def process_asrx(video_path: str, output_path: str, uuid: str = "", skip_diarization: bool = True):
-    """
-    Process video for speaker diarization using whisperx
-    
-    Args:
-        video_path: Path to video file
-        output_path: Path to output JSON
-        uuid: UUID for Redis progress
-        skip_diarization: Skip speaker diarization (only transcription)
-    """
-    
-    signal.signal(signal.SIGTERM, signal_handler)
-    signal.signal(signal.SIGINT, signal_handler)
-
-    publisher = RedisPublisher(uuid) if uuid else None
-    if publisher:
-        publisher.info("asrx", "ASRX_START")
-
-    try:
-        import whisperx
-        import torch
-    except ImportError as e:
-        if publisher:
-            publisher.error("asrx", f"Missing dependency: {e}")
-        result = {"language": None, "segments": []}
-        if publisher:
-            publisher.complete("asrx", "0 segments")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-    # Check for audio stream
-    if not has_audio_stream(video_path):
-        if publisher:
-            publisher.info("asrx", "No audio stream detected, skipping transcription")
-        output = {"language": "", "language_probability": 0.0, "segments": []}
-        with open(output_path, "w") as f:
-            json.dump(output, f, indent=2)
-        if publisher:
-            publisher.complete("asrx", "0 segments (no audio)")
-        sys.stderr.write("ASRX: No audio stream, skipping transcription\n")
-        sys.stderr.flush()
-        sys.exit(0)
-
-    if publisher:
-        publisher.info("asrx", "ASRX_LOADING_MODEL")
-
-    try:
-        # Load model
-        if publisher:
-            publisher.info("asrx", "Loading whisperx base model (this may take a while)...")
-        
-        model = whisperx.load_model("base", device="cpu", compute_type="int8")
-        
-        if publisher:
-            publisher.info("asrx", "ASRX_TRANSCRIBING")
-        
-        # Transcribe with language detection
-        result = model.transcribe(video_path)
-        
-        if publisher:
-            publisher.info("asrx", f"ASRX_LANGUAGE:{result.get('language', 'unknown')}")
-        
-        # Build output (without diarization for now)
-        segments = []
-        for seg in result.get("segments", []):
-            text = seg.get("text", "").strip()
-            if text:
-                segments.append(
-                    {
-                        "start": seg.get("start", 0.0),
-                        "end": seg.get("end", 0.0),
-                        "text": text,
-                        "speaker_id": None,  # Will be added when diarization is enabled
-                    }
-                )
-        
-        output_result = {
-            "language": result.get("language"),
-            "language_probability": result.get("language_probability", 0),
-            "segments": segments,
-            "diarization_enabled": not skip_diarization
-        }
-        
-        if publisher:
-            publisher.complete("asrx", f"{len(segments)} segments")
-        
-        with open(output_path, "w") as f:
-            json.dump(output_result, f, indent=2, ensure_ascii=False)
-        
-        sys.stderr.write(
-            f"ASRX: Transcription complete, {len(segments)} segments written to {output_path}\n"
-        )
-        sys.stderr.flush()
-        sys.exit(0)
-        
-    except Exception as e:
-        if publisher:
-            publisher.error("asrx", f"Error: {e}")
-        import traceback
-        traceback.print_exc()
-        result = {"language": None, "segments": [], "error": str(e)}
-        if publisher:
-            publisher.complete("asrx", "0 segments (error)")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser(description="ASRX Speaker Diarization (Simplified)")
-    parser.add_argument("video_path", help="Path to video file")
-    parser.add_argument("output_path", help="Output JSON path")
-    parser.add_argument("--uuid", "-u", help="UUID for Redis progress", default="")
-    parser.add_argument(
-        "--skip-diarization",
-        action="store_true",
-        help="Skip speaker diarization (only transcription)"
-    )
-    args = parser.parse_args()
-
-    process_asrx(
-        args.video_path,
-        args.output_path,
-        args.uuid,
-        args.skip_diarization
-    )
diff --git a/scripts/asrx_processor_v2.py b/scripts/asrx_processor_v2.py
deleted file mode 100755
index 61a4faf..0000000
--- a/scripts/asrx_processor_v2.py
+++ /dev/null
@@ -1,212 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-ASRX 處理器 v2 - 說話人分離
-使用 whisperx 進行轉錄和說話人分離
-需要 PyTorch 2.5.0 + torchvision 0.20.0 + torchaudio 2.5.0
-"""
-
-# Fix for PyTorch 2.5 compatibility
-import os
-os.environ["TORCH_FORCE_WEIGHTS_ONLY_LOAD"] = "0"
-
-import sys
-import json
-import argparse
-import signal
-import subprocess
-
-sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-from redis_publisher import RedisPublisher
-
-
-def signal_handler(signum, frame):
-    print(f"ASRX: Received signal {signum}, exiting...")
-    sys.exit(1)
-
-
-def has_audio_stream(video_path):
-    """Check if video file has audio stream using ffprobe."""
-    try:
-        cmd = [
-            "ffprobe",
-            "-v",
-            "error",
-            "-select_streams",
-            "a",
-            "-show_entries",
-            "stream=codec_type",
-            "-of",
-            "csv=p=0",
-            video_path,
-        ]
-        result = subprocess.run(cmd, capture_output=True, text=True, check=True)
-        return bool(result.stdout.strip())
-    except subprocess.CalledProcessError:
-        return False
-    except FileNotFoundError:
-        print("WARNING: ffprobe not found, assuming audio exists")
-        return True
-
-
-def process_asrx(video_path: str, output_path: str, uuid: str = "", skip_diarization: bool = False):
-    """
-    Process video for speaker diarization using whisperx
-    
-    Args:
-        video_path: Path to video file
-        output_path: Path to output JSON
-        uuid: UUID for Redis progress
-        skip_diarization: Skip speaker diarization (only transcription)
-    """
-    
-    signal.signal(signal.SIGTERM, signal_handler)
-    signal.signal(signal.SIGINT, signal_handler)
-
-    publisher = RedisPublisher(uuid) if uuid else None
-    if publisher:
-        publisher.info("asrx", "ASRX_START")
-
-    # Check for audio stream
-    if not has_audio_stream(video_path):
-        if publisher:
-            publisher.info("asrx", "No audio stream detected, skipping transcription")
-        output = {"language": "", "language_probability": 0.0, "segments": []}
-        with open(output_path, "w") as f:
-            json.dump(output, f, indent=2)
-        if publisher:
-            publisher.complete("asrx", "0 segments (no audio)")
-        sys.stderr.write("ASRX: No audio stream, skipping transcription\n")
-        sys.stderr.flush()
-        sys.exit(0)
-
-    if publisher:
-        publisher.info("asrx", "ASRX_LOADING_MODEL")
-
-    try:
-        import whisperx
-        import torch
-    except ImportError as e:
-        if publisher:
-            publisher.error("asrx", f"Missing dependency: {e}")
-        result = {"language": None, "segments": [], "error": str(e)}
-        if publisher:
-            publisher.complete("asrx", "0 segments")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-    try:
-        # Load model
-        if publisher:
-            publisher.info("asrx", "Loading whisperx base model (this may take a while)...")
-        
-        model = whisperx.load_model("base", device="cpu", compute_type="int8")
-        
-        if publisher:
-            publisher.info("asrx", "ASRX_TRANSCRIBING")
-        
-        # Transcribe with language detection
-        result = model.transcribe(video_path)
-        
-        if publisher:
-            publisher.info("asrx", f"ASRX_LANGUAGE:{result.get('language', 'unknown')}")
-        
-        # Align timestamps
-        if publisher:
-            publisher.info("asrx", "ASRX_ALIGNING_TIMESTAMPS")
-        
-        model_a, metadata = whisperx.load_align_model(
-            language_code=result["language"],
-            device="cpu"
-        )
-        result = whisperx.align(
-            result["segments"],
-            model_a,
-            metadata,
-            video_path,
-            device="cpu"
-        )
-        
-        # Diarization (speaker segmentation)
-        if not skip_diarization:
-            if publisher:
-                publisher.info("asrx", "ASRX_DIARIZATION")
-            
-            try:
-                diarize_model = whisperx.DiarizationPipeline(use_auth_token=None)
-                diarize_segments = diarize_model(video_path)
-                
-                # Assign speaker labels
-                result = whisperx.assign_word_speakers(diarize_segments, result)
-                
-                if publisher:
-                    publisher.info("asrx", "Diarization completed")
-            except Exception as e:
-                if publisher:
-                    publisher.info("asrx", f"Diarization skipped: {e}")
-                sys.stderr.write(f"ASRX: Diarization failed: {e}\n")
-        
-        # Build output
-        segments = []
-        for seg in result.get("segments", []):
-            text = seg.get("text", "").strip()
-            if text:
-                segments.append(
-                    {
-                        "start": seg.get("start", 0.0),
-                        "end": seg.get("end", 0.0),
-                        "text": text,
-                        "speaker_id": seg.get("speaker", None),
-                    }
-                )
-        
-        output_result = {
-            "language": result.get("language"),
-            "language_probability": result.get("language_probability", 0),
-            "segments": segments,
-            "diarization_enabled": not skip_diarization
-        }
-        
-        if publisher:
-            publisher.complete("asrx", f"{len(segments)} segments")
-        
-        with open(output_path, "w") as f:
-            json.dump(output_result, f, indent=2, ensure_ascii=False)
-        
-        sys.stderr.write(
-            f"ASRX: Transcription complete, {len(segments)} segments written to {output_path}\n"
-        )
-        sys.stderr.flush()
-        sys.exit(0)
-        
-    except Exception as e:
-        if publisher:
-            publisher.error("asrx", f"Error: {e}")
-        import traceback
-        traceback.print_exc()
-        result = {"language": None, "segments": [], "error": str(e)}
-        if publisher:
-            publisher.complete("asrx", "0 segments (error)")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser(description="ASRX Speaker Diarization v2")
-    parser.add_argument("video_path", help="Path to video file")
-    parser.add_argument("output_path", help="Output JSON path")
-    parser.add_argument("--uuid", "-u", help="UUID for Redis progress", default="")
-    parser.add_argument(
-        "--skip-diarization",
-        action="store_true",
-        help="Skip speaker diarization (only transcription)"
-    )
-    args = parser.parse_args()
-
-    process_asrx(
-        args.video_path,
-        args.output_path,
-        args.uuid,
-        args.skip_diarization
-    )
diff --git a/scripts/asrx_processor_v2_noalign.py b/scripts/asrx_processor_v2_noalign.py
deleted file mode 100755
index 85c9664..0000000
--- a/scripts/asrx_processor_v2_noalign.py
+++ /dev/null
@@ -1,184 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-ASRX 處理器 v2 - 快速版（跳過對齊）
-使用 whisperx 進行轉錄和說話人分離
-跳過時間戳對齊以避開 PyTorch 版本問題
-"""
-
-import os
-os.environ["TORCH_FORCE_WEIGHTS_ONLY_LOAD"] = "0"
-
-import sys
-import json
-import argparse
-import signal
-import subprocess
-
-sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-from redis_publisher import RedisPublisher
-
-
-def signal_handler(signum, frame):
-    print(f"ASRX: Received signal {signum}, exiting...")
-    sys.exit(1)
-
-
-def has_audio_stream(video_path):
-    """Check if video file has audio stream using ffprobe."""
-    try:
-        cmd = [
-            "ffprobe",
-            "-v",
-            "error",
-            "-select_streams",
-            "a",
-            "-show_entries",
-            "stream=codec_type",
-            "-of",
-            "csv=p=0",
-            video_path,
-        ]
-        result = subprocess.run(cmd, capture_output=True, text=True, check=True)
-        return bool(result.stdout.strip())
-    except subprocess.CalledProcessError:
-        return False
-    except FileNotFoundError:
-        print("WARNING: ffprobe not found, assuming audio exists")
-        return True
-
-
-def process_asrx(video_path: str, output_path: str, uuid: str = ""):
-    """
-    Process video for speaker diarization using whisperx (no alignment)
-    
-    Args:
-        video_path: Path to video file
-        output_path: Path to output JSON
-        uuid: UUID for Redis progress
-    """
-    
-    signal.signal(signal.SIGTERM, signal_handler)
-    signal.signal(signal.SIGINT, signal_handler)
-
-    publisher = RedisPublisher(uuid) if uuid else None
-    if publisher:
-        publisher.info("asrx", "ASRX_START")
-
-    # Check for audio stream
-    if not has_audio_stream(video_path):
-        if publisher:
-            publisher.info("asrx", "No audio stream detected")
-        output = {"language": "", "language_probability": 0.0, "segments": []}
-        with open(output_path, "w") as f:
-            json.dump(output, f, indent=2)
-        if publisher:
-            publisher.complete("asrx", "0 segments (no audio)")
-        sys.exit(0)
-
-    if publisher:
-        publisher.info("asrx", "ASRX_LOADING_MODEL")
-
-    try:
-        import whisperx
-        import torch
-    except ImportError as e:
-        if publisher:
-            publisher.error("asrx", f"Missing dependency: {e}")
-        result = {"language": None, "segments": [], "error": str(e)}
-        if publisher:
-            publisher.complete("asrx", "0 segments")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-    try:
-        # Load model
-        if publisher:
-            publisher.info("asrx", "Loading whisperx base model...")
-        
-        model = whisperx.load_model("base", device="cpu", compute_type="int8")
-        
-        if publisher:
-            publisher.info("asrx", "ASRX_TRANSCRIBING")
-        
-        # Transcribe with language detection
-        result = model.transcribe(video_path)
-        
-        if publisher:
-            publisher.info("asrx", f"ASRX_LANGUAGE:{result.get('language', 'unknown')}")
-        
-        # Skip alignment (requires PyTorch 2.6+)
-        # Go directly to diarization
-        if publisher:
-            publisher.info("asrx", "ASRX_DIARIZATION")
-        
-        try:
-            diarize_model = whisperx.DiarizationPipeline(use_auth_token=None)
-            diarize_segments = diarize_model(video_path)
-            
-            # Assign speaker labels
-            result = whisperx.assign_word_speakers(diarize_segments, result)
-            
-            if publisher:
-                publisher.info("asrx", "Diarization completed")
-        except Exception as e:
-            if publisher:
-                publisher.info("asrx", f"Diarization info: {e}")
-            sys.stderr.write(f"ASRX: Diarization note: {e}\n")
-        
-        # Build output
-        segments = []
-        for seg in result.get("segments", []):
-            text = seg.get("text", "").strip()
-            if text:
-                segments.append(
-                    {
-                        "start": seg.get("start", 0.0),
-                        "end": seg.get("end", 0.0),
-                        "text": text,
-                        "speaker_id": seg.get("speaker", None),
-                    }
-                )
-        
-        output_result = {
-            "language": result.get("language"),
-            "language_probability": result.get("language_probability", 0),
-            "segments": segments,
-            "diarization_enabled": True,
-            "alignment_enabled": False,
-            "note": "Alignment skipped due to PyTorch version compatibility"
-        }
-        
-        if publisher:
-            publisher.complete("asrx", f"{len(segments)} segments")
-        
-        with open(output_path, "w") as f:
-            json.dump(output_result, f, indent=2, ensure_ascii=False)
-        
-        sys.stderr.write(
-            f"ASRX: Transcription complete, {len(segments)} segments written to {output_path}\n"
-        )
-        sys.stderr.flush()
-        sys.exit(0)
-        
-    except Exception as e:
-        if publisher:
-            publisher.error("asrx", f"Error: {e}")
-        import traceback
-        traceback.print_exc()
-        result = {"language": None, "segments": [], "error": str(e)}
-        if publisher:
-            publisher.complete("asrx", "0 segments (error)")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser(description="ASRX Speaker Diarization v2 (No Alignment)")
-    parser.add_argument("video_path", help="Path to video file")
-    parser.add_argument("output_path", help="Output JSON path")
-    parser.add_argument("--uuid", "-u", help="UUID for Redis progress", default="")
-    args = parser.parse_args()
-
-    process_asrx(args.video_path, args.output_path, args.uuid)
diff --git a/scripts/asrx_processor_v2_transcribe.py b/scripts/asrx_processor_v2_transcribe.py
deleted file mode 100755
index a6e92d7..0000000
--- a/scripts/asrx_processor_v2_transcribe.py
+++ /dev/null
@@ -1,165 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-ASRX 處理器 v2 - 轉錄版
-使用 whisperx 進行轉錄（不含說話人分離）
-說話人分離需要額外安裝 pyannote.audio 並配置 HuggingFace token
-"""
-
-import os
-os.environ["TORCH_FORCE_WEIGHTS_ONLY_LOAD"] = "0"
-
-import sys
-import json
-import argparse
-import signal
-import subprocess
-
-sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
-from redis_publisher import RedisPublisher
-
-
-def signal_handler(signum, frame):
-    print(f"ASRX: Received signal {signum}, exiting...")
-    sys.exit(1)
-
-
-def has_audio_stream(video_path):
-    """Check if video file has audio stream using ffprobe."""
-    try:
-        cmd = [
-            "ffprobe",
-            "-v",
-            "error",
-            "-select_streams",
-            "a",
-            "-show_entries",
-            "stream=codec_type",
-            "-of",
-            "csv=p=0",
-            video_path,
-        ]
-        result = subprocess.run(cmd, capture_output=True, text=True, check=True)
-        return bool(result.stdout.strip())
-    except subprocess.CalledProcessError:
-        return False
-    except FileNotFoundError:
-        print("WARNING: ffprobe not found, assuming audio exists")
-        return True
-
-
-def process_asrx(video_path: str, output_path: str, uuid: str = ""):
-    """
-    Process video for transcription using whisperx
-    
-    Args:
-        video_path: Path to video file
-        output_path: Path to output JSON
-        uuid: UUID for Redis progress
-    """
-    
-    signal.signal(signal.SIGTERM, signal_handler)
-    signal.signal(signal.SIGINT, signal_handler)
-
-    publisher = RedisPublisher(uuid) if uuid else None
-    if publisher:
-        publisher.info("asrx", "ASRX_START")
-
-    # Check for audio stream
-    if not has_audio_stream(video_path):
-        if publisher:
-            publisher.info("asrx", "No audio stream detected")
-        output = {"language": "", "language_probability": 0.0, "segments": []}
-        with open(output_path, "w") as f:
-            json.dump(output, f, indent=2)
-        if publisher:
-            publisher.complete("asrx", "0 segments (no audio)")
-        sys.exit(0)
-
-    if publisher:
-        publisher.info("asrx", "ASRX_LOADING_MODEL")
-
-    try:
-        import whisperx
-        import torch
-    except ImportError as e:
-        if publisher:
-            publisher.error("asrx", f"Missing dependency: {e}")
-        result = {"language": None, "segments": [], "error": str(e)}
-        if publisher:
-            publisher.complete("asrx", "0 segments")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-    try:
-        # Load model
-        if publisher:
-            publisher.info("asrx", "Loading whisperx base model...")
-        
-        model = whisperx.load_model("base", device="cpu", compute_type="int8")
-        
-        if publisher:
-            publisher.info("asrx", "ASRX_TRANSCRIBING")
-        
-        # Transcribe with language detection
-        result = model.transcribe(video_path)
-        
-        if publisher:
-            publisher.info("asrx", f"ASRX_LANGUAGE:{result.get('language', 'unknown')}")
-        
-        # Build output (without alignment and diarization due to PyTorch version)
-        segments = []
-        for seg in result.get("segments", []):
-            text = seg.get("text", "").strip()
-            if text:
-                segments.append(
-                    {
-                        "start": seg.get("start", 0.0),
-                        "end": seg.get("end", 0.0),
-                        "text": text,
-                        "speaker_id": None,  # Requires pyannote.audio + HuggingFace token
-                    }
-                )
-        
-        output_result = {
-            "language": result.get("language"),
-            "language_probability": result.get("language_probability", 0),
-            "segments": segments,
-            "diarization_enabled": False,
-            "alignment_enabled": False,
-            "note": "PyTorch 2.5.0 compatibility - alignment and diarization require additional setup"
-        }
-        
-        if publisher:
-            publisher.complete("asrx", f"{len(segments)} segments")
-        
-        with open(output_path, "w") as f:
-            json.dump(output_result, f, indent=2, ensure_ascii=False)
-        
-        sys.stderr.write(
-            f"ASRX: Transcription complete, {len(segments)} segments written to {output_path}\n"
-        )
-        sys.stderr.flush()
-        sys.exit(0)
-        
-    except Exception as e:
-        if publisher:
-            publisher.error("asrx", f"Error: {e}")
-        import traceback
-        traceback.print_exc()
-        result = {"language": None, "segments": [], "error": str(e)}
-        if publisher:
-            publisher.complete("asrx", "0 segments (error)")
-        with open(output_path, "w") as f:
-            json.dump(result, f, indent=2)
-        sys.exit(1)
-
-
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser(description="ASRX Transcription (PyTorch 2.5.0)")
-    parser.add_argument("video_path", help="Path to video file")
-    parser.add_argument("output_path", help="Output JSON path")
-    parser.add_argument("--uuid", "-u", help="UUID for Redis progress", default="")
-    args = parser.parse_args()
-
-    process_asrx(args.video_path, args.output_path, args.uuid)
diff --git a/scripts/asrx_self/integrate_face_asrx_speaker.py b/scripts/asrx_self/integrate_face_asrx_speaker.py
deleted file mode 100755
index bc4141a..0000000
--- a/scripts/asrx_self/integrate_face_asrx_speaker.py
+++ /dev/null
@@ -1,178 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-整合 Face + ASRX 說話人分離（版本 3 - 修復 face_detected 檢查）
-"""
-
-import json
-import argparse
-from pathlib import Path
-from typing import Dict, List
-
-
-def load_json(path: str):
-    """載入 JSON 文件"""
-    with open(path, 'r', encoding='utf-8') as f:
-        return json.load(f)
-
-
-def match_face_with_speaker_v3(face_data: Dict, asrx_data: Dict, 
-                                time_threshold: float = 3.0) -> List[Dict]:
-    """
-    匹配人臉與說話人（版本 3 - 修復版）
-    
-    修復：Face 數據沒有 face_detected 欄位，改用 faces 列表是否為空判斷
-    """
-    face_frames = face_data.get('frames', [])
-    asrx_segments = asrx_data.get('segments', [])
-    
-    # 將 Face 幀按時間排序
-    face_frames_sorted = sorted(face_frames, key=lambda x: x.get('timestamp', 0))
-    
-    print(f"  Face frames: {len(face_frames_sorted)}")
-    print(f"  ASRX segments: {len(asrx_segments)}")
-    
-    # 匹配
-    integrated = []
-    
-    for i, seg in enumerate(asrx_segments):
-        start = seg['start']
-        end = seg['end']
-        speaker = seg['speaker']
-        mid_time = (start + end) / 2
-        
-        # 找到時間範圍內的人臉
-        faces_in_range = []
-        for frame in face_frames_sorted:
-            ts = frame.get('timestamp', 0)
-            
-            # 檢查是否在時間範圍內
-            if start - time_threshold <= ts <= end + time_threshold:
-                # 檢查是否有人臉（faces 列表不為空）
-                faces = frame.get('faces', [])
-                if faces and len(faces) > 0:
-                    faces_in_range.append({
-                        'timestamp': ts,
-                        'faces': faces,
-                        'distance_from_mid': abs(ts - mid_time)
-                    })
-        
-        # 選擇最接近片段中間的人臉
-        if faces_in_range:
-            faces_in_range.sort(key=lambda x: x['distance_from_mid'])
-            best_face = faces_in_range[0]
-        else:
-            best_face = None
-        
-        # 建立整合結果
-        integrated.append({
-            'start': start,
-            'end': end,
-            'duration': seg.get('duration', end - start),
-            'speaker': speaker,
-            'has_face': best_face is not None,
-            'face_timestamp': best_face['timestamp'] if best_face else None,
-            'face_location': best_face['faces'][0] if best_face and best_face['faces'] else None,
-            'face_count_in_range': len(faces_in_range)
-        })
-        
-        # 進度顯示
-        if (i + 1) % 200 == 0:
-            print(f"  Processed {i+1}/{len(asrx_segments)} segments...")
-    
-    return integrated
-
-
-def analyze_speaker_face(integrated: List[Dict]):
-    """分析說話人與人臉的對應"""
-    speaker_stats = {}
-    
-    for item in integrated:
-        speaker = item['speaker']
-        if speaker not in speaker_stats:
-            speaker_stats[speaker] = {
-                'total_segments': 0,
-                'with_face': 0,
-                'without_face': 0,
-                'total_duration': 0
-            }
-        
-        speaker_stats[speaker]['total_segments'] += 1
-        speaker_stats[speaker]['total_duration'] += item['duration']
-        
-        if item['has_face']:
-            speaker_stats[speaker]['with_face'] += 1
-        else:
-            speaker_stats[speaker]['without_face'] += 1
-    
-    return speaker_stats
-
-
-def main():
-    parser = argparse.ArgumentParser(description='整合 Face + ASRX 說話人')
-    parser.add_argument('face_json', help='Face 檢測結果 JSON')
-    parser.add_argument('asrx_json', help='ASRX 說話人分離 JSON')
-    parser.add_argument('-o', '--output', help='輸出整合結果 JSON')
-    parser.add_argument('--threshold', type=float, default=3.0,
-                        help='時間閾值（秒）')
-    parser.add_argument('--stats', action='store_true', help='只显示統計')
-    
-    args = parser.parse_args()
-    
-    # 載入數據
-    print(f"[Load] Face: {args.face_json}")
-    face_data = load_json(args.face_json)
-    
-    print(f"[Load] ASRX: {args.asrx_json}")
-    asrx_data = load_json(args.asrx_json)
-    
-    # 匹配
-    print(f"\n[Match] Matching faces with speakers (threshold={args.threshold}s)...")
-    integrated = match_face_with_speaker_v3(face_data, asrx_data, args.threshold)
-    
-    # 分析
-    print("\n[Analyze] Analyzing speaker-face correspondence...")
-    speaker_stats = analyze_speaker_face(integrated)
-    
-    # 顯示統計
-    print(f"\n{'='*70}")
-    print("說話人 - 人臉對應統計")
-    print(f"{'='*70}")
-    
-    total_segments = len(integrated)
-    total_with_face = sum(1 for item in integrated if item['has_face'])
-    
-    for speaker, stats in sorted(speaker_stats.items()):
-        with_face_pct = stats['with_face'] / stats['total_segments'] * 100 if stats['total_segments'] > 0 else 0
-        print(f"\n🔊 {speaker}:")
-        print(f"  總片段：{stats['total_segments']}")
-        print(f"  有人臉：{stats['with_face']} ({with_face_pct:.1f}%)")
-        print(f"  無人臉：{stats['without_face']}")
-        print(f"  總時長：{stats['total_duration']:.1f}s ({stats['total_duration']/60:.1f}分鐘)")
-    
-    print(f"\n{'='*70}")
-    print(f"總計：{total_segments} 片段，{total_with_face} 片段有人臉 ({total_with_face/total_segments*100:.1f}%)")
-    print(f"{'='*70}")
-    
-    # 保存結果
-    if args.output:
-        output_path = Path(args.output)
-        output_path.parent.mkdir(parents=True, exist_ok=True)
-        
-        result = {
-            'face_source': str(args.face_json),
-            'asrx_source': str(args.asrx_json),
-            'time_threshold': args.threshold,
-            'integrated_segments': integrated,
-            'speaker_stats': speaker_stats
-        }
-        
-        with open(output_path, 'w', encoding='utf-8') as f:
-            json.dump(result, f, indent=2, ensure_ascii=False)
-        
-        print(f"\n[Save] Results saved to: {output_path}")
-    
-    return integrated, speaker_stats
-
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/asrx_self/main.py b/scripts/asrx_self/main.py
deleted file mode 100644
index e26a419..0000000
--- a/scripts/asrx_self/main.py
+++ /dev/null
@@ -1,268 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-Self-implemented ASRX - 自實作說話人分離系統
-基於聲紋嵌入 + 譜聚類
-
-技術架構:
-1. VAD (Silero VAD) - 語音活動檢測
-2. Speaker Encoder (ECAPA-TDNN) - 聲紋特徵提取
-3. Spectral Clustering - 譜聚類
-4. Post-processing - 後處理
-
-流程:
-音頻 → VAD → 語音片段 → 聲紋嵌入 → 相似度矩陣 → 譜聚類 → 說話人 ID
-"""
-
-import sys
-import json
-import time
-from pathlib import Path
-
-# 導入自定義模組
-from vad import load_vad_model, extract_speech_segments
-from speaker_encoder import (
-    load_speaker_encoder,
-    extract_speaker_embeddings_batch,
-    compute_similarity_matrix,
-    normalize_embeddings,
-)
-from speaker_cluster import spectral_clustering_speaker, smooth_speaker_labels
-
-
-class SelfASRX:
-    """
-    自實作說話人分離系統
-    """
-
-    def __init__(self):
-        """初始化模型"""
-        print("[SelfASRX] Initializing models...")
-
-        # 載入 VAD 模型
-        print("[SelfASRX] Loading VAD model (Silero)...")
-        self.vad_model, self.vad_utils = load_vad_model()
-
-        # 載入聲紋模型
-        print("[SelfASRX] Loading speaker encoder (ECAPA-TDNN)...")
-        self.speaker_encoder = load_speaker_encoder()
-
-        print("[SelfASRX] Models loaded successfully")
-
-    def process(
-        self,
-        audio_path,
-        output_path=None,
-        min_speech_duration_ms=500,
-        n_speakers=None,
-        smooth_window=5,
-    ):
-        """
-        處理音頻文件進行說話人分離
-
-        Args:
-            audio_path: 音頻文件路徑
-            output_path: 輸出 JSON 路徑（可選）
-            min_speech_duration_ms: 最小語音持續時間
-            n_speakers: 說話人數量（None=自動估計）
-            smooth_window: 平滑窗口大小
-
-        Returns:
-            result: 說話人分離結果
-        """
-        start_time = time.time()
-        print(f"\n[SelfASRX] Processing: {audio_path}")
-        print("=" * 60)
-
-        # 步驟 1: VAD - 語音活動檢測
-        print("\n[Step 1] Voice Activity Detection...")
-        step1_start = time.time()
-
-        speech_segments, wav, sample_rate = extract_speech_segments(
-            audio_path,
-            self.vad_model,
-            self.vad_utils,
-            min_speech_duration_ms=min_speech_duration_ms,
-        )
-
-        step1_time = time.time() - step1_start
-        print(f"  Speech segments: {len(speech_segments)}")
-        print(f"  Total duration: {len(wav) / sample_rate:.2f}s")
-        print(f"  VAD time: {step1_time:.2f}s")
-
-        if len(speech_segments) == 0:
-            print("[SelfASRX] No speech detected!")
-            return {"error": "No speech detected", "segments": []}
-
-        # 步驟 2: 聲紋特徵提取
-        print("\n[Step 2] Speaker embedding extraction...")
-        step2_start = time.time()
-
-        # 提取語音片段音頻
-        audio_segments = []
-        for start_sec, end_sec in speech_segments:
-            start_sample = int(start_sec * sample_rate)
-            end_sample = int(end_sec * sample_rate)
-            audio_segments.append(wav[start_sample:end_sample])
-
-        # 批量提取嵌入
-        embeddings = extract_speaker_embeddings_batch(
-            self.speaker_encoder, audio_segments, sample_rate
-        )
-
-        # 正規化
-        embeddings = normalize_embeddings(embeddings)
-
-        step2_time = time.time() - step2_start
-        print(f"  Embedding shape: {embeddings.shape}")
-        print(f"  Embedding time: {step2_time:.2f}s")
-
-        # 步驟 3: 計算相似度矩陣
-        print("\n[Step 3] Computing similarity matrix...")
-        step3_start = time.time()
-
-        similarity_matrix = compute_similarity_matrix(embeddings, method="cosine")
-
-        step3_time = time.time() - step3_start
-        print(f"  Similarity matrix shape: {similarity_matrix.shape}")
-        print(f"  Similarity time: {step3_time:.2f}s")
-
-        # 步驟 4: 譜聚類
-        print("\n[Step 4] Spectral clustering...")
-        step4_start = time.time()
-
-        speaker_labels, estimated_n_speakers = spectral_clustering_speaker(
-            similarity_matrix, n_speakers=n_speakers, auto_estimate=(n_speakers is None)
-        )
-
-        # 平滑標籤
-        if smooth_window > 1:
-            speaker_labels = smooth_speaker_labels(
-                speaker_labels, window_size=smooth_window
-            )
-
-        step4_time = time.time() - step4_start
-        print(f"  Estimated speakers: {estimated_n_speakers}")
-        print(f"  Clustering time: {step4_time:.2f}s")
-
-        # 步驟 5: 建立輸出結果
-        print("\n[Step 5] Building output...")
-
-        result = {
-            "audio_path": str(audio_path),
-            "total_duration": len(wav) / sample_rate,
-            "n_speech_segments": len(speech_segments),
-            "n_speakers": int(estimated_n_speakers),
-            "segments": [],
-        }
-
-        for i, ((start, end), label) in enumerate(zip(speech_segments, speaker_labels)):
-            result["segments"].append(
-                {
-                    "index": i,
-                    "start": round(start, 3),
-                    "end": round(end, 3),
-                    "duration": round(end - start, 3),
-                    "speaker": f"SPEAKER_{int(label)}",
-                }
-            )
-
-        # 統計每個說話人的總時長
-        speaker_stats = {}
-        for seg in result["segments"]:
-            speaker = seg["speaker"]
-            if speaker not in speaker_stats:
-                speaker_stats[speaker] = {"count": 0, "duration": 0}
-            speaker_stats[speaker]["count"] += 1
-            speaker_stats[speaker]["duration"] += seg["duration"]
-
-        result["speaker_stats"] = speaker_stats
-
-        total_time = time.time() - start_time
-        result["processing_time"] = round(total_time, 2)
-        result["realtime_factor"] = round(result["total_duration"] / total_time, 2)
-
-        print("\n[SelfASRX] Processing completed!")
-        print(f"  Total time: {total_time:.2f}s")
-        print(f"  Realtime factor: {result['realtime_factor']:.2f}x")
-        print(f"  Detected speakers: {estimated_n_speakers}")
-
-        # 保存結果
-        if output_path:
-            output_path = Path(output_path)
-            output_path.parent.mkdir(parents=True, exist_ok=True)
-
-            with open(output_path, "w", encoding="utf-8") as f:
-                json.dump(result, f, indent=2, ensure_ascii=False)
-
-            print(f"  Results saved to: {output_path}")
-
-        print("=" * 60)
-
-        return result
-
-
-def main():
-    """主函數"""
-    import argparse
-
-    parser = argparse.ArgumentParser(
-        description="Self-implemented ASRX - Speaker Diarization"
-    )
-    parser.add_argument("audio_path", help="Path to audio file")
-    parser.add_argument("-o", "--output", help="Output JSON path")
-    parser.add_argument(
-        "--min-speech-duration",
-        type=int,
-        default=500,
-        help="Minimum speech duration in ms (default: 500)",
-    )
-    parser.add_argument(
-        "--n-speakers",
-        type=int,
-        default=None,
-        help="Number of speakers (default: auto-estimate)",
-    )
-    parser.add_argument(
-        "--smooth-window",
-        type=int,
-        default=5,
-        help="Smoothing window size (default: 5)",
-    )
-
-    args = parser.parse_args()
-
-    # 檢查文件是否存在
-    if not Path(args.audio_path).exists():
-        print(f"Error: Audio file not found: {args.audio_path}")
-        sys.exit(1)
-
-    # 創建 ASRX 實例並處理
-    asrx = SelfASRX()
-    result = asrx.process(
-        args.audio_path,
-        args.output,
-        min_speech_duration_ms=args.min_speech_duration,
-        n_speakers=args.n_speakers,
-        smooth_window=args.smooth_window,
-    )
-
-    # 顯示結果摘要
-    if "error" not in result:
-        print("\n[Summary]")
-        print(f"  Audio duration: {result['total_duration']:.2f}s")
-        print(f"  Speech segments: {result['n_speech_segments']}")
-        print(f"  Detected speakers: {result['n_speakers']}")
-        print(f"  Processing time: {result['processing_time']:.2f}s")
-        print(f"  Realtime factor: {result['realtime_factor']:.2f}x")
-
-        print("\n[Speaker Statistics]")
-        for speaker, stats in result["speaker_stats"].items():
-            pct = stats["duration"] / result["total_duration"] * 100
-            print(
-                f"  {speaker}: {stats['count']} segments, "
-                + f"{stats['duration']:.2f}s ({pct:.1f}%)"
-            )
-
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/asrx_self/main_fixed.py b/scripts/asrx_self/main_fixed.py
index 34b498f..4def1a3 100755
--- a/scripts/asrx_self/main_fixed.py
+++ b/scripts/asrx_self/main_fixed.py
@@ -1,308 +1,728 @@
-#!/opt/homebrew/bin/python3.11
 """
-Self-implemented ASRX - Fixed Version
-使用魯棒的聚類算法
+SelfASRXFixed - 7 步 Hybrid Speaker Diarization Pipeline
+
+Pipeline:
+  1. whisper.transcribe(full_audio) → rough segments + text + language
+  2. VAD scan each rough segment → refined segments
+  3. whisper per refined segment → {text, language, lang_prob}
+  4. ECAPA-TDNN per refined segment → 192-dim embeddings
+  5. AgglomerativeClustering → speaker_labels
+  6. Store all embeddings in Qdrant (payload: file_uuid, speaker_id, text, ...)
+  7. High-quality embeddings → gender classify + store reference in Qdrant
 """
 
 import sys
 import json
 import time
+import os
 import numpy as np
 from pathlib import Path
+from urllib.request import Request, urlopen
+from urllib.error import URLError
 
-# 導入自定義模組
-from vad import load_vad_model, extract_speech_segments
-from speaker_encoder import (
-    load_speaker_encoder, 
-    extract_speaker_embeddings_batch,
-    normalize_embeddings
-)
-from speaker_cluster_fixed import robust_speaker_clustering
+
+def _load_audio(path):
+    """載入音頻文件，回傳 (wav_numpy, sample_rate)"""
+    import soundfile as sf
+    wav, sr = sf.read(path)
+    if len(wav.shape) > 1:
+        wav = np.mean(wav, axis=1)
+    return wav, sr
+
+
+def _load_whisper_model(size="small"):
+    from whisper_local import load_model
+    return load_model(size)
+
+
+def _load_vad():
+    from vad import load_vad_model
+    return load_vad_model()
+
+
+def _load_speaker_encoder():
+    from speaker_encoder import load_speaker_encoder
+    return load_speaker_encoder()
+
+
+def _load_gender_classifier():
+    try:
+        from speechbrain.inference.classifiers import EncoderClassifier
+        classifier = EncoderClassifier.from_hparams(
+            source="speechbrain/gender-recognition-ecapa",
+            run_opts={"device": "cpu"},
+        )
+        print("[Gender] Classifier loaded: speechbrain/gender-recognition-ecapa")
+        return classifier
+    except Exception as e:
+        print(f"[Gender] Classifier not available: {e}")
+        return None
+
+
+def _ensure_speaker_collection(qdrant_url, api_key, collection):
+    """確認 Qdrant speaker collection 存在，不存在則建立 (dim=192, cosine)"""
+    try:
+        url = f"{qdrant_url}/collections/{collection}"
+        req = Request(url, method="GET",
+                      headers={"api-key": api_key} if api_key else {})
+        try:
+            urlopen(req)
+            return True
+        except URLError as e:
+            if getattr(e, "code", None) == 404:
+                body = json.dumps({
+                    "vectors": {
+                        "size": 192,
+                        "distance": "Cosine"
+                    }
+                }).encode()
+                req = Request(url, data=body, method="PUT",
+                              headers={"Content-Type": "application/json",
+                                       **({"api-key": api_key} if api_key else {})})
+                urlopen(req)
+                print(f"[Qdrant] Created collection: {collection} (dim=192)")
+                return True
+            raise
+    except Exception as e:
+        print(f"[Qdrant] Cannot access Qdrant: {e}")
+        return False
+
+
+def _qdrant_upsert(qdrant_url, api_key, collection, points):
+    """批量寫入 Qdrant points"""
+    try:
+        url = f"{qdrant_url}/collections/{collection}/points?wait=true"
+        body = json.dumps({"points": points}).encode()
+        headers = {"Content-Type": "application/json"}
+        if api_key:
+            headers["api-key"] = api_key
+        req = Request(url, data=body, headers=headers, method="PUT")
+        urlopen(req)
+        return True
+    except Exception as e:
+        print(f"[Qdrant] Upsert failed: {e}")
+        return False
+
+
+def _hash_point_id(file_uuid, label):
+    """產生一致的 point ID"""
+    s = f"{file_uuid}_{label}"
+    return hash(s) & 0x7FFFFFFFFFFFFFFF
+
+
+def _save_checkpoint(path: str, data: dict):
+    """原子寫入 checkpoint（先 .tmp 再 rename）"""
+    tmp = path + ".tmp"
+    Path(tmp).parent.mkdir(parents=True, exist_ok=True)
+    with open(tmp, "w", encoding="utf-8") as f:
+        json.dump(data, f, indent=2, ensure_ascii=False)
+    os.replace(tmp, path)
+
+
+def compute_embedding_quality(embeddings, labels):
+    """每個 embedding 到所屬 cluster centroid 的餘弦相似度"""
+    from sklearn.metrics.pairwise import cosine_similarity
+    unique_labels = set(labels)
+    centroids = {}
+    for label in unique_labels:
+        mask = labels == label
+        centroid = np.mean(embeddings[mask], axis=0)
+        norm = np.linalg.norm(centroid)
+        if norm > 0:
+            centroid = centroid / norm
+        centroids[label] = centroid
+    qualities = []
+    for emb, label in zip(embeddings, labels):
+        sim = cosine_similarity([emb], [centroids[label]])[0][0]
+        qualities.append(sim)
+    return np.array(qualities)
 
 
 class SelfASRXFixed:
-    """自實作說話人分離系統（修復版）"""
-    
+    """7 步 Hybrid Speaker Diarization Pipeline"""
+
     def __init__(self):
-        print("[SelfASRX-Fixed] Initializing models...")
-        
-        # 載入 VAD 模型
-        print("[SelfASRX-Fixed] Loading VAD model (Silero)...")
-        self.vad_model, self.vad_utils = load_vad_model()
-        
-        # 載入聲紋模型
-        print("[SelfASRX-Fixed] Loading speaker encoder (ECAPA-TDNN)...")
-        self.speaker_encoder = load_speaker_encoder()
-        
-        print("[SelfASRX-Fixed] Models loaded successfully")
-    
-    def process(self, audio_path, output_path=None, 
-                min_speech_duration_ms=500,
-                n_speakers=None,
-                max_speakers=10):
-        """處理音頻文件"""
-        start_time = time.time()
-        print(f"\n[SelfASRX-Fixed] Processing: {audio_path}")
-        print("=" * 60)
-        
-        # 步驟 1: VAD
-        print("\n[Step 1] Voice Activity Detection...")
-        step1_start = time.time()
-        
-        speech_segments, wav, sample_rate = extract_speech_segments(
-            audio_path, self.vad_model, self.vad_utils,
-            min_speech_duration_ms=min_speech_duration_ms
-        )
-        
-        step1_time = time.time() - step1_start
-        print(f"  Speech segments: {len(speech_segments)}")
-        print(f"  Total duration: {len(wav)/sample_rate:.2f}s")
-        print(f"  VAD time: {step1_time:.2f}s")
-        
-        if len(speech_segments) == 0:
-            print("[SelfASRX-Fixed] No speech detected!")
-            return {"error": "No speech detected", "segments": []}
-        
-        # 步驟 2: 聲紋特徵提取
-        print("\n[Step 2] Speaker embedding extraction...")
-        step2_start = time.time()
-        
-        # 提取語音片段音頻
-        audio_segments = []
-        for start_sec, end_sec in speech_segments:
-            start_sample = int(start_sec * sample_rate)
-            end_sample = int(end_sec * sample_rate)
-            audio_segments.append(wav[start_sample:end_sample])
-        
-        # 批量提取嵌入
-        embeddings = extract_speaker_embeddings_batch(
-            self.speaker_encoder, audio_segments, sample_rate
-        )
-        
-        # 正規化
-        embeddings = normalize_embeddings(embeddings)
-        
-        step2_time = time.time() - step2_start
-        print(f"  Embedding shape: {embeddings.shape}")
-        print(f"  Embedding time: {step2_time:.2f}s")
-        
-        # 步驟 3: 魯棒聚類
-        print("\n[Step 3] Robust speaker clustering...")
-        step3_start = time.time()
-        
-        speaker_labels, estimated_n_speakers = robust_speaker_clustering(
-            embeddings,
-            n_speakers=n_speakers,
-            max_speakers=max_speakers
-        )
-        
-        step3_time = time.time() - step3_start
-        print(f"  Clustering time: {step3_time:.2f}s")
-        
-        # 步驟 4: 建立輸出
-        print("\n[Step 4] Building output...")
-        
-        result = {
-            "audio_path": str(audio_path),
-            "total_duration": len(wav) / sample_rate,
-            "n_speech_segments": len(speech_segments),
-            "n_speakers": int(estimated_n_speakers),
-            "segments": []
-        }
-        
-        for i, ((start, end), label) in enumerate(zip(speech_segments, speaker_labels)):
-            result["segments"].append({
-                "index": i,
-                "start": round(start, 3),
-                "end": round(end, 3),
-                "duration": round(end - start, 3),
-                "speaker": f"SPEAKER_{int(label)}"
-            })
-        
-        # 統計每個說話人的總時長
-        speaker_stats = {}
-        for seg in result["segments"]:
-            speaker = seg["speaker"]
-            if speaker not in speaker_stats:
-                speaker_stats[speaker] = {"count": 0, "duration": 0}
-            speaker_stats[speaker]["count"] += 1
-            speaker_stats[speaker]["duration"] += seg["duration"]
-        
-        result["speaker_stats"] = speaker_stats
-        
-        total_time = time.time() - start_time
-        result["processing_time"] = round(total_time, 2)
-        result["realtime_factor"] = round(result["total_duration"] / total_time, 2)
-        
-        print("\n[SelfASRX-Fixed] Processing completed!")
-        print(f"  Total time: {total_time:.2f}s")
-        print(f"  Realtime factor: {result['realtime_factor']:.2f}x")
-        print(f"  Detected speakers: {estimated_n_speakers}")
-        
-        # 保存結果
-        if output_path:
-            output_path = Path(output_path)
-            output_path.parent.mkdir(parents=True, exist_ok=True)
-            
-            with open(output_path, 'w', encoding='utf-8') as f:
-                json.dump(result, f, indent=2, ensure_ascii=False)
-            
-            print(f"  Results saved to: {output_path}")
-        
-        print("=" * 60)
-        
-        return result
+        print("[SelfASRX] Initializing models...")
 
+        print("[SelfASRX] Loading whisper model...")
+        self.whisper = _load_whisper_model("small")
+
+        print("[SelfASRX] Loading VAD model (Silero)...")
+        self.vad_model, self.vad_utils = _load_vad()
+
+        print("[SelfASRX] Loading speaker encoder (ECAPA-TDNN)...")
+        self.speaker_encoder = _load_speaker_encoder()
+
+        print("[SelfASRX] Loading gender classifier...")
+        self.gender_classifier = _load_gender_classifier()
+
+        # Qdrant 設定
+        self.qdrant_url = os.environ.get("QDRANT_URL", "http://localhost:6333")
+        self.qdrant_api_key = os.environ.get("QDRANT_API_KEY", "")
+        schema = os.environ.get("DATABASE_SCHEMA", "public")
+        self.qdrant_collection = os.environ.get(
+            "QDRANT_SPEAKER_COLLECTION",
+            f"momentry_{schema}_speaker"
+        )
+        self._qdrant_ok = False
+
+        print("[SelfASRX] Models loaded successfully")
+
+    def process(self, audio_path, output_path=None, file_uuid=None,
+                max_speakers=10, quality_threshold=0.85,
+                checkpoint_path=None):
+        """7 步 speaker diarization pipeline
 
-    def process_with_segments(self, audio_path, asr_segments, output_path=None):
-        """
-        使用 ASR segment 邊界進行 speaker diarization，取代 VAD 步驟。
-        
         Args:
-            audio_path: 音頻文件路徑（WAV）
-            asr_segments: ASR segment 列表，每個包含 start/end（秒）
-            output_path: 輸出 JSON 路徑（可選）
+            audio_path: 音頻文件路徑 (WAV 16kHz mono)
+            output_path: 輸出 JSON 路徑 (可選)
+            file_uuid: 檔案 UUID (用於 Qdrant 儲存)
+            max_speakers: 最大說話人數
+            quality_threshold: 高品質聲紋門檻 (0-1)
+            checkpoint_path: Step 3 完成後儲存 checkpoint 路徑
+
+        Returns:
+            dict: segments, speaker_stats, n_speakers, total_duration, references
         """
         start_time = time.time()
-        print(f"\n[SelfASRX-Fixed] Processing with {len(asr_segments)} ASR segments: {audio_path}")
+        print(f"\n[SelfASRX] Processing: {audio_path}")
         print("=" * 60)
 
-        # 載入完整音頻
-        import soundfile as sf
-        wav, sample_rate = sf.read(audio_path)
-        if len(wav.shape) > 1:
-            wav = np.mean(wav, axis=1)  # 轉 mono
-        print(f"  Audio loaded: {len(wav)/sample_rate:.2f}s, {sample_rate}Hz")
+        # 載入音頻
+        wav, sample_rate = _load_audio(audio_path)
+        total_duration = len(wav) / sample_rate
+        print(f"  Audio: {total_duration:.2f}s, {sample_rate}Hz")
 
-        # 使用 ASR segments 取代 VAD (audio处理用time)
-        speech_segments = [(s["start_time"], s["end_time"]) for s in asr_segments]
-        print(f"  Speech segments from ASR: {len(speech_segments)}")
+        # ── Step 1: whisper 粗略定位 (faster-whisper) ──
+        print("\n[Step 1] Initial whisper transcription...")
+        t1 = time.time()
+        seg_gen, info = self.whisper.transcribe(audio_path)
+        rough_segments = []
+        for seg in seg_gen:
+            rough_segments.append({"start": seg.start, "end": seg.end, "text": seg.text})
+        language = info.language if info else None
+        print(f"  Rough segments: {len(rough_segments)}")
+        print(f"  Language: {language}")
+        print(f"  Step 1 time: {time.time() - t1:.2f}s")
 
-        if len(speech_segments) == 0:
-            print("[SelfASRX-Fixed] No ASR segments provided!")
-            return {"error": "No ASR segments", "segments": []}
+        if not rough_segments:
+            print("[SelfASRX] No speech detected by whisper!")
+            return {"error": "No speech detected", "segments": []}
 
-        # 提取語音片段
-        audio_segments = []
-        for start_sec, end_sec in speech_segments:
-            start_sample = int(start_sec * sample_rate)
-            end_sample = int(end_sec * sample_rate)
-            if start_sample >= len(wav):
+        # ── Step 2: VAD scan 每個 rough segment 細切 ──
+        print("\n[Step 2] VAD scan for refined segmentation...")
+        t2 = time.time()
+        refined_segments = []
+        for seg in rough_segments:
+            s = seg["start"]
+            e = seg["end"]
+            sub = self._vad_scan_segment(wav, sample_rate, s, e)
+            if sub:
+                refined_segments.extend(sub)
+            else:
+                refined_segments.append((s, e))
+        print(f"  Refined segments: {len(refined_segments)}")
+        print(f"  Step 2 time: {time.time() - t2:.2f}s")
+
+        if not refined_segments:
+            return {"error": "No segments after VAD scan", "segments": []}
+
+        # ── Step 3: whisper per refined segment ──
+        print("\n[Step 3] Per-segment transcription...")
+        t3 = time.time()
+        CHECKPOINT_INTERVAL = 50
+
+        segment_texts = []
+        resume_from = 0
+
+        # 載入既有 partial checkpoint（中斷續接）
+        if checkpoint_path and os.path.exists(checkpoint_path):
+            try:
+                with open(checkpoint_path, "r") as f:
+                    cp = json.load(f)
+                if cp.get("checkpoint_version") == 2 and not cp.get("step3_completed"):
+                    saved = cp.get("segment_texts", [])
+                    if saved:
+                        resume_from = len(saved)
+                        segment_texts = saved
+                        print(f"[Step 3] Resuming from #{resume_from}/{len(refined_segments)}")
+            except Exception:
+                pass
+
+        for i, (start_sec, end_sec) in enumerate(refined_segments):
+            if i < resume_from:
                 continue
-            audio_segments.append(wav[start_sample:min(end_sample, len(wav))])
+            seg_text = self._transcribe_segment(wav, sample_rate, start_sec, end_sec)
+            segment_texts.append(seg_text)
 
-        print(f"  Audio segments extracted: {len(audio_segments)}")
+            if checkpoint_path and (i + 1) % CHECKPOINT_INTERVAL == 0:
+                _save_checkpoint(checkpoint_path, {
+                    "checkpoint_version": 2,
+                    "step3_completed": False,
+                    "step3_progress": i + 1,
+                    "language": language,
+                    "total_duration": total_duration,
+                    "refined_segments": [[s, e] for s, e in refined_segments],
+                    "segment_texts": [{
+                        "text": st["text"],
+                        "language": st["language"],
+                        "lang_prob": st["lang_prob"],
+                    } for st in segment_texts],
+                    "file_uuid": file_uuid,
+                    "max_speakers": max_speakers,
+                    "quality_threshold": quality_threshold,
+                })
+                print(f"[Checkpoint] Step 3: {i+1}/{len(refined_segments)}")
 
-        # 批量提取聲紋嵌入
-        print("\n[Step 2] Speaker embedding extraction...")
-        step2_start = time.time()
+        print(f"  Step 3 time: {time.time() - t3:.2f}s")
+
+        # ── Save final checkpoint after Step 3 ──
+        if checkpoint_path:
+            _save_checkpoint(checkpoint_path, {
+                "checkpoint_version": 2,
+                "step3_completed": True,
+                "language": language,
+                "total_duration": total_duration,
+                "refined_segments": [[s, e] for s, e in refined_segments],
+                "segment_texts": [{
+                    "text": st["text"],
+                    "language": st["language"],
+                    "lang_prob": st["lang_prob"],
+                } for st in segment_texts],
+                "file_uuid": file_uuid,
+                "max_speakers": max_speakers,
+                "quality_threshold": quality_threshold,
+            })
+            print(f"[Checkpoint] Step 3 complete, saved to {checkpoint_path}")
+
+        # ── Step 4: ECAPA-TDNN per refined segment ──
+        print("\n[Step 4] Speaker embedding extraction...")
+        t4 = time.time()
+        audio_segments = []
+        for start_sec, end_sec in refined_segments:
+            s = int(start_sec * sample_rate)
+            e = int(end_sec * sample_rate)
+            audio_segments.append(wav[s:min(e, len(wav))])
+
+        from speaker_encoder import extract_speaker_embeddings_batch, normalize_embeddings
         embeddings = extract_speaker_embeddings_batch(
             self.speaker_encoder, audio_segments, sample_rate
         )
         embeddings = normalize_embeddings(embeddings)
-        step2_time = time.time() - step2_start
-        print(f"  Embedding shape: {embeddings.shape}")
-        print(f"  Embedding time: {step2_time:.2f}s")
+        print(f"  Embeddings: {embeddings.shape}")
+        print(f"  Step 4 time: {time.time() - t4:.2f}s")
 
-        # 聚類
-        print("\n[Step 3] Robust speaker clustering...")
-        step3_start = time.time()
+        # ── Step 5: AgglomerativeClustering ──
+        print("\n[Step 5] Speaker clustering...")
+        t5 = time.time()
+        from speaker_cluster_fixed import robust_speaker_clustering
         speaker_labels, estimated_n_speakers = robust_speaker_clustering(
-            embeddings, n_speakers=None, max_speakers=10
+            embeddings, n_speakers=None, max_speakers=max_speakers
         )
-        step3_time = time.time() - step3_start
-        print(f"  Clustering time: {step3_time:.2f}s")
+        print(f"  Speakers: {estimated_n_speakers}")
+        print(f"  Step 5 time: {time.time() - t5:.2f}s")
 
-        # 建立輸出
-        result = {
-            "audio_path": str(audio_path),
-            "total_duration": len(wav) / sample_rate,
-            "n_speech_segments": len(speech_segments),
-            "n_speakers": int(estimated_n_speakers),
-            "segments": []
-        }
+        # 品質計算
+        qualities = compute_embedding_quality(embeddings, speaker_labels)
 
-        for i, ((start, end), label) in enumerate(zip(speech_segments, speaker_labels)):
-            result["segments"].append({
-                "index": i,
-                "start": round(start, 3),
-                "end": round(end, 3),
-                "duration": round(end - start, 3),
-                "speaker": f"SPEAKER_{int(label)}"
-            })
-
-        # 加入 embeddings（每個 segment 對應的 192-D speaker embedding）
-        result["embeddings"] = []
-        for emb in embeddings:
-            result["embeddings"].append(emb.tolist())
+        # 建立輸出 segments
+        segments = []
+        for i, ((start_sec, end_sec), label) in enumerate(
+                zip(refined_segments, speaker_labels)):
+            seg = {
+                "start": round(start_sec, 3),
+                "end": round(end_sec, 3),
+                "start_frame": int(start_sec * 30),
+                "end_frame": int(end_sec * 30),
+                "text": segment_texts[i]["text"],
+                "language": segment_texts[i]["language"],
+                "lang_prob": segment_texts[i]["lang_prob"],
+                "speaker": f"SPEAKER_{int(label)}",
+                "speaker_id": f"SPEAKER_{int(label)}",
+                "quality": float(qualities[i]),
+            }
+            segments.append(seg)
 
         # 統計
         speaker_stats = {}
-        for seg in result["segments"]:
-            speaker = seg["speaker"]
-            if speaker not in speaker_stats:
-                speaker_stats[speaker] = {"count": 0, "duration": 0}
-            speaker_stats[speaker]["count"] += 1
-            speaker_stats[speaker]["duration"] += seg["duration"]
-        result["speaker_stats"] = speaker_stats
+        for seg in segments:
+            spk = seg["speaker_id"]
+            dur = seg["end"] - seg["start"]
+            if spk not in speaker_stats:
+                speaker_stats[spk] = {"count": 0, "duration": 0}
+            speaker_stats[spk]["count"] += 1
+            speaker_stats[spk]["duration"] += dur
+
+        result = {
+            "language": language or "",
+            "segments": segments,
+            "n_speakers": int(estimated_n_speakers),
+            "speaker_stats": speaker_stats,
+            "total_duration": total_duration,
+            "n_segments": len(segments),
+        }
+
+        # ── Step 6: Store embeddings in Qdrant ──
+        if file_uuid:
+            print("\n[Step 6] Storing embeddings in Qdrant...")
+            t6 = time.time()
+            self._store_speaker_embeddings(segments, embeddings, speaker_labels,
+                                           file_uuid)
+            print(f"  Step 6 time: {time.time() - t6:.2f}s")
+
+        # ── Step 7: High-quality classification ──
+        if file_uuid:
+            print("\n[Step 7] Classifying high-quality embeddings...")
+            t7 = time.time()
+            references = self._classify_high_quality_speakers(
+                segments, embeddings, speaker_labels, file_uuid,
+                wav, sample_rate, quality_threshold
+            )
+            if references:
+                result["references"] = references
+            print(f"  Step 7 time: {time.time() - t7:.2f}s")
 
         total_time = time.time() - start_time
         result["processing_time"] = round(total_time, 2)
-        result["realtime_factor"] = round(result["total_duration"] / total_time, 2)
-
-        print("\n[SelfASRX-Fixed] Processing completed!")
-        print(f"  Total time: {total_time:.2f}s")
-        print(f"  Realtime factor: {result['realtime_factor']:.2f}x")
-        print(f"  Detected speakers: {estimated_n_speakers}")
+        if total_duration > 0:
+            result["realtime_factor"] = round(total_duration / total_time, 2)
 
+        # 保存輸出
         if output_path:
-            import json
-            with open(output_path, 'w', encoding='utf-8') as f:
+            Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+            with open(output_path, "w", encoding="utf-8") as f:
                 json.dump(result, f, indent=2, ensure_ascii=False)
-            print(f"  Results saved to: {output_path}")
+            print(f"\n[SelfASRX] Saved to: {output_path}")
+
+        print(f"\n[SelfASRX] Done! {len(segments)} segments, "
+              f"{estimated_n_speakers} speakers, "
+              f"{total_time:.2f}s")
 
-        print("=" * 60)
         return result
 
+    def resume_from_checkpoint(self, checkpoint_path, audio_path,
+                               output_path=None):
+        """從 checkpoint 載入 Steps 1-3 結果，執行 Steps 4-7"""
+        print(f"\n[SelfASRX] Resuming from checkpoint: {checkpoint_path}")
+        print("=" * 60)
+
+        with open(checkpoint_path, "r", encoding="utf-8") as f:
+            cp = json.load(f)
+
+        if not cp.get("step3_completed"):
+            error_msg = f"Checkpoint step3 not completed (progress: {cp.get('step3_progress', '?')})"
+            print(f"[SelfASRX] {error_msg}")
+            return {"error": error_msg, "segments": []}
+
+        wav, sample_rate = _load_audio(audio_path)
+        refined_segments = [tuple(s) for s in cp["refined_segments"]]
+        segment_texts = cp["segment_texts"]
+        language = cp.get("language", "")
+        total_duration = cp.get("total_duration", 0)
+        file_uuid = cp.get("file_uuid")
+        max_speakers = cp.get("max_speakers", 10)
+        quality_threshold = cp.get("quality_threshold", 0.85)
+
+        print(f"  Loaded checkpoint: {len(refined_segments)} segments, "
+              f"language={language}, duration={total_duration:.2f}s")
+
+        start_time = time.time()
+
+        # ── Step 4: ECAPA-TDNN per refined segment ──
+        print("\n[Step 4] Speaker embedding extraction...")
+        t4 = time.time()
+        audio_segments = []
+        for start_sec, end_sec in refined_segments:
+            s = int(start_sec * sample_rate)
+            e = int(end_sec * sample_rate)
+            audio_segments.append(wav[s:min(e, len(wav))])
+
+        from speaker_encoder import extract_speaker_embeddings_batch, normalize_embeddings
+        embeddings = extract_speaker_embeddings_batch(
+            self.speaker_encoder, audio_segments, sample_rate
+        )
+        embeddings = normalize_embeddings(embeddings)
+        print(f"  Embeddings: {embeddings.shape}")
+        print(f"  Step 4 time: {time.time() - t4:.2f}s")
+
+        # ── Step 5: AgglomerativeClustering ──
+        print("\n[Step 5] Speaker clustering...")
+        t5 = time.time()
+        from speaker_cluster_fixed import robust_speaker_clustering
+        speaker_labels, estimated_n_speakers = robust_speaker_clustering(
+            embeddings, n_speakers=None, max_speakers=max_speakers
+        )
+        print(f"  Speakers: {estimated_n_speakers}")
+        print(f"  Step 5 time: {time.time() - t5:.2f}s")
+
+        # 品質計算
+        qualities = compute_embedding_quality(embeddings, speaker_labels)
+
+        # 建立輸出 segments
+        segments = []
+        for i, ((start_sec, end_sec), label) in enumerate(
+                zip(refined_segments, speaker_labels)):
+            seg = {
+                "start": round(start_sec, 3),
+                "end": round(end_sec, 3),
+                "start_frame": int(start_sec * 30),
+                "end_frame": int(end_sec * 30),
+                "text": segment_texts[i]["text"],
+                "language": segment_texts[i]["language"],
+                "lang_prob": segment_texts[i]["lang_prob"],
+                "speaker": f"SPEAKER_{int(label)}",
+                "speaker_id": f"SPEAKER_{int(label)}",
+                "quality": float(qualities[i]),
+            }
+            segments.append(seg)
+
+        # 統計
+        speaker_stats = {}
+        for seg in segments:
+            spk = seg["speaker_id"]
+            dur = seg["end"] - seg["start"]
+            if spk not in speaker_stats:
+                speaker_stats[spk] = {"count": 0, "duration": 0}
+            speaker_stats[spk]["count"] += 1
+            speaker_stats[spk]["duration"] += dur
+
+        result = {
+            "language": language or "",
+            "segments": segments,
+            "n_speakers": int(estimated_n_speakers),
+            "speaker_stats": speaker_stats,
+            "total_duration": total_duration,
+            "n_segments": len(segments),
+        }
+
+        # ── Step 6: Store embeddings in Qdrant ──
+        if file_uuid:
+            print("\n[Step 6] Storing embeddings in Qdrant...")
+            t6 = time.time()
+            self._store_speaker_embeddings(segments, embeddings, speaker_labels,
+                                           file_uuid)
+            print(f"  Step 6 time: {time.time() - t6:.2f}s")
+
+        # ── Step 7: High-quality classification ──
+        if file_uuid:
+            print("\n[Step 7] Classifying high-quality embeddings...")
+            t7 = time.time()
+            references = self._classify_high_quality_speakers(
+                segments, embeddings, speaker_labels, file_uuid,
+                wav, sample_rate, quality_threshold
+            )
+            if references:
+                result["references"] = references
+            print(f"  Step 7 time: {time.time() - t7:.2f}s")
+
+        total_time = time.time() - start_time
+        result["processing_time"] = round(total_time, 2)
+        if total_duration > 0:
+            result["realtime_factor"] = round(total_duration / total_time, 2)
+
+        # 保存輸出
+        if output_path:
+            Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+            with open(output_path, "w", encoding="utf-8") as f:
+                json.dump(result, f, indent=2, ensure_ascii=False)
+            print(f"\n[SelfASRX] Saved to: {output_path}")
+
+        print(f"\n[SelfASRX] Done! {len(segments)} segments, "
+              f"{estimated_n_speakers} speakers, "
+              f"{total_time:.2f}s")
+
+        return result
+
+    # ── Internal helpers ──
+
+    def _vad_scan_segment(self, wav, sample_rate, start_sec, end_sec):
+        """VAD 細切單一段落"""
+        from vad import scan_within_segment
+        return scan_within_segment(
+            wav, sample_rate, start_sec, end_sec,
+            self.vad_model, self.vad_utils
+        )
+
+    def _transcribe_segment(self, wav, sample_rate, start_sec, end_sec):
+        """轉錄單一段落"""
+        from whisper_local import transcribe_segment
+        return transcribe_segment(wav, sample_rate, start_sec, end_sec, self.whisper)
+
+    def _store_speaker_embeddings(self, segments, embeddings, labels, file_uuid):
+        """Step 6: 所有 embedding 存入 Qdrant"""
+        if not self._ensure_qdrant():
+            return
+
+        points = []
+        for i, (seg, emb, label) in enumerate(
+                zip(segments, embeddings, labels)):
+            point_id = _hash_point_id(file_uuid, f"{i}")
+            points.append({
+                "id": point_id,
+                "vector": emb.tolist(),
+                "payload": {
+                    "type": "speaker_embedding",
+                    "file_uuid": file_uuid,
+                    "speaker_id": seg["speaker_id"],
+                    "text": seg["text"],
+                    "language": seg["language"],
+                    "start_time": seg["start"],
+                    "end_time": seg["end"],
+                }
+            })
+
+        ok = _qdrant_upsert(self.qdrant_url, self.qdrant_api_key,
+                            self.qdrant_collection, points)
+        if ok:
+            print(f"  Stored {len(points)} speaker embeddings to Qdrant")
+        return ok
+
+    def _classify_high_quality_speakers(self, segments, embeddings, labels,
+                                        file_uuid, wav, sample_rate,
+                                        threshold=0.85):
+        """Step 7: 高品質聲紋分級 + 性別分類 → Qdrant reference"""
+        qualities = compute_embedding_quality(embeddings, labels)
+        high_mask = qualities >= threshold
+
+        if not np.any(high_mask):
+            print("  No high-quality embeddings found")
+            return []
+
+        unique_labels = set(labels)
+        references = []
+        for label in unique_labels:
+            mask = (labels == label) & high_mask
+            if not np.any(mask):
+                continue
+            high_indices = [i for i in range(len(segments)) if mask[i]]
+            high_segs = [segments[i] for i in high_indices]
+
+            # 取品質最高的 segment index
+            best_idx = high_indices[int(np.argmax(qualities[mask]))]
+            best_seg = segments[best_idx]
+
+            centroid = np.mean(embeddings[mask], axis=0)
+            norm = np.linalg.norm(centroid)
+            if norm > 0:
+                centroid = centroid / norm
+
+            avg_quality = float(np.mean(qualities[mask]))
+            speaker_id = f"SPEAKER_{int(label)}"
+            text_samples = [s["text"] for s in high_segs[:5] if s["text"]]
+            total_dur = sum(s["end"] - s["start"] for s in high_segs)
+
+            ref_id = _hash_point_id(file_uuid, f"ref_{label}")
+            ref_payload = {
+                "type": "speaker_reference",
+                "file_uuid": file_uuid,
+                "speaker_id": speaker_id,
+                "n_segments": int(np.sum(mask)),
+                "avg_quality": avg_quality,
+                "total_duration": round(total_dur, 2),
+                "language": best_seg.get("language", ""),
+                "text_samples": text_samples,
+            }
+
+            # 性別分類：用最佳 segment 的音頻
+            if self.gender_classifier is not None:
+                try:
+                    import torch
+                    s = int(best_seg["start"] * sample_rate)
+                    e = int(best_seg["end"] * sample_rate)
+                    seg_wav = wav[s:min(e, len(wav))]
+                    seg_tensor = torch.from_numpy(seg_wav).float().unsqueeze(0)
+                    # SpeechBrain gender classifier 接受音頻
+                    out = self.gender_classifier.classify_batch(seg_tensor)
+                    probs = torch.softmax(out[0], dim=-1).squeeze().cpu().detach().numpy()
+                    if len(probs) >= 2:
+                        idx = int(np.argmax(probs))
+                        ref_payload["gender"] = "male" if idx == 0 else "female"
+                        ref_payload["gender_conf"] = float(probs[idx])
+                    else:
+                        ref_payload["gender"] = "unknown"
+                        ref_payload["gender_conf"] = 0.0
+                except Exception as e:
+                    print(f"[Gender] Classify error: {e}")
+                    ref_payload["gender"] = "unknown"
+                    ref_payload["gender_conf"] = 0.0
+            else:
+                ref_payload["gender"] = "unknown"
+                ref_payload["gender_conf"] = 0.0
+
+            _qdrant_upsert(self.qdrant_url, self.qdrant_api_key,
+                           self.qdrant_collection, [{
+                               "id": ref_id,
+                               "vector": centroid.tolist(),
+                               "payload": ref_payload,
+                           }])
+
+            references.append({
+                "speaker_id": speaker_id,
+                "n_segments": int(np.sum(mask)),
+                "avg_quality": avg_quality,
+                "gender": ref_payload["gender"],
+            })
+
+            print(f"  Ref: {speaker_id}, gender={ref_payload['gender']}"
+                  f" ({ref_payload['gender_conf']:.2f}), q={avg_quality:.3f}")
+
+        return references
+
+    def _ensure_qdrant(self):
+        """確保 Qdrant collection 可用"""
+        if not self._qdrant_ok:
+            ok = _ensure_speaker_collection(
+                self.qdrant_url, self.qdrant_api_key, self.qdrant_collection
+            )
+            self._qdrant_ok = ok
+        return self._qdrant_ok
+
 
 def main():
     import argparse
-    
-    parser = argparse.ArgumentParser(description="Self-implemented ASRX (Fixed)")
-    parser.add_argument("audio_path", help="Path to audio file")
+    parser = argparse.ArgumentParser(description="SelfASRX - Hybrid Speaker Diarization")
+    parser.add_argument("audio_path", help="Path to audio file (WAV)")
     parser.add_argument("-o", "--output", help="Output JSON path")
-    parser.add_argument("--min-speech-duration", type=int, default=500)
-    parser.add_argument("--n-speakers", type=int, default=None)
+    parser.add_argument("--file-uuid", help="File UUID for Qdrant storage")
     parser.add_argument("--max-speakers", type=int, default=10)
-    
+    parser.add_argument("--quality-threshold", type=float, default=0.85)
+    parser.add_argument("--resume", help="Checkpoint path to resume from")
+    parser.add_argument("--checkpoint", help="Save checkpoint path after Step 3")
     args = parser.parse_args()
-    
-    if not Path(args.audio_path).exists():
-        print(f"Error: Audio file not found: {args.audio_path}")
-        sys.exit(1)
-    
+
     asrx = SelfASRXFixed()
-    result = asrx.process(
-        args.audio_path,
-        args.output,
-        min_speech_duration_ms=args.min_speech_duration,
-        n_speakers=args.n_speakers,
-        max_speakers=args.max_speakers
-    )
-    
+
+    if args.resume:
+        if not Path(args.resume).exists():
+            print(f"Error: Checkpoint not found: {args.resume}")
+            sys.exit(1)
+        result = asrx.resume_from_checkpoint(
+            args.resume, args.audio_path,
+            output_path=args.output,
+        )
+    else:
+        if not Path(args.audio_path).exists():
+            print(f"Error: Audio file not found: {args.audio_path}")
+            sys.exit(1)
+
+        result = asrx.process(
+            args.audio_path,
+            output_path=args.output,
+            file_uuid=args.file_uuid,
+            max_speakers=args.max_speakers,
+            quality_threshold=args.quality_threshold,
+            checkpoint_path=args.checkpoint,
+        )
+
     if "error" not in result:
         print("\n[Summary]")
-        print(f"  Audio duration: {result['total_duration']:.2f}s")
-        print(f"  Speech segments: {result['n_speech_segments']}")
-        print(f"  Detected speakers: {result['n_speakers']}")
-        print(f"  Processing time: {result['processing_time']:.2f}s")
-        print(f"  Realtime factor: {result['realtime_factor']:.2f}x")
-        
-        print("\n[Speaker Statistics]")
-        for speaker, stats in result['speaker_stats'].items():
-            pct = stats['duration'] / result['total_duration'] * 100
-            print(f"  {speaker}: {stats['count']} segments, " +
-                  f"{stats['duration']:.2f}s ({pct:.1f}%)")
+        print(f"  Duration: {result['total_duration']:.2f}s")
+        print(f"  Segments: {result['n_segments']}")
+        print(f"  Speakers: {result['n_speakers']}")
+        if "references" in result:
+            for ref in result["references"]:
+                print(f"  {ref['speaker_id']}: gender={ref['gender']}, "
+                      f"quality={ref['avg_quality']:.3f}")
 
 
 if __name__ == "__main__":
diff --git a/scripts/asrx_self/speaker_audio_player.py b/scripts/asrx_self/speaker_audio_player.py
deleted file mode 100644
index 7f26275..0000000
--- a/scripts/asrx_self/speaker_audio_player.py
+++ /dev/null
@@ -1,280 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-Speaker Audio Player - 說話人語音播放器
-從 ASRX 結果中提取並播放每個說話人的語音片段
-"""
-
-import json
-import argparse
-import subprocess
-import tempfile
-import os
-from pathlib import Path
-from typing import List, Dict
-
-
-def load_asrx_result(result_path: str) -> Dict:
-    """載入 ASRX 結果"""
-    with open(result_path, "r", encoding="utf-8") as f:
-        return json.load(f)
-
-
-def extract_audio_segment(
-    audio_path: str, start_sec: float, end_sec: float, output_path: str
-) -> bool:
-    """
-    使用 ffmpeg 提取音頻片段
-
-    Args:
-        audio_path: 原始音頻路徑
-        start_sec: 開始時間（秒）
-        end_sec: 結束時間（秒）
-        output_path: 輸出路徑
-
-    Returns:
-        bool: 是否成功
-    """
-    duration = end_sec - start_sec
-
-    cmd = [
-        "ffmpeg",
-        "-y",
-        "-i",
-        audio_path,
-        "-ss",
-        str(start_sec),
-        "-t",
-        str(duration),
-        "-acodec",
-        "pcm_s16le",
-        "-ar",
-        "16000",
-        "-ac",
-        "1",
-        output_path,
-    ]
-
-    try:
-        result = subprocess.run(cmd, capture_output=True, text=True)
-        return result.returncode == 0
-    except Exception as e:
-        print(f"Error extracting audio: {e}")
-        return False
-
-
-def play_audio(audio_path: str) -> bool:
-    """
-    播放音頻文件
-
-    使用 macOS 的 afplay 或 Linux 的 aplay
-    """
-    try:
-        # 嘗試使用 afplay (macOS)
-        if os.path.exists("/usr/bin/afplay"):
-            subprocess.run(["afplay", audio_path], check=True)
-        # 嘗試使用 aplay (Linux)
-        elif os.path.exists("/usr/bin/aplay"):
-            subprocess.run(["aplay", audio_path], check=True)
-        else:
-            print(
-                "No audio player found. Please install afplay (macOS) or aplay (Linux)"
-            )
-            return False
-        return True
-    except Exception as e:
-        print(f"Error playing audio: {e}")
-        return False
-
-
-def group_segments_by_speaker(segments: List[Dict]) -> Dict[str, List[Dict]]:
-    """將語音片段按說話人分組"""
-    speaker_segments = {}
-
-    for seg in segments:
-        speaker = seg["speaker"]
-        if speaker not in speaker_segments:
-            speaker_segments[speaker] = []
-        speaker_segments[speaker].append(seg)
-
-    # 按開始時間排序
-    for speaker in speaker_segments:
-        speaker_segments[speaker].sort(key=lambda x: x["start"])
-
-    return speaker_segments
-
-
-def play_speaker_segments(
-    audio_path: str,
-    result_path: str,
-    speaker_id: str = None,
-    limit: int = None,
-    temp_dir: str = None,
-):
-    """
-    播放指定說話人的語音片段
-
-    Args:
-        audio_path: 原始音頻路徑
-        result_path: ASRX 結果 JSON 路徑
-        speaker_id: 說話人 ID（None=播放所有）
-        limit: 最多播放幾個片段（None=全部）
-        temp_dir: 臨時目錄
-    """
-    # 載入結果
-    print(f"[Load] Loading ASRX result: {result_path}")
-    result = load_asrx_result(result_path)
-
-    segments = result.get("segments", [])
-    total_duration = result.get("total_duration", 0)
-
-    print(f"[Info] Total segments: {len(segments)}")
-    print(f"[Info] Total duration: {total_duration / 60:.1f} minutes")
-
-    # 分組
-    speaker_segments = group_segments_by_speaker(segments)
-
-    # 選擇說話人
-    if speaker_id:
-        speakers_to_play = [speaker_id]
-    else:
-        speakers_to_play = sorted(speaker_segments.keys())
-
-    # 創建臨時目錄
-    if temp_dir is None:
-        temp_dir = tempfile.mkdtemp(prefix="speaker_audio_")
-
-    print(f"\n[Info] Temp directory: {temp_dir}")
-    print(f"[Info] Speakers to play: {speakers_to_play}")
-    print("=" * 60)
-
-    # 播放每個說話人的片段
-    for speaker in speakers_to_play:
-        if speaker not in speaker_segments:
-            print(f"\n[Warning] Speaker {speaker} not found!")
-            continue
-
-        segs = speaker_segments[speaker]
-        if limit:
-            segs = segs[:limit]
-
-        print(f"\n▶️  {speaker} ({len(segs)} segments)")
-        print("-" * 60)
-
-        for i, seg in enumerate(segs, 1):
-            start = seg["start"]
-            end = seg["end"]
-            duration = seg["duration"]
-
-            # 提取音頻
-            temp_audio = os.path.join(temp_dir, f"{speaker}_{i:03d}.wav")
-
-            print(
-                f"  [{i:3d}] {start:7.2f}s - {end:7.2f}s ({duration:5.2f}s) ... ",
-                end="",
-                flush=True,
-            )
-
-            if extract_audio_segment(audio_path, start, end, temp_audio):
-                print("✅", end="", flush=True)
-
-                # 播放
-                if play_audio(temp_audio):
-                    print(" ▶️  Played")
-                else:
-                    print(" ❌ Play failed")
-            else:
-                print(" ❌ Extract failed")
-
-        print()
-
-
-def show_speaker_stats(result_path: str):
-    """顯示說話人統計資訊"""
-    result = load_asrx_result(result_path)
-
-    segments = result.get("segments", [])
-    speaker_segments = group_segments_by_speaker(segments)
-
-    print("\n" + "=" * 60)
-    print("說話人統計")
-    print("=" * 60)
-
-    # 按時長排序
-    speaker_stats = []
-    for speaker, segs in speaker_segments.items():
-        total_duration = sum(seg["duration"] for seg in segs)
-        speaker_stats.append((speaker, len(segs), total_duration))
-
-    speaker_stats.sort(key=lambda x: x[2], reverse=True)
-
-    total_duration = result.get("total_duration", 0)
-
-    for speaker, count, duration in speaker_stats:
-        pct = duration / total_duration * 100 if total_duration > 0 else 0
-        print(f"{speaker:12} {count:4} segments  {duration:8.1f}s  ({pct:5.1f}%)")
-
-    print("=" * 60)
-
-
-def main():
-    parser = argparse.ArgumentParser(
-        description="Speaker Audio Player - 播放說話人語音片段",
-        formatter_class=argparse.RawDescriptionHelpFormatter,
-        epilog="""
-Examples:
-  # 顯示說話人統計
-  python3 speaker_audio_player.py --stats result.json
-  
-  # 播放所有說話人的前 3 個片段
-  python3 speaker_audio_player.py audio.wav result.json --limit 3
-  
-  # 播放特定說話人的所有片段
-  python3 speaker_audio_player.py audio.wav result.json --speaker SPEAKER_0
-  
-  # 播放 SPEAKER_1 的前 5 個片段
-  python3 speaker_audio_player.py audio.wav result.json --speaker SPEAKER_1 --limit 5
-        """,
-    )
-
-    parser.add_argument("audio_path", nargs="?", help="原始音頻文件路徑")
-    parser.add_argument("result_path", help="ASRX 結果 JSON 路徑")
-    parser.add_argument("--stats", action="store_true", help="只显示說話人統計")
-    parser.add_argument("--speaker", type=str, help="指定說話人 ID（如 SPEAKER_0）")
-    parser.add_argument(
-        "--limit",
-        type=int,
-        default=None,
-        help="每個說話人最多播放幾個片段（None=全部）",
-    )
-    parser.add_argument("--temp-dir", type=str, default=None, help="臨時目錄路徑")
-
-    args = parser.parse_args()
-
-    if args.stats:
-        show_speaker_stats(args.result_path)
-        return
-
-    if not args.audio_path:
-        print("Error: audio_path is required unless --stats is specified")
-        parser.print_help()
-        return
-
-    if not Path(args.audio_path).exists():
-        print(f"Error: Audio file not found: {args.audio_path}")
-        return
-
-    if not Path(args.result_path).exists():
-        print(f"Error: Result file not found: {args.result_path}")
-        return
-
-    play_speaker_segments(
-        args.audio_path,
-        args.result_path,
-        speaker_id=args.speaker,
-        limit=args.limit,
-        temp_dir=args.temp_dir,
-    )
-
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/asrx_self/speaker_classifier.py b/scripts/asrx_self/speaker_classifier.py
new file mode 100644
index 0000000..f22f20d
--- /dev/null
+++ b/scripts/asrx_self/speaker_classifier.py
@@ -0,0 +1,65 @@
+"""
+Speaker Classifier - 聲紋品質評估與性別分類
+
+提供品質計算與性別分類功能，作為 main_fixed.py 的輔助模組。
+"""
+
+import numpy as np
+
+
+def compute_embedding_quality(embeddings, labels):
+    """每個 embedding 到所屬 cluster centroid 的餘弦相似度
+
+    Args:
+        embeddings: [n_segments, 192] 聲紋向量矩陣
+        labels: [n_segments] 聚類標籤
+
+    Returns:
+        qualities: [n_segments] 品質分數 (0-1)
+    """
+    from sklearn.metrics.pairwise import cosine_similarity
+
+    unique_labels = set(labels)
+    centroids = {}
+    for label in unique_labels:
+        mask = labels == label
+        centroid = np.mean(embeddings[mask], axis=0)
+        norm = np.linalg.norm(centroid)
+        if norm > 0:
+            centroid = centroid / norm
+        centroids[label] = centroid
+
+    qualities = []
+    for emb, label in zip(embeddings, labels):
+        sim = cosine_similarity([emb], [centroids[label]])[0][0]
+        qualities.append(sim)
+
+    return np.array(qualities)
+
+
+def classify_gender(audio_wav, sample_rate, classifier):
+    """從音頻段分類性別
+
+    Args:
+        audio_wav: 音頻波形 (numpy array)
+        sample_rate: 採樣率
+        classifier: SpeechBrain EncoderClassifier (gender-recognition-ecapa)
+
+    Returns:
+        dict: {"gender": "male"|"female"|"unknown", "confidence": float}
+    """
+    default = {"gender": "unknown", "confidence": 0.0}
+    if classifier is None or len(audio_wav) == 0:
+        return default
+    try:
+        import torch
+        seg_tensor = torch.from_numpy(audio_wav).float().unsqueeze(0)
+        out = classifier.classify_batch(seg_tensor)
+        probs = torch.softmax(out[0], dim=-1).squeeze().cpu().detach().numpy()
+        if len(probs) >= 2:
+            idx = int(np.argmax(probs))
+            label = "male" if idx == 0 else "female"
+            return {"gender": label, "confidence": float(probs[idx])}
+    except Exception as e:
+        pass
+    return default
diff --git a/scripts/asrx_self/speaker_cluster.py b/scripts/asrx_self/speaker_cluster.py
deleted file mode 100644
index 6c60a9a..0000000
--- a/scripts/asrx_self/speaker_cluster.py
+++ /dev/null
@@ -1,310 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-Speaker Clustering - 說話人聚類
-使用譜聚類算法將聲紋嵌入分組
-
-技術來源:
-- 譜聚類：Shi & Malik (2000), IEEE TPAMI
-- 論文：https://ieeexplore.ieee.org/document/868688
-- 應用於說話人分離：Wooters & Huijbregts (2008), ICASSP
-"""
-
-import numpy as np
-from sklearn.cluster import SpectralClustering, AgglomerativeClustering
-from sklearn.metrics.pairwise import cosine_similarity
-
-
-def estimate_n_speakers_eigengap(similarity_matrix, max_speakers=10):
-    """
-    使用特徵值間隙方法估計說話人數量
-
-    技術來源:
-    - 特徵值間隙理論：Lu et al. (2010)
-    - 原理：相似度矩陣的特徵值分佈中，最大間隙對應最佳聚類數
-
-    Args:
-        similarity_matrix: 相似度矩陣 [n, n]
-        max_speakers: 最大說話人數
-
-    Returns:
-        n_speakers: 估計的說話人數量
-    """
-    # 計算特徵值
-    eigenvalues = np.linalg.eigvalsh(similarity_matrix)
-
-    # 降序排列
-    eigenvalues = np.sort(eigenvalues)[::-1]
-
-    # 只考慮前 max_speakers 個特徵值
-    eigenvalues = eigenvalues[:max_speakers]
-
-    # 計算間隙
-    gaps = np.diff(eigenvalues)
-
-    # 找到最大間隙的位置
-    if len(gaps) > 0:
-        n_speakers = np.argmax(np.abs(gaps)) + 1
-    else:
-        n_speakers = 1
-
-    # 限制範圍
-    n_speakers = max(2, min(n_speakers, max_speakers))
-
-    return n_speakers
-
-
-def estimate_n_speakers_silhouette(embeddings, max_speakers=10):
-    """
-    使用輪廓係數估計說話人數量
-
-    Args:
-        embeddings: 嵌入矩陣 [n, d]
-        max_speakers: 最大說話人數
-
-    Returns:
-        n_speakers: 估計的說話人數量
-    """
-    from sklearn.metrics import silhouette_score
-
-    best_score = -1
-    best_n = 2
-
-    for n in range(2, min(max_speakers + 1, len(embeddings))):
-        clustering = AgglomerativeClustering(n_clusters=n)
-        labels = clustering.fit_predict(embeddings)
-
-        if len(np.unique(labels)) > 1:
-            score = silhouette_score(embeddings, labels)
-            if score > best_score:
-                best_score = score
-                best_n = n
-
-    return best_n
-
-
-def spectral_clustering_speaker(
-    similarity_matrix, n_speakers=None, auto_estimate=True, max_speakers=10
-):
-    """
-    使用譜聚類進行說話人分離
-
-    Args:
-        similarity_matrix: 相似度矩陣 [n, n]
-        n_speakers: 說話人數量（可選，如果為 None 則自動估計）
-        auto_estimate: 是否自動估計說話人數量
-        max_speakers: 最大說話人數
-
-    Returns:
-        speaker_labels: 說話人標籤 [n,]
-        n_speakers: 使用的說話人數量
-    """
-    n_segments = len(similarity_matrix)
-
-    # 清洗相似度矩陣
-    similarity_matrix = np.nan_to_num(
-        similarity_matrix, nan=0.5, posinf=1.0, neginf=-1.0
-    )
-
-    # 確保對角線為 1
-    np.fill_diagonal(similarity_matrix, 1.0)
-
-    # 確保值在 [-1, 1] 範圍
-    similarity_matrix = np.clip(similarity_matrix, -1.0, 1.0)
-
-    # 自動估計說話人數量
-    if n_speakers is None and auto_estimate:
-        n_speakers = estimate_n_speakers_eigengap(
-            similarity_matrix, max_speakers=max_speakers
-        )
-        print(f"[Clustering] Estimated n_speakers: {n_speakers}")
-
-    if n_speakers is None:
-        n_speakers = 2  # 預設值
-
-    # 確保 n_speakers 不超過樣本數
-    n_speakers = min(n_speakers, n_segments)
-
-    print(f"[Clustering] Running spectral clustering with {n_speakers} clusters...")
-
-    # 譜聚類
-    try:
-        clustering = SpectralClustering(
-            n_clusters=int(n_speakers),
-            affinity="precomputed",
-            assign_labels="kmeans",
-            random_state=42,
-            n_init=10,
-        )
-
-        speaker_labels = clustering.fit_predict(similarity_matrix)
-
-        print("[Clustering] Spectral clustering completed")
-        print(f"[Clustering] n_speakers: {n_speakers}")
-        print(f"[Clustering] n_segments: {n_segments}")
-
-        return speaker_labels, n_speakers
-
-    except Exception as e:
-        print(f"[Clustering] Spectral clustering failed: {e}")
-        print("[Clustering] Using fallback: 2 speakers")
-        # 簡單分配：前一半是 SPEAKER_0，後一半是 SPEAKER_1
-        speaker_labels = np.array(
-            [0] * (n_segments // 2) + [1] * (n_segments - n_segments // 2)
-        )
-        return speaker_labels, 2
-
-
-def agglomerative_clustering_speaker(
-    embeddings, n_speakers=None, threshold=0.5, max_speakers=10
-):
-    """
-    使用層次聚類進行說話人分離
-
-    Args:
-        embeddings: 嵌入矩陣 [n, d]
-        n_speakers: 說話人數量（可選）
-        threshold: 距離閾值（用於自動決定聚類數）
-        max_speakers: 最大說話人數
-
-    Returns:
-        speaker_labels: 說話人標籤 [n,]
-        n_speakers: 使用的說話人數量
-    """
-    n_segments = len(embeddings)
-
-    if n_speakers is None:
-        # 使用距離閾值自動決定
-        from sklearn.metrics.pairwise import cosine_distances
-
-        distances = cosine_distances(embeddings)
-
-        # 計算平均最近鄰距離
-        avg_distances = []
-        for i in range(min(100, n_segments)):
-            dists = distances[i]
-            dists = np.sort(dists)
-            if len(dists) > 1:
-                avg_distances.append(dists[1])  # 最近鄰（排除自己）
-
-        if avg_distances:
-            avg_dist = np.mean(avg_distances)
-            # 根據平均距離估計聚類數
-            n_speakers = max(2, int(avg_dist / threshold))
-            n_speakers = min(n_speakers, max_speakers)
-        else:
-            n_speakers = 2
-
-    n_speakers = min(n_speakers, n_segments)
-
-    # 層次聚類
-    clustering = AgglomerativeClustering(
-        n_clusters=n_speakers, metric="cosine", linkage="average"
-    )
-
-    speaker_labels = clustering.fit_predict(embeddings)
-
-    print("[Clustering] Agglomerative clustering completed")
-    print(f"[Clustering] n_speakers: {n_speakers}")
-
-    return speaker_labels, n_speakers
-
-
-def smooth_speaker_labels(speaker_labels, window_size=5):
-    """
-    平滑說話人標籤（去除噪聲）
-
-    Args:
-        speaker_labels: 原始說話人標籤
-        window_size: 平滑窗口大小
-
-    Returns:
-        smoothed_labels: 平滑後的標籤
-    """
-    from scipy import stats
-
-    smoothed = np.copy(speaker_labels)
-    half_window = window_size // 2
-
-    for i in range(len(speaker_labels)):
-        start = max(0, i - half_window)
-        end = min(len(speaker_labels), i + half_window + 1)
-
-        window_labels = speaker_labels[start:end]
-        mode_result = stats.mode(window_labels, keepdims=True)
-        smoothed[i] = mode_result.mode[0]
-
-    return smoothed
-
-
-def compute_diarization_purity(speaker_labels, ground_truth_labels=None):
-    """
-    計算說話人分離純度（如果有 ground truth）
-
-    Args:
-        speaker_labels: 預測的說話人標籤
-        ground_truth_labels: 真實的說話人標籤（可選）
-
-    Returns:
-        purity: 純度分數（0-1）
-    """
-    if ground_truth_labels is None:
-        # 沒有 ground truth，使用聚類純度近似
-
-        # 使用餘弦相似度作為距離
-        purity = 0.5  # 預設值
-    else:
-        # 計算純度
-        from sklearn.metrics import adjusted_rand_score
-
-        purity = adjusted_rand_score(ground_truth_labels, speaker_labels)
-
-    return purity
-
-
-if __name__ == "__main__":
-    # 測試聚類算法
-    print("[Test] Testing speaker clustering algorithms")
-
-    # 生成模擬數據
-    np.random.seed(42)
-    n_speakers = 3
-    n_segments_per_speaker = 20
-
-    # 生成 3 個說話人的嵌入
-    embeddings = []
-    for i in range(n_speakers):
-        # 每個說話人有不同的中心
-        center = np.random.randn(192) * 2 + i * 3
-        # 添加噪聲
-        for _ in range(n_segments_per_speaker):
-            emb = center + np.random.randn(192) * 0.5
-            embeddings.append(emb)
-
-    embeddings = np.array(embeddings)
-    print(f"[Test] Generated {len(embeddings)} embeddings for {n_speakers} speakers")
-
-    # 計算相似度矩陣
-    similarity = cosine_similarity(embeddings)
-    print(f"[Test] Similarity matrix shape: {similarity.shape}")
-
-    # 估計說話人數量
-    estimated_n = estimate_n_speakers_eigengap(similarity, max_speakers=10)
-    print(f"[Test] Estimated n_speakers (eigengap): {estimated_n}")
-
-    estimated_n_silhouette = estimate_n_speakers_silhouette(embeddings, max_speakers=10)
-    print(f"[Test] Estimated n_speakers (silhouette): {estimated_n_silhouette}")
-
-    # 譜聚類
-    labels, n_clusters = spectral_clustering_speaker(
-        similarity, n_speakers=None, auto_estimate=True
-    )
-
-    print("\n[Test] Clustering results:")
-    print(f"  True n_speakers: {n_speakers}")
-    print(f"  Estimated n_speakers: {n_clusters}")
-    print(f"  Unique labels: {np.unique(labels)}")
-
-    # 計算每個聚類的大小
-    for label in np.unique(labels):
-        count = np.sum(labels == label)
-        print(f"  Cluster {label}: {count} segments")
diff --git a/scripts/asrx_self/speaker_player_gui.py b/scripts/asrx_self/speaker_player_gui.py
deleted file mode 100644
index fe21d1f..0000000
--- a/scripts/asrx_self/speaker_player_gui.py
+++ /dev/null
@@ -1,431 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-Speaker Player GUI - 說話人語音播放器（圖形界面）
-使用 tkinter 顯示播放進度和 Speaker ID
-"""
-
-import json
-import subprocess
-import tempfile
-import os
-import threading
-import time
-from pathlib import Path
-
-try:
-    import tkinter as tk
-    from tkinter import ttk, filedialog, messagebox
-
-    HAS_TKINTER = True
-except ImportError:
-    HAS_TKINTER = False
-
-
-class SpeakerPlayerGUI:
-    """說話人語音播放器 GUI"""
-
-    def __init__(self, root):
-        self.root = root
-        self.root.title("🎬 Speaker Audio Player - Face Integration")
-        self.root.geometry("1100x800")
-
-        # 數據
-        self.audio_path = None
-        self.result_path = None
-        self.face_path = None
-        self.result_data = None
-        self.face_data = None
-        self.integrated_data = None
-        self.speaker_segments = {}
-        self.speakers = []
-        self.current_speaker_idx = 0
-        self.is_playing = False
-        self.stop_flag = False
-
-        # 創建界面
-        self.create_widgets()
-
-    def create_widgets(self):
-        """創建界面組件"""
-        # 頂部：文件選擇
-        top_frame = ttk.Frame(self.root, padding="10")
-        top_frame.pack(fill=tk.X)
-
-        ttk.Label(top_frame, text="📁 Audio:").pack(side=tk.LEFT)
-        self.audio_label = ttk.Label(top_frame, text="未選擇", width=50)
-        self.audio_label.pack(side=tk.LEFT, padx=5)
-        ttk.Button(top_frame, text="選擇音頻", command=self.select_audio).pack(
-            side=tk.LEFT, padx=5
-        )
-
-        ttk.Label(top_frame, text="  📊 Result:").pack(side=tk.LEFT, padx=(20, 0))
-        self.result_label = ttk.Label(top_frame, text="未選擇", width=50)
-        self.result_label.pack(side=tk.LEFT, padx=5)
-        ttk.Button(top_frame, text="選擇結果", command=self.select_result).pack(
-            side=tk.LEFT, padx=5
-        )
-
-        # 中間：說話人列表和片段列表
-        mid_frame = ttk.Frame(self.root, padding="10")
-        mid_frame.pack(fill=tk.BOTH, expand=True)
-
-        # 左側：說話人列表
-        left_frame = ttk.LabelFrame(mid_frame, text="📢 說話人列表", padding="10")
-        left_frame.pack(side=tk.LEFT, fill=tk.BOTH, expand=False)
-
-        self.speaker_listbox = tk.Listbox(
-            left_frame, width=35, height=20, font=("Arial", 11)
-        )
-        self.speaker_listbox.pack(fill=tk.BOTH, expand=True)
-        self.speaker_listbox.bind("<<ListboxSelect>>", self.on_speaker_select)
-
-        # 右側：片段列表
-        right_frame = ttk.LabelFrame(mid_frame, text="🎵 語音片段", padding="10")
-        right_frame.pack(side=tk.LEFT, fill=tk.BOTH, expand=True, padx=10)
-
-        # 片段列表（带滚动条）
-        list_frame = ttk.Frame(right_frame)
-        list_frame.pack(fill=tk.BOTH, expand=True)
-
-        scrollbar = ttk.Scrollbar(list_frame)
-        scrollbar.pack(side=tk.RIGHT, fill=tk.Y)
-
-        self.segment_listbox = tk.Listbox(
-            list_frame,
-            width=50,
-            height=20,
-            font=("Courier", 10),
-            yscrollcommand=scrollbar.set,
-        )
-        self.segment_listbox.pack(fill=tk.BOTH, expand=True)
-        scrollbar.config(command=self.segment_listbox.yview)
-
-        self.segment_listbox.bind("<Double-Button-1>", self.on_segment_double_click)
-
-        # 底部：播放控制和進度
-        bottom_frame = ttk.Frame(self.root, padding="10")
-        bottom_frame.pack(fill=tk.X)
-
-        # 播放控制
-        control_frame = ttk.Frame(bottom_frame)
-        control_frame.pack(fill=tk.X)
-
-        self.play_button = ttk.Button(
-            control_frame, text="▶️ 播放所選", command=self.play_selected, width=15
-        )
-        self.play_button.pack(side=tk.LEFT, padx=5)
-
-        self.stop_button = ttk.Button(
-            control_frame, text="⏹️ 停止", command=self.stop_playing, width=10
-        )
-        self.stop_button.pack(side=tk.LEFT, padx=5)
-        self.stop_button.config(state=tk.DISABLED)
-
-        self.play_all_button = ttk.Button(
-            control_frame, text="▶️▶️ 播放全部", command=self.play_all, width=15
-        )
-        self.play_all_button.pack(side=tk.LEFT, padx=5)
-
-        # 進度條
-        progress_frame = ttk.Frame(bottom_frame)
-        progress_frame.pack(fill=tk.X, pady=(10, 0))
-
-        ttk.Label(progress_frame, text="⏱️ 進度:").pack(side=tk.LEFT)
-        self.progress_bar = ttk.Progressbar(progress_frame, mode="determinate")
-        self.progress_bar.pack(side=tk.LEFT, fill=tk.X, expand=True, padx=10)
-
-        self.progress_label = ttk.Label(progress_frame, text="0:00 / 0:00", width=20)
-        self.progress_label.pack(side=tk.LEFT)
-
-        # 狀態欄
-        self.status_label = ttk.Label(
-            bottom_frame, text="就緒", relief=tk.SUNKEN, anchor=tk.W
-        )
-        self.status_label.pack(fill=tk.X, pady=(10, 0))
-
-    def select_audio(self):
-        """選擇音頻文件"""
-        filename = filedialog.askopenfilename(
-            title="選擇音頻文件",
-            filetypes=[("WAV files", "*.wav"), ("All files", "*.*")],
-        )
-        if filename:
-            self.audio_path = filename
-            self.audio_label.config(text=Path(filename).name)
-            self.check_ready()
-
-    def select_result(self):
-        """選擇結果文件"""
-        filename = filedialog.askopenfilename(
-            title="選擇 ASRX 結果文件",
-            filetypes=[("JSON files", "*.json"), ("All files", "*.*")],
-        )
-        if filename:
-            self.result_path = filename
-            self.result_label.config(text=Path(filename).name)
-            self.load_result()
-            self.check_ready()
-
-    def load_result(self):
-        """載入 ASRX 結果"""
-        try:
-            with open(self.result_path, "r", encoding="utf-8") as f:
-                self.result_data = json.load(f)
-
-            # 分組
-            self.speaker_segments = {}
-            for seg in self.result_data.get("segments", []):
-                speaker = seg["speaker"]
-                if speaker not in self.speaker_segments:
-                    self.speaker_segments[speaker] = []
-                self.speaker_segments[speaker].append(seg)
-
-            # 排序
-            for speaker in self.speaker_segments:
-                self.speaker_segments[speaker].sort(key=lambda x: x["start"])
-
-            # 說話人列表（按時長排序）
-            self.speakers = sorted(
-                self.speaker_segments.keys(),
-                key=lambda s: sum(seg["duration"] for seg in self.speaker_segments[s]),
-                reverse=True,
-            )
-
-            # 更新列表框
-            self.speaker_listbox.delete(0, tk.END)
-            for speaker in self.speakers:
-                segs = self.speaker_segments[speaker]
-                total_dur = sum(seg["duration"] for seg in segs)
-                total_dur_min = total_dur / 60
-                self.speaker_listbox.insert(
-                    tk.END,
-                    f"🔊 {speaker:12} | {len(segs):4d}段 | {total_dur_min:5.1f}分鐘",
-                )
-
-            self.status_label.config(
-                text=f"載入成功：{len(self.speakers)} 個說話人，{len(self.result_data.get('segments', []))} 個片段"
-            )
-
-        except Exception as e:
-            messagebox.showerror("錯誤", f"載入結果文件失敗：{e}")
-            self.result_path = None
-            self.result_label.config(text="載入失敗")
-
-    def check_ready(self):
-        """檢查是否就緒"""
-        if self.audio_path and self.result_path:
-            self.status_label.config(text="✅ 就緒 - 請選擇說話人並播放")
-            self.play_button.config(state=tk.NORMAL)
-            self.play_all_button.config(state=tk.NORMAL)
-        else:
-            self.status_label.config(text="⚠️ 請選擇音頻和結果文件")
-            self.play_button.config(state=tk.DISABLED)
-            self.play_all_button.config(state=tk.DISABLED)
-
-    def on_speaker_select(self, event):
-        """說話人選擇事件"""
-        selection = self.speaker_listbox.curselection()
-        if not selection:
-            return
-
-        self.current_speaker_idx = selection[0]
-        speaker = self.speakers[self.current_speaker_idx]
-
-        # 更新片段列表
-        self.segment_listbox.delete(0, tk.END)
-        for i, seg in enumerate(self.speaker_segments[speaker], 1):
-            start = seg["start"]
-            end = seg["end"]
-            duration = seg["duration"]
-            self.segment_listbox.insert(
-                tk.END,
-                f"[{i:4d}] {speaker:12} | {start:7.2f}s - {end:7.2f}s ({duration:5.2f}s)",
-            )
-
-        self.status_label.config(
-            text=f"選擇：{speaker} - {len(self.speaker_segments[speaker])} 個片段"
-        )
-
-    def on_segment_double_click(self, event):
-        """片段雙擊事件"""
-        self.play_selected()
-
-    def extract_and_play(self, start_sec: float, end_sec: float) -> bool:
-        """提取並播放音頻"""
-        duration = end_sec - start_sec
-        temp_file = tempfile.NamedTemporaryFile(suffix=".wav", delete=False)
-        temp_path = temp_file.name
-        temp_file.close()
-
-        try:
-            # 提取
-            cmd = [
-                "ffmpeg",
-                "-y",
-                "-loglevel",
-                "quiet",
-                "-i",
-                self.audio_path,
-                "-ss",
-                str(start_sec),
-                "-t",
-                str(duration),
-                "-acodec",
-                "pcm_s16le",
-                "-ar",
-                "16000",
-                "-ac",
-                "1",
-                temp_path,
-            ]
-
-            result = subprocess.run(cmd, capture_output=True)
-            if result.returncode != 0:
-                return False
-
-            # 播放
-            if os.path.exists("/usr/bin/afplay"):
-                subprocess.run(["afplay", temp_path], capture_output=True)
-            elif os.path.exists("/usr/bin/aplay"):
-                subprocess.run(["aplay", temp_path], capture_output=True)
-            else:
-                return False
-
-            return True
-        finally:
-            if os.path.exists(temp_path):
-                os.unlink(temp_path)
-
-    def play_segment(self, speaker: str, seg: dict, seg_idx: int, total: int):
-        """播放單個片段"""
-        if self.stop_flag:
-            return False
-
-        start = seg["start"]
-        end = seg["end"]
-        duration = seg["duration"]
-
-        # 更新 UI
-        self.root.after(
-            0,
-            lambda: self.status_label.config(
-                text=f"▶️  {speaker} [{seg_idx}/{total}] {start:.2f}s - {end:.2f}s"
-            ),
-        )
-
-        # 更新進度
-        progress = (seg_idx / total) * 100
-        self.root.after(0, lambda: self.progress_bar.config(value=progress))
-        self.root.after(
-            0, lambda: self.progress_label.config(text=f"{seg_idx}:{total}")
-        )
-
-        # 播放
-        if self.extract_and_play(start, end):
-            return True
-        else:
-            self.root.after(
-                0,
-                lambda: messagebox.showwarning(
-                    "警告", f"播放失敗：{speaker} [{seg_idx}]"
-                ),
-            )
-            return True
-
-    def play_selected(self):
-        """播放所選片段"""
-        selection = self.segment_listbox.curselection()
-        if not selection:
-            # 如果沒選擇，播放第一個
-            if self.speakers:
-                speaker = self.speakers[self.current_speaker_idx]
-                segs = self.speaker_segments[speaker]
-                if segs:
-                    self.play_all()
-            return
-
-        # 播放所選
-        seg_idx = selection[0]
-        speaker = self.speakers[self.current_speaker_idx]
-        seg = self.speaker_segments[speaker][seg_idx]
-
-        self.is_playing = True
-        self.stop_flag = False
-        self.play_button.config(state=tk.DISABLED)
-        self.stop_button.config(state=tk.NORMAL)
-
-        # 在後台線程播放
-        def play_thread():
-            success = self.play_segment(speaker, seg, seg_idx + 1, 1)
-            self.root.after(0, lambda: self.on_play_done())
-
-        thread = threading.Thread(target=play_thread, daemon=True)
-        thread.start()
-
-    def play_all(self):
-        """播放所選說話人的所有片段"""
-        if not self.speakers:
-            return
-
-        speaker = self.speakers[self.current_speaker_idx]
-        segs = self.speaker_segments[speaker]
-
-        if not segs:
-            return
-
-        self.is_playing = True
-        self.stop_flag = False
-        self.play_button.config(state=tk.DISABLED)
-        self.play_all_button.config(state=tk.DISABLED)
-        self.stop_button.config(state=tk.NORMAL)
-
-        # 在後台線程播放
-        def play_thread():
-            for i, seg in enumerate(segs, 1):
-                if self.stop_flag:
-                    break
-                self.play_segment(speaker, seg, i, len(segs))
-                time.sleep(0.3)  # 片段間隔
-
-            self.root.after(0, lambda: self.on_play_done())
-
-        thread = threading.Thread(target=play_thread, daemon=True)
-        thread.start()
-
-    def stop_playing(self):
-        """停止播放"""
-        self.stop_flag = True
-        self.is_playing = False
-        self.on_play_done()
-
-    def on_play_done(self):
-        """播放完成"""
-        self.is_playing = False
-        self.stop_flag = False
-        self.play_button.config(state=tk.NORMAL)
-        self.play_all_button.config(state=tk.NORMAL)
-        self.stop_button.config(state=tk.DISABLED)
-        self.progress_bar.config(value=0)
-        self.progress_label.config(text="0:00 / 0:00")
-
-        if self.stop_flag:
-            self.status_label.config(text="⏹️ 已停止")
-        else:
-            self.status_label.config(text="✅ 播放完成")
-
-
-def main():
-    """主函數"""
-    if not HAS_TKINTER:
-        print("❌ tkinter 未安裝")
-        print("請使用以下命令安裝:")
-        print("  brew install python-tk@3.9")
-        return
-
-    root = tk.Tk()
-    app = SpeakerPlayerGUI(root)
-    root.mainloop()
-
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/asrx_self/speaker_player_gui_face.py b/scripts/asrx_self/speaker_player_gui_face.py
deleted file mode 100644
index 22c1f51..0000000
--- a/scripts/asrx_self/speaker_player_gui_face.py
+++ /dev/null
@@ -1,522 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-Speaker Player GUI - 說話人語音播放器（Face 整合版）
-使用 tkinter 顯示播放進度、Speaker ID 和人臉信息
-"""
-
-import json
-import subprocess
-import tempfile
-import os
-import threading
-import time
-from pathlib import Path
-
-try:
-    import tkinter as tk
-    from tkinter import ttk, filedialog, messagebox
-
-    HAS_TKINTER = True
-except ImportError:
-    HAS_TKINTER = False
-
-
-class SpeakerPlayerGUI:
-    """說話人語音播放器 GUI（Face 整合版）"""
-
-    def __init__(self, root):
-        self.root = root
-        self.root.title("🎬 Speaker Player - Face Integration")
-        self.root.geometry("1200x800")
-
-        # 數據
-        self.audio_path = None
-        self.result_path = None
-        self.face_path = None
-        self.result_data = None
-        self.face_data = None
-        self.integrated_data = None
-        self.speaker_segments = {}
-        self.speakers = []
-        self.current_speaker_idx = 0
-        self.is_playing = False
-        self.stop_flag = False
-
-        # 創建界面
-        self.create_widgets()
-
-    def create_widgets(self):
-        """創建界面組件"""
-        # 頂部：文件選擇
-        top_frame = ttk.Frame(self.root, padding="10")
-        top_frame.pack(fill=tk.X)
-
-        # 第一行：音頻和 ASRX 結果
-        row1_frame = ttk.Frame(top_frame)
-        row1_frame.pack(fill=tk.X)
-
-        ttk.Label(row1_frame, text="📁 Audio:").pack(side=tk.LEFT)
-        self.audio_label = ttk.Label(row1_frame, text="未選擇", width=50)
-        self.audio_label.pack(side=tk.LEFT, padx=5)
-        ttk.Button(row1_frame, text="選擇音頻", command=self.select_audio).pack(
-            side=tk.LEFT, padx=5
-        )
-
-        ttk.Label(row1_frame, text="  📊 ASRX:").pack(side=tk.LEFT, padx=(20, 0))
-        self.result_label = ttk.Label(row1_frame, text="未選擇", width=50)
-        self.result_label.pack(side=tk.LEFT, padx=5)
-        ttk.Button(row1_frame, text="選擇結果", command=self.select_result).pack(
-            side=tk.LEFT, padx=5
-        )
-
-        # 第二行：Face 結果
-        row2_frame = ttk.Frame(top_frame)
-        row2_frame.pack(fill=tk.X, pady=(5, 0))
-
-        ttk.Label(row2_frame, text="👤 Face:").pack(side=tk.LEFT)
-        self.face_label = ttk.Label(row2_frame, text="未選擇 (可選)", width=50)
-        self.face_label.pack(side=tk.LEFT, padx=5)
-        ttk.Button(row2_frame, text="選擇 Face", command=self.select_face).pack(
-            side=tk.LEFT, padx=5
-        )
-        self.integrate_button = ttk.Button(
-            row2_frame,
-            text="🔗 整合 Face",
-            command=self.integrate_face,
-            state=tk.DISABLED,
-        )
-        self.integrate_button.pack(side=tk.LEFT, padx=5)
-
-        # 中間：說話人列表和片段列表
-        mid_frame = ttk.Frame(self.root, padding="10")
-        mid_frame.pack(fill=tk.BOTH, expand=True)
-
-        # 左側：說話人列表（帶 Face 統計）
-        left_frame = ttk.LabelFrame(mid_frame, text="📢 說話人列表", padding="10")
-        left_frame.pack(side=tk.LEFT, fill=tk.BOTH, expand=False)
-
-        self.speaker_listbox = tk.Listbox(
-            left_frame, width=45, height=20, font=("Arial", 11)
-        )
-        self.speaker_listbox.pack(fill=tk.BOTH, expand=True)
-        self.speaker_listbox.bind("<<ListboxSelect>>", self.on_speaker_select)
-
-        # 右側：片段列表（帶 Face 信息）
-        right_frame = ttk.LabelFrame(
-            mid_frame, text="🎵 語音片段 + 👥 人臉", padding="10"
-        )
-        right_frame.pack(side=tk.LEFT, fill=tk.BOTH, expand=True, padx=10)
-
-        # 片段列表（带滚动条）
-        list_frame = ttk.Frame(right_frame)
-        list_frame.pack(fill=tk.BOTH, expand=True)
-
-        scrollbar = ttk.Scrollbar(list_frame)
-        scrollbar.pack(side=tk.RIGHT, fill=tk.Y)
-
-        self.segment_listbox = tk.Listbox(
-            list_frame,
-            width=65,
-            height=20,
-            font=("Courier", 9),
-            yscrollcommand=scrollbar.set,
-        )
-        self.segment_listbox.pack(fill=tk.BOTH, expand=True)
-        scrollbar.config(command=self.segment_listbox.yview)
-
-        self.segment_listbox.bind("<Double-Button-1>", self.on_segment_double_click)
-
-        # 底部：播放控制和進度
-        bottom_frame = ttk.Frame(self.root, padding="10")
-        bottom_frame.pack(fill=tk.X)
-
-        # 播放控制
-        control_frame = ttk.Frame(bottom_frame)
-        control_frame.pack(fill=tk.X)
-
-        self.play_button = ttk.Button(
-            control_frame, text="▶️ 播放所選", command=self.play_selected, width=15
-        )
-        self.play_button.pack(side=tk.LEFT, padx=5)
-        self.play_button.config(state=tk.DISABLED)
-
-        self.stop_button = ttk.Button(
-            control_frame, text="⏹️ 停止", command=self.stop_playing, width=10
-        )
-        self.stop_button.pack(side=tk.LEFT, padx=5)
-        self.stop_button.config(state=tk.DISABLED)
-
-        self.play_all_button = ttk.Button(
-            control_frame, text="▶️▶️ 播放全部", command=self.play_all, width=15
-        )
-        self.play_all_button.pack(side=tk.LEFT, padx=5)
-        self.play_all_button.config(state=tk.DISABLED)
-
-        # 進度條
-        progress_frame = ttk.Frame(bottom_frame)
-        progress_frame.pack(fill=tk.X, pady=(10, 0))
-
-        ttk.Label(progress_frame, text="⏱️ 進度:").pack(side=tk.LEFT)
-        self.progress_bar = ttk.Progressbar(progress_frame, mode="determinate")
-        self.progress_bar.pack(side=tk.LEFT, fill=tk.X, expand=True, padx=10)
-
-        self.progress_label = ttk.Label(progress_frame, text="0:00 / 0:00", width=20)
-        self.progress_label.pack(side=tk.LEFT)
-
-        # 狀態欄
-        self.status_label = ttk.Label(
-            bottom_frame, text="就緒", relief=tk.SUNKEN, anchor=tk.W
-        )
-        self.status_label.pack(fill=tk.X, pady=(10, 0))
-
-    def select_audio(self):
-        """選擇音頻文件"""
-        filename = filedialog.askopenfilename(
-            title="選擇音頻文件",
-            filetypes=[("WAV files", "*.wav"), ("All files", "*.*")],
-        )
-        if filename:
-            self.audio_path = filename
-            self.audio_label.config(text=Path(filename).name)
-            self.check_ready()
-
-    def select_result(self):
-        """選擇 ASRX 結果文件"""
-        filename = filedialog.askopenfilename(
-            title="選擇 ASRX 結果文件",
-            filetypes=[("JSON files", "*.json"), ("All files", "*.*")],
-        )
-        if filename:
-            self.result_path = filename
-            self.result_label.config(text=Path(filename).name)
-            self.load_result()
-            self.check_ready()
-
-    def select_face(self):
-        """選擇 Face 結果文件"""
-        filename = filedialog.askopenfilename(
-            title="選擇 Face 檢測結果",
-            filetypes=[("JSON files", "*.json"), ("All files", "*.*")],
-        )
-        if filename:
-            self.face_path = filename
-            self.face_label.config(text=Path(filename).name)
-            self.integrate_button.config(state=tk.NORMAL)
-            self.status_label.config(text="✅ Face 已選擇 - 請點擊整合")
-
-    def integrate_face(self):
-        """整合 Face 與 ASRX"""
-        if not self.face_path or not self.result_path:
-            messagebox.showwarning("警告", "請先選擇 Face 和 ASRX 文件")
-            return
-
-        self.status_label.config(text="🔄 整合中...")
-        self.root.update()
-
-        try:
-            # 載入 Face 數據
-            with open(self.face_path, "r", encoding="utf-8") as f:
-                self.face_data = json.load(f)
-
-            # 重新載入 ASRX 數據並整合
-            self.load_result(integrate_with_face=True)
-
-            self.status_label.config(text="✅ Face 整合完成")
-            self.integrate_button.config(state=tk.DISABLED)
-
-        except Exception as e:
-            messagebox.showerror("錯誤", f"整合失敗：{e}")
-            self.status_label.config(text="❌ 整合失敗")
-
-    def load_result(self, integrate_with_face=False):
-        """載入 ASRX 結果"""
-        try:
-            with open(self.result_path, "r", encoding="utf-8") as f:
-                self.result_data = json.load(f)
-
-            # 分組
-            self.speaker_segments = {}
-            for seg in self.result_data.get("segments", []):
-                speaker = seg["speaker"]
-                if speaker not in self.speaker_segments:
-                    self.speaker_segments[speaker] = []
-                self.speaker_segments[speaker].append(seg)
-
-            # 排序
-            for speaker in self.speaker_segments:
-                self.speaker_segments[speaker].sort(key=lambda x: x["start"])
-
-            # 說話人列表（按時長排序）
-            self.speakers = sorted(
-                self.speaker_segments.keys(),
-                key=lambda s: sum(seg["duration"] for seg in self.speaker_segments[s]),
-                reverse=True,
-            )
-
-            # 更新列表框
-            self.speaker_listbox.delete(0, tk.END)
-            for speaker in self.speakers:
-                segs = self.speaker_segments[speaker]
-                total_dur = sum(seg["duration"] for seg in segs)
-                total_dur_min = total_dur / 60
-
-                # 如果有 Face 數據，計算有人臉的片段數
-                face_info = ""
-                if integrate_with_face and self.integrated_data:
-                    speaker_integrated = [
-                        item
-                        for item in self.integrated_data
-                        if item["speaker"] == speaker
-                    ]
-                    with_face = sum(
-                        1 for item in speaker_integrated if item.get("has_face", False)
-                    )
-                    face_info = f" | 👥 {with_face}/{len(segs)}"
-
-                self.speaker_listbox.insert(
-                    tk.END,
-                    f"🔊 {speaker:12} | {len(segs):4d}段 | {total_dur_min:5.1f}分鐘{face_info}",
-                )
-
-            total_segments = len(self.result_data.get("segments", []))
-            self.status_label.config(
-                text=f"載入成功：{len(self.speakers)} 個說話人，{total_segments} 個片段"
-            )
-
-        except Exception as e:
-            messagebox.showerror("錯誤", f"載入結果文件失敗：{e}")
-            self.result_path = None
-            self.result_label.config(text="載入失敗")
-
-    def check_ready(self):
-        """檢查是否就緒"""
-        if self.audio_path and self.result_path:
-            self.status_label.config(text="✅ 就緒 - 請選擇說話人並播放")
-            self.play_button.config(state=tk.NORMAL)
-            self.play_all_button.config(state=tk.NORMAL)
-        else:
-            self.status_label.config(text="⚠️ 請選擇音頻和結果文件")
-            self.play_button.config(state=tk.DISABLED)
-            self.play_all_button.config(state=tk.DISABLED)
-
-    def on_speaker_select(self, event):
-        """說話人選擇事件"""
-        selection = self.speaker_listbox.curselection()
-        if not selection:
-            return
-
-        self.current_speaker_idx = selection[0]
-        speaker = self.speakers[self.current_speaker_idx]
-
-        # 更新片段列表
-        self.segment_listbox.delete(0, tk.END)
-        for i, seg in enumerate(self.speaker_segments[speaker], 1):
-            start = seg["start"]
-            end = seg["end"]
-            duration = seg["duration"]
-
-            # 如果有整合 Face 數據
-            face_info = ""
-            if self.integrated_data:
-                matching = [
-                    item
-                    for item in self.integrated_data
-                    if abs(item["start"] - start) < 0.1 and item["speaker"] == speaker
-                ]
-                if matching and matching[0].get("has_face", False):
-                    face_info = " 👥✅"
-                elif matching:
-                    face_info = " 👥❌"
-
-            self.segment_listbox.insert(
-                tk.END,
-                f"[{i:4d}] {speaker:12} | {start:7.2f}s - {end:7.2f}s ({duration:5.2f}s){face_info}",
-            )
-
-        self.status_label.config(
-            text=f"選擇：{speaker} - {len(self.speaker_segments[speaker])} 個片段"
-        )
-
-    def on_segment_double_click(self, event):
-        """片段雙擊事件"""
-        self.play_selected()
-
-    def extract_and_play(self, start_sec: float, end_sec: float) -> bool:
-        """提取並播放音頻"""
-        duration = end_sec - start_sec
-        temp_file = tempfile.NamedTemporaryFile(suffix=".wav", delete=False)
-        temp_path = temp_file.name
-        temp_file.close()
-
-        try:
-            # 提取
-            cmd = [
-                "ffmpeg",
-                "-y",
-                "-loglevel",
-                "quiet",
-                "-i",
-                self.audio_path,
-                "-ss",
-                str(start_sec),
-                "-t",
-                str(duration),
-                "-acodec",
-                "pcm_s16le",
-                "-ar",
-                "16000",
-                "-ac",
-                "1",
-                temp_path,
-            ]
-
-            result = subprocess.run(cmd, capture_output=True)
-            if result.returncode != 0:
-                return False
-
-            # 播放
-            if os.path.exists("/usr/bin/afplay"):
-                subprocess.run(["afplay", temp_path], capture_output=True)
-            elif os.path.exists("/usr/bin/aplay"):
-                subprocess.run(["aplay", temp_path], capture_output=True)
-            else:
-                return False
-
-            return True
-        finally:
-            if os.path.exists(temp_path):
-                os.unlink(temp_path)
-
-    def play_segment(self, speaker: str, seg: dict, seg_idx: int, total: int):
-        """播放單個片段"""
-        if self.stop_flag:
-            return False
-
-        start = seg["start"]
-        end = seg["end"]
-        duration = seg["duration"]
-
-        # 更新 UI
-        self.root.after(
-            0,
-            lambda: self.status_label.config(
-                text=f"▶️  {speaker} [{seg_idx}/{total}] {start:.2f}s - {end:.2f}s"
-            ),
-        )
-
-        # 更新進度
-        progress = (seg_idx / total) * 100
-        self.root.after(0, lambda: self.progress_bar.config(value=progress))
-        self.root.after(
-            0, lambda: self.progress_label.config(text=f"{seg_idx}:{total}")
-        )
-
-        # 播放
-        if self.extract_and_play(start, end):
-            return True
-        else:
-            self.root.after(
-                0,
-                lambda: messagebox.showwarning(
-                    "警告", f"播放失敗：{speaker} [{seg_idx}]"
-                ),
-            )
-            return True
-
-    def play_selected(self):
-        """播放所選片段"""
-        selection = self.segment_listbox.curselection()
-        if not selection:
-            # 如果沒選擇，播放第一個
-            if self.speakers:
-                speaker = self.speakers[self.current_speaker_idx]
-                segs = self.speaker_segments[speaker]
-                if segs:
-                    self.play_all()
-            return
-
-        # 播放所選
-        seg_idx = selection[0]
-        speaker = self.speakers[self.current_speaker_idx]
-        seg = self.speaker_segments[speaker][seg_idx]
-
-        self.is_playing = True
-        self.stop_flag = False
-        self.play_button.config(state=tk.DISABLED)
-        self.stop_button.config(state=tk.NORMAL)
-
-        # 在後台線程播放
-        def play_thread():
-            success = self.play_segment(speaker, seg, seg_idx + 1, 1)
-            self.root.after(0, lambda: self.on_play_done())
-
-        thread = threading.Thread(target=play_thread, daemon=True)
-        thread.start()
-
-    def play_all(self):
-        """播放所選說話人的所有片段"""
-        if not self.speakers:
-            return
-
-        speaker = self.speakers[self.current_speaker_idx]
-        segs = self.speaker_segments[speaker]
-
-        if not segs:
-            return
-
-        self.is_playing = True
-        self.stop_flag = False
-        self.play_button.config(state=tk.DISABLED)
-        self.play_all_button.config(state=tk.DISABLED)
-        self.stop_button.config(state=tk.NORMAL)
-
-        # 在後台線程播放
-        def play_thread():
-            for i, seg in enumerate(segs, 1):
-                if self.stop_flag:
-                    break
-                self.play_segment(speaker, seg, i, len(segs))
-                time.sleep(0.3)  # 片段間隔
-
-            self.root.after(0, lambda: self.on_play_done())
-
-        thread = threading.Thread(target=play_thread, daemon=True)
-        thread.start()
-
-    def stop_playing(self):
-        """停止播放"""
-        self.stop_flag = True
-        self.is_playing = False
-        self.on_play_done()
-
-    def on_play_done(self):
-        """播放完成"""
-        self.is_playing = False
-        self.stop_flag = False
-        self.play_button.config(state=tk.NORMAL)
-        self.play_all_button.config(state=tk.NORMAL)
-        self.stop_button.config(state=tk.DISABLED)
-        self.progress_bar.config(value=0)
-        self.progress_label.config(text="0:00 / 0:00")
-
-        if self.stop_flag:
-            self.status_label.config(text="⏹️ 已停止")
-        else:
-            self.status_label.config(text="✅ 播放完成")
-
-
-def main():
-    """主函數"""
-    if not HAS_TKINTER:
-        print("❌ tkinter 未安裝")
-        print("請使用以下命令安裝:")
-        print("  brew install python-tk@3.9")
-        return
-
-    root = tk.Tk()
-    app = SpeakerPlayerGUI(root)
-    root.mainloop()
-
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/asrx_self/speaker_player_interactive.py b/scripts/asrx_self/speaker_player_interactive.py
deleted file mode 100644
index e844c89..0000000
--- a/scripts/asrx_self/speaker_player_interactive.py
+++ /dev/null
@@ -1,267 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-Interactive Speaker Audio Player - 交互式說話人語音播放器
-可以選擇播放哪個說話人的哪些片段
-"""
-
-import json
-import subprocess
-import tempfile
-import os
-from pathlib import Path
-from typing import List, Dict
-
-
-def load_asrx_result(result_path: str) -> Dict:
-    """載入 ASRX 結果"""
-    with open(result_path, "r", encoding="utf-8") as f:
-        return json.load(f)
-
-
-def extract_and_play(audio_path: str, start_sec: float, end_sec: float) -> bool:
-    """提取並播放音頻片段"""
-    duration = end_sec - start_sec
-    temp_file = tempfile.NamedTemporaryFile(suffix=".wav", delete=False)
-    temp_path = temp_file.name
-    temp_file.close()
-
-    try:
-        # 提取
-        cmd = [
-            "ffmpeg",
-            "-y",
-            "-loglevel",
-            "quiet",
-            "-i",
-            audio_path,
-            "-ss",
-            str(start_sec),
-            "-t",
-            str(duration),
-            "-acodec",
-            "pcm_s16le",
-            "-ar",
-            "16000",
-            "-ac",
-            "1",
-            temp_path,
-        ]
-
-        result = subprocess.run(cmd, capture_output=True)
-        if result.returncode != 0:
-            return False
-
-        # 播放
-        if os.path.exists("/usr/bin/afplay"):
-            subprocess.run(["afplay", temp_path], capture_output=True)
-        elif os.path.exists("/usr/bin/aplay"):
-            subprocess.run(["aplay", temp_path], capture_output=True)
-        else:
-            print("  ⚠️  No audio player found")
-            return False
-
-        return True
-    finally:
-        if os.path.exists(temp_path):
-            os.unlink(temp_path)
-
-
-def show_menu(speaker_segments: Dict[str, List[Dict]], speaker_id: str):
-    """顯示選單"""
-    segs = speaker_segments[speaker_id]
-    total_duration = sum(seg["duration"] for seg in segs)
-
-    print(f"\n{'=' * 70}")
-    print(f"🔊 {speaker_id}")
-    print(f"{'=' * 70}")
-    print(f"  Segments: {len(segs)}")
-    print(
-        f"  Total duration: {total_duration / 60:.1f} minutes ({total_duration:.1f}s)"
-    )
-    print(f"{'=' * 70}")
-
-    # 顯示前 20 個片段
-    for i, seg in enumerate(segs[:20], 1):
-        start = seg["start"]
-        end = seg["end"]
-        duration = seg["duration"]
-        print(
-            f"  [{i:3d}] {speaker_id:12} | {start:7.2f}s - {end:7.2f}s  ({duration:5.2f}s)"
-        )
-
-    if len(segs) > 20:
-        print(f"  ... and {len(segs) - 20} more segments")
-
-    print(f"\n{'=' * 70}")
-    print("Commands:")
-    print(f"  [1-{min(20, len(segs))}]  Play specific segment")
-    print("  all      Play all segments (may take a while)")
-    print("  first N  Play first N segments")
-    print("  next     Next speaker")
-    print("  prev     Previous speaker")
-    print("  list     List all speakers")
-    print("  quit     Exit")
-    print(f"{'=' * 70}")
-
-
-def interactive_player(audio_path: str, result_path: str):
-    """交互式播放器"""
-    # 載入結果
-    result = load_asrx_result(result_path)
-    segments = result.get("segments", [])
-    total_duration = result.get("total_duration", 0)
-
-    # 分組
-    speaker_segments = {}
-    for seg in segments:
-        speaker = seg["speaker"]
-        if speaker not in speaker_segments:
-            speaker_segments[speaker] = []
-        speaker_segments[speaker].append(seg)
-
-    # 排序
-    for speaker in speaker_segments:
-        speaker_segments[speaker].sort(key=lambda x: x["start"])
-
-    # 說話人列表
-    speakers = sorted(
-        speaker_segments.keys(),
-        key=lambda s: sum(seg["duration"] for seg in speaker_segments[s]),
-        reverse=True,
-    )
-
-    current_speaker_idx = 0
-
-    print("\n🎬 Speaker Audio Player")
-    print(f"📁 Audio: {audio_path}")
-    print(f"📊 Speakers: {len(speakers)}")
-    print(f"{'=' * 70}")
-
-    while True:
-        current_speaker = speakers[current_speaker_idx]
-        show_menu(speaker_segments, current_speaker)
-
-        try:
-            cmd = input(f"\n▶️  {current_speaker} > ").strip().lower()
-        except (EOFError, KeyboardInterrupt):
-            print("\n\nExiting...")
-            break
-
-        if not cmd:
-            continue
-
-        # 播放特定片段
-        if cmd.isdigit():
-            idx = int(cmd) - 1
-            if 0 <= idx < len(speaker_segments[current_speaker]):
-                seg = speaker_segments[current_speaker][idx]
-                print(f"\n  🔊 {current_speaker} - Segment {idx + 1}")
-                print(
-                    f"  ⏱️  {seg['start']:.2f}s - {seg['end']:.2f}s ({seg['duration']:.2f}s)"
-                )
-                print("  ▶️  Playing...", end="", flush=True)
-                if extract_and_play(audio_path, seg["start"], seg["end"]):
-                    print(" ✅ Done")
-                else:
-                    print(" ❌ Failed")
-            else:
-                print(
-                    f"  Invalid segment number (1-{len(speaker_segments[current_speaker])})"
-                )
-
-        # 播放所有
-        elif cmd == "all":
-            print(
-                f"\n  🔊 {current_speaker} - Playing all {len(speaker_segments[current_speaker])} segments..."
-            )
-            print("=" * 70)
-            for i, seg in enumerate(speaker_segments[current_speaker], 1):
-                print(
-                    f"  [{i:3d}/{len(speaker_segments[current_speaker])}] {current_speaker} | "
-                    + f"{seg['start']:7.2f}s - {seg['end']:7.2f}s ({seg['duration']:5.2f}s)",
-                    end="",
-                    flush=True,
-                )
-                if extract_and_play(audio_path, seg["start"], seg["end"]):
-                    print(" ✅")
-                else:
-                    print(" ❌")
-            print("=" * 70)
-
-        # 播放前 N 個
-        elif cmd.startswith("first "):
-            try:
-                n = int(cmd.split()[1])
-                print(f"\n  🔊 {current_speaker} - Playing first {n} segments...")
-                print("=" * 70)
-                for i, seg in enumerate(speaker_segments[current_speaker][:n], 1):
-                    print(
-                        f"  [{i:3d}/{n}] {current_speaker} | "
-                        + f"{seg['start']:7.2f}s - {seg['end']:7.2f}s ({seg['duration']:5.2f}s)",
-                        end="",
-                        flush=True,
-                    )
-                    if extract_and_play(audio_path, seg["start"], seg["end"]):
-                        print(" ✅")
-                    else:
-                        print(" ❌")
-                print("=" * 70)
-            except (IndexError, ValueError):
-                print("  Usage: first N")
-
-        # 下一個說話人
-        elif cmd == "next":
-            current_speaker_idx = (current_speaker_idx + 1) % len(speakers)
-
-        # 上一個說話人
-        elif cmd == "prev":
-            current_speaker_idx = (current_speaker_idx - 1) % len(speakers)
-
-        # 列出所有說話人
-        elif cmd == "list":
-            print(f"\n{'=' * 70}")
-            print("📢 All speakers:")
-            print(f"{'=' * 70}")
-            for i, speaker in enumerate(speakers, 1):
-                segs = speaker_segments[speaker]
-                total_dur = sum(seg["duration"] for seg in segs)
-                pct = total_dur / total_duration * 100 if total_duration > 0 else 0
-                print(
-                    f"  {i:2d}. 🔊 {speaker:12} | {len(segs):4d} segments, "
-                    + f"{total_dur:7.1f}s ({pct:5.1f}%)"
-                )
-            print(f"{'=' * 70}")
-            print(f"  Current: 🔊 {speakers[current_speaker_idx]}")
-            print(f"{'=' * 70}")
-
-        # 退出
-        elif cmd == "quit" or cmd == "exit" or cmd == "q":
-            print("\nExiting...")
-            break
-
-        else:
-            print(f"  Unknown command: {cmd}")
-
-
-def main():
-    import argparse
-
-    parser = argparse.ArgumentParser(description="Interactive Speaker Audio Player")
-    parser.add_argument("audio_path", help="原始音頻文件路徑")
-    parser.add_argument("result_path", help="ASRX 結果 JSON 路徑")
-
-    args = parser.parse_args()
-
-    if not Path(args.audio_path).exists():
-        print(f"Error: Audio file not found: {args.audio_path}")
-        return
-
-    if not Path(args.result_path).exists():
-        print(f"Error: Result file not found: {args.result_path}")
-        return
-
-    interactive_player(args.audio_path, args.result_path)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/asrx_self/test_gui_face_player.py b/scripts/asrx_self/test_gui_face_player.py
deleted file mode 100755
index 08dd112..0000000
--- a/scripts/asrx_self/test_gui_face_player.py
+++ /dev/null
@@ -1,164 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-GUI Face Player 自動化測試腳本
-測試所有功能並生成測試報告
-"""
-
-import json
-import subprocess
-from pathlib import Path
-
-
-def check_file_exists(path, description):
-    """檢查文件是否存在"""
-    exists = Path(path).exists()
-    status = "✅" if exists else "❌"
-    size = Path(path).stat().st_size / 1024 / 1024 if exists else 0
-    print(f"{status} {description}: {path} ({size:.1f} MB)")
-    return exists
-
-
-def check_process_running(pattern):
-    """檢查進程是否運行"""
-    result = subprocess.run(['pgrep', '-f', pattern], capture_output=True, text=True)
-    running = result.returncode == 0
-    status = "✅" if running else "❌"
-    print(f"{status} 進程：{pattern} ({'運行中' if running else '未運行'})")
-    return running
-
-
-def test_json_structure(path, required_keys, description):
-    """測試 JSON 文件結構"""
-    try:
-        with open(path, 'r', encoding='utf-8') as f:
-            data = json.load(f)
-        
-        missing_keys = [key for key in required_keys if key not in data]
-        if missing_keys:
-            print(f"❌ {description}: 缺少鍵 {missing_keys}")
-            return False
-        else:
-            print(f"✅ {description}: 結構正確")
-            return True
-    except Exception as e:
-        print(f"❌ {description}: {e}")
-        return False
-
-
-def test_integration_script():
-    """測試整合腳本"""
-    print("\n" + "="*70)
-    print("測試整合腳本")
-    print("="*70)
-    
-    cmd = [
-        'python3',
-        'integrate_face_asrx_speaker.py',
-        '/tmp/face_long.json',
-        '/tmp/asrx_charade_optimized.json',
-        '--threshold', '3.0',
-        '--stats'
-    ]
-    
-    result = subprocess.run(cmd, capture_output=True, text=True, timeout=120)
-    
-    # 檢查輸出
-    if '99.8%' in result.stdout:
-        print("✅ 整合腳本：匹配率正確 (99.8%)")
-        return True
-    else:
-        print("❌ 整合腳本：匹配率異常")
-        print(result.stdout)
-        return False
-
-
-def test_gui_startup():
-    """測試 GUI 啟動"""
-    print("\n" + "="*70)
-    print("測試 GUI 啟動")
-    print("="*70)
-    
-    # 檢查進程
-    running = check_process_running('speaker_player_gui_face')
-    
-    if running:
-        print("✅ GUI 進程：正常運行")
-        return True
-    else:
-        print("❌ GUI 進程：未運行")
-        return False
-
-
-def main():
-    """主測試函數"""
-    print("="*70)
-    print("GUI Face Player 自動化測試")
-    print("="*70)
-    
-    # 測試文件
-    print("\n" + "="*70)
-    print("測試文件")
-    print("="*70)
-    
-    files_ok = True
-    files_ok &= check_file_exists('/tmp/charade_audio.wav', '音頻文件')
-    files_ok &= check_file_exists('/tmp/asrx_charade_optimized.json', 'ASRX 結果')
-    files_ok &= check_file_exists('/tmp/face_long.json', 'Face 結果')
-    files_ok &= check_file_exists('/tmp/charade_integrated.json', '整合結果')
-    
-    # 測試 JSON 結構
-    print("\n" + "="*70)
-    print("測試 JSON 結構")
-    print("="*70)
-    
-    json_ok = True
-    json_ok &= test_json_structure(
-        '/tmp/asrx_charade_optimized.json',
-        ['segments', 'n_speakers'],
-        'ASRX 結果'
-    )
-    json_ok &= test_json_structure(
-        '/tmp/face_long.json',
-        ['frames', 'frame_count'],
-        'Face 結果'
-    )
-    json_ok &= test_json_structure(
-        '/tmp/charade_integrated.json',
-        ['integrated_segments', 'speaker_stats'],
-        '整合結果'
-    )
-    
-    # 測試整合腳本
-    integration_ok = test_integration_script()
-    
-    # 測試 GUI
-    gui_ok = test_gui_startup()
-    
-    # 總結
-    print("\n" + "="*70)
-    print("測試總結")
-    print("="*70)
-    
-    all_ok = files_ok and json_ok and integration_ok and gui_ok
-    
-    if all_ok:
-        print("✅ 所有測試通過！")
-    else:
-        print("❌ 部分測試失敗")
-        if not files_ok:
-            print("  - 文件測試失敗")
-        if not json_ok:
-            print("  - JSON 結構測試失敗")
-        if not integration_ok:
-            print("  - 整合腳本測試失敗")
-        if not gui_ok:
-            print("  - GUI 啟動測試失敗")
-    
-    print("\n" + "="*70)
-    
-    return all_ok
-
-
-if __name__ == "__main__":
-    success = main()
-    exit(0 if success else 1)
diff --git a/scripts/asrx_self/test_long_movie.py b/scripts/asrx_self/test_long_movie.py
deleted file mode 100755
index 1b5ee60..0000000
--- a/scripts/asrx_self/test_long_movie.py
+++ /dev/null
@@ -1,240 +0,0 @@
-#!/opt/homebrew/bin/python3.11
-"""
-長影片（Charade 1963，114 分鐘）完整測試腳本
-"""
-
-import json
-import subprocess
-from pathlib import Path
-from datetime import datetime
-
-
-def print_header(title):
-    """打印標題"""
-    print("\n" + "="*70)
-    print(f" {title}")
-    print("="*70)
-
-
-def test_data_files():
-    """測試數據文件"""
-    print_header("1. 數據文件測試")
-    
-    files = {
-        '音頻文件': '/tmp/charade_audio.wav',
-        'ASRX 結果': '/tmp/asrx_charade_optimized.json',
-        'Face 結果': '/tmp/face_long.json',
-        '整合結果': '/tmp/charade_integrated.json'
-    }
-    
-    all_ok = True
-    for name, path in files.items():
-        exists = Path(path).exists()
-        size = Path(path).stat().st_size / 1024 / 1024 if exists else 0
-        status = "✅" if exists else "❌"
-        print(f"{status} {name}: {size:.1f} MB")
-        all_ok = all_ok and exists
-    
-    return all_ok
-
-
-def test_asrx_results():
-    """測試 ASRX 結果"""
-    print_header("2. ASRX 結果測試")
-    
-    with open('/tmp/asrx_charade_optimized.json', 'r', encoding='utf-8') as f:
-        data = json.load(f)
-    
-    total_duration = data.get('total_duration', 0)
-    n_speakers = data.get('n_speakers', 0)
-    n_segments = data.get('n_speech_segments', 0)
-    
-    print(f"📊 影片時長：{total_duration/60:.1f} 分鐘 ({total_duration:.1f}秒)")
-    print(f" 說話人數量：{n_speakers}")
-    print(f"📊 語音片段：{n_segments}")
-    
-    # 說話人統計
-    print("\n📢 說話人分佈:")
-    speaker_stats = data.get('speaker_stats', {})
-    for speaker, stats in sorted(speaker_stats.items(), key=lambda x: x[1]['duration'], reverse=True):
-        duration = stats.get('duration', 0)
-        count = stats.get('count', 0)
-        pct = duration / total_duration * 100 if total_duration > 0 else 0
-        print(f"   {speaker}: {count} 片段，{duration/60:.1f}分鐘 ({pct:.1f}%)")
-    
-    return n_speakers >= 2 and n_segments > 100
-
-
-def test_face_results():
-    """測試 Face 結果"""
-    print_header("3. Face 結果測試")
-    
-    with open('/tmp/face_long.json', 'r', encoding='utf-8') as f:
-        data = json.load(f)
-    
-    total_frames = data.get('frame_count', 0)
-    detected_frames = data.get('frames', [])
-    fps = data.get('fps', 0)
-    
-    print(f"📊 總數：{total_frames:,}")
-    print(f"📊 檢測到人臉：{len(detected_frames):,}")
-    print(f"📊 FPS: {fps:.2f}")
-    print(f"📊 檢測率：{len(detected_frames)/total_frames*100:.2f}%")
-    
-    return len(detected_frames) > 0
-
-
-def test_integration():
-    """測試整合結果"""
-    print_header("4. Face + ASRX 整合測試")
-    
-    with open('/tmp/charade_integrated.json', 'r', encoding='utf-8') as f:
-        data = json.load(f)
-    
-    segments = data.get('integrated_segments', [])
-    total = len(segments)
-    with_face = sum(1 for seg in segments if seg.get('has_face', False))
-    match_rate = with_face / total * 100 if total > 0 else 0
-    
-    print(f"📊 總片段：{total}")
-    print(f"📊 有人臉：{with_face}")
-    print(f"📊 匹配率：{match_rate:.2f}%")
-    
-    # 說話人匹配統計
-    print("\n📢 說話人匹配詳情:")
-    speaker_stats = data.get('speaker_stats', {})
-    for speaker, stats in sorted(speaker_stats.items()):
-        total_seg = stats.get('total_segments', 0)
-        with_face_seg = stats.get('with_face', 0)
-        rate = with_face_seg / total_seg * 100 if total_seg > 0 else 0
-        status = "✅" if rate >= 99 else "⚠️" if rate >= 50 else "❌"
-        print(f"   {status} {speaker}: {with_face_seg}/{total_seg} ({rate:.1f}%)")
-    
-    return match_rate >= 95
-
-
-def test_gui_process():
-    """測試 GUI 進程"""
-    print_header("5. GUI 進程測試")
-    
-    result = subprocess.run(['pgrep', '-f', 'speaker_player_gui_face'], 
-                          capture_output=True, text=True)
-    running = result.returncode == 0
-    
-    if running:
-        pid = result.stdout.strip()
-        print(f"✅ GUI 進程運行中 (PID: {pid})")
-        
-        # 檢查進程資源使用
-        ps_result = subprocess.run(['ps', 'aux'], capture_output=True, text=True)
-        for line in ps_result.stdout.split('\n'):
-            if 'speaker_player_gui_face' in line and 'grep' not in line:
-                parts = line.split()
-                if len(parts) >= 8:
-                    cpu = parts[2]
-                    mem = parts[3]
-                    print(f"   CPU: {cpu}%, 記憶體：{mem}%")
-    else:
-        print("❌ GUI 進程未運行")
-    
-    return running
-
-
-def test_playback():
-    """測試播放功能（模擬）"""
-    print_header("6. 播放功能測試")
-    
-    # 測試 ffmpeg 是否可用
-    result = subprocess.run(['which', 'ffmpeg'], capture_output=True, text=True)
-    ffmpeg_ok = result.returncode == 0
-    print(f"{'✅' if ffmpeg_ok else '❌'} ffmpeg: {'可用' if ffmpeg_ok else '不可用'}")
-    
-    # 測試 afplay 是否可用
-    result = subprocess.run(['which', 'afplay'], capture_output=True, text=True)
-    afplay_ok = result.returncode == 0
-    print(f"{'✅' if afplay_ok else '❌'} afplay: {'可用' if afplay_ok else '不可用'}")
-    
-    # 測試音頻提取（第一個片段）
-    with open('/tmp/asrx_charade_optimized.json', 'r', encoding='utf-8') as f:
-        asrx_data = json.load(f)
-    
-    first_seg = asrx_data['segments'][0]
-    start = first_seg['start']
-    end = first_seg['end']
-    duration = end - start
-    
-    print("\n🎵 測試提取第一個片段:")
-    print(f"   時間：{start:.2f}s - {end:.2f}s ({duration:.2f}s)")
-    
-    # 實際提取測試
-    temp_file = '/tmp/test_segment.wav'
-    cmd = [
-        'ffmpeg', '-y', '-loglevel', 'quiet',
-        '-i', '/tmp/charade_audio.wav',
-        '-ss', str(start),
-        '-t', str(duration),
-        temp_file
-    ]
-    
-    result = subprocess.run(cmd, capture_output=True)
-    extract_ok = result.returncode == 0 and Path(temp_file).exists()
-    
-    print(f"{'✅' if extract_ok else '❌'} 音頻提取: {'成功' if extract_ok else '失敗'}")
-    
-    if extract_ok:
-        size = Path(temp_file).stat().st_size / 1024
-        print(f"   文件大小：{size:.1f} KB")
-        Path(temp_file).unlink()  # 清理
-    
-    return ffmpeg_ok and afplay_ok and extract_ok
-
-
-def generate_report():
-    """生成測試報告"""
-    print_header("測試報告")
-    
-    tests = [
-        ("數據文件", test_data_files()),
-        ("ASRX 結果", test_asrx_results()),
-        ("Face 結果", test_face_results()),
-        ("整合結果", test_integration()),
-        ("GUI 進程", test_gui_process()),
-        ("播放功能", test_playback())
-    ]
-    
-    passed = sum(1 for _, result in tests if result)
-    total = len(tests)
-    
-    print("\n" + "="*70)
-    print(f" 測試總結：{passed}/{total} 通過")
-    print("="*70)
-    
-    for name, result in tests:
-        status = "✅" if result else "❌"
-        print(f"{status} {name}")
-    
-    if passed == total:
-        print("\n🎉 所有測試通過！")
-    else:
-        print(f"\n⚠️ {total - passed} 個測試失敗")
-    
-    # 保存報告
-    report_path = '/tmp/long_movie_test_report.md'
-    with open(report_path, 'w', encoding='utf-8') as f:
-        f.write("# 長影片測試報告\n\n")
-        f.write(f"**測試時間**: {datetime.now().isoformat()}\n")
-        f.write("**測試影片**: Charade 1963 (114.7 分鐘)\n\n")
-        f.write("## 結果\n\n")
-        f.write(f"**通過**: {passed}/{total}\n\n")
-        for name, result in tests:
-            status = "✅" if result else "❌"
-            f.write(f"- {status} {name}\n")
-    
-    print(f"\n📄 報告已保存：{report_path}")
-    
-    return passed == total
-
-
-if __name__ == "__main__":
-    success = generate_report()
-    exit(0 if success else 1)
diff --git a/scripts/asrx_self/vad.py b/scripts/asrx_self/vad.py
index b900709..4527c73 100644
--- a/scripts/asrx_self/vad.py
+++ b/scripts/asrx_self/vad.py
@@ -126,6 +126,52 @@ def extract_speech_audio(audio_path, model, utils, output_dir=None):
     return speech_audios, speech_segments
 
 
+def scan_within_segment(wav, sample_rate, start_sec, end_sec, model, utils,
+                        min_speech_duration_ms=500, min_silence_duration_ms=300):
+    """
+    在一個時間範圍內執行 VAD 掃描，切出子片段。
+
+    用途: whisper 給出的粗略時間段內，利用句間停頓細切。
+
+    Args:
+        wav: 完整音頻波形 (numpy array)
+        sample_rate: 採樣率
+        start_sec: 掃描起始時間 (秒)
+        end_sec: 掃描結束時間 (秒)
+        model: VAD 模型
+        utils: VAD 工具函數
+        min_speech_duration_ms: 最小語音持續時間
+        min_silence_duration_ms: 最小靜音持續時間
+
+    Returns:
+        sub_segments: [(start_sec, end_sec), ...] 子片段列表 (原始時間軸)
+    """
+    get_speech_timestamps, _, _, _, _ = utils
+
+    # 提取該時間範圍內的音頻
+    start_sample = int(start_sec * sample_rate)
+    end_sample = int(end_sec * sample_rate)
+    segment_wav = wav[start_sample:end_sample]
+
+    # 在子音頻上執行 VAD
+    speech_ts = get_speech_timestamps(
+        segment_wav,
+        model,
+        sampling_rate=sample_rate,
+        min_speech_duration_ms=min_speech_duration_ms,
+        min_silence_duration_ms=min_silence_duration_ms,
+        return_seconds=True,
+    )
+
+    # 轉換回原始時間軸
+    sub_segments = [
+        (ts["start"] + start_sec, ts["end"] + start_sec)
+        for ts in speech_ts
+    ]
+
+    return sub_segments
+
+
 if __name__ == "__main__":
     # 測試 VAD
     import sys
diff --git a/scripts/asrx_self/whisper_local.py b/scripts/asrx_self/whisper_local.py
new file mode 100644
index 0000000..7029731
--- /dev/null
+++ b/scripts/asrx_self/whisper_local.py
@@ -0,0 +1,35 @@
+"""
+Whisper Local - uses faster-whisper for per-segment transcription
+"""
+
+import numpy as np
+
+
+def load_model(size="small"):
+    from faster_whisper import WhisperModel
+    return WhisperModel(size, device="cpu", compute_type="int8")
+
+
+def transcribe_segment(wav, sample_rate, start_sec, end_sec, model):
+    start_sample = int(start_sec * sample_rate)
+    end_sample = int(end_sec * sample_rate)
+    if start_sample >= len(wav):
+        return {"text": "", "language": "", "lang_prob": 0.0, "segments": []}
+    segment_wav = wav[start_sample:min(end_sample, len(wav))]
+
+    segments_generator, info = model.transcribe(segment_wav, language=None)
+
+    text = ""
+    lang_prob = info.language_probability if info else 0.0
+    language = info.language if info else ""
+
+    segs = list(segments_generator)
+    for seg in segs:
+        text += seg.text + " "
+
+    return {
+        "text": text.strip(),
+        "language": language,
+        "lang_prob": lang_prob,
+        "segments": segs,
+    }
diff --git a/scripts/checksums.sha256 b/scripts/checksums.sha256
index e0068a5..6ec1fe9 100644
--- a/scripts/checksums.sha256
+++ b/scripts/checksums.sha256
@@ -1,346 +1,293 @@
-2bfe6a1c1263f35916d4a28981814515fc40cb473f7bbc801f84842904c888f6  ./add_yolo_to_chunks.py
-f61f7126698018b346c8bafc45501708c17e3b45d9db54be5f0109afeee63176  ./age_benchmark.py
-8efb13239db2a25a728abbdebd92affe685b69402a277cceb0d76e62ed9451ac  ./analyze_asr_lip.py
-432b3e3b30578e71ef973aca758bd1964102cbbb19530620df8ac02df00eefb8  ./analyze_video_faces.py
-732609ef1882e14dc7ed60488697f6ae7e2607ec90b240a86ea9e585f052b9be  ./apply_asr_corrections.py
-790bd25424e93ca5a0743ea1a740a9a70f6ae6f8a9ca411012eb1e9b03907eb4  ./asr_benchmark_runner.py
-18744dc3bebdce0d89ea7076b5e43febd35ad3c84064bb52adde4d128d50bc9f  ./asr_face_stats.py
-1577d055328a73561f9ccfaf0c54727532e3dddcd1bf0f33e3c38081415cced8  ./asr_model_benchmark.py
-fcbb81639f53e9e08bee436853c84d918c0eeac09d985b34634d5ddc00055b61  ./asr_processor_base.py
-25948a204e45ce844d43606b7e45c9532321d48df44887d261fc886748276b10  ./asr_processor_contract_v1.py
-e9209cf028a11bdc45514124826374e58458ee06b054cfedffe8013d751735ea  ./asr_processor_contract_v2.py
-407dd0ec772027e0df27af0b66ea8130cb390595ccdeca4350e7bdc210acee6c  ./asr_processor_debug.py
-dcee1b80071b47c974bcffe3d27ec2f2269f4b8de7e7409ceaec7e6f271d31aa  ./asr_processor_legacy_v2.py
-10728a05a6ff2d56a70bb831abb51e05b03309e45bc5fa068c5a0702a4c73769  ./asr_processor_legacy.py
-9106bfe07de9cfc920f4f4d2f821dc024df612f4c2a8f5f75d35f012d26440f0  ./asr_processor_simplified.py
-7eabdcf7320302ee65c67e801f3ac7ca5801abc76165faa182348d30a8113e9f  ./asr_processor_small_multilingual.py
-2714f7be88f286635ea8465daf8fa969e6b27d2b2d1f73ac5e98f5e496139cad  ./asr_processor_small.py
-1089ff10b9b0a9f528cac79580aec25e33f8eeea485ac44b6aaf8c7c0cab5b42  ./asr_processor_v2.py
-e9e622d737990bea8ecc139fa310a7cb4b0ca0309d6783f8105e74f864dfb850  ./asr_processor.py
-5431b57d4369a841d51a6d6c5e1fb5e6c2932cb97cb4601f5e1b41ffe9f7ecaf  ./asr_side_by_side_comparison.py
-6c11efc3d40e559bfbeadcbf4f51eb353b744cc4f765bd8abc472a701e3f33cb  ./asrx_processor_contract_v1.py
-93501463af84d6541405057da3783d40492aec5e536b4210dcaffe460cdb5503  ./asrx_processor_custom.py
-6adfbee842d134b9d180e2d1104694ed5cdc1fa4febcd0c502801b8f87b3ce66  ./asrx_processor_simplified.py
-60fc3465f9c461583f8d0b888e85b3a6e04e1f252a1e1c21d036b52e1ce4b43c  ./asrx_processor_v2_noalign.py
-82d65b71bd86874e484870c40214d3fbd9343c39d5d635896fb4d257d13a410f  ./asrx_processor_v2_transcribe.py
-5a0c9905a2e10c847aa74f108e4054de4704bbafb2004589db15bf33833ea3c7  ./asrx_processor_v2.py
-b16b00cf9e5de96abc512022af9bb81196405b10988f5a39dfd3a9b6471f1155  ./asrx_processor.py
-d570fbe89bf84c50f180e8f3ec26c30092e07e3fa4883fb83a644670c13b8588  ./asrx_self/__init__.py
-3b7a788e5fe2fa1a7518bf2a639ccd09b304b264b952c88a3e6612aba30faef5  ./asrx_self/integrate_face_asrx_speaker.py
-1fe4b9ac1d04c2f2ef5361d8325cf9333e434b126be6a53a4c0d40a04f32a34d  ./asrx_self/main_fixed.py
-e4a2894bd4207f6d034c86e1d232001e2e0f9e65856c89d84d8a038473a5e50b  ./asrx_self/main.py
-46f61075b403729e4ff9bf0b05367b5319acf5d8c696a0517033699dcba36276  ./asrx_self/speaker_audio_player.py
-2a072521662906e5ca84ec54cb1963930a1c795f8d64906b66e889c0f442198b  ./asrx_self/speaker_cluster_fixed.py
-db4ddc98d563bf4a8c34fcd1fe40edd34fab63fa8c293644a8a40ae87be521dd  ./asrx_self/speaker_cluster.py
-a50d0ae549b733532f940332e4656a4dcf0623703240eb74832524eedf54f888  ./asrx_self/speaker_encoder.py
-42f325168e1f6edd514eb00321f18ce581f7b61d18c50798271c3da8410cb248  ./asrx_self/speaker_player_gui_face.py
-54a847a8862e2f7400c4d8425f4bebaeb230fd50932933734819fbb6729bb560  ./asrx_self/speaker_player_gui.py
-43508b714f2f1aa8bacdb9c4f52152f3fd14f6c2e2529460e5b24b29846c8c37  ./asrx_self/speaker_player_interactive.py
-e25e789552fef129bd6f536140ec4deead8e242091ab60ab679b544ff9d43307  ./asrx_self/test_gui_face_player.py
-788014df1faf7cfa09fbce16781f8bf9da1acef75e8891592b3b4d51b91e93f2  ./asrx_self/test_long_movie.py
-8bac63ea24cd06b9d398c2650ac396e10db64e33f0686a01bd460e17286e7574  ./asrx_self/vad.py
-f11b67ada6167540d2f95cb2af93d0e3a0de55bce659745baa37c4aa4805212e  ./audio_taxonomy_processor_v2.py
-ded810b81cda24e31e82de14ba9846770ee2b18d84d52b9d570de5877e9e2513  ./audio_taxonomy_processor.py
-f7c53be5a031a8bff15c3165543586529932d81c4312521654d132b1f0ed6bc3  ./auto_identify_persons.py
-5497a6f1f7ae267c796a398a9f020ea485aa45f980f2eca932b904ad61ce9b40  ./backfill_demographics.py
-39a479ca4f8986f3255b0bcd0d9162a1f2ae339bb4dcf081f931ff9b304797a1  ./backfill_frame_data.py
-308c8e3f3d45ee273504f9f415eaf6c025f06aaf1cca33156a66431ed6e64f43  ./build_semantic_index_poc.py
-4eb37768edd252d94f0d751f219c317e905bc093f414b2a6350efb8294131138  ./build_semantic_index.py
-debbd058957d09c2397f3f4c028edaa0a658002921dcca95eae2a20070ba95fb  ./caption_processor_contract_v1.py
-7236cdb5deaeada266cc246ee11380248bb9f2255888c25a152b2f6ab1f981cc  ./caption_processor.py
-e73cbb688dade5c5b6fc4276f0c78b377903ff83f3830b63d8bcdacd8da8aecf  ./check_all_stamps.py
-7ecdbd4b1f94be8ebab9935ea210a868330e7030b6e19c73229c579c1189fd5c  ./check_architecture_all.py
-7179ed1a87241904af29542f9018398f8afd9b9dd89af7bb11909310ab7b49e0  ./check_architecture_docs.py
-7e6bd7d14582e494baf8b28354bbded3f79b43f0bd271ab33874da55b9086311  ./check_code_document_consistency.py
-5ffca7c55edafad755e84499981553fcb48ce6056ca7b04130acafb9e6a9b1c3  ./check_frame_112_36.py
-f49c7b0cfa53b657f69b2ad97a6e18393741cc2151b32c9d7dde2e078b75953f  ./check_frame_91_59.py
-d2cb7475262ee711a4b06e53559f0927242be4a924a56e7fe212225f318f4193  ./chinese_vector_test.py
-ecde3d3df773916f62de4e34f8d8693feaedf112a3ef9955e22417c8421722bd  ./chunk_statistics.py
-2588ecf27c13020d894e46ba70a76de89f09556b475f555dae59db36da0b90a0  ./clean_sentence_text.py
-98ab1129032f42fddc020f9b3492d1fc133851d1af33ddeb57e2385d88425af4  ./clip_logo_integration.py
-bf6f74c09b8f8c7f25c5fffb9c36f16a8afb483a7b65903cfc75e2ea641bdf49  ./compare_asr_content.py
-1f2caadcded724aa04a929018a35ace53dd79d172f5ee2720308fbd4581b0c6c  ./compare_asr_models.py
-1ed8a9530f40e304b556ff76c7cac40468c86a0cd32ff2a8bc7bf2a69669121d  ./compare_models_gun_test.py
-6bf790fe75a7a2a5220052ca14c31e90a97eabc4558cd5e9059280913862a81e  ./compare_search.py
-875e7a598982c8ad7222a51b7b147e91cd5e1a930f41214b3942107cb932fc5c  ./compare_segmentation.py
-e432b6f2364d5a9aaf207a1de0dca3fb14ab8d118c53ee34306abfe6fd211ba8  ./comprehensive_search_test.py
-43df85cf860ac28e083de35b511bb2a7b91ed48f596757f52f19487768987500  ./coreml_embed_server.py
-9149ccc8de5adfec69c6f3f2ec502ae7d5e7844518a228ba587af2e08cb38805  ./crop_opencv_stamp.py
-fc36ecbb1455d959456945266e193b601a29c4210b4938a3f0d4a9aaf44b5cee  ./crop_real_stamps.py
-34a694624ce94d916b06a847bc4d41e7665985b85e55a626a4bc3a4370c21acf  ./crop_stamp_112_36.py
-27099dc9c8ee52a6949ce18c505089afef1720fe70858b90d0801972c3b43fff  ./crop_stamp_closeup.py
-01b5a3b091ebcffc0c1e2637b7af8192ba597239fa80d152738e3b8cfdf8174d  ./crop_stamp.py
-71b2a362b5395c6e4d70e62766820db92d94eaf140d98eecb2880bcd98d55be9  ./crop_top_candidates.py
-60f18c5fa03ffbc80c209337cd1c8b6acd0b8471e600119340aa8cdfeef14f5b  ./cut_benchmark_runner.py
-deba86a1645ca5b1acf413dd9edfad77b93ff213897d739a32de1ba629bfce52  ./cut_processor_contract_v1.py
-01024f947f0326c124293a30e4f2cdb859f21cfb2d4c07f9c1030e2934f7bc44  ./cut_processor.py
-ff092ad2373b57321f87d1dd123fff8a99c8207057591e8526e56cb1424d47c6  ./dashboard.py
-f184bf3e546db0253ffb71895e8d42aeb06588c71c4914c2fe656f42ef463c9a  ./debug_face_registration.py
-a9acce1ebd6ea821a8dc5009b8fc40586a98d31c23e93c97fd844bdadbda4ed2  ./deep_analysis_112_36.py
-7767ee7455a956d14d286ad558c4c312c2ad3ccee1c73adc1bc8f761c96ad72a  ./demo_dashboard.py
-425290c12161c5cfcb0c505a737ba3951656b39e425e792919d4812e15b9b8e3  ./demo_face_learning.py
-d7e3e27e6a65b1fa62530ee954c227dbb4f97593c5a5dcc48b39e5ebae4656e5  ./dense_scan_traces.py
-df79b7fc7a03a8e754de5123a23bb33b1d5c23d832adc1886fb846ca517dd24d  ./detect_language.py
-f6f8047e24ebbec81ef27dd38f4242e63385f8ebe5be471cae156b8aa5fc4477  ./detect_objects_keyframes.py
-e61d2ef5043bda3674a0050d83ba3bc6a70c47f54e456124a736b4328f0c0638  ./detect_stamp_shapes.py
-f23a382113e9c7de2ec3b24e95160daef48f9336ae6d4ec9ee7a18f4bf529f6d  ./download_places365_classes.py
-a747e5e17960b972549714786bb9e28ea578e10e6c80788e298a0149c970bcc5  ./embed_faces.py
-f1a2b3820e1a763eba6d8d905a5bb87f5a9b4a2f005e709e313bb7505ba7ddaa  ./embeddinggemma_server.py
-43c540c02c1be992e7d44ab4fc76a759815db3ed5f25bcbb594328b50ed7c73b  ./export_file_package.py
-19d23e4604d5532928412afe4d5d39ff49194ab4a046825286ae1be154326a1f  ./export_file.py
-5f10bab1dcb0b5fad233a74069f9e2f89043e7c848c9c38ae7e2806e6940c75d  ./export_identities.py
-2a1d0a1b853fd2c28f9a404871d33912f93521358576833be0999271bae02bcb  ./export_person_thumbnails.py
-a81bf1d6af78c052e638f5d5677b4edb512d0de5441025d86fd970d3e7993922  ./export_sqlite.py
-8b5cc0ff437fb4dd0df28b7b20a78469cdca3621e2eeb4b6d46ad2391acb0596  ./extract_female_faces.py
-bdecbaf0496bf536dce2ef4897f7090749820d15dcca03492d4d736ab0f8c6c5  ./face_benchmark_runner.py
-22319a38bd684fb235fec681ddc60f45821e4bb2181f2b31fdf945f7ad9a1b85  ./face_clustering_processor.py
-5adce4e444743331fa592e13d71e52f26554eadb9744d350a7654a449a8fb8a3  ./face_count_comparison.py
-3574454c74eaf11021f9052f77d93044cca4ae0285d0f2630b4016c2ec0df783  ./face_cross_validate.py
-4f09b3b66b14a5eefb14fcf915a1ad1e9147010f6ae7671731566679b1cae461  ./face_embedding_extractor.py
-87f1b69affbac03fbd87331a99cd7c4faba6c72d359ffcfebb62d6ad8f70445b  ./face_landmark_qc.py
-28776dfcc6ac40e9481c25467438745fed60fecdfd4fc19f9f4c7396397591a7  ./face_mediapipe_test.py
-f4d1b4334a49357b74b80e390ad5a3d16263e51cbe5cab661af92bd2e9721f02  ./face_processor_contract_v1.py
-802015c73dfce0866f2a0bc94c645aa35ba30a6de78244af23090bb1f1828c6e  ./face_processor_mps.py
-96ffdbde3f4d87e9942f9e1f4c93cbd999dc404b43e00d4cdcbb22de3c0f16b7  ./face_processor_optimized.py
-17e7d0bd142bddfead94b1dd959c1f41c0dad7063ffc677dff1a99d62aab6cf8  ./face_processor_v1.py
-d6ddad29a5e53b43b887554072d7965f0535e47fb62dad1a8b87e44fa1be6015  ./face_processor.py
-8edab61189ad1a8fa60c203077e814e82d46c5bae67054fa2ab1958e199c05f9  ./face_recognition_processor.py
-9ea19f357b3fcec6c8b3875c538e53cb46e407ab188cd544963e0123e535fa03  ./face_registration.py
-72648816de611fd9b84d2b98c177b8b4f24374024b69184e8151c06cf44d633b  ./face_statistics_report.py
-499f197a06f50839ebd5350af380fa56506ce08f073ba40c0e863b8e02b34133  ./fast_face_clustering_processor.py
-0191781635b98d0675969fb87733af19525d7b5c148723346c5378c08a00fe33  ./fast_stamp_search.py
-00e7e8ed06f6a0f2c46c84a47d7e7f5d366acee941d546a52c4b1b7885c71e08  ./filter_stamp_colors.py
-5341fd648cffafc77568070313b06417636943d50ff3b4380a61381260acaafa  ./final_face_validation.py
-213793ab719f4ef42ec9b22f351dd86d4739211c17be486a46b76ba7e64fd8f1  ./find_blue_stamp_opencv.py
-e1490317c0f56b895f73cfbb6f57c8e3ea5c65304bfdd7663f103f6b564e148c  ./find_kids_pose.py
-08d4cba0650f6a22fc134d07fd15fe8784c8472c3ba687b587e31e0b980e2b1c  ./find_kids_refined.py
-aecec0784ce5d0e98176c15798f05d4f67ab6a686f9ffafba71fbd82157027f8  ./find_magnifying_glass.py
-620db08dd84f00af0c6d744dac54c68360548dd5b2cc26b12ddcefd936239b2e  ./find_pink_stamp.py
-1f4555b3578f4dc6bc08aa37e34eda1d91ea25d8134439771678d1a57bfdaeb9  ./find_realistic_stamp_opencv.py
-277aa3b48eec2e739de3bb95ef501ffbd24104aa2a1bdef28c844ef44fd75013  ./find_small_stamp_opencv.py
-fc73bbc9605938db495bd33ea74955e454e9384130531a16d42f25dbd9b515d8  ./find_stamp_in_hands.py
-c6ed0f12e78c12df977ddca5d699f58edb174b47199f584e7a24dbdc3b7d02b1  ./find_stamp_in_magnifier_scene.py
-ecf12e346619c27a985452e9f84ee262c2da25de9df0ff6e0b293279ccba559b  ./find_stamp_opencv.py
-4ff93cbcc781a5cff023f78006f1aebbe2d954405ae7d00a473fef6b41b2ebee  ./fix_asr_text.py
-4090cb892115843a909aa41426c0f39c5a53d8d88a5db69499ec8bafcb780d77  ./florence2_scan_stamps.py
-e90e4447db3328b64a2062ca13ed41f6a045220d8fb640542dff5b790d3c4d3b  ./gdino_comparison_test.py
-7071a9999057c347e2275381f1f0c58e19aa8581d70a572d3170ed14a295a48d  ./gdino_frame_api.py
-891410310b415ff68a0f7ee0aa39e84eef7f2c75887487bdb88b8f4718d40e94  ./generate_asr1.py
-24efe7db016387b40bd9caae449f0445a3d47eb878c00399803bb6e78e6dd5fc  ./generate_benchmark_summary.py
-dc956a78a3ed26686f45dd6d6d9cb42c023751fcd9b8789585450b6df63670a1  ./generate_chunk_summaries.py
-8a0922d75fdc7c5994ebfb31881d765db4b105cbcddfcaa4b4c49d11950b8df4  ./generate_chunk_visual_stats.py
-4860bfd00cc6c1c842c2f8e17e725eebca191d81067af3cb5a28661b45d74bd3  ./generate_parent_chunks_gemma4.py
-e9fca223a8329ff6bdcb8552fecedb2d8b4607c6516c373c3023f29edfd42e06  ./generate_sentence_summaries.py
-cbae7c3e85457274e8c284005196c39dc97f9d9200ed6b0e4ea266e48a381d3a  ./generate_synonyms_llamacpp.py
-57512cd7a5ec2f52813717fd3d81dec1aaa69dc9c91a9edbca847e7012b1c86f  ./generate_synonyms_ollama.py
-dc495cb8127858fa03a5f8b8bb4a772c5934ada1abecf97459bf71de80417672  ./gun_detector_scan.py
-1a7cfb72723b3b94e3f4fe368477ba693ac3d20ac7af7351962bc548c700b451  ./head_shoulder_bench.py
-b2fe8e4d8d7d1057ba928fc5e190f4a06cb60e83e2a02c5d7c423791596c11b8  ./head_shoulder_quick.py
-ba5e67a97cb465e6a1a942c2f7342406031759ffcea2b897ae963bee4bc551c4  ./hybrid_stamp_search.py
-f5847b6c8ed4c7c51290df9032d5a192317b5f03b5ff418ead1181a6e1b655f2  ./identity_agent.py
-61bea1980af5861a02d6e9b47ac5ad0bd04a4fd633af477d2179b7361ae58c01  ./identity_bind.py
-046aa90eb4a4b830910912362a9865d1e6170f5bc176fae42be630f967f9d3ff  ./import_file_package.py
-7cc260d4411ab13559803686f8b645afa07738d652d9459830aecac268597fa7  ./import_file.py
-071e3a5141d04cb9e6bd31489a835c778608785896b18ea7fa65e8db9f1547e5  ./insert_chunks.py
-d3d53f44daa7f1526488677b141e90fbf4aa5625369b96a3ca275b802414802f  ./integrate_face_asrx.py
-4cb6a93ef8006cb69e8bdb1bc72899ee9bab1bf7eceaafe9896923bb7023bbd5  ./integrate_rule3_markers.py
-75aa3e4bffc9f9cb8b9254db19095c93c3efb43d465fb5dcca8c7b9b730f5c59  ./integrated_body_action_decoder.py
-f4dd2e21fb6b668bdf0c51cc56e214188b46937b96a2b4a10d13783e171d0472  ./language_router.py
-bef426641645fcf7dcc68c87e3325a6edf3f70925febaf1df84f7c6ff87681e5  ./lip_analyzer.py
-7f98b0cc8379b3759cc7e805dd56f736cc518093e83f43b2e5ecf559a19b95f0  ./lip_processor_cv.py
-a1473eeba17fce25e4678234fe4e8793a132514e0566b03b36a0bec04eb93acb  ./lip_processor_media.py
-0df61396756ee22d35356776c189b354458661916c8baf85bcef97c9f8b62ec8  ./lip_processor_mp.py
-3202aeca29e651ef1a54f47681c6b3b2d0680555fe3c6d318a932bb12b49e58c  ./lip_processor_simple.py
-fed15bafb5e09715cc03962f465b2ff618bf05ebeafdf932643690c9635c9840  ./lip_processor.py
-1773054e8d563b493865880d0d8bda105e3eb6fb536a25817517237b3bb76afe  ./magnifying_glass_analyze.py
-7d4d048c452bf273f4a6d96da13eb7bab6aa60ca9dd51de5ca0fb0a01e587b13  ./magnifying_glass_extract.py
-8528bbf89d2770fa5a23f461274038898be251fb6e48c5d3adece5aab3bf976d  ./magnifying_glass_owl.py
-cb645f5e29ee5a36b2f97812039abfdaed7328386bcd25ad7b742af6a6b16399  ./map_speakers_v2.py
-a90bd3fb729a05010c29a213134c60cc0bdd17769e27a7d3f1250919b7bf1613  ./match_face_identity.py
-2d864dc831c2fd0142b19b8ad2cda169c2a05facd9662d31861d29bb710c4979  ./match_face_with_pose_filtering.py
-889d4853707896885ed96ab945d4266acb213f4b122e2ba7c4563eb0e3e9e865  ./match_identities_to_tmdb.py
-b34ec373bcf65139e08e41967f58a2fc8ebb67a59c361074d3590cd16541415a  ./match_speakers_to_chunks.py
-fe6260a94d01d8b43d0d3b59eb820cfd7b4711c907343a1261c69f9010ae990d  ./mediapipe_holistic_processor.py
-bb36844b4d13bba8edc1b7f0703f02081b62bea795535b8cd8dcbfdb4281f402  ./migrate_asr_to_children.py
-819312cbfce6e68a0d8d731e02d283946f79de6044f207991ddf9a28ac853d79  ./migrate_face_results.py
-c418f6e50054fa7eae1d0d879e28997b98f57437acec48b53ecb09f332728867  ./migrate_to_4188.py
-6f60aa899e06f05e575cb5b461ea517481119cc32644566245d74c96eccde722  ./multi_stage_stamp_search.py
-b24e2289c00f803c8339f59c34d44ed6c53a3c19dafc13e72c4b260d6bb312a6  ./music_segmentation_processor.py
-da2546f84d0dbd711c8800ae4e32e59d9c38de9e62e1b423c4518fa1fda1dbea  ./natural_language_top10.py
-78c3d1a9302dbfacdf9b3655dab07348957fd9dbb4af94aae83eefecd5343a33  ./natural_language_vector_detailed.py
-e924f04d68c9a8211ad373da811aa6671d2c5654281c1634dbf8b1e5e5b51533  ./natural_language_vector_test.py
-df6ac92367b1afb50c0af958e362d87555fe569f608a8d213e0a593e2a43cde8  ./object_search_agent.py
-fd39b779a0337f521940f3f7b159931f1f207f200eefd610183781fdcf3dfafd  ./object_search.py
-42d2952fc78b57302b0d12bc3d45790a2c2c46d4ffa3c713a82686134bd63f13  ./ocr_benchmark_runner.py
-7b3ccb5c4ddd4c62c5ad04d0e3aafaecc2c1441012b6a98613cdcf055e2e50e8  ./ocr_processor_contract_v1.py
-271023eec42d6be4a1ce6ae2ce3f29e825210a57e6bb37554a6f7fdf54616f9a  ./ocr_processor_mps.py
-2e73c41285e52ef013594fcd4d20df9f5781bfc26bcf62e54dd2c04ec44200c3  ./ocr_processor.py
-62196108cb3337b5f9a873d70d2981ac8f49152369afbcc8a12b3a13de579e80  ./opencv_stamp_search.py
-b2e8d552c272fd173c77693e9453a85fe16dfc12f7c2cd304d299c6188c14077  ./paligemma_vs_gdino.py
-1534d5b7617dbae77f7a37a2c33a89b90f965247a6828f00b73ea6b720f6f4fc  ./parent_chunk_5w1h.py
-5208c738d4b615282813d351daf09872ce516121bb604caa64968ef5e52c53d3  ./pipeline_checklist.py
-8f80c3a2be5c330e2d1853d9250a171c75db84598dbf3304280c42237ed4fb1f  ./pipeline_status.py
-94db44c0f49115a677d117d4901a1b7991c1517905300eaa495dd62b8ac1c79c  ./pose_processor_contract_v1.py
-167dee5e42c6bd46674bcffcfd92f368fc0b48a1f42c459c806853b281bc6482  ./pose_processor_mps.py
-a6ef3a785ef5c6dc47fa38dbed80d76bc7d4bf48cbaf0f7edb3d26df98d7262c  ./pose_processor.py
-45e6798dc5900f2f7c8776a2d260c122aae5068a075256b8a5c02e8d0be6c131  ./probe_file.py
-139a68b5915680ec697d4bb5420adbd20b89637de2c16a15d68aca4fc22da02b  ./qa/executor.py
-4a59b36c29e1ee6e2b169db3b0201d2f7088c6ccbfdf642a3b522aeb182bbeea  ./qa/judges/facenet.py
-0dcea0258ae3309cdec93dc4dd534d1a42511c327d528a117c8e3085f5b30386  ./qa/judges/gdino.py
-7c9392436477662bc1b49d719f0c78f96e8e7e180fd281d4c59c36fd241a3e6a  ./qa/judges/gemma4.py
-84c6f793538981bdafdc08bb9bd5f12401b442441fae54936f610a758d18e972  ./qa/judges/maskformer.py
-2f9b5dd3373fdec77a84f117ab620230e208f96d015c960275ab60a0656575b6  ./qa/judges/paligemma.py
-52dedc276f6f9806710f1ef510aabd88032afe4abad364f5963fd2bd5b6cf14d  ./qa/judges/yolo.py
-c4e4424aad1847d822e9cf7dc98a1b2e903735a61e8ec056c6a9be75f79486bd  ./qa/pipeline.py
-96f5ab509622118db307641082a19daff6b9a36bcc66451c35ed2abee4fe4249  ./qa/query_generator.py
-00b1716423a184856bbe44d4132fd6d84ca13f3ae018964caa6f3389c1ab98a5  ./qa/scorer.py
-01c7b3c30c1531224f9605f0ee633285fe8489ab2d0a3c9c6a41f2b2b60d6626  ./quick_stamp_search.py
-e3143673a2bff6139e05c82446fd8770c4b7e59a854a42c3b29662f5ac75efe2  ./rebuild_parents.py
-4aa98981632d4f8a11039c510e86aa296ae1cd4b399fc871ed664ac11e445bd9  ./rebuild_story_content.py
-205cfc47b603b5ab94d97dae8c25486b342b7c2858afe6d6dae27615ca0b2aeb  ./redis_publisher.py
-750f778946b56bc57c47d9d2295332bb0f8cec2c1aa03c6b882d39ef4432673d  ./refine_search.py
-0f8a6a6866a5797e964d3b17e2b7ef146fe7a798f09fcea982fcda6f629b4d06  ./regenerate_parent_5w1h.py
-3ee192b623f290136b36bd63abd018aad6e6639a9543970c3415734628b33bd6  ./register_sample_faces.py
-334782f0f66d0ad3818a51adf6343186a2de65467378ab68a81ade806e496af9  ./release_manager.py
-9a44cdd155953778b52ac0cfb118504c56eb6b1141984365ffbb717e28f3e65b  ./release_pack.py
-3906b48f3a7764d19605def2bf8ef84a54a6afe64c9291a7cc0881a91472a826  ./render_face_heatmap.py
-44e432c31a35211a37dd26695772b7e250487ac42ba4f16a56f843277c2fabbf  ./render_offline_report.py
-3fac1e6a4125042185a2ce82771f695c562b3137c7aa58a912bada00ad8ecf78  ./rescan_single_frame_traces.py
-9c3212cb455c2a6230be918448560fee00c153a8956ffd04fcb62974d5e1abff  ./resume_framework.py
-7c95ec08daf4f980bd53233503b7a4fa01afc08660e8fe8cd031ea3613ead8f7  ./save_events_to_db.py
-24795e1531fe05e33d515104e4fb2f9567b46d802ef1b5a38f11268cf105be76  ./scan_charade_stamps.py
-cad2da5073577f851c5cb2abdbd7cab05b39caa0d1179ccc89c378a7df2736c8  ./scan_full_video_stamps.py
-03ae71470331fe5b7f8e394f7f789eee08cad4ed5ec9196b46ab2c9dbefa7fec  ./scan_handheld_objects.py
-d3935ba498786cf260d9d5370ca60d3af7bc4fd438f6be33ce23cfd0b7bab593  ./scan_keyframes_opencv.py
-12c9b35212f587f5adb37584bf3c3844804d2bc642ebfc5d82b86b44f46d2472  ./scan_keyframes.py
-f386130ac203308c904ba7efea09ce0ca0d640d36762b113bf0cfedc24d7f885  ./scene_classifier.py
-482edae04e5467a68c77729760db53d3653e8d7654fa49e5ec9a36f1f8f22616  ./search_blue_stamp.py
-e3786422932138272d1096ad4c800594e62c9640952a286a9158372a1e5443e3  ./search_envelope.py
-2df1e259c2e52d10d79b20856cb94ffff5a9bfdbe47cee587b1148b2f1c16101  ./search_objects_in_hands.py
-9fd49be8ab16f94fd82efc5ae035c029372a7ddeb7fd779b557f1917cdc14592  ./search_vase.py
-7a6d8e7c435368f6218db972c04a7be16d7d6680d8d4374f82c05b7162716b9d  ./select_face_reference_vectors_v2.py
-2bcf7c1b3c407b51a134a5ee4982713f0ea387cfd6df01ed75554c94603971a6  ./select_face_reference_vectors_v3.py
-d52098fcf1f9f7ba14f31a9a90bc5b3bc933e1a5e5697e3d09eff389c153cb18  ./select_face_reference_vectors.py
-a02cb37639275d86ae0b4504d21f50963b45aaf94630c59472ba30d07722e50c  ./simple_api_test.py
-02516ab1616c1756c4f8041f48ff12811cc5d672c53b34850b84ce682fefdff1  ./simple_face_stats.py
-b024d9bfe244d0d058daae0acd314b9344d6f0912e4f3b02dbc618f9fe3e4949  ./simple_test.py
-af8703506769f3cdb89ff7849b071c2421307717850596dd86d2fe0b053e7809  ./smart_stamp_v2.py
-5e5f86d47ea2b75bcaa8662689f73af1963645149c0da688dc43482616aa4e76  ./sound_event_detector.py
-bab7697e4b4b05e93babc116e0c5b13cbaf1f4d419a65acd5dc1de5bdfc510dc  ./speaker_assign.py
-381ff240ce806ead7d6463ee40c5b830035eb6252180b4b0901b3c8313fa4bbd  ./speaker_bind_lip.py
-5eede29fa0966974c1943792d7fcca2dd9179d4f23570cf1a3964dc97bc9ac1e  ./specific_stamp_search.py
-d5363d832272bdb3c1d6f6d93eee7b7894893b9164a3f5ad5fa08a4a0eaeeb47  ./split_asr_segments.py
-8e1269f173f2c72de78857c2d83d3111b62ec89bd79f4fb00c3f57390986ae4f  ./step3_asr_fine.py
-7592df8be5dc58376b33960bfa7fc0003c51114b70ebc01f1589f39ee9568d3b  ./store_traced_faces.py
-7ac32c1e2146a19e6654ab3e4bbbfd42e1a6540fb8717d40d55c61e9f5d1bf71  ./story_embed.py
-74cc24b328a075f48b1f44a465611157f44eadc8f5dabf6d95cd5cc5f80dd9dc  ./story_pipeline_full.py
-97628f0f1270825dabafdf0a69f10ef12c4ffe2be4ac12941315f06bfb084e7c  ./story_processor_contract_v1.py
-1b1f42fc4bbff26551f26f4ac1e8a995dfe3ff98b940a29c9e130410965d0fa0  ./story_processor.py
-cdbc7ef88551e2b3a3771eac5be5e0360989e71fa009ac28c97e548507e08a5e  ./sync_face_speaker_to_chunks.py
-8b08e9a33f5917aad10e070d6aa48805f5e7c23f905ba8fff3b8697b2109d962  ./sync_to_mongodb.py
-f64cc6dcb72f54d3e97aa981b40591aef4804ca769e1f14628d901b98bc6aeac  ./terminology_manager.py
-455546b9bb3a2c2c877c7720229b254e75b28eea33b3715d1731c02ca85294ae  ./test_api_correct_usage.py
-b03dc1bbb091672e7da2b131850b17badac896b4fbba92fe9bce76c232c99be4  ./test_api_with_key_id.py
-7d295c77d5bcd4c72c5673370af48cc89bbccf9292c3b82aad3a230d242547a9  ./test_args.py
-f474ec88e6634decbf178da497443fa709096b174bb4a4320a07256f516b1044  ./test_asr_large_model.py
-aa952524dd86f346740ffe555075b74adf2e60bb822bb04a943a51b1fd262445  ./test_birth_uuid.py
-db87badad7948527325a528400d67a4eeef76abf8d13f5c4254c812e944e4e0c  ./test_end_to_end.py
-e191c98a82f7e089f7dccfc4c536244da2bf14339f982a3afef05d33332c3755  ./test_face_api_final.py
-1b97c9aae2e1744aa7aefb192eaef86c64e6134efc8f08ffa9a274bff16a58d3  ./test_face_api_with_correct_key.py
-f7e4078f31b1ca8494c18878219cf2f90c301f19fc851b9e7084657b71a5e150  ./test_face_api.py
-9eafc49f8fa42b4cd58109e9b725b3aec3b06943ec426919b1788838ccf1ed92  ./test_face_db_fix.py
-38bce82b167e0c97b257cc6b955fdc2e9ded581ce2d39eb0fd2c60249275394b  ./test_face_direct.py
-24e82bf0af82407e6c04361e9a671770cbfb0b05d92df589bd0d5a0118bb5a98  ./test_face_learning.py
-8dcdb144c4253fbb466f220359b42c2a9579193865e320a56e682e384c2ae176  ./test_face_recognition_integration.py
-b921e3256fdea176d4391116d1ead472c4f3ca8aac6999140367818818c35ec3  ./test_face_registration_api.py
-9af6c6ff0c766b3de92185c3602f2b8b62b815bf88dcb0e3251c2676e61e0a48  ./test_face_tracker.py
-4f70eadb6a8b80eb8febe32b17b77e58d1a4823cc5d598e5ea45555342d2d4cb  ./test_florence2_direct.py
-0588be0acea540950d737943073f71e769b6301374eaa4ff7fdb96a80145c4e0  ./test_florence2_pipeline.py
-694c15193616157ddae4bdb0a45feada2a8f8490f01d290a28aa77a4b24eabb2  ./test_florence2_stamps.py
-2c281f698616a83e9eeccd610555d9f9ab657b2deac65ae9e3dbfba0b450d9b0  ./test_identity_db.py
-7a73e8314ea7e91ca9dad3867a83b9c1101fdab09bdc0fdac0f798d0a7a204f3  ./test_llm_capabilities.py
-68300f87b96a474f06a3071a833e6b3ae48d1db5fb8a7e5a3ec1834fd878d808  ./test_multilingual.py
-c17cdd0f4ffb7a151a634add08d13cc576ba7a848bb20f54fb97d0c1d9d81cc0  ./test_object_search.py
-d07bd363a2878259fbf4ffcba40e367f7f1bf4171b5a5dfdda97f7a53b450d0e  ./test_ollama_feasibility.py
-8421003b1f66cbd21c6fe5d3aff0a526897753e959b23905ca8f502f644f66a5  ./test_owl_vit_debug.py
-6f9e8b7947229ea4aa0a62b59bda5fcec05bd74f6c00dc4a7b06d932bd1b730f  ./test_owl_vit_stamps.py
-da91a7c97466ce7f03cde13aa9bf6e691b3e482d2cac74519a2e1a61a2abb05a  ./test_parent_chunk_generation.py
-19d9f2492d3b04b7dafa008f106767d3107dd36b0c8e4601765dca30131027cd  ./test_places365_scene.py
-de44553023067362e8b2223f03e1bff55fcbd2f11ddf3d01060dc02c4675a744  ./test_probe_file.py
-c0e987ba06a61cc0426ffbca8af1eb51a97bd79acab59b70453cfbb18eaee093  ./test_processor_performance.py
-7b4b55e23dff35ba107b3da5b0560d03b1b41dfdea1d3a59eac777b4be4d4033  ./test_pyannote_audio.py
-5cb8b42033ffba41f25e7ef74ef04cf352c0c277a9971e9eaef53fd673902712  ./test_pyannote_multilingual.py
-8580e689ae148754e03d958419e108241040a012584ba49e8a90db114a9f8c13  ./test_scene_api.py
-1194d450070b1f42e045d98e532f41205bb3e52fc48ba26e7c9b72a188fe1b2c  ./test_segment_count.py
-147bfffeac9561cfa407207b04a825862ac623ba97deecf5ed7c6257432dc62c  ./test_speechbrain.py
-22e4b865bc769329c1146c2f914395044a9bc84cd2a13acf68fb374a57fe1e3e  ./test_v2_detailed.py
-a616570a2a080b5b19f4bf783877147e714a014103b274143dd37984a946ca08  ./test_v2_model.py
-7b83611f6b3028500c91c62197f774c0769e299136eca8dc4b612a7b5743e3d6  ./test_v2_with_text.py
-1dd983c78074a61ceec26d7e3623d40772ca55fd6ee63ba368afe756c66ae091  ./test_with_real_image.py
-1b738cc0d69d33e967cbb775def0a7f58dc02f1911404af56a5825bd60a5b75b  ./text_semantic_analysis.py
-a4221417ae00add76881c6c715ee4257c263e2dfd0a846a8887738682dfe8cda  ./thumbnail_extractor.py
-0d188a738a0df79ead10065d9f17c366fe159c862bd4bafa2860d0e6ba2640c3  ./tkg_builder.py
-8b97f0fdfc0899460bf23d420dba0a51a34737c74ebad0519856909d198662bf  ./tmdb_cast_fetcher.py
-4858909a0beaf8397becf4103be17fcc350841217afcdc1d917c48c512a9041b  ./tmdb_embed_extractor.py
-54d8321dfe0f8caa669e4a9d1b48dc772a5b25817eab95b552944140c91f457d  ./tmdb_identity_integration.py
-2a84aa2dcfb83ac385d2c394f884926f306c81798e4277a26dbd1f3c5506be46  ./trace_face_aggregator.py
-61d3b4b362722ce24326a204f1b72cc7b1dcc20cf3264a4f526d4ea343a8d33d  ./transcribe.py
-ede9a184fd51ef4c87eb3e2541f09b91739a49986cb588591a7c6fbb33433020  ./unified_synonym_processor.py
-a408f294c3a71eb6a0eea80b9b586f73dedcefe286c62233f713a7428a9979be  ./update_all_demographics.py
-e6520bb10ae6835ceade487ceb5e3fa549ca6f06de35b2c785d649921ef443f4  ./update_fine_speakers.py
-a2191daff2ad228725b6a66f0e472ec659a6b4fa8f2cbbd74d1bf9c35cca63eb  ./update_person_demographics.py
-60060753cfd2a6d1241e55bf40a0c74f1df15739656d0349e22e8543036b2424  ./update_speaker_assignments.py
-fdc61009c351263e0018801b32ad90ffd8919af611a2a0580546be7fd62c99c4  ./update_terminology.py
-0d337c821b36eb7761c0e439b63b8192ff54a542c539d1279efa6854f0b0cdc2  ./utils/body_action_decoder.py
-3b384a8d88f6147d1953b14bd6b55672f4f161885e29bc241a466d4cfbd50e99  ./utils/face_trace_visualizer.py
-52a7b79ade15f213841c70416565d3c5e46c145c9a72724ce545143c6e0bdea8  ./utils/face_tracker.py
-ecd902a4a6f1084d8396af0b4d88079105c84fa6170e3a394720a6452ff3aa3b  ./utils/pose_action_decoder.py
-29dd3e0f802c0347cd9d9465123915b4604c990d7250048b7ae388af03cf5f36  ./utils/pose_analyzer.py
-bc6184153096e5cd8d89d02fa3279c6587f60a49c6b3366b4d82cee722bbf352  ./utils/pose_transition_analyzer.py
-d0ec8f4a67c1a1eb1356ad6e9b2f466575691bd336621cdbbfd31dd10159f2dc  ./utils/test_mediapipe.py
-4840c11964a59eabad26b97fe01033ccaf7903e2d24edd5e1035f6dd5fc995ea  ./vectorize_4188.py
-078979114c5f248d2bfd43aa8df55235fa03ab812f26998b984cd485a3d2cda8  ./vectorize_chunk_summaries.py
-ff98864f1b11795cc3bb64f30ccb6f8609771ddc7a5df2c003ba7c2233d16fc2  ./vectorize_chunks.py
-5880c128400e6e36c8eb7dffd009dbbc99dd13f8575b0037bdc854e25ddc41fb  ./video_comparison_statistics.py
-0a1501ffdc027236cdf88706b3d61229e2998ab268fd57fb60e399ccb734b6a1  ./vision_agent.py
-eac8f90fbbb655614abcefc4b887e346bf94db5f015d33d37bc9514fb030489d  ./visual_chunk_processor.py
-c165dfc5fc981dc731b25ef414184ee58e56b73b148d41a32fdce985c701efd5  ./visualize_stamp.py
-6c65a82fdd1d585e20bee4fcb2d1bdec2e6220bda71d6ef9cd00d6a3cf74c4d7  ./voice_embedding_extractor.py
-2b3a7b357db4ddd07ca30bf200c6600724e33441d8def0a4d9a39673e2cfb1c0  ./weather_sound_detector.py
-206b61ebf3c91d7ce3f1488247b52aca6e955042d8aa979c59723e3ff10dd36a  ./yolo_benchmark_runner.py
-e8cb0963c90fbd1c2aa91141f80340edd3c9560d69780dd825d107c6ed14fa64  ./yolo_count_comparison.py
-dad775ecdca0144bd14b7abaa7ec8fb213e8b9428e39906abce541e93db496b6  ./yolo_processor_contract_v1.py
-74ff880e664ec514223a4f220b682fbc87089f8c0851c93ac68c97269b8a59b6  ./yolo_processor_mps.py
-8af0a6db683b6626e07820b302135ac5960d38e3d4b3d187c640b23ce8a14f72  ./yolo_processor.py
-e13cf22b9aeae96c7e28b4512dd2137743a25eb59027da446966c1aaaaf4ce71  ./zero_shot_combined_test.py
-f4aaf017ff588999f06cd9ba1787517e06c6d6e6228a15a54d8aa4f54fde5eb3  ./zero_shot_gun_test.py
-0a285b8ec33d7999e9d4ae8d43ce768c9f06ee1929e13a6809e98bdabe6357ce  ./zero_shot_objects_test.py
-5711c6d18acba76511a3f088d4d0f095b47c978a6c6ae3e086e2b7cbee7b9e55  ./backup_all.sh
-c8860e3d55b99745265998abaae63efe28c83d7c1bfd91b30dfba54d146793d3  ./check_config.sh
-6321793085bfb33b751b2848dddc41f13d9ead9763f6e581f9dcfceea9090f8b  ./demo_identity_full_cycle.sh
-77382d8671059ff99fd5ca3db42590de47ecf4e1555eea950bd3a7016b1547b0  ./deploy_package.sh
-09bda12152917b969259ff3ca0bcda63f615bdf4873dbb8bb7f7ce5eec742a9f  ./final_validation.sh
-491e609bb43526b0c41d3dd060a3813bbeb3defc70fc88fe36f9fbbd2280e720  ./install_mongodb.sh
-09e21960f0d7fdd00ff1d30334b753a8216ad17fc3644c9dbb129b4446ecc12c  ./package_delivery.sh
-0c2fe9288f9b51ad34aadf87093c1e1a423483ad7a972861ace811250e30204c  ./package_file.sh
-c233bb7b854dfd68e75808640fdea379af6952095a93cc8884d7e8b7ecbb4539  ./package_release.sh
-02e85ba83e8d3da68bf9320ff25506714ce460736b8824309027a5ec375ea86b  ./package_system.sh
-7557f1999bde53ef397b78208713e8df8817171dfbc053d6bed130b57a229517  ./release_preflight_check.sh
-091087dad7f38e8a0d98458b64fdeb0ac5770534f7dfebdbdf3b80d945ff39df  ./security_check.sh
-25711049adabfd179d4e19c2a4c4bd675ed9da8e8913ed1bdaac7519f6cde7ac  ./setup_fresh_mac.sh
-f6dae232edd5d2d111468be125609feb0dbd8db1895846f3d1c48f0e411e3a16  ./setup/01_postgresql.sh
-8a405e2372ddb5958f7bfac15d330a2f189ffe2583ae37bba4c953ac45412c80  ./setup/check_momentry.sh
-72dc22172a201a060a20f21b89af38c80ecb6399f594ecca81cafa8a918c764f  ./setup/install_momentry.sh
-5eccd14e8e4b3c91159b17756892dd03a7d26cb7bbc1961d783188ed10411770  ./setup/upgrade_momentry.sh
-e48ab4673f71370dc7d4ce5c32d159bf9438e9e1dd7c9edd9c6053156fbdaa99  ./start_momentry.sh
-ffe7e91a24fbfa826eb816f66cdb315097fe841a7b67a476865aec1ad7a4dda0  ./swift_processors/.build/checkouts/swift-argument-parser/Scripts/environment.sh
-b2ee4f8a445a7e83f7b99ae5d4139fd525d9e3e58a360bfef054d441aa21d901  ./swift_processors/.build/checkouts/swift-argument-parser/Scripts/format.sh
-9461213a77531fb3a5742fda0c9024304abe47988bb33852da55e96ae01a382a  ./test_api_validation.sh
-7cb98fb67007abe03bb57ef58a5e7499ae389693b33a14e015c9ef6061d6b0f5  ./test_face_recognition.sh
-46bf67f794dbcd2c191f1933f1c05a1eef0ad3f5bb2e1d64e11e5f23a44ffc10  ./test_identity_agent.sh
-7763d5bfbd83ede94e31eb8e44dd0d422fe2d1221b9e112d73fc637f29fdb7ea  ./test_multilingual.sh
-8a730fedf9252b7ed352b8447773c9c256f064fd64ca20efa05f9021766b09e5  ./test_search_modes_v2.sh
-fbca5ba0783153c4e21c174b0cbf75b582514f6ef0f92750a82d3178bc170f48  ./test_search_modes.sh
-f8c1647cdb4db8adef1829e41fbecd97f6b3b2e62927f195cd8e68127876069d  ./troubleshoot.sh
-992296b5218f3ef97ce53325be12f71848f3c3aeb3ee81d764bfe4bd61e1de05  ./verify_package.sh
-b6f95fa070cc0258bc5d005f10d13025ba8b08d3ee1598bcdad405ff1d3332ed  ./tmdb_agent.py
+2bfe6a1c1263f35916d4a28981814515fc40cb473f7bbc801f84842904c888f6  add_yolo_to_chunks.py
+f61f7126698018b346c8bafc45501708c17e3b45d9db54be5f0109afeee63176  age_benchmark.py
+8efb13239db2a25a728abbdebd92affe685b69402a277cceb0d76e62ed9451ac  analyze_asr_lip.py
+432b3e3b30578e71ef973aca758bd1964102cbbb19530620df8ac02df00eefb8  analyze_video_faces.py
+732609ef1882e14dc7ed60488697f6ae7e2607ec90b240a86ea9e585f052b9be  apply_asr_corrections.py
+790bd25424e93ca5a0743ea1a740a9a70f6ae6f8a9ca411012eb1e9b03907eb4  asr_benchmark_runner.py
+18744dc3bebdce0d89ea7076b5e43febd35ad3c84064bb52adde4d128d50bc9f  asr_face_stats.py
+1577d055328a73561f9ccfaf0c54727532e3dddcd1bf0f33e3c38081415cced8  asr_model_benchmark.py
+fcbb81639f53e9e08bee436853c84d918c0eeac09d985b34634d5ddc00055b61  asr_processor_base.py
+25948a204e45ce844d43606b7e45c9532321d48df44887d261fc886748276b10  asr_processor_contract_v1.py
+e9209cf028a11bdc45514124826374e58458ee06b054cfedffe8013d751735ea  asr_processor_contract_v2.py
+407dd0ec772027e0df27af0b66ea8130cb390595ccdeca4350e7bdc210acee6c  asr_processor_debug.py
+dcee1b80071b47c974bcffe3d27ec2f2269f4b8de7e7409ceaec7e6f271d31aa  asr_processor_legacy_v2.py
+10728a05a6ff2d56a70bb831abb51e05b03309e45bc5fa068c5a0702a4c73769  asr_processor_legacy.py
+9106bfe07de9cfc920f4f4d2f821dc024df612f4c2a8f5f75d35f012d26440f0  asr_processor_simplified.py
+7eabdcf7320302ee65c67e801f3ac7ca5801abc76165faa182348d30a8113e9f  asr_processor_small_multilingual.py
+2714f7be88f286635ea8465daf8fa969e6b27d2b2d1f73ac5e98f5e496139cad  asr_processor_small.py
+1089ff10b9b0a9f528cac79580aec25e33f8eeea485ac44b6aaf8c7c0cab5b42  asr_processor_v2.py
+b9e826f23f080ae67f5961ad750ec2a6834cd18335955c3b3175b8cd06ebd6d3  asr_processor.py
+5431b57d4369a841d51a6d6c5e1fb5e6c2932cb97cb4601f5e1b41ffe9f7ecaf  asr_side_by_side_comparison.py
+6c11efc3d40e559bfbeadcbf4f51eb353b744cc4f765bd8abc472a701e3f33cb  asrx_processor_contract_v1.py
+93501463af84d6541405057da3783d40492aec5e536b4210dcaffe460cdb5503  asrx_processor_custom.py
+6adfbee842d134b9d180e2d1104694ed5cdc1fa4febcd0c502801b8f87b3ce66  asrx_processor_simplified.py
+60fc3465f9c461583f8d0b888e85b3a6e04e1f252a1e1c21d036b52e1ce4b43c  asrx_processor_v2_noalign.py
+82d65b71bd86874e484870c40214d3fbd9343c39d5d635896fb4d257d13a410f  asrx_processor_v2_transcribe.py
+5a0c9905a2e10c847aa74f108e4054de4704bbafb2004589db15bf33833ea3c7  asrx_processor_v2.py
+b16b00cf9e5de96abc512022af9bb81196405b10988f5a39dfd3a9b6471f1155  asrx_processor.py
+f11b67ada6167540d2f95cb2af93d0e3a0de55bce659745baa37c4aa4805212e  audio_taxonomy_processor_v2.py
+ded810b81cda24e31e82de14ba9846770ee2b18d84d52b9d570de5877e9e2513  audio_taxonomy_processor.py
+f7c53be5a031a8bff15c3165543586529932d81c4312521654d132b1f0ed6bc3  auto_identify_persons.py
+5497a6f1f7ae267c796a398a9f020ea485aa45f980f2eca932b904ad61ce9b40  backfill_demographics.py
+39a479ca4f8986f3255b0bcd0d9162a1f2ae339bb4dcf081f931ff9b304797a1  backfill_frame_data.py
+77a98d9b7cb97eceae4c0fcf2c353933e0fb36ee7406b57d59b1e216b1a44601  build_docs.py
+308c8e3f3d45ee273504f9f415eaf6c025f06aaf1cca33156a66431ed6e64f43  build_semantic_index_poc.py
+4eb37768edd252d94f0d751f219c317e905bc093f414b2a6350efb8294131138  build_semantic_index.py
+debbd058957d09c2397f3f4c028edaa0a658002921dcca95eae2a20070ba95fb  caption_processor_contract_v1.py
+7236cdb5deaeada266cc246ee11380248bb9f2255888c25a152b2f6ab1f981cc  caption_processor.py
+e73cbb688dade5c5b6fc4276f0c78b377903ff83f3830b63d8bcdacd8da8aecf  check_all_stamps.py
+7ecdbd4b1f94be8ebab9935ea210a868330e7030b6e19c73229c579c1189fd5c  check_architecture_all.py
+7179ed1a87241904af29542f9018398f8afd9b9dd89af7bb11909310ab7b49e0  check_architecture_docs.py
+7e6bd7d14582e494baf8b28354bbded3f79b43f0bd271ab33874da55b9086311  check_code_document_consistency.py
+5ffca7c55edafad755e84499981553fcb48ce6056ca7b04130acafb9e6a9b1c3  check_frame_112_36.py
+f49c7b0cfa53b657f69b2ad97a6e18393741cc2151b32c9d7dde2e078b75953f  check_frame_91_59.py
+d2cb7475262ee711a4b06e53559f0927242be4a924a56e7fe212225f318f4193  chinese_vector_test.py
+ecde3d3df773916f62de4e34f8d8693feaedf112a3ef9955e22417c8421722bd  chunk_statistics.py
+2588ecf27c13020d894e46ba70a76de89f09556b475f555dae59db36da0b90a0  clean_sentence_text.py
+98ab1129032f42fddc020f9b3492d1fc133851d1af33ddeb57e2385d88425af4  clip_logo_integration.py
+bf6f74c09b8f8c7f25c5fffb9c36f16a8afb483a7b65903cfc75e2ea641bdf49  compare_asr_content.py
+1f2caadcded724aa04a929018a35ace53dd79d172f5ee2720308fbd4581b0c6c  compare_asr_models.py
+1ed8a9530f40e304b556ff76c7cac40468c86a0cd32ff2a8bc7bf2a69669121d  compare_models_gun_test.py
+6bf790fe75a7a2a5220052ca14c31e90a97eabc4558cd5e9059280913862a81e  compare_search.py
+875e7a598982c8ad7222a51b7b147e91cd5e1a930f41214b3942107cb932fc5c  compare_segmentation.py
+e432b6f2364d5a9aaf207a1de0dca3fb14ab8d118c53ee34306abfe6fd211ba8  comprehensive_search_test.py
+43df85cf860ac28e083de35b511bb2a7b91ed48f596757f52f19487768987500  coreml_embed_server.py
+9149ccc8de5adfec69c6f3f2ec502ae7d5e7844518a228ba587af2e08cb38805  crop_opencv_stamp.py
+fc36ecbb1455d959456945266e193b601a29c4210b4938a3f0d4a9aaf44b5cee  crop_real_stamps.py
+34a694624ce94d916b06a847bc4d41e7665985b85e55a626a4bc3a4370c21acf  crop_stamp_112_36.py
+27099dc9c8ee52a6949ce18c505089afef1720fe70858b90d0801972c3b43fff  crop_stamp_closeup.py
+01b5a3b091ebcffc0c1e2637b7af8192ba597239fa80d152738e3b8cfdf8174d  crop_stamp.py
+71b2a362b5395c6e4d70e62766820db92d94eaf140d98eecb2880bcd98d55be9  crop_top_candidates.py
+60f18c5fa03ffbc80c209337cd1c8b6acd0b8471e600119340aa8cdfeef14f5b  cut_benchmark_runner.py
+deba86a1645ca5b1acf413dd9edfad77b93ff213897d739a32de1ba629bfce52  cut_processor_contract_v1.py
+01024f947f0326c124293a30e4f2cdb859f21cfb2d4c07f9c1030e2934f7bc44  cut_processor.py
+ff092ad2373b57321f87d1dd123fff8a99c8207057591e8526e56cb1424d47c6  dashboard.py
+f184bf3e546db0253ffb71895e8d42aeb06588c71c4914c2fe656f42ef463c9a  debug_face_registration.py
+a9acce1ebd6ea821a8dc5009b8fc40586a98d31c23e93c97fd844bdadbda4ed2  deep_analysis_112_36.py
+7767ee7455a956d14d286ad558c4c312c2ad3ccee1c73adc1bc8f761c96ad72a  demo_dashboard.py
+425290c12161c5cfcb0c505a737ba3951656b39e425e792919d4812e15b9b8e3  demo_face_learning.py
+d7e3e27e6a65b1fa62530ee954c227dbb4f97593c5a5dcc48b39e5ebae4656e5  dense_scan_traces.py
+df79b7fc7a03a8e754de5123a23bb33b1d5c23d832adc1886fb846ca517dd24d  detect_language.py
+f6f8047e24ebbec81ef27dd38f4242e63385f8ebe5be471cae156b8aa5fc4477  detect_objects_keyframes.py
+e61d2ef5043bda3674a0050d83ba3bc6a70c47f54e456124a736b4328f0c0638  detect_stamp_shapes.py
+f23a382113e9c7de2ec3b24e95160daef48f9336ae6d4ec9ee7a18f4bf529f6d  download_places365_classes.py
+a747e5e17960b972549714786bb9e28ea578e10e6c80788e298a0149c970bcc5  embed_faces.py
+f1a2b3820e1a763eba6d8d905a5bb87f5a9b4a2f005e709e313bb7505ba7ddaa  embeddinggemma_server.py
+43c540c02c1be992e7d44ab4fc76a759815db3ed5f25bcbb594328b50ed7c73b  export_file_package.py
+19d23e4604d5532928412afe4d5d39ff49194ab4a046825286ae1be154326a1f  export_file.py
+5f10bab1dcb0b5fad233a74069f9e2f89043e7c848c9c38ae7e2806e6940c75d  export_identities.py
+2a1d0a1b853fd2c28f9a404871d33912f93521358576833be0999271bae02bcb  export_person_thumbnails.py
+a81bf1d6af78c052e638f5d5677b4edb512d0de5441025d86fd970d3e7993922  export_sqlite.py
+2fe8c0131dde21382cae1483825d489fd467c2491a0cb91d5c1881df2e402e9f  extract_face_embedding.py
+8b5cc0ff437fb4dd0df28b7b20a78469cdca3621e2eeb4b6d46ad2391acb0596  extract_female_faces.py
+bdecbaf0496bf536dce2ef4897f7090749820d15dcca03492d4d736ab0f8c6c5  face_benchmark_runner.py
+22319a38bd684fb235fec681ddc60f45821e4bb2181f2b31fdf945f7ad9a1b85  face_clustering_processor.py
+5adce4e444743331fa592e13d71e52f26554eadb9744d350a7654a449a8fb8a3  face_count_comparison.py
+3574454c74eaf11021f9052f77d93044cca4ae0285d0f2630b4016c2ec0df783  face_cross_validate.py
+4f09b3b66b14a5eefb14fcf915a1ad1e9147010f6ae7671731566679b1cae461  face_embedding_extractor.py
+d05c65221cbe787e4e29a4de1966edb9e89fed47e9e89c9d065e1d5cb46cf178  face_landmark_qc.py
+28776dfcc6ac40e9481c25467438745fed60fecdfd4fc19f9f4c7396397591a7  face_mediapipe_test.py
+f4d1b4334a49357b74b80e390ad5a3d16263e51cbe5cab661af92bd2e9721f02  face_processor_contract_v1.py
+802015c73dfce0866f2a0bc94c645aa35ba30a6de78244af23090bb1f1828c6e  face_processor_mps.py
+96ffdbde3f4d87e9942f9e1f4c93cbd999dc404b43e00d4cdcbb22de3c0f16b7  face_processor_optimized.py
+4c3915a7465f524e706940c9813614ec4920cd6f8647602ef32e88fdbbaf8fc0  face_processor_v1.py
+d6ddad29a5e53b43b887554072d7965f0535e47fb62dad1a8b87e44fa1be6015  face_processor.py
+8edab61189ad1a8fa60c203077e814e82d46c5bae67054fa2ab1958e199c05f9  face_recognition_processor.py
+9ea19f357b3fcec6c8b3875c538e53cb46e407ab188cd544963e0123e535fa03  face_registration.py
+72648816de611fd9b84d2b98c177b8b4f24374024b69184e8151c06cf44d633b  face_statistics_report.py
+499f197a06f50839ebd5350af380fa56506ce08f073ba40c0e863b8e02b34133  fast_face_clustering_processor.py
+0191781635b98d0675969fb87733af19525d7b5c148723346c5378c08a00fe33  fast_stamp_search.py
+00e7e8ed06f6a0f2c46c84a47d7e7f5d366acee941d546a52c4b1b7885c71e08  filter_stamp_colors.py
+5341fd648cffafc77568070313b06417636943d50ff3b4380a61381260acaafa  final_face_validation.py
+213793ab719f4ef42ec9b22f351dd86d4739211c17be486a46b76ba7e64fd8f1  find_blue_stamp_opencv.py
+e1490317c0f56b895f73cfbb6f57c8e3ea5c65304bfdd7663f103f6b564e148c  find_kids_pose.py
+08d4cba0650f6a22fc134d07fd15fe8784c8472c3ba687b587e31e0b980e2b1c  find_kids_refined.py
+aecec0784ce5d0e98176c15798f05d4f67ab6a686f9ffafba71fbd82157027f8  find_magnifying_glass.py
+620db08dd84f00af0c6d744dac54c68360548dd5b2cc26b12ddcefd936239b2e  find_pink_stamp.py
+1f4555b3578f4dc6bc08aa37e34eda1d91ea25d8134439771678d1a57bfdaeb9  find_realistic_stamp_opencv.py
+277aa3b48eec2e739de3bb95ef501ffbd24104aa2a1bdef28c844ef44fd75013  find_small_stamp_opencv.py
+fc73bbc9605938db495bd33ea74955e454e9384130531a16d42f25dbd9b515d8  find_stamp_in_hands.py
+c6ed0f12e78c12df977ddca5d699f58edb174b47199f584e7a24dbdc3b7d02b1  find_stamp_in_magnifier_scene.py
+ecf12e346619c27a985452e9f84ee262c2da25de9df0ff6e0b293279ccba559b  find_stamp_opencv.py
+4ff93cbcc781a5cff023f78006f1aebbe2d954405ae7d00a473fef6b41b2ebee  fix_asr_text.py
+4090cb892115843a909aa41426c0f39c5a53d8d88a5db69499ec8bafcb780d77  florence2_scan_stamps.py
+e90e4447db3328b64a2062ca13ed41f6a045220d8fb640542dff5b790d3c4d3b  gdino_comparison_test.py
+7071a9999057c347e2275381f1f0c58e19aa8581d70a572d3170ed14a295a48d  gdino_frame_api.py
+891410310b415ff68a0f7ee0aa39e84eef7f2c75887487bdb88b8f4718d40e94  generate_asr1.py
+24efe7db016387b40bd9caae449f0445a3d47eb878c00399803bb6e78e6dd5fc  generate_benchmark_summary.py
+dc956a78a3ed26686f45dd6d6d9cb42c023751fcd9b8789585450b6df63670a1  generate_chunk_summaries.py
+8a0922d75fdc7c5994ebfb31881d765db4b105cbcddfcaa4b4c49d11950b8df4  generate_chunk_visual_stats.py
+4860bfd00cc6c1c842c2f8e17e725eebca191d81067af3cb5a28661b45d74bd3  generate_parent_chunks_gemma4.py
+e9fca223a8329ff6bdcb8552fecedb2d8b4607c6516c373c3023f29edfd42e06  generate_sentence_summaries.py
+cbae7c3e85457274e8c284005196c39dc97f9d9200ed6b0e4ea266e48a381d3a  generate_synonyms_llamacpp.py
+57512cd7a5ec2f52813717fd3d81dec1aaa69dc9c91a9edbca847e7012b1c86f  generate_synonyms_ollama.py
+dc495cb8127858fa03a5f8b8bb4a772c5934ada1abecf97459bf71de80417672  gun_detector_scan.py
+1a7cfb72723b3b94e3f4fe368477ba693ac3d20ac7af7351962bc548c700b451  head_shoulder_bench.py
+b2fe8e4d8d7d1057ba928fc5e190f4a06cb60e83e2a02c5d7c423791596c11b8  head_shoulder_quick.py
+ba5e67a97cb465e6a1a942c2f7342406031759ffcea2b897ae963bee4bc551c4  hybrid_stamp_search.py
+f5847b6c8ed4c7c51290df9032d5a192317b5f03b5ff418ead1181a6e1b655f2  identity_agent.py
+12237fa6cc5f0d2dcdd05f26fd50c0a7bfd541d1c922a1640d131fa0c4d6f4fc  identity_bind.py
+046aa90eb4a4b830910912362a9865d1e6170f5bc176fae42be630f967f9d3ff  import_file_package.py
+7cc260d4411ab13559803686f8b645afa07738d652d9459830aecac268597fa7  import_file.py
+071e3a5141d04cb9e6bd31489a835c778608785896b18ea7fa65e8db9f1547e5  insert_chunks.py
+d3d53f44daa7f1526488677b141e90fbf4aa5625369b96a3ca275b802414802f  integrate_face_asrx.py
+4cb6a93ef8006cb69e8bdb1bc72899ee9bab1bf7eceaafe9896923bb7023bbd5  integrate_rule3_markers.py
+75aa3e4bffc9f9cb8b9254db19095c93c3efb43d465fb5dcca8c7b9b730f5c59  integrated_body_action_decoder.py
+f4dd2e21fb6b668bdf0c51cc56e214188b46937b96a2b4a10d13783e171d0472  language_router.py
+bef426641645fcf7dcc68c87e3325a6edf3f70925febaf1df84f7c6ff87681e5  lip_analyzer.py
+7f98b0cc8379b3759cc7e805dd56f736cc518093e83f43b2e5ecf559a19b95f0  lip_processor_cv.py
+a1473eeba17fce25e4678234fe4e8793a132514e0566b03b36a0bec04eb93acb  lip_processor_media.py
+0df61396756ee22d35356776c189b354458661916c8baf85bcef97c9f8b62ec8  lip_processor_mp.py
+3202aeca29e651ef1a54f47681c6b3b2d0680555fe3c6d318a932bb12b49e58c  lip_processor_simple.py
+fed15bafb5e09715cc03962f465b2ff618bf05ebeafdf932643690c9635c9840  lip_processor.py
+b9532949bd145c0411876bdf3a8cbf1540b4233f7585465ce6389928e1bfd908  llm_metadata_enhancer.py
+1773054e8d563b493865880d0d8bda105e3eb6fb536a25817517237b3bb76afe  magnifying_glass_analyze.py
+7d4d048c452bf273f4a6d96da13eb7bab6aa60ca9dd51de5ca0fb0a01e587b13  magnifying_glass_extract.py
+8528bbf89d2770fa5a23f461274038898be251fb6e48c5d3adece5aab3bf976d  magnifying_glass_owl.py
+cb645f5e29ee5a36b2f97812039abfdaed7328386bcd25ad7b742af6a6b16399  map_speakers_v2.py
+a90bd3fb729a05010c29a213134c60cc0bdd17769e27a7d3f1250919b7bf1613  match_face_identity.py
+2d864dc831c2fd0142b19b8ad2cda169c2a05facd9662d31861d29bb710c4979  match_face_with_pose_filtering.py
+889d4853707896885ed96ab945d4266acb213f4b122e2ba7c4563eb0e3e9e865  match_identities_to_tmdb.py
+b34ec373bcf65139e08e41967f58a2fc8ebb67a59c361074d3590cd16541415a  match_speakers_to_chunks.py
+fe6260a94d01d8b43d0d3b59eb820cfd7b4711c907343a1261c69f9010ae990d  mediapipe_holistic_processor.py
+bb36844b4d13bba8edc1b7f0703f02081b62bea795535b8cd8dcbfdb4281f402  migrate_asr_to_children.py
+819312cbfce6e68a0d8d731e02d283946f79de6044f207991ddf9a28ac853d79  migrate_face_results.py
+c3d062aab67b5177ac7bf2c3ad2f0e578e12c9893e377f68339a17cc2783316c  migrate_identity_files.py
+c418f6e50054fa7eae1d0d879e28997b98f57437acec48b53ecb09f332728867  migrate_to_4188.py
+6f60aa899e06f05e575cb5b461ea517481119cc32644566245d74c96eccde722  multi_stage_stamp_search.py
+b24e2289c00f803c8339f59c34d44ed6c53a3c19dafc13e72c4b260d6bb312a6  music_segmentation_processor.py
+da2546f84d0dbd711c8800ae4e32e59d9c38de9e62e1b423c4518fa1fda1dbea  natural_language_top10.py
+78c3d1a9302dbfacdf9b3655dab07348957fd9dbb4af94aae83eefecd5343a33  natural_language_vector_detailed.py
+e924f04d68c9a8211ad373da811aa6671d2c5654281c1634dbf8b1e5e5b51533  natural_language_vector_test.py
+df6ac92367b1afb50c0af958e362d87555fe569f608a8d213e0a593e2a43cde8  object_search_agent.py
+fd39b779a0337f521940f3f7b159931f1f207f200eefd610183781fdcf3dfafd  object_search.py
+42d2952fc78b57302b0d12bc3d45790a2c2c46d4ffa3c713a82686134bd63f13  ocr_benchmark_runner.py
+7b3ccb5c4ddd4c62c5ad04d0e3aafaecc2c1441012b6a98613cdcf055e2e50e8  ocr_processor_contract_v1.py
+271023eec42d6be4a1ce6ae2ce3f29e825210a57e6bb37554a6f7fdf54616f9a  ocr_processor_mps.py
+2e73c41285e52ef013594fcd4d20df9f5781bfc26bcf62e54dd2c04ec44200c3  ocr_processor.py
+62196108cb3337b5f9a873d70d2981ac8f49152369afbcc8a12b3a13de579e80  opencv_stamp_search.py
+b2e8d552c272fd173c77693e9453a85fe16dfc12f7c2cd304d299c6188c14077  paligemma_vs_gdino.py
+1534d5b7617dbae77f7a37a2c33a89b90f965247a6828f00b73ea6b720f6f4fc  parent_chunk_5w1h.py
+5208c738d4b615282813d351daf09872ce516121bb604caa64968ef5e52c53d3  pipeline_checklist.py
+8f80c3a2be5c330e2d1853d9250a171c75db84598dbf3304280c42237ed4fb1f  pipeline_status.py
+94db44c0f49115a677d117d4901a1b7991c1517905300eaa495dd62b8ac1c79c  pose_processor_contract_v1.py
+167dee5e42c6bd46674bcffcfd92f368fc0b48a1f42c459c806853b281bc6482  pose_processor_mps.py
+a6ef3a785ef5c6dc47fa38dbed80d76bc7d4bf48cbaf0f7edb3d26df98d7262c  pose_processor.py
+45e6798dc5900f2f7c8776a2d260c122aae5068a075256b8a5c02e8d0be6c131  probe_file.py
+01c7b3c30c1531224f9605f0ee633285fe8489ab2d0a3c9c6a41f2b2b60d6626  quick_stamp_search.py
+e3143673a2bff6139e05c82446fd8770c4b7e59a854a42c3b29662f5ac75efe2  rebuild_parents.py
+4aa98981632d4f8a11039c510e86aa296ae1cd4b399fc871ed664ac11e445bd9  rebuild_story_content.py
+090137a5872edfed1b89c97b537d13ad8aafda9a705ebb4c54f30352503e5e3a  redis_publisher.py
+750f778946b56bc57c47d9d2295332bb0f8cec2c1aa03c6b882d39ef4432673d  refine_search.py
+0f8a6a6866a5797e964d3b17e2b7ef146fe7a798f09fcea982fcda6f629b4d06  regenerate_parent_5w1h.py
+3ee192b623f290136b36bd63abd018aad6e6639a9543970c3415734628b33bd6  register_sample_faces.py
+334782f0f66d0ad3818a51adf6343186a2de65467378ab68a81ade806e496af9  release_manager.py
+9a44cdd155953778b52ac0cfb118504c56eb6b1141984365ffbb717e28f3e65b  release_pack.py
+3906b48f3a7764d19605def2bf8ef84a54a6afe64c9291a7cc0881a91472a826  render_face_heatmap.py
+44e432c31a35211a37dd26695772b7e250487ac42ba4f16a56f843277c2fabbf  render_offline_report.py
+3fac1e6a4125042185a2ce82771f695c562b3137c7aa58a912bada00ad8ecf78  rescan_single_frame_traces.py
+9c3212cb455c2a6230be918448560fee00c153a8956ffd04fcb62974d5e1abff  resume_framework.py
+7c95ec08daf4f980bd53233503b7a4fa01afc08660e8fe8cd031ea3613ead8f7  save_events_to_db.py
+24795e1531fe05e33d515104e4fb2f9567b46d802ef1b5a38f11268cf105be76  scan_charade_stamps.py
+cad2da5073577f851c5cb2abdbd7cab05b39caa0d1179ccc89c378a7df2736c8  scan_full_video_stamps.py
+03ae71470331fe5b7f8e394f7f789eee08cad4ed5ec9196b46ab2c9dbefa7fec  scan_handheld_objects.py
+d3935ba498786cf260d9d5370ca60d3af7bc4fd438f6be33ce23cfd0b7bab593  scan_keyframes_opencv.py
+12c9b35212f587f5adb37584bf3c3844804d2bc642ebfc5d82b86b44f46d2472  scan_keyframes.py
+f386130ac203308c904ba7efea09ce0ca0d640d36762b113bf0cfedc24d7f885  scene_classifier.py
+482edae04e5467a68c77729760db53d3653e8d7654fa49e5ec9a36f1f8f22616  search_blue_stamp.py
+e3786422932138272d1096ad4c800594e62c9640952a286a9158372a1e5443e3  search_envelope.py
+2df1e259c2e52d10d79b20856cb94ffff5a9bfdbe47cee587b1148b2f1c16101  search_objects_in_hands.py
+9fd49be8ab16f94fd82efc5ae035c029372a7ddeb7fd779b557f1917cdc14592  search_vase.py
+7a6d8e7c435368f6218db972c04a7be16d7d6680d8d4374f82c05b7162716b9d  select_face_reference_vectors_v2.py
+2bcf7c1b3c407b51a134a5ee4982713f0ea387cfd6df01ed75554c94603971a6  select_face_reference_vectors_v3.py
+d52098fcf1f9f7ba14f31a9a90bc5b3bc933e1a5e5697e3d09eff389c153cb18  select_face_reference_vectors.py
+a02cb37639275d86ae0b4504d21f50963b45aaf94630c59472ba30d07722e50c  simple_api_test.py
+02516ab1616c1756c4f8041f48ff12811cc5d672c53b34850b84ce682fefdff1  simple_face_stats.py
+b024d9bfe244d0d058daae0acd314b9344d6f0912e4f3b02dbc618f9fe3e4949  simple_test.py
+af8703506769f3cdb89ff7849b071c2421307717850596dd86d2fe0b053e7809  smart_stamp_v2.py
+5e5f86d47ea2b75bcaa8662689f73af1963645149c0da688dc43482616aa4e76  sound_event_detector.py
+bab7697e4b4b05e93babc116e0c5b13cbaf1f4d419a65acd5dc1de5bdfc510dc  speaker_assign.py
+381ff240ce806ead7d6463ee40c5b830035eb6252180b4b0901b3c8313fa4bbd  speaker_bind_lip.py
+5eede29fa0966974c1943792d7fcca2dd9179d4f23570cf1a3964dc97bc9ac1e  specific_stamp_search.py
+d5363d832272bdb3c1d6f6d93eee7b7894893b9164a3f5ad5fa08a4a0eaeeb47  split_asr_segments.py
+8e1269f173f2c72de78857c2d83d3111b62ec89bd79f4fb00c3f57390986ae4f  step3_asr_fine.py
+7592df8be5dc58376b33960bfa7fc0003c51114b70ebc01f1589f39ee9568d3b  store_traced_faces.py
+7ac32c1e2146a19e6654ab3e4bbbfd42e1a6540fb8717d40d55c61e9f5d1bf71  story_embed.py
+74cc24b328a075f48b1f44a465611157f44eadc8f5dabf6d95cd5cc5f80dd9dc  story_pipeline_full.py
+97628f0f1270825dabafdf0a69f10ef12c4ffe2be4ac12941315f06bfb084e7c  story_processor_contract_v1.py
+1b1f42fc4bbff26551f26f4ac1e8a995dfe3ff98b940a29c9e130410965d0fa0  story_processor.py
+cdbc7ef88551e2b3a3771eac5be5e0360989e71fa009ac28c97e548507e08a5e  sync_face_speaker_to_chunks.py
+8b08e9a33f5917aad10e070d6aa48805f5e7c23f905ba8fff3b8697b2109d962  sync_to_mongodb.py
+869b6c56fe16cbf8973826782a17503f02b5cd757ec025b944da693d38bdb4cb  sync_users_from_sftpgo.py
+f64cc6dcb72f54d3e97aa981b40591aef4804ca769e1f14628d901b98bc6aeac  terminology_manager.py
+455546b9bb3a2c2c877c7720229b254e75b28eea33b3715d1731c02ca85294ae  test_api_correct_usage.py
+b03dc1bbb091672e7da2b131850b17badac896b4fbba92fe9bce76c232c99be4  test_api_with_key_id.py
+7d295c77d5bcd4c72c5673370af48cc89bbccf9292c3b82aad3a230d242547a9  test_args.py
+f474ec88e6634decbf178da497443fa709096b174bb4a4320a07256f516b1044  test_asr_large_model.py
+aa952524dd86f346740ffe555075b74adf2e60bb822bb04a943a51b1fd262445  test_birth_uuid.py
+db87badad7948527325a528400d67a4eeef76abf8d13f5c4254c812e944e4e0c  test_end_to_end.py
+e191c98a82f7e089f7dccfc4c536244da2bf14339f982a3afef05d33332c3755  test_face_api_final.py
+1b97c9aae2e1744aa7aefb192eaef86c64e6134efc8f08ffa9a274bff16a58d3  test_face_api_with_correct_key.py
+f7e4078f31b1ca8494c18878219cf2f90c301f19fc851b9e7084657b71a5e150  test_face_api.py
+9eafc49f8fa42b4cd58109e9b725b3aec3b06943ec426919b1788838ccf1ed92  test_face_db_fix.py
+38bce82b167e0c97b257cc6b955fdc2e9ded581ce2d39eb0fd2c60249275394b  test_face_direct.py
+24e82bf0af82407e6c04361e9a671770cbfb0b05d92df589bd0d5a0118bb5a98  test_face_learning.py
+8dcdb144c4253fbb466f220359b42c2a9579193865e320a56e682e384c2ae176  test_face_recognition_integration.py
+b921e3256fdea176d4391116d1ead472c4f3ca8aac6999140367818818c35ec3  test_face_registration_api.py
+9af6c6ff0c766b3de92185c3602f2b8b62b815bf88dcb0e3251c2676e61e0a48  test_face_tracker.py
+4f70eadb6a8b80eb8febe32b17b77e58d1a4823cc5d598e5ea45555342d2d4cb  test_florence2_direct.py
+0588be0acea540950d737943073f71e769b6301374eaa4ff7fdb96a80145c4e0  test_florence2_pipeline.py
+694c15193616157ddae4bdb0a45feada2a8f8490f01d290a28aa77a4b24eabb2  test_florence2_stamps.py
+2c281f698616a83e9eeccd610555d9f9ab657b2deac65ae9e3dbfba0b450d9b0  test_identity_db.py
+7a73e8314ea7e91ca9dad3867a83b9c1101fdab09bdc0fdac0f798d0a7a204f3  test_llm_capabilities.py
+68300f87b96a474f06a3071a833e6b3ae48d1db5fb8a7e5a3ec1834fd878d808  test_multilingual.py
+c17cdd0f4ffb7a151a634add08d13cc576ba7a848bb20f54fb97d0c1d9d81cc0  test_object_search.py
+d07bd363a2878259fbf4ffcba40e367f7f1bf4171b5a5dfdda97f7a53b450d0e  test_ollama_feasibility.py
+8421003b1f66cbd21c6fe5d3aff0a526897753e959b23905ca8f502f644f66a5  test_owl_vit_debug.py
+6f9e8b7947229ea4aa0a62b59bda5fcec05bd74f6c00dc4a7b06d932bd1b730f  test_owl_vit_stamps.py
+da91a7c97466ce7f03cde13aa9bf6e691b3e482d2cac74519a2e1a61a2abb05a  test_parent_chunk_generation.py
+19d9f2492d3b04b7dafa008f106767d3107dd36b0c8e4601765dca30131027cd  test_places365_scene.py
+de44553023067362e8b2223f03e1bff55fcbd2f11ddf3d01060dc02c4675a744  test_probe_file.py
+c0e987ba06a61cc0426ffbca8af1eb51a97bd79acab59b70453cfbb18eaee093  test_processor_performance.py
+7b4b55e23dff35ba107b3da5b0560d03b1b41dfdea1d3a59eac777b4be4d4033  test_pyannote_audio.py
+5cb8b42033ffba41f25e7ef74ef04cf352c0c277a9971e9eaef53fd673902712  test_pyannote_multilingual.py
+8580e689ae148754e03d958419e108241040a012584ba49e8a90db114a9f8c13  test_scene_api.py
+1194d450070b1f42e045d98e532f41205bb3e52fc48ba26e7c9b72a188fe1b2c  test_segment_count.py
+147bfffeac9561cfa407207b04a825862ac623ba97deecf5ed7c6257432dc62c  test_speechbrain.py
+22e4b865bc769329c1146c2f914395044a9bc84cd2a13acf68fb374a57fe1e3e  test_v2_detailed.py
+a616570a2a080b5b19f4bf783877147e714a014103b274143dd37984a946ca08  test_v2_model.py
+7b83611f6b3028500c91c62197f774c0769e299136eca8dc4b612a7b5743e3d6  test_v2_with_text.py
+1dd983c78074a61ceec26d7e3623d40772ca55fd6ee63ba368afe756c66ae091  test_with_real_image.py
+1b738cc0d69d33e967cbb775def0a7f58dc02f1911404af56a5825bd60a5b75b  text_semantic_analysis.py
+a4221417ae00add76881c6c715ee4257c263e2dfd0a846a8887738682dfe8cda  thumbnail_extractor.py
+0d188a738a0df79ead10065d9f17c366fe159c862bd4bafa2860d0e6ba2640c3  tkg_builder.py
+a084d3b5840e920d552515febffa22b34943b9efa8b73adab9cd193372e71592  tmdb_agent.py
+8b97f0fdfc0899460bf23d420dba0a51a34737c74ebad0519856909d198662bf  tmdb_cast_fetcher.py
+4858909a0beaf8397becf4103be17fcc350841217afcdc1d917c48c512a9041b  tmdb_embed_extractor.py
+54d8321dfe0f8caa669e4a9d1b48dc772a5b25817eab95b552944140c91f457d  tmdb_identity_integration.py
+2a84aa2dcfb83ac385d2c394f884926f306c81798e4277a26dbd1f3c5506be46  trace_face_aggregator.py
+61d3b4b362722ce24326a204f1b72cc7b1dcc20cf3264a4f526d4ea343a8d33d  transcribe.py
+ede9a184fd51ef4c87eb3e2541f09b91739a49986cb588591a7c6fbb33433020  unified_synonym_processor.py
+a408f294c3a71eb6a0eea80b9b586f73dedcefe286c62233f713a7428a9979be  update_all_demographics.py
+e6520bb10ae6835ceade487ceb5e3fa549ca6f06de35b2c785d649921ef443f4  update_fine_speakers.py
+a2191daff2ad228725b6a66f0e472ec659a6b4fa8f2cbbd74d1bf9c35cca63eb  update_person_demographics.py
+1a7dddd1db467990ee1c685d61b971babfa30c3ae3a754b5df8f3b4c320f3ed1  update_qdrant_uuid.py
+60060753cfd2a6d1241e55bf40a0c74f1df15739656d0349e22e8543036b2424  update_speaker_assignments.py
+fdc61009c351263e0018801b32ad90ffd8919af611a2a0580546be7fd62c99c4  update_terminology.py
+4840c11964a59eabad26b97fe01033ccaf7903e2d24edd5e1035f6dd5fc995ea  vectorize_4188.py
+078979114c5f248d2bfd43aa8df55235fa03ab812f26998b984cd485a3d2cda8  vectorize_chunk_summaries.py
+ff98864f1b11795cc3bb64f30ccb6f8609771ddc7a5df2c003ba7c2233d16fc2  vectorize_chunks.py
+5880c128400e6e36c8eb7dffd009dbbc99dd13f8575b0037bdc854e25ddc41fb  video_comparison_statistics.py
+0a1501ffdc027236cdf88706b3d61229e2998ab268fd57fb60e399ccb734b6a1  vision_agent.py
+eac8f90fbbb655614abcefc4b887e346bf94db5f015d33d37bc9514fb030489d  visual_chunk_processor.py
+c165dfc5fc981dc731b25ef414184ee58e56b73b148d41a32fdce985c701efd5  visualize_stamp.py
+6c65a82fdd1d585e20bee4fcb2d1bdec2e6220bda71d6ef9cd00d6a3cf74c4d7  voice_embedding_extractor.py
+2b3a7b357db4ddd07ca30bf200c6600724e33441d8def0a4d9a39673e2cfb1c0  weather_sound_detector.py
+206b61ebf3c91d7ce3f1488247b52aca6e955042d8aa979c59723e3ff10dd36a  yolo_benchmark_runner.py
+e8cb0963c90fbd1c2aa91141f80340edd3c9560d69780dd825d107c6ed14fa64  yolo_count_comparison.py
+dad775ecdca0144bd14b7abaa7ec8fb213e8b9428e39906abce541e93db496b6  yolo_processor_contract_v1.py
+74ff880e664ec514223a4f220b682fbc87089f8c0851c93ac68c97269b8a59b6  yolo_processor_mps.py
+8af0a6db683b6626e07820b302135ac5960d38e3d4b3d187c640b23ce8a14f72  yolo_processor.py
+e13cf22b9aeae96c7e28b4512dd2137743a25eb59027da446966c1aaaaf4ce71  zero_shot_combined_test.py
+f4aaf017ff588999f06cd9ba1787517e06c6d6e6228a15a54d8aa4f54fde5eb3  zero_shot_gun_test.py
+0a285b8ec33d7999e9d4ae8d43ce768c9f06ee1929e13a6809e98bdabe6357ce  zero_shot_objects_test.py
diff --git a/scripts/embed_faces_only.py b/scripts/embed_faces_only.py
new file mode 100644
index 0000000..fcbedd7
--- /dev/null
+++ b/scripts/embed_faces_only.py
@@ -0,0 +1,136 @@
+#!/opt/homebrew/bin/python3.11
+"""Embed faces from existing detections JSON using CoreML FaceNet."""
+import json, os, sys, time
+import cv2
+import numpy as np
+from pathlib import Path
+
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+import coremltools as ct
+
+FACENET_PATH = os.path.join(os.path.dirname(os.path.abspath(__file__)), "..", "models", "facenet512.mlpackage")
+
+def classify_pose(roll: float, yaw: float) -> str:
+    abs_yaw, abs_roll = abs(yaw), abs(roll)
+    if abs_yaw < 15 and abs_roll < 15:
+        return "frontal"
+    elif abs_yaw > 30:
+        return "profile_right" if yaw > 0 else "profile_left"
+    return "three_quarter"
+
+def extract_embedding(coreml_model, face_img):
+    resized = cv2.resize(face_img, (160, 160))
+    normalized = (resized.astype(np.float32) / 127.5) - 1.0
+    normalized = np.transpose(normalized, (2, 0, 1))
+    input_array = np.expand_dims(normalized, axis=0)
+    result = coreml_model.predict({"input": input_array})
+    emb_key = [k for k in result.keys() if k.startswith("var_")][0]
+    return result[emb_key].flatten().tolist()
+
+def main():
+    import argparse
+    parser = argparse.ArgumentParser(description="Embed faces only")
+    parser.add_argument("detections_json")
+    parser.add_argument("output_json")
+    parser.add_argument("--video", required=True)
+    args = parser.parse_args()
+
+    print(f"[EMBED] Loading detections: {args.detections_json}")
+    with open(args.detections_json) as f:
+        detection_data = json.load(f)
+
+    print(f"[EMBED] Loading CoreML FaceNet: {FACENET_PATH}")
+    coreml_model = ct.models.MLModel(FACENET_PATH)
+
+    print(f"[EMBED] Opening video: {args.video}")
+    video = cv2.VideoCapture(args.video)
+    fps = video.get(cv2.CAP_PROP_FPS)
+    total_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT))
+    width = int(video.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(video.get(cv2.CAP_PROP_FRAME_HEIGHT))
+
+    face_data = {
+        "metadata": {
+            "video_path": os.path.abspath(args.video),
+            "fps": fps, "width": width, "height": height,
+            "sample_interval": detection_data.get("sample_interval", 3),
+            "detection_method": "apple_vision",
+            "embedding_method": "coreml_facenet",
+            "total_frames": total_frames,
+        },
+        "frames": {}
+    }
+
+    frames = detection_data.get("frames", [])
+    t0 = time.time()
+    embed_count, total_face_count = 0, 0
+    batch_size = max(1, len(frames) // 20)
+
+    for idx, frame_info in enumerate(frames):
+        frame_num = frame_info["frame"]
+        faces = []
+        for face in frame_info.get("faces", []):
+            total_face_count += 1
+            bb = face.get("bbox", face)
+            x, y, w, h = bb["x"], bb["y"], bb["width"], bb["height"]
+            if w <= 10 or h <= 10:
+                continue
+
+            video.set(cv2.CAP_PROP_POS_FRAMES, frame_num)
+            ret, frame = video.read()
+            if not ret:
+                continue
+
+            x1, y1 = max(0, x), max(0, y)
+            x2, y2 = min(width, x + w), min(height, y + h)
+            if x2 <= x1 or y2 <= y1:
+                continue
+            face_img = frame[y1:y2, x1:x2]
+            if face_img.size == 0:
+                continue
+
+            emb = extract_embedding(coreml_model, face_img)
+            if emb is not None:
+                embed_count += 1
+
+            pose_info = face.get("pose", {})
+            pose_angle = classify_pose(
+                pose_info.get("roll", 0),
+                pose_info.get("yaw", 0)
+            )
+
+            faces.append({
+                "x": x, "y": y, "width": w, "height": h,
+                "confidence": face.get("confidence", 0.5),
+                "embedding": emb,
+                "pose_angle": {
+                    "angle": pose_angle,
+                    "roll": pose_info.get("roll", 0),
+                    "yaw": pose_info.get("yaw", 0),
+                    "pitch": pose_info.get("pitch", 0),
+                },
+                "landmarks": face.get("landmarks", []),
+            })
+
+        face_data["frames"][str(frame_num)] = faces
+
+        if (idx + 1) % batch_size == 0:
+            pct = (idx + 1) / len(frames) * 100
+            elapsed = time.time() - t0
+            eta = (elapsed / (idx + 1)) * (len(frames) - idx - 1) if idx > 0 else 0
+            print(f"[EMBED] {pct:.0f}% | {idx+1}/{len(frames)} frames | "
+                  f"{embed_count} embeddings | {elapsed:.0f}s elapsed | "
+                  f"{eta:.0f}s ETA", flush=True)
+
+    video.release()
+    face_data["metadata"]["status"] = "completed"
+
+    print(f"[EMBED] Writing output: {args.output_json}")
+    with open(args.output_json, "w") as f:
+        json.dump(face_data, f, indent=2)
+
+    elapsed = time.time() - t0
+    print(f"[EMBED] Done: {len(frames)} frames, {embed_count}/{total_face_count} embeddings, {elapsed:.0f}s")
+
+if __name__ == "__main__":
+    main()
diff --git a/scripts/extract_embeddings_from_face_json.py b/scripts/extract_embeddings_from_face_json.py
new file mode 100644
index 0000000..d80fe6d
--- /dev/null
+++ b/scripts/extract_embeddings_from_face_json.py
@@ -0,0 +1,121 @@
+#!/opt/homebrew/bin/python3.11
+"""
+Extract embeddings from existing face.json using CoreML FaceNet.
+
+Usage: python3 scripts/extract_embeddings_from_face_json.py <face_json_path> <video_path> <output_path>
+"""
+import sys
+import os
+import json
+import cv2
+import numpy as np
+import coremltools as ct
+
+SCRIPT_DIR = os.path.dirname(os.path.abspath(__file__))
+FACENET_PATH = os.path.join(SCRIPT_DIR, "..", "models", "facenet512.mlpackage")
+
+
+def extract_embeddings(face_json_path: str, video_path: str, output_path: str):
+    # Load face.json
+    with open(face_json_path, 'r') as f:
+        face_data = json.load(f)
+    
+    frames = face_data.get('frames', [])
+    if not frames:
+        print("No frames in face.json")
+        return
+    
+    # Load CoreML FaceNet
+    facenet = os.path.normpath(FACENET_PATH)
+    if not os.path.exists(facenet):
+        print(f"FaceNet model not found: {facenet}")
+        return
+    
+    coreml_model = ct.models.MLModel(facenet)
+    print(f"[EMB] CoreML FaceNet loaded: {facenet}")
+    
+    # Open video
+    video = cv2.VideoCapture(video_path)
+    if not video.isOpened():
+        print(f"Cannot open video: {video_path}")
+        return
+    
+    fps = video.get(cv2.CAP_PROP_FPS)
+    total_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT))
+    print(f"[EMB] Video: {fps} fps, {total_frames} frames")
+    
+    # Extract embeddings for each face
+    embed_count = 0
+    processed_frames = 0
+    
+    for frame_entry in frames:
+        frame_num = frame_entry.get('frame', 0)
+        faces = frame_entry.get('faces', [])
+        
+        # Seek to frame
+        video.set(cv2.CAP_PROP_POS_FRAMES, frame_num)
+        ret, img = video.read()
+        if not ret:
+            continue
+        
+        processed_frames += 1
+        
+        for face in faces:
+            x = face.get('x', 0)
+            y = face.get('y', 0)
+            w = face.get('width', 0)
+            h = face.get('height', 0)
+            
+            if w == 0 or h == 0:
+                continue
+            
+            # Crop face
+            crop = img[y:y+h, x:x+w]
+            if crop.size == 0:
+                continue
+            
+            # Resize to 160x160 (FaceNet input size)
+            crop_resized = cv2.resize(crop, (160, 160))
+            
+            # Convert to RGB
+            crop_rgb = cv2.cvtColor(crop_resized, cv2.COLOR_BGR2RGB)
+            
+            # CoreML embedding
+            try:
+                input_dict = {'image': crop_rgb}
+                output = coreml_model.predict(input_dict)
+                emb = output.get('output', output.get('embeddings', None))
+                
+                if emb is not None:
+                    if isinstance(emb, np.ndarray):
+                        emb = emb.flatten().tolist()
+                    elif isinstance(emb, dict):
+                        emb = list(emb.values())[0]
+                        if isinstance(emb, np.ndarray):
+                            emb = emb.flatten().tolist()
+                    
+                    face['embedding'] = emb
+                    embed_count += 1
+            except Exception as e:
+                print(f"[EMB] Frame {frame_num} embedding failed: {e}")
+        
+        if processed_frames % 1000 == 0:
+            print(f"[EMB] Processed {processed_frames} frames, {embed_count} embeddings")
+    
+    video.release()
+    
+    # Save updated face.json
+    face_data['metadata']['total_embeddings'] = embed_count
+    
+    with open(output_path, 'w') as f:
+        json.dump(face_data, f)
+    
+    print(f"[EMB] Done: {processed_frames} frames, {embed_count} embeddings")
+
+
+if __name__ == "__main__":
+    if len(sys.argv) < 4:
+        print("Usage: python3 extract_embeddings_from_face_json.py <face_json> <video> <output>")
+        sys.exit(1)
+    
+    extract_embeddings(sys.argv[1], sys.argv[2], sys.argv[3])
\ No newline at end of file
diff --git a/scripts/extract_face_crops.py b/scripts/extract_face_crops.py
new file mode 100644
index 0000000..6262860
--- /dev/null
+++ b/scripts/extract_face_crops.py
@@ -0,0 +1,397 @@
+#!/usr/bin/env python3
+"""
+extract_face_crops.py - 批量提取 face crops
+
+Usage:
+    python3 scripts/extract_face_crops.py --uuid <file_uuid>
+    python3 scripts/extract_face_crops.py --uuid <file_uuid> --video <video_path>
+
+儲存位置: {OUTPUT_DIR}/.faces/{file_uuid}/{trace_id}/{frame}.jpg
+
+條件:
+    - trace_id != None and trace_id != 0
+    - landmarks.left_eye or landmarks.right_eye
+
+品檢:
+    - file_size > 500 bytes
+    - mean_brightness > 5
+    - std_deviation > 10
+
+Retry: 最多 3 次
+"""
+
+import argparse
+import json
+import subprocess
+import os
+import sys
+from pathlib import Path
+from datetime import datetime
+from typing import Dict, List, Optional, Tuple, Set
+from concurrent.futures import ThreadPoolExecutor, as_completed
+import threading
+
+# Constants
+MAX_RETRIES = 3
+MIN_FILE_SIZE = 500
+MIN_BRIGHTNESS = 5
+MIN_STD_DEV = 10
+FFMPEG_TIMEOUT = 30
+MAX_WORKERS = 8  # Parallel threads for ffmpeg
+
+
+class FaceCropExtractor:
+    def __init__(self, output_dir: str):
+        self.output_dir = Path(output_dir)
+        self.faces_dir = self.output_dir / ".faces"
+        self.faces_dir.mkdir(parents=True, exist_ok=True)
+        self.stats = {"total_faces": 0, "qualified": 0, "successful": 0, "failed": 0, "skipped": 0, "low_confidence": 0, "too_small": 0}
+        self.stats_lock = threading.Lock()
+    
+    def process_video(self, uuid: str, video_path: str) -> dict:
+        """處理單一影片"""
+        face_json = self.output_dir / f"{uuid}.face.json"
+        traced_json = self.output_dir / f"{uuid}.face_traced.json"
+        
+        if not face_json.exists():
+            print(f"[ERROR] face.json not found: {uuid}")
+            return {"error": "face.json not found"}
+        
+        if not os.path.exists(video_path):
+            print(f"[ERROR] Video not found: {video_path}")
+            return {"error": "video not found"}
+        
+        # Load face.json (landmarks)
+        print(f"[LOAD] Reading {face_json}")
+        with open(face_json) as f:
+            face_data = json.load(f)
+        
+        # Load face_traced.json if exists (trace_id)
+        traced_data = {}
+        if traced_json.exists():
+            print(f"[LOAD] Reading {traced_json}")
+            with open(traced_json) as f:
+                traced_data = json.load(f)
+        
+        # Build lookup: (frame, x, y) -> trace_id from traced_data
+        trace_lookup: Dict[Tuple[int, int, int], int] = {}
+        frames = traced_data.get("frames", {})
+        if isinstance(frames, dict):
+            for fnum, frm in frames.items():
+                faces = frm.get("faces", [])
+                if faces is None:
+                    continue
+                for face in faces:
+                    if face is None:
+                        continue
+                    trace_id = face.get("trace_id")
+                    if trace_id and trace_id != 0:
+                        x = face.get("x", 0)
+                        y = face.get("y", 0)
+                        key = (int(fnum), x, y)
+                        trace_lookup[key] = trace_id
+        
+        # Create output directory
+        uuid_dir = self.faces_dir / uuid
+        uuid_dir.mkdir(parents=True, exist_ok=True)
+        
+        results = {"successful": [], "failed": []}
+        processed: Set[Tuple[int, int]] = set()  # (trace_id, frame)
+        trace_counts: Dict[int, int] = {}  # trace_id -> count
+        
+        # Process faces from face.json
+        frames = face_data.get("frames", {})
+        if isinstance(frames, dict):
+            frame_items = frames.items()
+        elif isinstance(frames, list):
+            frame_items = [(frm.get("frame"), frm) for frm in frames]
+        else:
+            frame_items = []
+        
+        # Collect extraction tasks
+        tasks = []
+        for fnum, frm in frame_items:
+            if fnum is None:
+                continue
+            
+            faces = frm.get("faces", [])
+            if faces is None:
+                continue
+            
+            for face in faces:
+                if face is None:
+                    continue
+                
+                self.stats["total_faces"] += 1
+                
+                bb = face.get("bbox", face)
+                x = bb.get("x", 0) if isinstance(bb, dict) else 0
+                y = bb.get("y", 0) if isinstance(bb, dict) else 0
+                w = bb.get("width", 0) if isinstance(bb, dict) else 0
+                h = bb.get("height", 0) if isinstance(bb, dict) else 0
+                confidence = face.get("confidence", 0.0)
+                
+                # Quality filtering: confidence + size
+                MIN_CONFIDENCE = 0.6
+                MIN_SIZE = 20
+                
+                if confidence < MIN_CONFIDENCE:
+                    self.stats["low_confidence"] += 1
+                    continue
+                if w < MIN_SIZE or h < MIN_SIZE:
+                    self.stats["too_small"] += 1
+                    continue
+                
+                # Check: has eyes
+                lm = face.get("landmarks")
+                has_eyes = False
+                if lm:
+                    if isinstance(lm, dict):
+                        has_eyes = lm.get("left_eye") or lm.get("right_eye")
+                    elif isinstance(lm, list) and len(lm) >= 2:
+                        has_eyes = True
+                
+                if not has_eyes:
+                    self.stats["skipped"] += 1
+                    continue
+                
+                self.stats["qualified"] += 1
+                
+                # Check: in trace
+                key = (int(fnum), x, y)
+                trace_id = trace_lookup.get(key) or face.get("trace_id")
+                
+                # Determine output directory
+                if trace_id and trace_id != 0:
+                    output_dir = uuid_dir / str(trace_id)
+                    crop_key = (trace_id, int(fnum))
+                else:
+                    # No trace_id → unbound directory
+                    output_dir = uuid_dir / "unbound"
+                    crop_key = ("unbound", int(fnum), x, y)  # unique key for unbound
+                
+                if crop_key in processed:
+                    continue
+                processed.add(crop_key)
+                
+                output_dir.mkdir(parents=True, exist_ok=True)
+                output_path = output_dir / f"{fnum}.jpg"
+                
+                tasks.append({
+                    "trace_id": trace_id or "unbound",
+                    "frame": int(fnum),
+                    "x": x, "y": y, "w": w, "h": h,
+                    "output_path": output_path
+                })
+        
+        # Parallel extraction
+        print(f"[EXTRACT] Processing {len(tasks)} faces with {MAX_WORKERS} threads...")
+        
+        with ThreadPoolExecutor(max_workers=MAX_WORKERS) as executor:
+            futures = {
+                executor.submit(
+                    self.extract_face, video_path, t["frame"], 
+                    t["x"], t["y"], t["w"], t["h"], t["output_path"]
+                ): t for t in tasks
+            }
+            
+            for i, future in enumerate(as_completed(futures)):
+                t = futures[future]
+                result = future.result()
+                
+                if result["success"]:
+                    self.stats["successful"] += 1
+                    results["successful"].append({
+                        "trace_id": t["trace_id"],
+                        "frame": t["frame"],
+                        "path": str(t["output_path"])
+                    })
+                    trace_counts[t["trace_id"]] = trace_counts.get(t["trace_id"], 0) + 1
+                else:
+                    self.stats["failed"] += 1
+                    results["failed"].append({
+                        "trace_id": t["trace_id"],
+                        "frame": t["frame"],
+                        "bbox": {"x": t["x"], "y": t["y"], "w": t["w"], "h": t["h"]},
+                        "reason": result.get("reason", "unknown")
+                    })
+                
+                # Progress every 1000
+                if (i + 1) % 1000 == 0:
+                    print(f"  Progress: {i+1}/{len(tasks)} ({self.stats['successful']} OK, {self.stats['failed']} fail)")
+        
+        # Write summary
+        self.write_summary(uuid, trace_counts, results)
+        
+        return results
+    
+    def extract_face(self, video_path: str, frame: int, x: int, y: int, 
+                     w: int, h: int, output_path: Path) -> dict:
+        """提取 face crop（含 retry，使用 -ss 快速 seek）"""
+        for attempt in range(MAX_RETRIES):
+            try:
+                ts = frame / 24.0  # FPS is always 24 for this video
+                cmd = [
+                    "ffmpeg", "-y", "-ss", f"{ts:.3f}",
+                    "-i", video_path,
+                    "-vf", f"crop={w}:{h}:{x}:{y}",
+                    "-frames:v", "1",
+                    "-q:v", "2",  # 高品質 JPEG
+                    str(output_path)
+                ]
+                
+                proc = subprocess.run(
+                    cmd, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL,
+                    timeout=FFMPEG_TIMEOUT
+                )
+                
+                if proc.returncode != 0:
+                    if attempt < MAX_RETRIES - 1:
+                        continue
+                    return {"success": False, "reason": "ffmpeg_failed"}
+                
+                # Quality check
+                quality = self.check_quality(output_path)
+                if quality["ok"]:
+                    return {"success": True, "path": str(output_path)}
+                
+                # Quality failed, retry
+                if attempt < MAX_RETRIES - 1:
+                    # Remove bad file
+                    if output_path.exists():
+                        output_path.unlink()
+                    continue
+                
+                return {"success": False, "reason": quality.get("reason", "quality_failed")}
+            
+            except subprocess.TimeoutExpired:
+                if attempt < MAX_RETRIES - 1:
+                    continue
+                return {"success": False, "reason": "timeout"}
+            except Exception as e:
+                return {"success": False, "reason": str(e)}
+        
+        return {"success": False, "reason": "max_retries"}
+    
+    def check_quality(self, path: Path) -> dict:
+        """品檢"""
+        if not path.exists():
+            return {"ok": False, "reason": "file_not_exist"}
+        
+        file_size = path.stat().st_size
+        if file_size < MIN_FILE_SIZE:
+            return {"ok": False, "reason": f"empty_file ({file_size}B)"}
+        
+        try:
+            from PIL import Image
+            import numpy as np
+            
+            img = Image.open(path)
+            arr = np.array(img.convert('RGB'))
+            
+            mean_brightness = arr.mean()
+            if mean_brightness < MIN_BRIGHTNESS:
+                return {"ok": False, "reason": f"black_frame (mean={mean_brightness:.1f})"}
+            
+            std_dev = arr.std()
+            if std_dev < MIN_STD_DEV:
+                return {"ok": False, "reason": f"low_contrast (std={std_dev:.1f})"}
+            
+            return {"ok": True}
+        
+        except ImportError:
+            # PIL not available, skip advanced quality check
+            return {"ok": True}
+        except Exception as e:
+            return {"ok": False, "reason": str(e)}
+    
+    def write_summary(self, uuid: str, trace_counts: Dict[int, int], results: dict):
+        """寫摘要報告"""
+        summary_path = self.faces_dir / uuid / "_summary.json"
+        
+        summary = {
+            "file_uuid": uuid,
+            "timestamp": datetime.now().isoformat(),
+            "stats": self.stats,
+            "trace_counts": trace_counts,
+            "total_traces": len(trace_counts),
+            "failed_count": len(results["failed"]),
+            "failed_faces": results["failed"] if results["failed"] else None
+        }
+        
+        with open(summary_path, "w") as f:
+            json.dump(summary, f, indent=2, ensure_ascii=False)
+        
+        print(f"\n[SUMMARY] Written to {summary_path}")
+    
+    def print_stats(self):
+        """印統計"""
+        print(f"\n=== Statistics ===")
+        print(f"Total faces scanned: {self.stats['total_faces']}")
+        print(f"Filtered (low confidence < 0.6): {self.stats['low_confidence']}")
+        print(f"Filtered (too small < 20px): {self.stats['too_small']}")
+        print(f"Qualified (trace_id + eyes): {self.stats['qualified']}")
+        print(f"Successfully extracted: {self.stats['successful']}")
+        print(f"Failed: {self.stats['failed']}")
+        print(f"Skipped (no trace/eyes): {self.stats['skipped']}")
+
+
+def main():
+    parser = argparse.ArgumentParser(
+        description="Extract face crops from videos",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog=__doc__
+    )
+    
+    parser.add_argument("--uuid", type=str, required=True,
+                        help="File UUID to process")
+    parser.add_argument("--video", type=str,
+                        help="Video file path (optional, will check DB if not provided)")
+    parser.add_argument("--output-dir", type=str,
+                        default="/Users/accusys/momentry/output_dev",
+                        help="Output directory (default: output_dev)")
+    
+    args = parser.parse_args()
+    
+    # Get video path
+    video_path = args.video
+    if not video_path:
+        # Query from DB
+        video_path = query_video_path_from_db(args.uuid)
+        if not video_path:
+            print(f"[ERROR] Video path not found for UUID: {args.uuid}")
+            sys.exit(1)
+    
+    print(f"=== Face Crop Extraction ===")
+    print(f"UUID: {args.uuid}")
+    print(f"Video: {video_path}")
+    print(f"Output: {args.output_dir}/.faces/{args.uuid}/")
+    print()
+    
+    extractor = FaceCropExtractor(args.output_dir)
+    results = extractor.process_video(args.uuid, video_path)
+    extractor.print_stats()
+
+
+def query_video_path_from_db(uuid: str) -> Optional[str]:
+    """從 PostgreSQL 取得影片路徑"""
+    psql_path = "/opt/homebrew/Cellar/libpq/18.3/bin/psql"
+    
+    if not os.path.exists(psql_path):
+        return None
+    
+        cmd = [
+            psql_path, "-U", "accusys", "-d", "momentry", "-t", "-A",
+            "-c", f"SELECT file_path FROM public.videos WHERE file_uuid = '{uuid}' LIMIT 1"
+        ]
+    
+    try:
+        proc = subprocess.run(cmd, capture_output=True, text=True, timeout=5)
+        path = proc.stdout.strip()
+        return path if path else None
+    except Exception:
+        return None
+
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/scripts/extract_video_embeddings.py b/scripts/extract_video_embeddings.py
new file mode 100644
index 0000000..5a2f39b
--- /dev/null
+++ b/scripts/extract_video_embeddings.py
@@ -0,0 +1,174 @@
+#!/opt/homebrew/bin/python3.11
+"""
+Extract face embeddings for a video file using InsightFace + CoreML FaceNet.
+Updates face_detections.embedding in PostgreSQL.
+
+Usage: python3 scripts/extract_video_embeddings.py --file-uuid <uuid> --video-path <path>
+"""
+
+import argparse
+import json
+import os
+import sys
+import io
+import warnings
+import cv2
+import numpy as np
+import psycopg2
+from psycopg2.extras import execute_values
+
+warnings.filterwarnings("ignore")
+
+DATABASE_URL = os.getenv("DATABASE_URL", "postgres://accusys@localhost:5432/momentry")
+MODELS_DIR = os.path.join(os.path.dirname(os.path.abspath(__file__)), "..", "models")
+FACENET_PATH = os.path.join(MODELS_DIR, "facenet512.mlpackage")
+
+
+def get_schema():
+    """Get schema from DATABASE_URL options"""
+    db_url = os.getenv("DATABASE_URL", "")
+    if "search_path=dev" in db_url or "DATABASE_SCHEMA=dev" in os.environ:
+        return "dev"
+    return "public"
+
+
+def extract_video_embeddings(file_uuid: str, video_path: str, schema: str = "dev"):
+    """Extract face embeddings from video frames"""
+    
+    # Suppress InsightFace verbose output
+    old_stdout = sys.stdout
+    sys.stdout = io.StringIO()
+    try:
+        import insightface
+        from insightface.app import FaceAnalysis
+        import coremltools as ct
+        
+        app = FaceAnalysis(name="buffalo_l", providers=["CPUExecutionProvider"])
+        app.prepare(ctx_id=0, det_thresh=0.5)
+        coreml_model = ct.models.MLModel(FACENET_PATH)
+    finally:
+        sys.stdout = old_stdout
+    
+    # Open video
+    cap = cv2.VideoCapture(video_path)
+    fps = cap.get(cv2.CAP_PROP_FPS)
+    total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    
+    print(f"[EMBED] Video: {total_frames} frames, {fps} fps")
+    
+    # Get face detections from DB (without embeddings)
+    conn = psycopg2.connect(DATABASE_URL)
+    cur = conn.cursor()
+    
+    cur.execute(f"""
+        SELECT id, frame_number, x, y, width, height 
+        FROM {schema}.face_detections 
+        WHERE file_uuid = %s AND embedding IS NULL
+        ORDER BY frame_number
+    """, (file_uuid,))
+    
+    face_records = cur.fetchall()
+    print(f"[EMBED] Faces without embedding: {len(face_records)}")
+    
+    if len(face_records) == 0:
+        print("[EMBED] All faces have embeddings")
+        cur.close()
+        conn.close()
+        return
+    
+    # Build frame -> faces mapping
+    frame_faces = {}
+    for face_id, frame_num, x, y, w, h in face_records:
+        if frame_num not in frame_faces:
+            frame_faces[frame_num] = []
+        frame_faces[frame_num].append((face_id, x, y, w, h))
+    
+    # Extract embeddings
+    batch_updates = []
+    processed_frames = 0
+    
+    for frame_num in sorted(frame_faces.keys()):
+        cap.set(cv2.CAP_PROP_POS_FRAMES, frame_num)
+        ret, frame = cap.read()
+        
+        if not ret:
+            continue
+        
+        faces_data = frame_faces[frame_num]
+        
+        # Detect faces in this frame
+        faces = app.get(frame)
+        
+        for face_id, x, y, w, h in faces_data:
+            # Find matching detected face
+            best_face = None
+            best_iou = 0
+            
+            for det_face in faces:
+                fx1, fy1, fx2, fy2 = det_face.bbox
+                fw, fh = fx2 - fx1, fy2 - fy1
+                
+                # Calculate IoU
+                xi1, yi1 = max(x, fx1), max(y, fy1)
+                xi2, yi2 = min(x + w, fx2), min(y + h, fy2)
+                inter_w, inter_h = max(0, xi2 - xi1), max(0, yi2 - yi1)
+                inter = inter_w * inter_h
+                union = w * h + fw * fh - inter
+                
+                iou = inter / union if union > 0 else 0
+                
+                if iou > best_iou:
+                    best_iou = iou
+                    best_face = det_face
+            
+            if best_face and best_iou > 0.3:
+                # Get embedding from InsightFace
+                embedding = best_face.embedding
+                
+                if embedding is not None and len(embedding) > 0:
+                    batch_updates.append((embedding.tolist(), face_id))
+        
+        processed_frames += 1
+        if processed_frames % 100 == 0:
+            print(f"[EMBED] Progress: {processed_frames} frames, {len(batch_updates)} embeddings")
+    
+    cap.release()
+    
+    # Update embeddings in DB
+    if batch_updates:
+        print(f"[EMBED] Updating {len(batch_updates)} embeddings...")
+        
+        for emb, face_id in batch_updates:
+            cur.execute(f"""
+                UPDATE {schema}.face_detections
+                SET embedding = %s
+                WHERE id = %s
+            """, (emb, face_id))
+        
+        conn.commit()
+        
+        # Verify
+        cur.execute(f"""
+            SELECT COUNT(embedding) FROM {schema}.face_detections 
+            WHERE file_uuid = %s
+        """, (file_uuid,))
+        embed_count = cur.fetchone()[0]
+        
+        print(f"[EMBED] Done: {embed_count} faces with embeddings")
+    
+    cur.close()
+    conn.close()
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Extract face embeddings from video")
+    parser.add_argument("--file-uuid", required=True, help="Video file UUID")
+    parser.add_argument("--video-path", required=True, help="Video file path")
+    parser.add_argument("--schema", default=get_schema(), help="Database schema")
+    args = parser.parse_args()
+    
+    extract_video_embeddings(args.file_uuid, args.video_path, args.schema)
+
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/scripts/insert_face_detections.py b/scripts/insert_face_detections.py
new file mode 100644
index 0000000..3c1f6d1
--- /dev/null
+++ b/scripts/insert_face_detections.py
@@ -0,0 +1,64 @@
+#!/opt/homebrew/bin/python3.11
+"""Insert face detections from traced JSON into DB."""
+import json, os, sys
+import psycopg2
+import psycopg2.extras
+
+DB_URL = os.environ.get("DATABASE_URL", "postgresql://accusys@localhost:5432/momentry")
+
+def insert_faces(file_uuid, traced_json_path, schema):
+    conn = psycopg2.connect(DB_URL)
+    cur = conn.cursor()
+
+    with open(traced_json_path) as f:
+        data = json.load(f)
+
+    frames = data.get("frames", {})
+    metadata = data.get("metadata", {})
+    fps = metadata.get("fps", 24.0)
+
+    total = 0
+    for frame_num_str, frame_data in sorted(frames.items(), key=lambda x: int(x[0])):
+        frame_num = int(frame_num_str)
+        ts = frame_num / fps
+        faces = frame_data.get("faces", [])
+
+        for face in faces:
+            x = int(face.get("x", 0))
+            y = int(face.get("y", 0))
+            w = int(face.get("width", 0))
+            h = int(face.get("height", 0))
+            confidence = face.get("confidence", 0.0)
+            trace_id = face.get("trace_id")
+            embedding = face.get("embedding")
+
+            try:
+                cur.execute(
+                    f"""
+                    INSERT INTO {schema}.face_detections
+                        (file_uuid, frame_number, timestamp_secs, x, y, width, height, confidence, trace_id, embedding)
+                    VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s)
+                    ON CONFLICT DO NOTHING
+                    """,
+                    (file_uuid, frame_num, ts, x, y, w, h, confidence, trace_id, embedding),
+                )
+                if cur.rowcount > 0:
+                    total += 1
+            except Exception as e:
+                print(f"[INSERT] Error at frame {frame_num}: {e}")
+                conn.rollback()
+
+    conn.commit()
+    cur.close()
+    conn.close()
+    print(f"[INSERT] Inserted {total} face detections into {schema}.face_detections")
+
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser(description="Insert face detections")
+    parser.add_argument("--file-uuid", required=True)
+    parser.add_argument("--face-json", required=True)
+    parser.add_argument("--schema", default="public")
+    args = parser.parse_args()
+
+    insert_faces(args.file_uuid, args.face_json, args.schema)
diff --git a/scripts/match_faces_to_tmdb.py b/scripts/match_faces_to_tmdb.py
new file mode 100644
index 0000000..890ffbc
--- /dev/null
+++ b/scripts/match_faces_to_tmdb.py
@@ -0,0 +1,201 @@
+#!/opt/homebrew/bin/python3.11
+"""
+Match face_detections against TMDb identities via face embedding similarity.
+Port of match_faces_against_tmdb from src/core/tmdb/face_agent.rs
+
+Usage: python3 scripts/match_faces_to_tmdb.py <file_uuid> [--schema dev]
+"""
+
+import sys
+import psycopg2
+import psycopg2.extras
+import numpy as np
+from collections import defaultdict
+
+DATABASE_URL = "postgres://accusys@localhost:5432/momentry"
+THRESHOLD = 0.50
+QC_MIN_FACES = 4  # Minimum faces per trace for QC
+
+
+def cosine_similarity(a, b):
+    a = np.array(a, dtype=np.float64)
+    b = np.array(b, dtype=np.float64)
+    na = np.linalg.norm(a)
+    nb = np.linalg.norm(b)
+    if na == 0 or nb == 0:
+        return 0.0
+    return np.dot(a, b) / (na * nb)
+
+
+def match_faces_to_tmdb(file_uuid: str, schema: str = "dev"):
+    conn = psycopg2.connect(DATABASE_URL)
+    cur = conn.cursor(cursor_factory=psycopg2.extras.RealDictCursor)
+
+    # Step 1: Load TMDb identities with face embeddings
+    cur.execute(f"""
+        SELECT id, name, tmdb_id, face_embedding::real[] as embedding
+        FROM {schema}.identities
+        WHERE source = 'tmdb' AND face_embedding IS NOT NULL
+    """)
+    tmdb_identities = []
+    for row in cur.fetchall():
+        emb = row["embedding"]
+        if emb and len(emb) > 0:
+            tmdb_identities.append({
+                "id": row["id"],
+                "name": row["name"],
+                "tmdb_id": row["tmdb_id"],
+                "embedding": emb,
+            })
+    
+    print(f"[TMDB-MATCH] Loaded {len(tmdb_identities)} TMDb identities")
+    
+    if not tmdb_identities:
+        print("[TMDB-MATCH] No TMDb identities with embeddings")
+        cur.close()
+        conn.close()
+        return 0
+
+    # Step 2: Load face_detections with trace_id and embedding
+    cur.execute(f"""
+        SELECT id, trace_id, frame_number, embedding::real[] as embedding, confidence
+        FROM {schema}.face_detections
+        WHERE file_uuid = %s AND trace_id IS NOT NULL AND embedding IS NOT NULL
+        ORDER BY trace_id, frame_number
+    """, (file_uuid,))
+    
+    fd_rows = cur.fetchall()
+    if not fd_rows:
+        print(f"[TMDB-MATCH] No face detections for {file_uuid}")
+        cur.close()
+        conn.close()
+        return 0
+    
+    # Group by trace_id
+    trace_faces = defaultdict(list)
+    for row in fd_rows:
+        trace_id = row["trace_id"]
+        emb = row["embedding"]
+        if emb:
+            trace_faces[trace_id].append({
+                "id": row["id"],
+                "embedding": emb,
+                "frame": row["frame_number"],
+                "confidence": row["confidence"],
+            })
+    
+    # Dedup near-identical embeddings within trace (sim > 0.99)
+    for tid, faces in trace_faces.items():
+        faces.sort(key=lambda x: x["embedding"][0])
+        unique = []
+        for f in faces:
+            if not unique or cosine_similarity(f["embedding"], unique[-1]["embedding"]) <= 0.99:
+                unique.append(f)
+        trace_faces[tid] = unique
+    
+    total_traces = len(trace_faces)
+    total_faces = len(fd_rows)
+    print(f"[TMDB-MATCH] {total_traces} traces with {total_faces} faces")
+    
+    # Step 3: Single-pass matching (one round only for performance)
+    matched = {}  # trace_id → (identity_id, name)
+    
+    # Build reference pool from TMDb seeds only
+    reference_pool = []
+    for tmdb in tmdb_identities:
+        reference_pool.append({
+            "embedding": tmdb["embedding"],
+            "identity_id": tmdb["id"],
+            "name": tmdb["name"],
+        })
+    
+    print(f"[TMDB-MATCH] Matching {total_traces} traces against {len(reference_pool)} TMDb identities (threshold={THRESHOLD})")
+    
+    # Match each trace against TMDb seeds
+    for tid, faces in trace_faces.items():
+        trace_scores = defaultdict(list)
+        for f in faces:
+            for ref in reference_pool:
+                sim = cosine_similarity(f["embedding"], ref["embedding"])
+                if sim >= THRESHOLD:
+                    trace_scores[ref["identity_id"]].append((sim, ref["name"]))
+        
+        if not trace_scores:
+            continue
+        
+        # Select identity with highest aggregate score
+        best_identity = None
+        best_score = 0
+        best_name = None
+        
+        for identity_id, scores in trace_scores.items():
+            avg_sim = np.mean([s[0] for s in scores])
+            if avg_sim > best_score:
+                best_score = avg_sim
+                best_identity = identity_id
+                best_name = scores[0][1]
+        
+        if best_identity:
+            matched[tid] = (best_identity, best_name, best_score)
+    
+    # Step 4: Quality Control - minimum faces per trace
+    qc_removed = 0
+    for tid, faces in trace_faces.items():
+        if tid in matched and len(faces) < QC_MIN_FACES:
+            del matched[tid]
+            qc_removed += 1
+    
+    # Step 5: Temporal collision check
+    frame_identity_count = defaultdict(lambda: defaultdict(int))
+    for tid, faces in trace_faces.items():
+        if tid in matched:
+            identity_id = matched[tid][0]
+            for f in faces:
+                frame_identity_count[f["frame"]][identity_id] += 1
+    
+    for frame, identity_counts in frame_identity_count.items():
+        for identity_id, count in identity_counts.items():
+            if count > 1:
+                conflicting = []
+                for tid, faces in trace_faces.items():
+                    if tid in matched and matched[tid][0] == identity_id:
+                        for f in faces:
+                            if f["frame"] == frame:
+                                conflicting.append((tid, f["confidence"]))
+                
+                conflicting.sort(key=lambda x: x[1], reverse=True)
+                for tid, _ in conflicting[1:]:
+                    if tid in matched:
+                        del matched[tid]
+                        qc_removed += 1
+    
+    if qc_removed > 0:
+        print(f"[TMDB-MATCH] QC removed {qc_removed} traces")
+    
+    # Step 6: Update face_detections.identity_id
+    bindings_created = 0
+    for tid, (identity_id, name, score) in matched.items():
+        for f in trace_faces[tid]:
+            cur.execute(f"""
+                UPDATE {schema}.face_detections
+                SET identity_id = %s
+                WHERE id = %s AND identity_id IS NULL
+            """, (identity_id, f["id"]))
+            bindings_created += cur.rowcount
+    
+    conn.commit()
+    cur.close()
+    conn.close()
+    
+    print(f"[TMDB-MATCH] {bindings_created} bindings created, {len(matched)} traces matched")
+    return bindings_created
+
+
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser()
+    parser.add_argument("file_uuid", help="Video file UUID")
+    parser.add_argument("--schema", default="dev", help="Database schema")
+    args = parser.parse_args()
+    
+    match_faces_to_tmdb(args.file_uuid, args.schema)
\ No newline at end of file
diff --git a/scripts/ocr_processor.py b/scripts/ocr_processor.py
index 04a1091..bcf5de7 100755
--- a/scripts/ocr_processor.py
+++ b/scripts/ocr_processor.py
@@ -84,18 +84,22 @@ def process_ocr(
 
 
 def _fallback(video_path, output_path, uuid, sample_interval):
-    """Fallback to original PaddleOCR implementation"""
+    """Fallback to MPS OCR implementation"""
     import importlib
     spec = importlib.util.spec_from_file_location(
-        "paddle_ocr",
-        os.path.join(os.path.dirname(__file__), "ocr_paddle.py")
+        "ocr_mps",
+        os.path.join(os.path.dirname(__file__), "ocr_processor_mps.py")
     )
     if spec is None:
         print("[OCR] No fallback available, returning empty result", file=sys.stderr)
         return {"frame_count": 0, "fps": 0, "frames": []}
-    paddle = importlib.util.module_from_spec(spec)
-    spec.loader.exec_module(paddle)
-    return paddle.process_ocr(video_path, output_path, uuid, sample_interval=sample_interval)
+    ocr_mps = importlib.util.module_from_spec(spec)
+    spec.loader.exec_module(ocr_mps)
+    return ocr_mps.process_video_ocr(
+        video_path=video_path,
+        output_path=output_path,
+        sample_interval=sample_interval
+    )
 
 
 if __name__ == "__main__":
diff --git a/scripts/qdrant_sync_collection.py b/scripts/qdrant_sync_collection.py
new file mode 100644
index 0000000..8f634ea
--- /dev/null
+++ b/scripts/qdrant_sync_collection.py
@@ -0,0 +1,77 @@
+#!/usr/bin/env python3
+"""Sync all vectors from one Qdrant collection to another on the same instance."""
+import json
+import time
+import urllib.request
+import urllib.error
+
+QDRANT_URL = "http://localhost:6333"
+API_KEY = "Test3200Test3200Test3200"
+SOURCE = "momentry_dev_rule1_v2"
+TARGET = "momentry_rule1"
+BATCH_SIZE = 500
+SLEEP = 0.05
+
+
+def qdrant(method, path, body=None):
+    url = f"{QDRANT_URL}{path}"
+    data = json.dumps(body).encode() if body else None
+    req = urllib.request.Request(url, data=data, method=method)
+    req.add_header("Content-Type", "application/json")
+    req.add_header("Api-Key", API_KEY)
+    try:
+        with urllib.request.urlopen(req) as resp:
+            return json.loads(resp.read())
+    except urllib.error.HTTPError as e:
+        print(f"  HTTP {e.code}: {e.read().decode()}")
+        raise
+
+
+def scroll_batch(offset=None):
+    body = {"limit": BATCH_SIZE, "with_payload": True, "with_vector": True}
+    if offset is not None:
+        body["offset"] = offset
+    result = qdrant("POST", f"/collections/{SOURCE}/points/scroll", body)
+    points = result.get("result", {}).get("points", [])
+    next_offset = result.get("result", {}).get("next_page_offset")
+    return points, next_offset
+
+
+def upsert_batch(points):
+    body = {"points": points}
+    result = qdrant("PUT", f"/collections/{TARGET}/points", body)
+    return result.get("status") == "ok" or result.get("result", {}).get("status") == "ok"
+
+
+def main():
+    offset = None
+    total = 0
+    batch_num = 0
+    t0 = time.time()
+
+    while True:
+        points, offset = scroll_batch(offset)
+        if not points:
+            break
+
+        ok = upsert_batch(points)
+        if not ok:
+            print(f"  FAILED batch {batch_num} ({len(points)} pts)")
+            break
+
+        total += len(points)
+        batch_num += 1
+        if batch_num % 10 == 0:
+            elapsed = time.time() - t0
+            print(f"  Synced {total} points ({elapsed:.1f}s)")
+
+        if offset is None:
+            break
+        time.sleep(SLEEP)
+
+    elapsed = time.time() - t0
+    print(f"Done: {total} points synced in {elapsed:.1f}s")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/scripts/start_momentry.sh b/scripts/start_momentry.sh
index 9f19fd8..8a12d67 100755
--- a/scripts/start_momentry.sh
+++ b/scripts/start_momentry.sh
@@ -4,6 +4,24 @@ SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
 PROJECT_DIR="$(dirname "$SCRIPT_DIR")"
 ENV_FILE="${PROJECT_DIR}/.env.development"
 
+# Load env vars (silently)
+source "$ENV_FILE" 2>/dev/null || true
+
+# Path defaults (can be overridden by env vars above)
+LOG_DIR="${MOMENTRY_LOG_DIR:-/Users/accusys/momentry/logs}"
+PG_BIN_DIR="${MOMENTRY_PG_BIN_DIR:-/Users/accusys/pgsql/18.3/bin}"
+PG_DATA_DIR="${MOMENTRY_PG_DATA_DIR:-/Users/accusys/pgsql/data}"
+QDRANT_BIN="${MOMENTRY_QDRANT_BIN:-/Users/accusys/.cargo/bin/qdrant}"
+QDRANT_STORAGE_DIR="${MOMENTRY_QDRANT_STORAGE_DIR:-/Users/accusys/momentry/qdrant_storage}"
+LLAMACPP_BIN="${MOMENTRY_LLAMACPP_BIN:-/Users/accusys/llama/bin/llama-server}"
+A4B_MODEL="${MOMENTRY_LLM_A4B_MODEL_PATH:-/Users/accusys/models/google_gemma-4-26B-A4B-it-Q5_K_M.gguf}"
+A4B_MMPROJ="${MOMENTRY_LLM_A4B_MMPROJ_PATH:-/Users/accusys/models/gemma-4-26B-A4B-it.mmproj-f16.gguf}"
+E4B_MODEL="${MOMENTRY_LLM_E4B_MODEL_PATH:-/Users/accusys/models/gemma-4-E4B-it-Q4_K_M.gguf}"
+E4B_MMPROJ="${MOMENTRY_LLM_E4B_MMPROJ_PATH:-/Users/accusys/models/mmproj-gemma-4-E4B-it-BF16.gguf}"
+OLLAMA_BIN="${MOMENTRY_OLLAMA_BIN:-/Users/accusys/bin/ollama}"
+PLAYGROUND_BIN="${MOMENTRY_PLAYGROUND_BIN:-target/debug/momentry_playground}"
+API_KEY="${MOMENTRY_API_KEY:-muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69}"
+
 # Colors
 GREEN='\033[0;32m'
 YELLOW='\033[1;33m'
@@ -17,27 +35,23 @@ check() {
     if [ $? -eq 0 ]; then echo -e "  ${GREEN}✅${NC} $1"; else echo -e "  ${RED}❌${NC} $1"; FAILURES+=("$1"); fi
 }
 
-echo -e "${CYAN}====================================${NC}"
+echo -e "${CYAN}========================================${NC}"
 echo -e "${CYAN}  Momentry Core - Startup Sequence${NC}"
-echo -e "${CYAN}====================================${NC}"
+echo -e "${CYAN}========================================${NC}"
 echo ""
 
-LOG_DIR="/Users/accusys/momentry/logs"
-
 # ── 1. PostgreSQL ──
-echo -e "${YELLOW}[1/8] PostgreSQL${NC}"
-PG_DATA="/Users/accusys/pgsql/data"
-PG_BIN="/Users/accusys/pgsql/18.3/bin"
-if $PG_BIN/pg_isready -q 2>/dev/null; then
+echo -e "${YELLOW}[1/10] PostgreSQL${NC}"
+if "$PG_BIN_DIR/pg_isready" -q 2>/dev/null; then
     echo -e "  ${GREEN}✅${NC} already running"
 else
-    $PG_BIN/pg_ctl -D "$PG_DATA" -l "$LOG_DIR/pg.log" start 2>/dev/null
+    "$PG_BIN_DIR/pg_ctl" -D "$PG_DATA_DIR" -l "$LOG_DIR/pg.log" start 2>/dev/null
     sleep 2
-    $PG_BIN/pg_isready -q 2>/dev/null; check "started"
+    "$PG_BIN_DIR/pg_isready" -q 2>/dev/null; check "started"
 fi
 
 # ── 2. Redis ──
-echo -e "${YELLOW}[2/8] Redis${NC}"
+echo -e "${YELLOW}[2/10] Redis${NC}"
 if redis-cli ping 2>/dev/null | grep -q PONG; then
     echo -e "  ${GREEN}✅${NC} already running"
 else
@@ -46,14 +60,22 @@ else
     redis-cli ping 2>/dev/null | grep -q PONG; check "started"
 fi
 
-# ── 3. Qdrant ──
-echo -e "${YELLOW}[3/8] Qdrant${NC}"
-QDRANT_BIN="/Users/accusys/momentry_resources/bin/qdrant"
-QDRANT_STORAGE="/Users/accusys/momentry/qdrant_storage"
+# ── 3. MongoDB ──
+echo -e "${YELLOW}[3/10] MongoDB${NC}"
+if pgrep -q mongod 2>/dev/null; then
+    echo -e "  ${GREEN}✅${NC} already running"
+else
+    brew services start mongodb-community 2>/dev/null || mongod --dbpath /opt/homebrew/var/mongodb --logpath "$LOG_DIR/mongodb.log" --fork 2>/dev/null
+    sleep 2
+    pgrep -q mongod 2>/dev/null; check "started"
+fi
+
+# ── 4. Qdrant ──
+echo -e "${YELLOW}[4/10] Qdrant${NC}"
 if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 3 http://localhost:6333/healthz 2>/dev/null | grep -q 200; then
     echo -e "  ${GREEN}✅${NC} already running"
 else
-    mkdir -p "$QDRANT_STORAGE"
+    mkdir -p "$QDRANT_STORAGE_DIR"
     "$QDRANT_BIN" > "$LOG_DIR/qdrant.log" 2>&1 &
     for i in $(seq 1 15); do
         sleep 2
@@ -64,9 +86,8 @@ else
     curl -s -o /dev/null -w "%{http_code}" --connect-timeout 3 http://localhost:6333/healthz 2>/dev/null | grep -q 200; check "started"
 fi
 
-# ── 4. Qdrant Collection ──
-echo -e "${YELLOW}[4/8] Qdrant Collection${NC}"
-source "$ENV_FILE" 2>/dev/null || true
+# ── 5. Qdrant Collection ──
+echo -e "${YELLOW}[5/10] Qdrant Collection${NC}"
 COLLECTION="${QDRANT_COLLECTION:-momentry_dev_rule1_v2}"
 EXISTS=$(curl -s "http://localhost:6333/collections/$COLLECTION" 2>/dev/null | python3 -c "import sys,json; d=json.load(sys.stdin); print(d.get('result',{}).get('status','not_found'))" 2>/dev/null)
 if [ "$EXISTS" = "not_found" ]; then
@@ -78,15 +99,19 @@ fi
 curl -s "http://localhost:6333/collections/$COLLECTION" 2>/dev/null | python3 -c "import sys,json; d=json.load(sys.stdin); s=d.get('result',{}).get('status','not_found'); assert s in ('green','ok'), f'unexpected status: {s}'" 2>/dev/null
 check "collection '$COLLECTION' ready"
 
-# ── 5. LLM (Gemma4 / llama.cpp) ──
-echo -e "${YELLOW}[5/8] LLM Server (Gemma4)${NC}"
+# ── 6a. LLM Chat (A4B, port 8082) ──
+echo -e "${YELLOW}[6a/10] LLM Chat - A4B (port 8082)${NC}"
 if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 5 http://localhost:8082/health 2>/dev/null | grep -q 200; then
     echo -e "  ${GREEN}✅${NC} already running"
 else
-    LLM_BIN="/Users/accusys/momentry_resources/llama/bin/llama-server"
-    LLM_MODEL="/Users/accusys/momentry/models/llm/google_gemma-4-26B-A4B-it-Q5_K_M.gguf"
-    "$LLM_BIN" -m "$LLM_MODEL" --host 0.0.0.0 --port 8082 -ngl 99 -c 16384 --temp 0.1 --mlock --reasoning off > "$LOG_DIR/llama_server.log" 2>&1 &
-    echo -e "  ${YELLOW}⏳ loading model (~30s)...${NC}"
+    LLAMA_ARGS_A4B=(
+        -m "$A4B_MODEL"
+        --mmproj "$A4B_MMPROJ"
+        --host 0.0.0.0 --port 8082
+        -ngl 99 -c 16384 --temp 0.1 --mlock --reasoning off
+    )
+    "$LLAMACPP_BIN" "${LLAMA_ARGS_A4B[@]}" > "$LOG_DIR/llama_a4b.log" 2>&1 &
+    echo -e "  ${YELLOW}⏳ loading A4B model (~30s)...${NC}"
     for i in $(seq 1 30); do
         sleep 2
         if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 2 http://localhost:8082/health 2>/dev/null | grep -q 200; then
@@ -96,8 +121,30 @@ else
     curl -s -o /dev/null -w "%{http_code}" --connect-timeout 3 http://localhost:8082/health 2>/dev/null | grep -q 200; check "started"
 fi
 
-# ── 6. Embedding Server ──
-echo -e "${YELLOW}[6/8] EmbeddingGemma${NC}"
+# ── 6b. LLM Vision (E4B, port 8083) ──
+echo -e "${YELLOW}[6b/10] LLM Vision - E4B (port 8083)${NC}"
+if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 5 http://localhost:8083/health 2>/dev/null | grep -q 200; then
+    echo -e "  ${GREEN}✅${NC} already running"
+else
+    LLAMA_ARGS_E4B=(
+        -m "$E4B_MODEL"
+        --mmproj "$E4B_MMPROJ"
+        --host 0.0.0.0 --port 8083
+        -ngl 99 -c 16384 --temp 0.1 --mlock
+    )
+    "$LLAMACPP_BIN" "${LLAMA_ARGS_E4B[@]}" > "$LOG_DIR/llama_e4b.log" 2>&1 &
+    echo -e "  ${YELLOW}⏳ loading E4B model (~30s)...${NC}"
+    for i in $(seq 1 30); do
+        sleep 2
+        if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 2 http://localhost:8083/health 2>/dev/null | grep -q 200; then
+            break
+        fi
+    done
+    curl -s -o /dev/null -w "%{http_code}" --connect-timeout 3 http://localhost:8083/health 2>/dev/null | grep -q 200; check "started"
+fi
+
+# ── 7. Embedding Server ──
+echo -e "${YELLOW}[7/10] EmbeddingGemma${NC}"
 if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 5 http://localhost:11436/health 2>/dev/null | grep -q 200; then
     echo -e "  ${GREEN}✅${NC} already running"
 else
@@ -112,23 +159,22 @@ else
     curl -s -o /dev/null -w "%{http_code}" --connect-timeout 5 http://localhost:11436/health 2>/dev/null | grep -q 200; check "started"
 fi
 
-# ── 7. Playground Server ──
-echo -e "${YELLOW}[7/8] Playground API Server${NC}"
-if curl -s -o /dev/null -w "%{http_code}" -H "X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69" --connect-timeout 5 http://127.0.0.1:3003/api/v1/agents/5w1h/status 2>/dev/null | grep -q 200; then
+# ── 8. Playground Server ──
+echo -e "${YELLOW}[8/10] Playground API Server${NC}"
+if curl -s -o /dev/null -w "%{http_code}" -H "X-API-Key: $API_KEY" --connect-timeout 5 http://127.0.0.1:3003/api/v1/agents/5w1h/status 2>/dev/null | grep -q 200; then
     echo -e "  ${GREEN}✅${NC} already running"
 else
     cd "$PROJECT_DIR"
-    target/debug/momentry_playground server > "$LOG_DIR/playground.log" 2>&1 &
+    $PLAYGROUND_BIN server > "$LOG_DIR/playground.log" 2>&1 &
     sleep 4
-    curl -s -o /dev/null -w "%{http_code}" -H "X-API-Key: muser_68600856036340bcafc01930eb4bd839_1774418104_97221b69" --connect-timeout 5 http://127.0.0.1:3003/api/v1/agents/5w1h/status 2>/dev/null | grep -q 200; check "started"
+    curl -s -o /dev/null -w "%{http_code}" -H "X-API-Key: $API_KEY" --connect-timeout 5 http://127.0.0.1:3003/api/v1/agents/5w1h/status 2>/dev/null | grep -q 200; check "started"
 fi
 
-# ── 8. Ollama (Gemma4 E4B) ──
-echo -e "${YELLOW}[8/8] Ollama (Gemma4 E4B)${NC}"
+# ── 9. Ollama ──
+echo -e "${YELLOW}[9/10] Ollama${NC}"
 if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 5 http://localhost:11434/api/tags 2>/dev/null | grep -q 200; then
     echo -e "  ${GREEN}✅${NC} already running"
 else
-    OLLAMA_BIN="/Users/accusys/momentry_resources/bin/ollama"
     if [ ! -f "$OLLAMA_BIN" ]; then
         echo -e "  ${YELLOW}⚠ ollama binary not found, skipping${NC}"
     else
@@ -138,6 +184,16 @@ else
     fi
 fi
 
+# ── 10. SFTPGo ──
+echo -e "${YELLOW}[10/10] SFTPGo${NC}"
+if curl -s -o /dev/null -w "%{http_code}" --connect-timeout 5 http://localhost:8080/api/v1/version 2>/dev/null | grep -q 200; then
+    echo -e "  ${GREEN}✅${NC} already running"
+else
+    /Users/accusys/bin/sftpgo serve -c /Users/accusys/momentry/etc/sftpgo > "$LOG_DIR/sftpgo.log" 2>&1 &
+    sleep 3
+    curl -s -o /dev/null -w "%{http_code}" --connect-timeout 5 http://localhost:8080/api/v1/version 2>/dev/null | grep -q 200; check "started"
+fi
+
 echo ""
 if [ ${#FAILURES[@]} -eq 0 ]; then
     echo -e "${GREEN}====================================${NC}"
@@ -151,10 +207,13 @@ else
 fi
 echo ""
 echo "  Playground:   http://127.0.0.1:3003"
-echo "  LLM:          http://127.0.0.1:8082"
+echo "  LLM Chat:     http://127.0.0.1:8082"
+echo "  LLM Vision:   http://127.0.0.1:8083"
 echo "  Embedding:    http://127.0.0.1:11436"
 echo "  Ollama:       http://localhost:11434"
 echo "  Qdrant:       http://localhost:6333"
 echo "  PostgreSQL:   localhost:5432"
 echo "  Redis:        localhost:6379"
+echo "  MongoDB:      localhost:27017"
+echo "  SFTPGo:       http://localhost:8080 (SFTP: port 2022)"
 echo ""
diff --git a/scripts/store_traced_faces.py b/scripts/store_traced_faces.py
index 26127ed..a0c45eb 100644
--- a/scripts/store_traced_faces.py
+++ b/scripts/store_traced_faces.py
@@ -319,12 +319,13 @@ def store_traced_faces(file_uuid: str, traced_json_path: str, schema: str = SCHE
                 cur.execute(
                     f"""
                     UPDATE {schema}.face_detections
-                    SET trace_id = %s
+                    SET trace_id = %s, embedding = %s
                     WHERE file_uuid = %s AND frame_number = %s
                       AND x = %s AND y = %s AND width = %s AND height = %s
                     """,
                     (
                         trace_id,
+                        embed_vec,
                         file_uuid, frame_num, x, y, w, h,
                     ),
                 )
diff --git a/scripts/swift_processors/swift_face.swift b/scripts/swift_processors/swift_face.swift
index ecb850d..06710d1 100644
--- a/scripts/swift_processors/swift_face.swift
+++ b/scripts/swift_processors/swift_face.swift
@@ -126,12 +126,24 @@ struct SwiftFace: ParsableCommand {
                 let imgH = CGFloat(cgImage.height)
 
                 // Process landmark observations FIRST (each has bbox + landmarks, self-consistent)
+                // Quality filtering
+                let MIN_CONFIDENCE = 0.6
+                let MIN_SIZE = 20
+                
                 for lmObs in landmarkObservations {
+                    // Confidence filter
+                    let lmConf = Double(lmObs.confidence)
+                    if lmConf < MIN_CONFIDENCE { continue }
+                    
                     let bb = lmObs.boundingBox
-                    let faceX = Int(bb.origin.x * imgW)
-                    let faceY = Int((1.0 - bb.origin.y - bb.size.height) * imgH)
                     let faceW = Int(bb.size.width * imgW)
                     let faceH = Int(bb.size.height * imgH)
+                    
+                    // Size filter
+                    if faceW < MIN_SIZE || faceH < MIN_SIZE { continue }
+                    
+                    let faceX = Int(bb.origin.x * imgW)
+                    let faceY = Int((1.0 - bb.origin.y - bb.size.height) * imgH)
 
                     var faceData: [String: Any] = [
                         "bbox": ["x": max(0, faceX), "y": max(0, faceY),
@@ -203,11 +215,21 @@ struct SwiftFace: ParsableCommand {
                         }
                     }
                     if matched { continue }
+                    
+                    // Quality filtering for unmatched face rects
+                    let MIN_CONFIDENCE = 0.6
+                    let MIN_SIZE = 20
+                    
+                    let faceConf = Double(faceObs.faceCaptureQuality ?? faceObs.confidence)
+                    if faceConf < MIN_CONFIDENCE { continue }
+                    
+                    let faceW = Int(fBB.size.width * imgW)
+                    let faceH = Int(fBB.size.height * imgH)
+                    if faceW < MIN_SIZE || faceH < MIN_SIZE { continue }
+                    
                     // Unmatched face rect: output without landmarks
                     let faceX = Int(fBB.origin.x * imgW)
                     let faceY = Int((1.0 - fBB.origin.y - fBB.size.height) * imgH)
-                    let faceW = Int(fBB.size.width * imgW)
-                    let faceH = Int(fBB.size.height * imgH)
 
                     var faceData: [String: Any] = [
                         "bbox": ["x": max(0, faceX), "y": max(0, faceY),
diff --git a/scripts/update_embeddings.py b/scripts/update_embeddings.py
new file mode 100644
index 0000000..13da7c9
--- /dev/null
+++ b/scripts/update_embeddings.py
@@ -0,0 +1,107 @@
+#!/opt/homebrew/bin/python3.11
+"""Update face_detections embeddings from face_traced.json"""
+
+import json
+import psycopg2
+import sys
+import os
+
+DATABASE_URL = os.getenv("DATABASE_URL", "postgres://accusys@localhost:5432/momentry")
+
+def update_embeddings(file_uuid: str, traced_json_path: str, schema: str = "dev"):
+    """Update embeddings in face_detections from face_traced.json"""
+    
+    with open(traced_json_path, 'r') as f:
+        data = json.load(f)
+    
+    conn = psycopg2.connect(DATABASE_URL)
+    cur = conn.cursor()
+    
+    frames = data.get('frames', {})
+    
+    updated = 0
+    no_match = 0
+    
+    # Process frames in batches of 1000
+    batch = []
+    
+    for frame_key, frame_data in frames.items():
+        frame_num = int(frame_key)
+        faces = frame_data.get('faces', [])
+        
+        for face in faces:
+            embedding = face.get('embedding')
+            if not embedding or len(embedding) == 0:
+                continue
+            
+            trace_id = face.get('trace_id')
+            x = face.get('x', 0)
+            y = face.get('y', 0)
+            w = face.get('width', 0)
+            h = face.get('height', 0)
+            
+            # Convert embedding to PostgreSQL array format
+            emb_str = '[' + ','.join(str(v) for v in embedding) + ']'
+            
+            batch.append((trace_id, emb_str, file_uuid, frame_num, x, y, w, h))
+        
+        # Execute batch every 1000 frames
+        if len(batch) >= 1000:
+            for item in batch:
+                try:
+                    cur.execute(
+                        f"""
+                        UPDATE {schema}.face_detections
+                        SET embedding = %s::real[], trace_id = %s
+                        WHERE file_uuid = %s AND frame_number = %s
+                          AND x = %s AND y = %s AND width = %s AND height = %s
+                          AND embedding IS NULL
+                        """,
+                        (item[1], item[0], item[2], item[3], item[4], item[5], item[6], item[7])
+                    )
+                    updated += cur.rowcount
+                except Exception as e:
+                    pass
+            conn.commit()
+            batch = []
+            print(f"[UPDATE] Processed {updated} so far...", file=sys.stderr)
+    
+    # Final batch
+    for item in batch:
+        try:
+            cur.execute(
+                f"""
+                UPDATE {schema}.face_detections
+                SET embedding = %s::real[], trace_id = %s
+                WHERE file_uuid = %s AND frame_number = %s
+                  AND x = %s AND y = %s AND width = %s AND height = %s
+                  AND embedding IS NULL
+                """,
+                (item[1], item[0], item[2], item[3], item[4], item[5], item[6], item[7])
+            )
+            updated += cur.rowcount
+        except Exception as e:
+            pass
+    
+    conn.commit()
+    cur.close()
+    conn.close()
+    
+    print(f"[UPDATE] Total updated: {updated}")
+    return updated
+
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--file-uuid", required=True)
+    parser.add_argument("--traced-json", help="Path to face_traced.json")
+    parser.add_argument("--schema", default="dev")
+    args = parser.parse_args()
+    
+    traced_json = args.traced_json or f"/Users/accusys/momentry/output_dev/{args.file_uuid}.face_traced.json"
+    
+    if not os.path.exists(traced_json):
+        print(f"File not found: {traced_json}", file=sys.stderr)
+        sys.exit(1)
+    
+    update_embeddings(args.file_uuid, traced_json, args.schema)
\ No newline at end of file
diff --git a/scripts/verify_charade_pipeline.py b/scripts/verify_charade_pipeline.py
new file mode 100644
index 0000000..afa6edd
--- /dev/null
+++ b/scripts/verify_charade_pipeline.py
@@ -0,0 +1,170 @@
+#!/opt/homebrew/bin/python3.11
+"""
+Verify Charade pipeline completion.
+Usage: python3 scripts/verify_charade_pipeline.py <file_uuid>
+"""
+
+import sys
+import psycopg2
+import subprocess
+import json
+
+DATABASE_URL = "postgres://accusys@localhost:5432/momentry"
+OUTPUT_DIR = "/Users/accusys/momentry/output_dev"
+
+
+def check_file_outputs(file_uuid):
+    """Check all expected output files exist"""
+    expected_files = [
+        "cut.json",
+        "yolo.json",
+        "face.json",
+        "face_traced.json",
+        "pose.json",
+        "asrx.json",
+        "visual_chunk.json",
+        "scene.json",
+        "scene_meta.json",
+        "story_llm.json",
+        "story_story.json",
+        "tmdb.json",
+    ]
+    
+    results = []
+    for ext in expected_files:
+        path = f"{OUTPUT_DIR}/{file_uuid}.{ext}"
+        try:
+            size = subprocess.check_output(["stat", "-f%z", path]).decode().strip()
+            results.append({"file": ext, "exists": True, "size": int(size)})
+        except:
+            results.append({"file": ext, "exists": False, "size": 0})
+    
+    return results
+
+
+def check_db_records(file_uuid, schema="dev"):
+    """Check database records"""
+    conn = psycopg2.connect(DATABASE_URL)
+    cur = conn.cursor()
+    
+    checks = [
+        ("videos", f"SELECT status FROM {schema}.videos WHERE file_uuid = '{file_uuid}'"),
+        ("monitor_jobs", f"SELECT status, completed_processors FROM {schema}.monitor_jobs WHERE uuid = '{file_uuid}'"),
+        ("pre_chunks", f"SELECT COUNT(*) FROM {schema}.pre_chunks WHERE file_uuid = '{file_uuid}'"),
+        ("face_detections_total", f"SELECT COUNT(*) FROM {schema}.face_detections WHERE file_uuid = '{file_uuid}'"),
+        ("face_detections_embedding", f"SELECT COUNT(embedding) FROM {schema}.face_detections WHERE file_uuid = '{file_uuid}'"),
+        ("face_detections_trace", f"SELECT COUNT(trace_id) FROM {schema}.face_detections WHERE file_uuid = '{file_uuid}'"),
+        ("face_detections_identity", f"SELECT COUNT(identity_id) FROM {schema}.face_detections WHERE file_uuid = '{file_uuid}'"),
+        ("chunks_total", f"SELECT COUNT(*) FROM {schema}.chunk WHERE file_uuid = '{file_uuid}'"),
+        ("chunks_embedding", f"SELECT COUNT(embedding) FROM {schema}.chunk WHERE file_uuid = '{file_uuid}'"),
+    ]
+    
+    results = []
+    for name, query in checks:
+        try:
+            cur.execute(query)
+            result = cur.fetchone()
+            results.append({"check": name, "value": result[0] if result else None})
+        except Exception as e:
+            results.append({"check": name, "error": str(e)})
+    
+    cur.close()
+    conn.close()
+    return results
+
+
+def check_identity_bindings(file_uuid, schema="dev"):
+    """Check identity bindings"""
+    conn = psycopg2.connect(DATABASE_URL)
+    cur = conn.cursor()
+    
+    checks = [
+        ("audrey_faces", f"""
+            SELECT COUNT(*) FROM {schema}.face_detections fd 
+            JOIN {schema}.identities i ON fd.identity_id = i.id 
+            WHERE fd.file_uuid = '{file_uuid}' AND i.name = 'Audrey Hepburn'
+        """),
+        ("cary_faces", f"""
+            SELECT COUNT(*) FROM {schema}.face_detections fd 
+            JOIN {schema}.identities i ON fd.identity_id = i.id 
+            WHERE fd.file_uuid = '{file_uuid}' AND i.name = 'Cary Grant'
+        """),
+        ("top_identities", f"""
+            SELECT i.name, COUNT(*) as count 
+            FROM {schema}.face_detections fd 
+            JOIN {schema}.identities i ON fd.identity_id = i.id 
+            WHERE fd.file_uuid = '{file_uuid}' AND fd.identity_id IS NOT NULL 
+            GROUP BY i.name 
+            ORDER BY count DESC 
+            LIMIT 10
+        """),
+    ]
+    
+    results = []
+    for name, query in checks:
+        try:
+            cur.execute(query)
+            if name == "top_identities":
+                rows = cur.fetchall()
+                results.append({"check": name, "value": rows})
+            else:
+                result = cur.fetchone()
+                results.append({"check": name, "value": result[0] if result else 0})
+        except Exception as e:
+            results.append({"check": name, "error": str(e)})
+    
+    cur.close()
+    conn.close()
+    return results
+
+
+def print_report(file_uuid, file_outputs, db_records, identity_bindings):
+    """Print verification report"""
+    print(f"\n{'='*60}")
+    print(f"Charade Pipeline Verification Report")
+    print(f"File UUID: {file_uuid}")
+    print(f"{'='*60}\n")
+    
+    print("## File Outputs")
+    for f in file_outputs:
+        status = "✅" if f["exists"] and f["size"] > 0 else "❌"
+        size_kb = f["size"] / 1024
+        print(f"  {status} {f['file']}: {size_kb:.1f} KB")
+    
+    print("\n## Database Records")
+    for r in db_records:
+        value = r.get("value", r.get("error", "N/A"))
+        if isinstance(value, (list, tuple)):
+            value = ", ".join(str(v) for v in value)
+        print(f"  {r['check']}: {value}")
+    
+    print("\n## Identity Bindings")
+    for r in identity_bindings:
+        value = r.get("value", r.get("error", "N/A"))
+        if isinstance(value, list):
+            print(f"  {r['check']}:")
+            for row in value:
+                print(f"    - {row[0]}: {row[1]} faces")
+        else:
+            print(f"  {r['check']}: {value}")
+    
+    print(f"\n{'='*60}\n")
+
+
+def main():
+    if len(sys.argv) < 2:
+        file_uuid = "c3c635e3641da80dde10cc555ffcdda5"
+    else:
+        file_uuid = sys.argv[1]
+    
+    print("Verifying pipeline...")
+    
+    file_outputs = check_file_outputs(file_uuid)
+    db_records = check_db_records(file_uuid)
+    identity_bindings = check_identity_bindings(file_uuid)
+    
+    print_report(file_uuid, file_outputs, db_records, identity_bindings)
+
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/scripts/visual_chunk_processor.py b/scripts/visual_chunk_processor.py
deleted file mode 100644
index 1a60750..0000000
--- a/scripts/visual_chunk_processor.py
+++ /dev/null
@@ -1,445 +0,0 @@
-#!/usr/bin/env python3
-"""
-視覺分片處理器 (Phase 2.2)
-
-從 YOLO 結果生成視覺分片，支持多種分片策略：
-1. 固定幀數分片
-2. 基於物件相似度分片
-3. 基於場景變化分片
-"""
-
-import json
-import sys
-import os
-import argparse
-from pathlib import Path
-from typing import Dict, List, Any, Optional
-import numpy as np
-from datetime import datetime
-
-# 添加父目錄到路徑以導入其他模組
-sys.path.insert(0, str(Path(__file__).parent.parent))
-from scripts.yolo_processor_contract_v1 import YOLOProcessor
-
-
-class VisualChunkProcessor:
-    """視覺分片處理器"""
-
-    def __init__(self, video_path: str, yolo_result_path: Optional[str] = None):
-        self.video_path = video_path
-        self.yolo_result_path = yolo_result_path
-        self.yolo_result = None
-
-    def load_yolo_result(self):
-        """加載 YOLO 結果"""
-        if self.yolo_result_path and os.path.exists(self.yolo_result_path):
-            with open(self.yolo_result_path, "r", encoding="utf-8") as f:
-                self.yolo_result = json.load(f)
-        else:
-            # 如果沒有提供 YOLO 結果路徑，則運行 YOLO 檢測
-            print(f"[VisualChunk] Running YOLO detection for: {self.video_path}")
-            yolo_processor = YOLOProcessor(self.video_path)
-            yolo_result = yolo_processor.process()
-            self.yolo_result = yolo_processor.to_json_dict()
-
-    def create_fixed_frame_chunks(
-        self, frames_per_chunk: int = 30
-    ) -> List[Dict[str, Any]]:
-        """創建固定幀數分片
-
-        Args:
-            frames_per_chunk: 每個分片的幀數
-
-        Returns:
-            視覺分片列表
-        """
-        if not self.yolo_result:
-            self.load_yolo_result()
-
-        frames = self.yolo_result.get("frames", {})
-        if not frames:
-            return []
-
-        # 將幀字典轉換為排序後的列表
-        frame_list = []
-        for frame_key, frame_data in frames.items():
-            frame_list.append(
-                {
-                    "frame_number": int(frame_key),
-                    "timestamp": frame_data.get("time_seconds", 0),
-                    "objects": frame_data.get("detections", []),
-                }
-            )
-
-        # 按幀號排序
-        frame_list.sort(key=lambda x: x["frame_number"])
-
-        chunks = []
-        total_frames = len(frame_list)
-
-        for start_idx in range(0, total_frames, frames_per_chunk):
-            end_idx = min(start_idx + frames_per_chunk, total_frames)
-            chunk_frames = frame_list[start_idx:end_idx]
-
-            if not chunk_frames:
-                continue
-
-            # 計算分片統計
-            chunk_stats = self._calculate_chunk_stats(chunk_frames)
-
-            chunk = {
-                "start_frame": chunk_frames[0]["frame_number"],
-                "end_frame": chunk_frames[-1]["frame_number"] + 1,  # exclusive
-                "frame_count": len(chunk_frames),
-                "keyframe_objects": self._extract_keyframe_objects(chunk_frames),
-                "dominant_objects": chunk_stats["dominant_objects"],
-                "metadata": {
-                    "object_count": chunk_stats["total_objects"],
-                    "unique_classes": chunk_stats["unique_classes"],
-                    "max_confidence": chunk_stats["max_confidence"],
-                    "avg_confidence": chunk_stats["avg_confidence"],
-                    "spatial_density": chunk_stats["spatial_density"],
-                },
-            }
-
-            chunks.append(chunk)
-
-        return chunks
-
-    def create_similarity_based_chunks(
-        self, similarity_threshold: float = 0.5, min_frames_per_chunk: int = 10
-    ) -> List[Dict[str, Any]]:
-        """基於物件相似度創建分片
-
-        Args:
-            similarity_threshold: 相似度閾值 (0-1)
-            min_frames_per_chunk: 最小幀數
-
-        Returns:
-            視覺分片列表
-        """
-        if not self.yolo_result:
-            self.load_yolo_result()
-
-        frames = self.yolo_result.get("frames", {})
-        if not frames:
-            return []
-
-        # 將幀字典轉換為排序後的列表
-        frame_list = []
-        for frame_key, frame_data in frames.items():
-            frame_list.append(
-                {
-                    "frame_number": int(frame_key),
-                    "timestamp": frame_data.get("time_seconds", 0),
-                    "objects": frame_data.get("detections", []),
-                }
-            )
-
-        # 按幀號排序
-        frame_list.sort(key=lambda x: x["frame_number"])
-
-        chunks = []
-        current_chunk_frames = []
-        current_start_frame = 0
-
-        for i, frame in enumerate(frame_list):
-            if not current_chunk_frames:
-                current_chunk_frames.append(frame)
-                current_start_frame = frame["frame_number"]
-                continue
-
-            # 計算相似度
-            last_frame = current_chunk_frames[-1]
-            similarity = self._calculate_frame_similarity(last_frame, frame)
-
-            if similarity >= similarity_threshold:
-                # 相似度高，加入當前分片
-                current_chunk_frames.append(frame)
-            else:
-                # 相似度低，創建新分片
-                if len(current_chunk_frames) >= min_frames_per_chunk:
-                    chunk = self._create_chunk_from_frames(
-                        current_chunk_frames,
-                        current_start_frame,
-                        frame_list[i - 1]["frame_number"] + 1,
-                    )
-                    chunks.append(chunk)
-
-                # 開始新的分片
-                current_chunk_frames = [frame]
-                current_start_frame = frame["frame_number"]
-
-        # 處理最後一個分片
-        if len(current_chunk_frames) >= min_frames_per_chunk:
-            chunk = self._create_chunk_from_frames(
-                current_chunk_frames,
-                current_start_frame,
-                current_chunk_frames[-1]["frame_number"] + 1,
-            )
-            chunks.append(chunk)
-
-        return chunks
-
-    def _calculate_frame_similarity(self, frame1: Dict, frame2: Dict) -> float:
-        """計算兩個幀之間的相似度（基於物件類別）"""
-        objects1 = frame1.get("objects", [])
-        objects2 = frame2.get("objects", [])
-
-        if not objects1 and not objects2:
-            return 1.0
-
-        if not objects1 or not objects2:
-            return 0.0
-
-        # 提取物件類別
-        classes1 = set(
-            obj.get("class_name", "") for obj in objects1 if obj.get("class_name")
-        )
-        classes2 = set(
-            obj.get("class_name", "") for obj in objects2 if obj.get("class_name")
-        )
-
-        # 計算 Jaccard 相似度
-        intersection = classes1.intersection(classes2)
-        union = classes1.union(classes2)
-
-        if not union:
-            return 0.0
-
-        return len(intersection) / len(union)
-
-    def _calculate_chunk_stats(self, frames: List[Dict]) -> Dict[str, Any]:
-        """計算分片統計信息"""
-        all_objects = []
-        for frame in frames:
-            all_objects.extend(frame.get("objects", []))
-
-        # 總物件數
-        total_objects = len(all_objects)
-
-        # 唯一類別
-        unique_classes = list(
-            set(
-                obj.get("class_name", "")
-                for obj in all_objects
-                if obj.get("class_name")
-            )
-        )
-
-        # 信心值統計
-        confidences = [obj.get("confidence", 0) for obj in all_objects]
-        max_confidence = max(confidences) if confidences else 0
-        avg_confidence = np.mean(confidences) if confidences else 0
-
-        # 空間密度（每幀平均物件數）
-        spatial_density = total_objects / len(frames) if frames else 0
-
-        # 主要物件（出現在大多數幀中的物件）
-        object_counts = {}
-        for frame in frames:
-            frame_classes = set(
-                obj.get("class_name", "")
-                for obj in frame.get("objects", [])
-                if obj.get("class_name")
-            )
-            for class_name in frame_classes:
-                object_counts[class_name] = object_counts.get(class_name, 0) + 1
-
-        dominant_objects = [
-            class_name
-            for class_name, count in object_counts.items()
-            if count / len(frames) > 0.5
-        ]
-        dominant_objects.sort()
-
-        return {
-            "total_objects": total_objects,
-            "unique_classes": unique_classes,
-            "max_confidence": float(max_confidence),
-            "avg_confidence": float(avg_confidence),
-            "spatial_density": float(spatial_density),
-            "dominant_objects": dominant_objects,
-        }
-
-    def _extract_keyframe_objects(self, frames: List[Dict]) -> List[Dict[str, Any]]:
-        """提取關鍵幀物件"""
-        keyframe_objects = []
-
-        # 簡化：每5幀取一個關鍵幀
-        for i in range(0, len(frames), 5):
-            if i < len(frames):
-                frame = frames[i]
-                objects = []
-
-                for obj in frame.get("objects", []):
-                    objects.append(
-                        {
-                            "class_name": obj.get("class_name", ""),
-                            "class_id": obj.get("class_id", 0),
-                            "confidence": float(obj.get("confidence", 0)),
-                            "bbox": {
-                                "x": obj.get("x1", 0),
-                                "y": obj.get("y1", 0),
-                                "width": obj.get("width", 0),
-                                "height": obj.get("height", 0),
-                            }
-                            if "x1" in obj
-                            else None,
-                            "occurrence": 1,
-                        }
-                    )
-
-                keyframe_objects.append(
-                    {
-                        "timestamp": float(frame.get("timestamp", 0)),
-                        "frame_number": frame.get("frame_number", 0),
-                        "objects": objects,
-                    }
-                )
-
-        return keyframe_objects
-
-    def _create_chunk_from_frames(
-        self, frames: List[Dict], start_frame: int, end_frame: int
-    ) -> Dict[str, Any]:
-        """從幀列表創建分片"""
-        chunk_stats = self._calculate_chunk_stats(frames)
-
-        return {
-            "start_frame": start_frame,
-            "end_frame": end_frame,  # exclusive
-            "frame_count": len(frames),
-            "keyframe_objects": self._extract_keyframe_objects(frames),
-            "dominant_objects": chunk_stats["dominant_objects"],
-            "object_relationships": [],  # 可選：後期添加關係檢測
-            "scene_description": None,  # 可選：後期添加 LLM 生成的場景描述
-            "metadata": {
-                "object_count": chunk_stats["total_objects"],
-                "unique_classes": chunk_stats["unique_classes"],
-                "max_confidence": chunk_stats["max_confidence"],
-                "avg_confidence": chunk_stats["avg_confidence"],
-                "spatial_density": chunk_stats["spatial_density"],
-            },
-        }
-
-    def process(self, strategy: str = "fixed", **kwargs) -> Dict[str, Any]:
-        """處理視覺分片生成
-
-        Args:
-            strategy: 分片策略 ("fixed" 或 "similarity")
-            **kwargs: 策略參數
-
-        Returns:
-            處理結果
-        """
-        if not self.yolo_result:
-            self.load_yolo_result()
-
-        start_time = datetime.now()
-
-        if strategy == "fixed":
-            frames_per_chunk = kwargs.get("frames_per_chunk", 30)
-            chunks = self.create_fixed_frame_chunks(frames_per_chunk)
-        elif strategy == "similarity":
-            similarity_threshold = kwargs.get("similarity_threshold", 0.5)
-            min_frames = kwargs.get("min_frames_per_chunk", 10)
-            chunks = self.create_similarity_based_chunks(
-                similarity_threshold, min_frames
-            )
-        else:
-            raise ValueError(f"Unknown strategy: {strategy}")
-
-        # 計算總統計
-        total_frames = sum(chunk["frame_count"] for chunk in chunks)
-        total_objects = sum(chunk["metadata"]["object_count"] for chunk in chunks)
-
-        # 收集所有唯一類別
-        all_unique_classes = set()
-        for chunk in chunks:
-            all_unique_classes.update(chunk["metadata"]["unique_classes"])
-
-        processing_time = (datetime.now() - start_time).total_seconds()
-
-        result = {
-            "metadata": {
-                "video_path": self.video_path,
-                "processing_time": processing_time,
-                "strategy": strategy,
-                "parameters": kwargs,
-                "processed_at": datetime.now().isoformat(),
-            },
-            "chunk_count": len(chunks),
-            "total_frames": total_frames,
-            "total_objects": total_objects,
-            "unique_classes": len(all_unique_classes),
-            "chunks": chunks,
-        }
-
-        return result
-
-
-def main():
-    parser = argparse.ArgumentParser(description="視覺分片處理器")
-    parser.add_argument("video_path", help="視頻文件路徑")
-    parser.add_argument("output_path", help="輸出文件路徑")
-    parser.add_argument("--yolo-result", help="YOLO 結果文件路徑（可選）")
-    parser.add_argument("--uuid", help="檔案 UUID（由 executor 傳入）")
-    parser.add_argument(
-        "--strategy", choices=["fixed", "similarity"], default="fixed", help="分片策略"
-    )
-    parser.add_argument(
-        "--frames-per-chunk", type=int, default=30, help="固定幀數策略：每個分片的幀數"
-    )
-    parser.add_argument(
-        "--similarity-threshold", type=float, default=0.5, help="相似度策略：相似度閾值"
-    )
-    parser.add_argument(
-        "--min-frames-per-chunk", type=int, default=10, help="相似度策略：最小幀數"
-    )
-
-    args = parser.parse_args()
-
-    print(f"[VisualChunk] Starting processing: {args.video_path}")
-    print(f"[VisualChunk] Strategy: {args.strategy}")
-
-    try:
-        processor = VisualChunkProcessor(args.video_path, args.yolo_result)
-
-        if args.strategy == "fixed":
-            result = processor.process(
-                strategy="fixed", frames_per_chunk=args.frames_per_chunk
-            )
-        else:
-            result = processor.process(
-                strategy="similarity",
-                similarity_threshold=args.similarity_threshold,
-                min_frames_per_chunk=args.min_frames_per_chunk,
-            )
-
-        # 保存結果
-        with open(args.output_path, "w", encoding="utf-8") as f:
-            json.dump(result, f, ensure_ascii=False, indent=2)
-
-        print("[VisualChunk] Processing completed")
-        print(f"[VisualChunk] Generated {result['chunk_count']} visual chunks")
-        print(f"[VisualChunk] Total frames: {result['total_frames']}")
-        print(f"[VisualChunk] Total objects: {result['total_objects']}")
-        print(f"[VisualChunk] Unique classes: {result['unique_classes']}")
-        print(f"[VisualChunk] Result saved to: {args.output_path}")
-    except Exception as e:
-        print(f"[VisualChunk] Error: {e}", file=sys.stderr)
-        result = {
-            "chunk_count": 0,
-            "total_frames": 0,
-            "total_objects": 0,
-            "unique_classes": 0,
-            "chunks": [],
-        }
-        with open(args.output_path, "w", encoding="utf-8") as f:
-            json.dump(result, f, ensure_ascii=False, indent=2)
-        print(f"[VisualChunk] Fallback: empty result saved to {args.output_path}")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/scripts/wrapper_embedding.sh b/scripts/wrapper_embedding.sh
new file mode 100755
index 0000000..8cc9adb
--- /dev/null
+++ b/scripts/wrapper_embedding.sh
@@ -0,0 +1,21 @@
+#!/bin/bash
+set -e
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+PROJECT_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
+
+# Source environment (silently)
+source "$PROJECT_DIR/.env" 2>/dev/null || true
+source "$PROJECT_DIR/.env.development" 2>/dev/null || true
+
+# Ensure PATH is set
+export PATH="/opt/homebrew/bin:/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin:$PATH"
+
+# Find python
+PYTHON="${MOMENTRY_PYTHON_PATH:-$PROJECT_DIR/venv/bin/python}"
+if [ ! -f "$PYTHON" ]; then
+    PYTHON="/opt/homebrew/bin/python3.11"
+fi
+
+EMBED_SCRIPT="$PROJECT_DIR/scripts/embeddinggemma_server.py"
+exec "$PYTHON" "$EMBED_SCRIPT" --port 11436
\ No newline at end of file
diff --git a/scripts/wrapper_playground.sh b/scripts/wrapper_playground.sh
new file mode 100755
index 0000000..d3b042d
--- /dev/null
+++ b/scripts/wrapper_playground.sh
@@ -0,0 +1,14 @@
+#!/bin/bash
+set -e
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+PROJECT_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
+
+# Source environment (silently)
+source "$PROJECT_DIR/.env" 2>/dev/null || true
+source "$PROJECT_DIR/.env.development" 2>/dev/null || true
+
+# Ensure PATH is set
+export PATH="/opt/homebrew/bin:/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin:$PATH"
+
+exec "$PROJECT_DIR/target/debug/momentry_playground" server --host 0.0.0.0
\ No newline at end of file
diff --git a/scripts/wrapper_production.sh b/scripts/wrapper_production.sh
new file mode 100755
index 0000000..a6f17e6
--- /dev/null
+++ b/scripts/wrapper_production.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+set -e
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+PROJECT_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
+
+# Source environment (silently)
+source "$PROJECT_DIR/.env" 2>/dev/null || true
+
+# Ensure PATH is set
+export PATH="/opt/homebrew/bin:/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin:$PATH"
+
+exec "$PROJECT_DIR/target/release/momentry" server --host 0.0.0.0
\ No newline at end of file
diff --git a/src/api/agent_search.rs b/src/api/agent_search.rs
index e33d536..b0fbdd7 100644
--- a/src/api/agent_search.rs
+++ b/src/api/agent_search.rs
@@ -1,10 +1,4 @@
-use axum::{
-    extract::State,
-    http::StatusCode,
-    response::Json,
-    routing::post,
-    Router,
-};
+use axum::{extract::State, http::StatusCode, response::Json, routing::post, Router};
 use once_cell::sync::Lazy;
 use serde::{Deserialize, Serialize};
 use std::collections::HashMap;
@@ -13,7 +7,10 @@ use std::time::Instant;
 
 use crate::api::types::AppState;
 use crate::core::db::schema;
-use crate::core::llm::function_calling::{self, ChatMessage, LlmResponse, ToolCall, ToolDef};
+use crate::core::llm::function_calling::{
+    self, call_llm_vision, ChatMessage, LlmResponse, ToolCall, ToolDef,
+};
+use base64::{engine::general_purpose::STANDARD as BASE64, Engine};
 
 // ── Conversation Manager ─────────────────────────────────────────
 
@@ -43,11 +40,14 @@ fn get_or_create_conv(conv_id: Option<&str>) -> (String, Vec<ChatMessage>) {
         }
     }
     let id = uuid::Uuid::new_v4().to_string().replace('-', "")[..16].to_string();
-    map.insert(id.clone(), Conversation {
-        messages: Vec::new(),
-        created_at: Instant::now(),
-        last_active: Instant::now(),
-    });
+    map.insert(
+        id.clone(),
+        Conversation {
+            messages: Vec::new(),
+            created_at: Instant::now(),
+            last_active: Instant::now(),
+        },
+    );
     (id, Vec::new())
 }
 
@@ -85,8 +85,13 @@ const SYSTEM_PROMPT: &str = r#"你是 Momentry 影片分析助手。回答用戶
 ## 工具使用規則
 1. 先確認用戶在問哪部影片 — 使用 find_file 或 list_files
 2. 人物問題優先使用 tkg_query
-3. 語意/內容問題使用 smart_search 或 universal_search
-4. 可以同時呼叫多個工具
+3. 人物台詞/發言問題使用 identities_search（輸入人名→回傳台詞片段）
+4. 人物對話互動（誰跟誰說話）使用 tkg_query 的 speaker_interaction
+5. 人物台詞內容使用 tkg_query 的 speaker_dialogue
+6. 用文字反查人物使用 identity_text（輸入關鍵字→找出誰說/提到這段話）
+7. 語意/內容問題使用 smart_search 或 universal_search
+8. 畫面分析使用 analyze_frame — 可以分析影片中的任何畫面內容（場景、人物表情、動作、物件等）
+9. 可以同時呼叫多個工具
 
 ## 引導規則
 - 如果用戶沒說片名 → 用 find_file 搜尋，如果名稱不明確就反問
@@ -120,16 +125,16 @@ fn make_tools(pool: &sqlx::PgPool) -> Vec<ToolDef> {
         ),
         function_calling::make_tool(
             "tkg_query",
-            "查詢影片的人物互動、配對、同框資料。query_type 包括：top_identities（人物排名）、first_cooccurrence（第一次同框）、identity_details（人物詳細）、mutual_gaze（互看）、interaction_network（互動網絡）、identity_traces（出場片段）、file_info（影片資訊）。",
+            "查詢影片的人物互動、配對、同框、台詞資料。query_type 包括：top_identities（人物排名）、first_cooccurrence（第一次同框）、identity_details（人物詳細）、mutual_gaze（互看）、interaction_network（互動網絡）、identity_traces（出場片段）、file_info（影片資訊）、speaker_dialogue（人物台詞）、speaker_interaction（兩人對話互動）。",
             serde_json::json!({
                 "file_uuid": {"type": "string", "description": "影片 UUID"},
                 "query_type": {
                     "type": "string",
-                    "enum": ["top_identities", "first_cooccurrence", "identity_details", "mutual_gaze", "interaction_network", "identity_traces", "file_info"],
+                    "enum": ["top_identities", "first_cooccurrence", "identity_details", "mutual_gaze", "interaction_network", "identity_traces", "file_info", "speaker_dialogue", "speaker_interaction"],
                     "description": "查詢類型"
                 },
-                "identity_name": {"type": "string", "description": "人物名稱（配合 identity_details / identity_traces）"},
-                "identity_b": {"type": "string", "description": "第二人物名稱（配合 first_cooccurrence / mutual_gaze）"},
+                "identity_name": {"type": "string", "description": "人物名稱（配合 identity_details / identity_traces / speaker_dialogue / speaker_interaction）"},
+                "identity_b": {"type": "string", "description": "第二人物名稱（配合 first_cooccurrence / mutual_gaze / speaker_interaction）"},
                 "limit": {"type": "integer", "default": 5}
             }),
             vec!["file_uuid", "query_type"],
@@ -144,6 +149,26 @@ fn make_tools(pool: &sqlx::PgPool) -> Vec<ToolDef> {
             }),
             vec!["query"],
         ),
+        function_calling::make_tool(
+            "identity_text",
+            "搜尋文字關鍵字，找出有提及該內容的影片人物。適合回答「誰說了OOO」、「誰跟OOO有關」。不是查詢人物的台詞，而是用文字反查人物。",
+            serde_json::json!({
+                "q": {"type": "string", "description": "搜尋關鍵字（台詞片段、主題等）"},
+                "file_uuid": {"type": "string", "description": "限制搜尋範圍（可選）"},
+                "limit": {"type": "integer", "default": 10}
+            }),
+            vec!["q"],
+        ),
+        function_calling::make_tool(
+            "identities_search",
+            "查詢特定人物的台詞/發言內容。輸入人物名稱，回傳該人物在影片中說過的話。適合回答「某某人說了什麼」、「某某人的台詞」。",
+            serde_json::json!({
+                "q": {"type": "string", "description": "人物名稱關鍵字（姓名、角色名、別名）"},
+                "file_uuid": {"type": "string", "description": "限制搜尋範圍（可選）"},
+                "limit": {"type": "integer", "default": 10}
+            }),
+            vec!["q"],
+        ),
         function_calling::make_tool(
             "get_identity_detail",
             "查詢單一身份的詳細資料（名字、角色、TMDb 資訊）。",
@@ -168,6 +193,16 @@ fn make_tools(pool: &sqlx::PgPool) -> Vec<ToolDef> {
             }),
             vec!["file_uuid"],
         ),
+        function_calling::make_tool(
+            "analyze_frame",
+            "分析影片中指定畫面的視覺內容（場景、人物表情、動作、物件等）。若不指定 frame_number，會使用代表性畫面。問題會傳給視覺 LLM 分析。",
+            serde_json::json!({
+                "file_uuid": {"type": "string", "description": "影片 UUID"},
+                "question": {"type": "string", "description": "關於畫面的問題，例如「這個場景發生什麼事？」"},
+                "frame_number": {"type": "integer", "description": "指定的 frame 編號（可選）"}
+            }),
+            vec!["file_uuid"],
+        ),
     ]
 }
 
@@ -193,9 +228,10 @@ async fn exec_find_file(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result
     if rows.is_empty() {
         return Ok(serde_json::json!({"found": false, "message": "No files match the query. Try different keywords."}).to_string());
     }
-    let files: Vec<serde_json::Value> = rows.into_iter().map(|(u, n, hd)| {
-        serde_json::json!({"file_uuid": u, "file_name": n, "has_data": hd})
-    }).collect();
+    let files: Vec<serde_json::Value> = rows
+        .into_iter()
+        .map(|(u, n, hd)| serde_json::json!({"file_uuid": u, "file_name": n, "has_data": hd}))
+        .collect();
     Ok(serde_json::json!({"found": true, "files": files}).to_string())
 }
 
@@ -214,15 +250,19 @@ async fn exec_list_files(pool: &sqlx::PgPool, args: &serde_json::Value) -> Resul
     .await
     .map_err(|e| e.to_string())?;
 
-    let files: Vec<serde_json::Value> = rows.into_iter().map(|(u, n, hd)| {
-        serde_json::json!({"file_uuid": u, "file_name": n, "has_data": hd})
-    }).collect();
+    let files: Vec<serde_json::Value> = rows
+        .into_iter()
+        .map(|(u, n, hd)| serde_json::json!({"file_uuid": u, "file_name": n, "has_data": hd}))
+        .collect();
     Ok(serde_json::json!({"files": files}).to_string())
 }
 
 async fn exec_tkg_query(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result<String, String> {
     let file_uuid = args.get("file_uuid").and_then(|v| v.as_str()).unwrap_or("");
-    let query_type = args.get("query_type").and_then(|v| v.as_str()).unwrap_or("");
+    let query_type = args
+        .get("query_type")
+        .and_then(|v| v.as_str())
+        .unwrap_or("");
     let identity_name = args.get("identity_name").and_then(|v| v.as_str());
     let identity_b = args.get("identity_b").and_then(|v| v.as_str());
     let limit = args.get("limit").and_then(|v| v.as_i64()).unwrap_or(5);
@@ -242,9 +282,11 @@ async fn exec_tkg_query(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result
                  GROUP BY i.uuid, i.name ORDER BY face_count DESC LIMIT $2",
                 fd_table, id_table
             ))
-            .bind(file_uuid).bind(limit)
+            .bind(file_uuid)
+            .bind(limit)
             .fetch_all(pool)
-            .await.map_err(|e| e.to_string())?;
+            .await
+            .map_err(|e| e.to_string())?;
             Ok(serde_json::json!({"identities": rows}).to_string())
         }
         "first_cooccurrence" => {
@@ -325,8 +367,9 @@ async fn exec_tkg_query(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result
         }
         "identity_traces" => {
             let name = identity_name.unwrap_or("");
-            let rows: Vec<(i32, i64, i32, i32)> = sqlx::query_as(&format!(
-                "SELECT fd.trace_id, COUNT(*)::bigint, MIN(fd.frame_number)::int, MAX(fd.frame_number)::int \
+            // MIN/MAX frame_number should be bigint (i64), not int
+            let rows: Vec<(i32, i64, i64, i64)> = sqlx::query_as(&format!(
+                "SELECT fd.trace_id, COUNT(*)::bigint, MIN(fd.frame_number)::bigint, MAX(fd.frame_number)::bigint \
                  FROM {} fd JOIN {} i ON i.id = fd.identity_id \
                  WHERE fd.file_uuid = $1 AND i.name ILIKE $2 \
                  GROUP BY fd.trace_id ORDER BY COUNT(*) DESC LIMIT $3",
@@ -344,14 +387,133 @@ async fn exec_tkg_query(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result
             ))
             .bind(file_uuid)
             .fetch_optional(pool)
-            .await.map_err(|e| e.to_string())?;
+            .await
+            .map_err(|e| e.to_string())?;
             Ok(serde_json::json!({"file_info": row.map(|(n, d, w, h, f)| serde_json::json!({"file_name": n, "duration_sec": d, "width": w, "height": h, "fps": f}))}).to_string())
         }
-        _ => Ok(serde_json::json!({"error": format!("Unknown query_type: {}", query_type)}).to_string()),
+        "speaker_dialogue" => {
+            let name = identity_name.unwrap_or("");
+            let rows: Vec<(String, Option<String>)> = sqlx::query_as(&format!(
+                "SELECT DISTINCT sn.external_id, sn.properties->>'full_text' AS full_text \
+                 FROM {} i \
+                 JOIN {} fd ON fd.identity_id = i.id AND ($2::text IS NULL OR fd.file_uuid = $2) \
+                 JOIN {} fn ON fn.file_uuid = fd.file_uuid \
+                     AND fn.node_type = 'face_trace' \
+                     AND fn.external_id = CONCAT('trace_', fd.trace_id) \
+                 JOIN {} e ON e.source_node_id = fn.id \
+                     AND e.edge_type = 'SPEAKS_AS' \
+                     AND ($2::text IS NULL OR e.file_uuid = $2) \
+                 JOIN {} sn ON sn.id = e.target_node_id \
+                 WHERE i.name ILIKE $1 \
+                 LIMIT $3",
+                id_table, fd_table, nodes, edges, nodes
+            ))
+            .bind(name)
+            .bind(file_uuid)
+            .bind(limit)
+            .fetch_all(pool)
+            .await
+            .map_err(|e| e.to_string())?;
+
+            Ok(
+                serde_json::json!({"speakers": rows.iter().map(|(sid, text)| {
+                serde_json::json!({"speaker_id": sid, "dialogue": text})
+            }).collect::<Vec<_>>()})
+                .to_string(),
+            )
+        }
+        "speaker_interaction" => {
+            let name_a = identity_name.unwrap_or("");
+            let name_b = identity_b.unwrap_or("");
+            if name_a.is_empty() || name_b.is_empty() {
+                return Ok(
+                    serde_json::json!({"error": "identity_name and identity_b are required"})
+                        .to_string(),
+                );
+            }
+
+            // Get both speakers' segments from TKG
+            let rows: Vec<(String, String, serde_json::Value)> = sqlx::query_as(&format!(
+                "SELECT sn.external_id, sn.properties->>'full_text' AS full_text, sn.properties->'segments' AS segments \
+                 FROM {} i \
+                 JOIN {} fd ON fd.identity_id = i.id AND ($3::text IS NULL OR fd.file_uuid = $3) \
+                 JOIN {} fn ON fn.file_uuid = fd.file_uuid \
+                     AND fn.node_type = 'face_trace' \
+                     AND fn.external_id = CONCAT('trace_', fd.trace_id) \
+                 JOIN {} e ON e.source_node_id = fn.id \
+                     AND e.edge_type = 'SPEAKS_AS' \
+                     AND ($3::text IS NULL OR e.file_uuid = $3) \
+                 JOIN {} sn ON sn.id = e.target_node_id \
+                 WHERE (i.name ILIKE $1 OR i.name ILIKE $2) \
+                 ORDER BY sn.external_id",
+                id_table, fd_table, nodes, edges, nodes
+            ))
+            .bind(name_a)
+            .bind(name_b)
+            .bind(file_uuid)
+            .fetch_all(pool)
+            .await
+            .map_err(|e| e.to_string())?;
+
+            let mut interactions = Vec::new();
+            for i in 0..rows.len() {
+                for j in i + 1..rows.len() {
+                    let (sid_a, text_a, segs_a_val) = &rows[i];
+                    let (sid_b, text_b, segs_b_val) = &rows[j];
+                    let segs_a = segs_a_val.as_array();
+                    let segs_b = segs_b_val.as_array();
+                    if let (Some(a_list), Some(b_list)) = (segs_a, segs_b) {
+                        for sa in a_list {
+                            let sa_start = sa.get("start").and_then(|v| v.as_f64()).unwrap_or(0.0);
+                            let sa_end = sa.get("end").and_then(|v| v.as_f64()).unwrap_or(0.0);
+                            let sa_text = sa.get("text").and_then(|v| v.as_str()).unwrap_or("");
+                            if sa_text.is_empty() {
+                                continue;
+                            }
+                            for sb in b_list {
+                                let sb_start =
+                                    sb.get("start").and_then(|v| v.as_f64()).unwrap_or(0.0);
+                                let sb_end = sb.get("end").and_then(|v| v.as_f64()).unwrap_or(0.0);
+                                let sb_text = sb.get("text").and_then(|v| v.as_str()).unwrap_or("");
+                                if sb_text.is_empty() {
+                                    continue;
+                                }
+                                // Check temporal overlap
+                                let overlap_start = sa_start.max(sb_start);
+                                let overlap_end = sa_end.min(sb_end);
+                                if overlap_start < overlap_end {
+                                    interactions.push(serde_json::json!({
+                                        "speaker_a": sid_a,
+                                        "speaker_b": sid_b,
+                                        "time_range_s": [overlap_start, overlap_end],
+                                        "dialogue_a": sa_text,
+                                        "dialogue_b": sb_text,
+                                    }));
+                                }
+                            }
+                        }
+                    }
+                }
+            }
+            interactions.sort_by(|a, b| {
+                let a_start = a["time_range_s"][0].as_f64().unwrap_or(0.0);
+                let b_start = b["time_range_s"][0].as_f64().unwrap_or(0.0);
+                a_start.partial_cmp(&b_start).unwrap()
+            });
+            interactions.truncate(limit as usize);
+
+            Ok(serde_json::json!({"interactions": interactions, "speaker_a_text": rows.first().map(|r| r.1.clone()), "speaker_b_text": rows.get(1).map(|r| r.1.clone())}).to_string())
+        }
+        _ => Ok(
+            serde_json::json!({"error": format!("Unknown query_type: {}", query_type)}).to_string(),
+        ),
     }
 }
 
-async fn exec_smart_search(_pool: &sqlx::PgPool, args: &serde_json::Value) -> Result<String, String> {
+async fn exec_smart_search(
+    _pool: &sqlx::PgPool,
+    args: &serde_json::Value,
+) -> Result<String, String> {
     let query = args.get("query").and_then(|v| v.as_str()).unwrap_or("");
     let file_uuid = args.get("file_uuid").and_then(|v| v.as_str());
     let limit = args.get("limit").and_then(|v| v.as_i64()).unwrap_or(5);
@@ -359,7 +521,8 @@ async fn exec_smart_search(_pool: &sqlx::PgPool, args: &serde_json::Value) -> Re
     let chunk_table = schema::table_name("chunk");
     let mut sql = format!(
         "SELECT chunk_id, text_content, start_frame, end_frame, chunk_type \
-         FROM {} WHERE text_content ILIKE $1", chunk_table
+         FROM {} WHERE text_content ILIKE $1",
+        chunk_table
     );
     if file_uuid.is_some() {
         sql.push_str(" AND file_uuid = $2");
@@ -369,21 +532,147 @@ async fn exec_smart_search(_pool: &sqlx::PgPool, args: &serde_json::Value) -> Re
     if let Some(fuid) = file_uuid {
         let like = format!("%{}%", query);
         let rows: Vec<(String, Option<String>, i64, i64, String)> = sqlx::query_as(&sql)
-            .bind(&like).bind(fuid)
+            .bind(&like)
+            .bind(fuid)
             .fetch_all(_pool)
-            .await.map_err(|e| e.to_string())?;
+            .await
+            .map_err(|e| e.to_string())?;
         Ok(serde_json::json!({"results": rows}).to_string())
     } else {
         let like = format!("%{}%", query);
         let rows: Vec<(String, Option<String>, i64, i64, String)> = sqlx::query_as(&sql)
             .bind(&like)
             .fetch_all(_pool)
-            .await.map_err(|e| e.to_string())?;
+            .await
+            .map_err(|e| e.to_string())?;
         Ok(serde_json::json!({"results": rows}).to_string())
     }
 }
 
-async fn exec_get_identity_detail(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result<String, String> {
+async fn exec_identity_text(
+    pool: &sqlx::PgPool,
+    args: &serde_json::Value,
+) -> Result<String, String> {
+    let q = args.get("q").and_then(|v| v.as_str()).unwrap_or("");
+    let file_uuid = args.get("file_uuid").and_then(|v| v.as_str());
+    let limit = args
+        .get("limit")
+        .and_then(|v| v.as_i64())
+        .unwrap_or(10)
+        .min(50);
+
+    let chunk_table = schema::table_name("chunk");
+    let fd_table = schema::table_name("face_detections");
+    let id_table = schema::table_name("identities");
+    let like_q = format!("%{}%", q.replace('%', "%%"));
+
+    let sql = format!(
+        "SELECT c.chunk_id, c.start_time, c.end_time, c.text_content, \
+                i.name AS identity_name, fd.trace_id, i.source AS identity_source \
+         FROM {} c \
+         JOIN {} fd ON fd.file_uuid = c.file_uuid \
+             AND fd.frame_number BETWEEN c.start_frame AND c.end_frame \
+             AND fd.identity_id IS NOT NULL \
+         JOIN {} i ON i.id = fd.identity_id \
+         WHERE ($1::text IS NULL OR c.file_uuid = $1) \
+           AND (LOWER(c.text_content) LIKE LOWER($2) OR LOWER(c.content::text) LIKE LOWER($2)) \
+         ORDER BY c.start_time \
+         LIMIT $3",
+        chunk_table, fd_table, id_table
+    );
+
+    let rows: Vec<(
+        String,
+        f64,
+        f64,
+        Option<String>,
+        String,
+        Option<i32>,
+        String,
+    )> = sqlx::query_as(&sql)
+        .bind(file_uuid)
+        .bind(&like_q)
+        .bind(limit)
+        .fetch_all(pool)
+        .await
+        .map_err(|e| e.to_string())?;
+
+    Ok(
+        serde_json::json!({"results": rows.iter().map(|(chunk_id, st, et, txt, name, tid, src)| {
+        serde_json::json!({
+            "chunk_id": chunk_id,
+            "start_time": st,
+            "end_time": et,
+            "text": txt,
+            "identity_name": name,
+            "trace_id": tid,
+            "source": src
+        })
+    }    ).collect::<Vec<_>>()})
+        .to_string(),
+    )
+}
+
+async fn exec_identities_search(
+    pool: &sqlx::PgPool,
+    args: &serde_json::Value,
+) -> Result<String, String> {
+    let q = args.get("q").and_then(|v| v.as_str()).unwrap_or("");
+    let file_uuid = args.get("file_uuid").and_then(|v| v.as_str());
+    let limit = args
+        .get("limit")
+        .and_then(|v| v.as_i64())
+        .unwrap_or(10)
+        .min(50);
+
+    let id_table = schema::table_name("identities");
+    let fd_table = schema::table_name("face_detections");
+    let chunk_table = schema::table_name("chunk");
+    let like_q = format!("%{}%", q.replace('%', "%%"));
+
+    let sql = format!(
+        "SELECT DISTINCT ON (i.name, c.chunk_id) \
+                i.name, c.chunk_id, c.start_time, c.end_time, c.text_content, fd.trace_id \
+         FROM {} i \
+         JOIN {} fd ON fd.identity_id = i.id \
+         JOIN {} c ON c.file_uuid = fd.file_uuid \
+             AND c.start_time <= fd.frame_number / COALESCE(c.fps, 25.0) \
+             AND c.end_time >= fd.frame_number / COALESCE(c.fps, 25.0) \
+         WHERE (i.name ILIKE $1 \
+             OR EXISTS (SELECT 1 FROM jsonb_array_elements(i.metadata->'aliases') AS a WHERE a->>'name' ILIKE $1)) \
+           AND ($2::text IS NULL OR fd.file_uuid = $2) \
+         ORDER BY i.name, c.chunk_id, c.start_time \
+         LIMIT $3",
+        id_table, fd_table, chunk_table
+    );
+
+    let rows: Vec<(String, String, f64, f64, Option<String>, Option<i32>)> = sqlx::query_as(&sql)
+        .bind(&like_q)
+        .bind(file_uuid)
+        .bind(limit)
+        .fetch_all(pool)
+        .await
+        .map_err(|e| e.to_string())?;
+
+    Ok(
+        serde_json::json!({"results": rows.iter().map(|(name, chunk_id, st, et, txt, tid)| {
+            serde_json::json!({
+                "identity_name": name,
+                "chunk_id": chunk_id,
+                "start_time": st,
+                "end_time": et,
+                "text": txt,
+                "trace_id": tid,
+            })
+        }).collect::<Vec<_>>()})
+        .to_string(),
+    )
+}
+
+async fn exec_get_identity_detail(
+    pool: &sqlx::PgPool,
+    args: &serde_json::Value,
+) -> Result<String, String> {
     let name = args.get("name").and_then(|v| v.as_str()).unwrap_or("");
     let id_table = schema::table_name("identities");
     let row: Option<(String, String, Option<String>, Option<i32>, Option<String>)> = sqlx::query_as(&format!(
@@ -396,7 +685,10 @@ async fn exec_get_identity_detail(pool: &sqlx::PgPool, args: &serde_json::Value)
     Ok(serde_json::json!({"identity": row.map(|(u, n, s, t, c)| serde_json::json!({"uuid": u, "name": n, "source": s, "tmdb_id": t, "character": c}))}).to_string())
 }
 
-async fn exec_get_file_info(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result<String, String> {
+async fn exec_get_file_info(
+    pool: &sqlx::PgPool,
+    args: &serde_json::Value,
+) -> Result<String, String> {
     let file_uuid = args.get("file_uuid").and_then(|v| v.as_str()).unwrap_or("");
     let videos = schema::table_name("videos");
     let row: Option<(String, f64, i32, i32, f64)> = sqlx::query_as(&format!(
@@ -405,11 +697,15 @@ async fn exec_get_file_info(pool: &sqlx::PgPool, args: &serde_json::Value) -> Re
     ))
     .bind(file_uuid)
     .fetch_optional(pool)
-    .await.map_err(|e| e.to_string())?;
+    .await
+    .map_err(|e| e.to_string())?;
     Ok(serde_json::json!({"file_info": row.map(|(n, d, w, h, f)| serde_json::json!({"file_name": n, "duration_sec": d, "width": w, "height": h, "fps": f}))}).to_string())
 }
 
-async fn exec_get_representative_frame(pool: &sqlx::PgPool, args: &serde_json::Value) -> Result<String, String> {
+async fn exec_get_representative_frame(
+    pool: &sqlx::PgPool,
+    args: &serde_json::Value,
+) -> Result<String, String> {
     let file_uuid = args.get("file_uuid").and_then(|v| v.as_str()).unwrap_or("");
     match crate::core::processor::tkg::query_auto_representative_frame(pool, file_uuid).await {
         Ok(r) => Ok(serde_json::json!({
@@ -417,24 +713,131 @@ async fn exec_get_representative_frame(pool: &sqlx::PgPool, args: &serde_json::V
             "face_quality": r.face_quality,
             "main_identities": r.main_identities,
             "traces": r.traces,
-        }).to_string()),
+        })
+        .to_string()),
         Err(e) => Ok(serde_json::json!({"error": e.to_string()}).to_string()),
     }
 }
 
+async fn exec_analyze_frame(
+    pool: &sqlx::PgPool,
+    args: &serde_json::Value,
+) -> Result<String, String> {
+    let file_uuid = args.get("file_uuid").and_then(|v| v.as_str()).unwrap_or("");
+    let question = args
+        .get("question")
+        .and_then(|v| v.as_str())
+        .unwrap_or("請描述這個畫面中的內容");
+
+    if file_uuid.is_empty() {
+        return Ok(serde_json::json!({"error": "file_uuid is required"}).to_string());
+    }
+
+    let videos = schema::table_name("videos");
+    let (video_path, fps): (String, f64) = sqlx::query_as(&format!(
+        "SELECT file_path, COALESCE(fps, 25.0) FROM {} WHERE file_uuid = $1",
+        videos
+    ))
+    .bind(file_uuid)
+    .fetch_optional(pool)
+    .await
+    .map_err(|e| e.to_string())?
+    .ok_or_else(|| "Video not found".to_string())?;
+
+    let frame_number = match args.get("frame_number").and_then(|v| v.as_i64()) {
+        Some(f) => f,
+        None => {
+            match crate::core::processor::tkg::query_auto_representative_frame(pool, file_uuid)
+                .await
+            {
+                Ok(r) => r.frame_number,
+                Err(_) => {
+                    let duration: f64 = sqlx::query_scalar(&format!(
+                        "SELECT COALESCE(duration, 0) FROM {} WHERE file_uuid = $1",
+                        videos
+                    ))
+                    .bind(file_uuid)
+                    .fetch_optional(pool)
+                    .await
+                    .map_err(|e| e.to_string())?
+                    .unwrap_or(0.0);
+                    if duration > 0.0 {
+                        ((duration / 2.0) * fps) as i64
+                    } else {
+                        0
+                    }
+                }
+            }
+        }
+    };
+
+    let timestamp_secs = frame_number as f64 / fps;
+
+    let ffmpeg_path = std::env::var("MOMENTRY_FFMPEG").unwrap_or_else(|_| {
+        let full = "/opt/homebrew/opt/ffmpeg-full/bin/ffmpeg";
+        if std::path::Path::new(full).exists() {
+            full.to_string()
+        } else {
+            "ffmpeg".to_string()
+        }
+    });
+
+    let output = tokio::process::Command::new(&ffmpeg_path)
+        .args([
+            "-ss",
+            &format!("{:.3}", timestamp_secs),
+            "-i",
+            &video_path,
+            "-vframes",
+            "1",
+            "-f",
+            "image2pipe",
+            "-vcodec",
+            "mjpeg",
+            "-",
+        ])
+        .output()
+        .await
+        .map_err(|e| format!("ffmpeg execution error: {}", e))?;
+
+    if !output.status.success() {
+        let stderr = String::from_utf8_lossy(&output.stderr);
+        return Ok(serde_json::json!({"error": format!("ffmpeg failed: {}", stderr)}).to_string());
+    }
+
+    let base64_img = BASE64.encode(&output.stdout);
+
+    let system_prompt =
+        "你是一個專業的影片畫面分析助手。請根據提供的畫面以及用戶的問題，詳細描述畫面中的內容，包括場景、人物、動作、表情、物件等。請用繁體中文回答。";
+    let vision_result = call_llm_vision(system_prompt, question, vec![base64_img], 1024, 120)
+        .await
+        .map_err(|e| e.to_string())?;
+
+    Ok(serde_json::json!({
+        "frame_number": frame_number,
+        "timestamp_secs": timestamp_secs,
+        "analysis": vision_result,
+    })
+    .to_string())
+}
+
 // ── Tool Router ───────────────────────────────────────────────────
 
 async fn execute_tool(pool: &sqlx::PgPool, tool_call: &ToolCall) -> (String, String, String) {
     let name = tool_call.function.name.clone();
-    let args: serde_json::Value = serde_json::from_str(&tool_call.function.arguments).unwrap_or_default();
+    let args: serde_json::Value =
+        serde_json::from_str(&tool_call.function.arguments).unwrap_or_default();
     let result = match name.as_str() {
         "find_file" => exec_find_file(pool, &args).await,
         "list_files" => exec_list_files(pool, &args).await,
         "tkg_query" => exec_tkg_query(pool, &args).await,
         "smart_search" => exec_smart_search(pool, &args).await,
+        "identity_text" => exec_identity_text(pool, &args).await,
+        "identities_search" => exec_identities_search(pool, &args).await,
         "get_identity_detail" => exec_get_identity_detail(pool, &args).await,
         "get_file_info" => exec_get_file_info(pool, &args).await,
         "get_representative_frame" => exec_get_representative_frame(pool, &args).await,
+        "analyze_frame" => exec_analyze_frame(pool, &args).await,
         _ => Err(format!("Unknown tool: {}", name)),
     };
     let content = match result {
@@ -476,7 +879,11 @@ async fn run_tool_loop(
                 for call in &calls {
                     let (tool_call_id, name, content) = execute_tool(pool, call).await;
                     sources.push(serde_json::json!({"tool": name, "result": content}));
-                    messages.push(function_calling::make_tool_result(&tool_call_id, &name, &content));
+                    messages.push(function_calling::make_tool_result(
+                        &tool_call_id,
+                        &name,
+                        &content,
+                    ));
                 }
             }
             Err(e) => {
@@ -484,7 +891,10 @@ async fn run_tool_loop(
             }
         }
     }
-    ("已達到最大查詢次數，請縮小問題範圍後重新詢問。".to_string(), sources)
+    (
+        "已達到最大查詢次數，請縮小問題範圍後重新詢問。".to_string(),
+        sources,
+    )
 }
 
 // ── Handler ───────────────────────────────────────────────────────
@@ -495,13 +905,8 @@ async fn agent_search(
 ) -> Result<Json<AgentSearchResponse>, (StatusCode, Json<serde_json::Value>)> {
     let (conv_id, history) = get_or_create_conv(req.conversation_id.as_deref());
 
-    let (answer, sources) = run_tool_loop(
-        state.db.pool(),
-        SYSTEM_PROMPT,
-        &req.query,
-        history,
-    )
-    .await;
+    let (answer, sources) =
+        run_tool_loop(state.db.pool(), SYSTEM_PROMPT, &req.query, history).await;
 
     // Save updated messages for conversation continuation
     let new_msgs = function_calling::build_conversation(SYSTEM_PROMPT, &req.query, vec![]);
@@ -509,7 +914,11 @@ async fn agent_search(
 
     let needs_input = answer.contains('？') || answer.contains('?');
     let suggestions = if needs_input {
-        Some(vec!["演員名".to_string(), "電影片名".to_string(), "年份".to_string()])
+        Some(vec![
+            "演員名".to_string(),
+            "電影片名".to_string(),
+            "年份".to_string(),
+        ])
     } else {
         None
     };
@@ -526,6 +935,5 @@ async fn agent_search(
 // ── Routes ─────────────────────────────────────────────────────────
 
 pub fn agent_search_routes() -> Router<AppState> {
-    Router::new()
-        .route("/api/v1/agents/search", post(agent_search))
+    Router::new().route("/api/v1/agents/search", post(agent_search))
 }
diff --git a/src/api/docs.rs b/src/api/docs.rs
index 1f52c6b..bbf55ca 100644
--- a/src/api/docs.rs
+++ b/src/api/docs.rs
@@ -8,8 +8,7 @@ async fn doc_redirect() -> axum::response::Redirect {
 
 async fn wasm_doc_handler() -> Result<impl axum::response::IntoResponse, (StatusCode, &'static str)>
 {
-    let path =
-        std::path::Path::new("/Users/accusys/momentry_core/docs_v1.0/doc_wasm/index.html");
+    let path = std::path::Path::new("/Users/accusys/momentry_core/docs_v1.0/doc_wasm/index.html");
     match tokio::fs::read_to_string(path).await {
         Ok(html) => Ok(([("content-type", "text/html; charset=utf-8")], html)),
         Err(_) => Err((StatusCode::NOT_FOUND, "Doc not found")),
diff --git a/src/api/files.rs b/src/api/files.rs
index 5793f52..4c9a9a6 100644
--- a/src/api/files.rs
+++ b/src/api/files.rs
@@ -12,7 +12,7 @@ use std::collections::HashMap;
 use super::types::AppState;
 use crate::core::config;
 use crate::core::db::schema;
-use crate::core::db::{Database, PostgresDb};
+use crate::core::db::{Database, PostgresDb, QdrantDb, RedisClient};
 use crate::core::storage::content_hash;
 use crate::FileManager;
 
@@ -767,17 +767,7 @@ async fn register_file(
             if let Some(ref vp) = video_path {
                 if let Ok(job) = auto_state.db.create_monitor_job(&auto_uuid, Some(vp)).await {
                     tracing::info!("[AUTO-PIPELINE] Job {} created for {}", job.id, auto_uuid);
-                    let all_procs: Vec<&str> = vec![
-                        "asr",
-                        "cut",
-                        "yolo",
-                        "ocr",
-                        "face",
-                        "pose",
-                        "asrx",
-                        "visual_chunk",
-                        "5w1h",
-                    ];
+                    let all_procs: Vec<&str> = vec!["cut", "yolo", "ocr", "face", "pose", "asrx"];
                     let total = sqlx::query_scalar::<_, i64>(&format!(
                         "SELECT COALESCE(total_frames, 0) FROM {} WHERE file_uuid = $1",
                         schema::table_name("videos")
@@ -986,6 +976,10 @@ struct UnregisterResponse {
     deleted_face_detections: u64,
     deleted_processor_results: u64,
     deleted_chunks: u64,
+    deleted_tkg_nodes: u64,
+    deleted_qdrant_vectors: Option<u64>,
+    deleted_redis_keys: Option<u64>,
+    deleted_output_files: u64,
 }
 
 #[derive(Debug, Deserialize)]
@@ -994,18 +988,30 @@ struct UnregisterRequest {
     file_path: Option<String>,
 }
 
-fn delete_output_files(uuid: &str) {
-    let output_dir = config::OUTPUT_DIR.to_string();
-    if let Ok(entries) = std::fs::read_dir(&output_dir) {
-        for entry in entries.flatten() {
-            let path = entry.path();
-            if let Some(name) = path.file_name().and_then(|n| n.to_str()) {
-                if name.starts_with(uuid) {
-                    let _ = std::fs::remove_file(&path);
+fn delete_output_files(uuid: &str) -> u64 {
+    let mut deleted_count = 0u64;
+    let output_dirs = [
+        config::OUTPUT_DIR.to_string(),
+        "/Users/accusys/momentry/output_dev".to_string(),
+        "/Users/accusys/momentry/output".to_string(),
+    ];
+
+    for output_dir in &output_dirs {
+        if let Ok(entries) = std::fs::read_dir(output_dir) {
+            for entry in entries.flatten() {
+                let path = entry.path();
+                if let Some(name) = path.file_name().and_then(|n| n.to_str()) {
+                    if name.starts_with(uuid) && name.ends_with(".json") {
+                        if std::fs::remove_file(&path).is_ok() {
+                            deleted_count += 1;
+                            tracing::info!("[UNREGISTER] Deleted output file: {}", name);
+                        }
+                    }
                 }
             }
         }
     }
+    deleted_count
 }
 
 async fn unregister(
@@ -1024,65 +1030,54 @@ async fn unregister(
     let processor_table = schema::table_name("processor_results");
     let chunks_table = schema::table_name("chunk");
     let parent_chunks_table = schema::table_name("parent_chunks");
-
-    let deleted_faces: i64 =
-        sqlx::query(&format!("DELETE FROM {} WHERE file_uuid = $1", face_table))
-            .bind(&uuid)
-            .execute(state.db.pool())
-            .await
-            .map_err(|e| {
-                tracing::error!("[unregister] Failed to delete faces: {}", e);
-                StatusCode::INTERNAL_SERVER_ERROR
-            })?
-            .rows_affected() as i64;
-
-    let deleted_processors: i64 = sqlx::query(&format!(
-        "DELETE FROM {} WHERE file_uuid = $1",
-        processor_table
-    ))
-    .bind(&uuid)
-    .execute(state.db.pool())
-    .await
-    .map_err(|e| {
-        tracing::error!("[unregister] Failed to delete processors: {}", e);
-        StatusCode::INTERNAL_SERVER_ERROR
-    })?
-    .rows_affected() as i64;
-
-    let deleted_parent_chunks: i64 = sqlx::query(&format!(
-        "DELETE FROM {} WHERE uuid = $1",
-        parent_chunks_table
-    ))
-    .bind(&uuid)
-    .execute(state.db.pool())
-    .await
-    .map_err(|e| {
-        tracing::error!("[unregister] Failed to delete parent chunks: {}", e);
-        StatusCode::INTERNAL_SERVER_ERROR
-    })?
-    .rows_affected() as i64;
-
-    let deleted_chunks: i64 = sqlx::query(&format!("DELETE FROM {} WHERE file_uuid = $1", chunks_table))
-        .bind(&uuid)
-        .execute(state.db.pool())
-        .await
-        .map_err(|e| {
-            tracing::error!("[unregister] Failed to delete chunks: {}", e);
-            StatusCode::INTERNAL_SERVER_ERROR
-        })?
-        .rows_affected() as i64;
-
-    // Delete pre_chunks
     let pre_chunks_table = schema::table_name("pre_chunks");
-    let deleted_pre_chunks: i64 = sqlx::query(&format!(
-        "DELETE FROM {} WHERE file_uuid = $1",
-        pre_chunks_table
+    let tkg_nodes_table = schema::table_name("tkg_nodes");
+    let cuts_table = schema::table_name("cuts");
+    let strangers_table = schema::table_name("strangers");
+    let chunk_vectors_table = schema::table_name("chunk_vectors");
+    let monitor_jobs_table = schema::table_name("monitor_jobs");
+    let frames_table = schema::table_name("frames");
+
+    let mut tx = state.db.pool().begin().await.map_err(|e| {
+        tracing::error!("[unregister] Failed to start transaction: {}", e);
+        StatusCode::INTERNAL_SERVER_ERROR
+    })?;
+
+    macro_rules! delete_safe {
+        ($table:expr, $where:expr, $bind:expr, $label:expr) => {{
+            sqlx::query(&format!("DELETE FROM {} WHERE {}", $table, $where))
+                .bind($bind)
+                .execute(&mut *tx)
+                .await
+                .map_err(|e| {
+                    tracing::error!("[unregister] Failed to delete {}: {}", $label, e);
+                    StatusCode::INTERNAL_SERVER_ERROR
+                })?
+                .rows_affected() as i64
+        }};
+    }
+
+    let deleted_faces = delete_safe!(face_table, "file_uuid = $1", &uuid, "faces");
+    let deleted_processors = delete_safe!(processor_table, "file_uuid = $1", &uuid, "processors");
+    let deleted_parent_chunks =
+        delete_safe!(parent_chunks_table, "uuid = $1", &uuid, "parent chunks");
+    let deleted_chunks = delete_safe!(chunks_table, "file_uuid = $1", &uuid, "chunks");
+    let deleted_pre_chunks = delete_safe!(pre_chunks_table, "file_uuid = $1", &uuid, "pre_chunks");
+    let deleted_tkg_nodes = delete_safe!(tkg_nodes_table, "file_uuid = $1", &uuid, "TKG nodes");
+    let deleted_cuts = delete_safe!(cuts_table, "file_uuid = $1", &uuid, "cuts");
+    let deleted_strangers = delete_safe!(strangers_table, "file_uuid = $1", &uuid, "strangers");
+    let deleted_chunk_vectors =
+        delete_safe!(chunk_vectors_table, "uuid = $1", &uuid, "chunk vectors");
+    let deleted_monitor_jobs = delete_safe!(monitor_jobs_table, "uuid = $1", &uuid, "monitor jobs");
+    let deleted_frames: i64 = sqlx::query(&format!(
+        "DELETE FROM {} WHERE file_id = (SELECT id FROM {} WHERE file_uuid = $1)",
+        frames_table, videos_table
     ))
     .bind(&uuid)
-    .execute(state.db.pool())
+    .execute(&mut *tx)
     .await
     .map_err(|e| {
-        tracing::error!("[unregister] Failed to delete pre_chunks: {}", e);
+        tracing::error!("[unregister] Failed to delete frames: {}", e);
         StatusCode::INTERNAL_SERVER_ERROR
     })?
     .rows_affected() as i64;
@@ -1092,14 +1087,59 @@ async fn unregister(
         videos_table
     ))
     .bind(&uuid)
-    .execute(state.db.pool())
+    .execute(&mut *tx)
     .await
     .map_err(|e| {
         tracing::error!("[unregister] Failed: {}", e);
         StatusCode::INTERNAL_SERVER_ERROR
     })?;
 
-    delete_output_files(&uuid);
+    tx.commit().await.map_err(|e| {
+        tracing::error!("[unregister] Failed to commit transaction: {}", e);
+        StatusCode::INTERNAL_SERVER_ERROR
+    })?;
+
+    tracing::info!(
+        "[UNREGISTER] Deleted: {} faces, {} processors, {} parent_chunks, {} chunks, {} pre_chunks, {} tkg_nodes, {} cuts, {} strangers, {} chunk_vectors, {} monitor_jobs, {} frames",
+        deleted_faces, deleted_processors, deleted_parent_chunks, deleted_chunks,
+        deleted_pre_chunks, deleted_tkg_nodes, deleted_cuts, deleted_strangers,
+        deleted_chunk_vectors, deleted_monitor_jobs, deleted_frames
+    );
+
+    let deleted_output_files = delete_output_files(&uuid);
+
+    let deleted_qdrant_vectors = {
+        let qdrant = QdrantDb::new();
+        match qdrant.delete_by_uuid(&uuid).await {
+            Ok(_) => {
+                tracing::info!("[UNREGISTER] Deleted Qdrant vectors for {}", uuid);
+                Some(1)
+            }
+            Err(e) => {
+                tracing::warn!("[UNREGISTER] Failed to delete Qdrant vectors: {}", e);
+                None
+            }
+        }
+    };
+
+    let deleted_redis_keys = {
+        match RedisClient::new() {
+            Ok(redis) => match redis.delete_worker_job(&uuid).await {
+                Ok(_) => {
+                    tracing::info!("[UNREGISTER] Deleted Redis keys for {}", uuid);
+                    Some(1)
+                }
+                Err(e) => {
+                    tracing::warn!("[UNREGISTER] Failed to delete Redis keys: {}", e);
+                    None
+                }
+            },
+            Err(e) => {
+                tracing::warn!("[UNREGISTER] Failed to create Redis client: {}", e);
+                None
+            }
+        }
+    };
 
     Ok(Json(UnregisterResponse {
         success: true,
@@ -1107,7 +1147,11 @@ async fn unregister(
         file_uuid: uuid,
         deleted_face_detections: deleted_faces as u64,
         deleted_processor_results: deleted_processors as u64,
-        deleted_chunks: (deleted_chunks + deleted_parent_chunks) as u64,
+        deleted_chunks: (deleted_chunks + deleted_parent_chunks + deleted_pre_chunks) as u64,
+        deleted_tkg_nodes: deleted_tkg_nodes as u64,
+        deleted_qdrant_vectors,
+        deleted_redis_keys,
+        deleted_output_files,
     }))
 }
 
diff --git a/src/api/five_w1h_agent_api.rs b/src/api/five_w1h_agent_api.rs
index 759a8f9..705b717 100644
--- a/src/api/five_w1h_agent_api.rs
+++ b/src/api/five_w1h_agent_api.rs
@@ -471,7 +471,7 @@ async fn store_parent_summary(
         "sentence_count": sentences.len(),
     });
     sqlx::query(&format!(
-        r#"UPDATE {} SET summary_text = $1, metadata = metadata || $2::jsonb
+        r#"UPDATE {} SET summary_text = $1, metadata = jsonb_deep_merge(COALESCE(metadata, '{{}}'::jsonb), $2::jsonb)
            WHERE chunk_id = $3 AND file_uuid = $4"#,
         table
     ))
@@ -743,7 +743,7 @@ pub async fn run_5w1h_agent(db: &PostgresDb, file_uuid: &str) -> anyhow::Result<
 
     // Auto-vectorize sentences with EmbeddingGemma (768D)
     tracing::info!("[5W1H] Starting vectorize for sentence chunks...");
-    let embedder = Embedder::new("embeddinggemma-300M-Q8_0.gguf".to_string());
+    let embedder = Embedder::new("embeddinggemma-300m".to_string());
     let qdrant = QdrantDb::new();
     qdrant.init_collection(768).await?;
 
diff --git a/src/api/health.rs b/src/api/health.rs
index 4737133..ee9339c 100644
--- a/src/api/health.rs
+++ b/src/api/health.rs
@@ -388,10 +388,18 @@ async fn health_detailed(State(state): State<AppState>) -> Json<DetailedHealthRe
             let directory_exists = identities_root.is_dir();
             let files_count = crate::core::identity::storage::count_identity_files();
             let index_ok = crate::core::identity::storage::read_index().is_ok();
-            let db_count: i64 = sqlx::query_scalar("SELECT COUNT(*) FROM identities")
+            let id_cnt: i64 = sqlx::query_scalar("SELECT COUNT(*) FROM identities")
                 .fetch_one(state.db.pool())
                 .await
                 .unwrap_or(0);
+            let st_cnt: i64 = sqlx::query_scalar(&format!(
+                "SELECT COUNT(*) FROM {} WHERE file_uuid IS NOT NULL",
+                crate::core::db::schema::table_name("strangers")
+            ))
+            .fetch_one(state.db.pool())
+            .await
+            .unwrap_or(0);
+            let db_count = id_cnt + st_cnt;
             IdentityHealth {
                 directory_exists,
                 files_count,
diff --git a/src/api/identities.rs b/src/api/identities.rs
index 2477761..01b4989 100644
--- a/src/api/identities.rs
+++ b/src/api/identities.rs
@@ -220,8 +220,8 @@ async fn list_identities(
     .await
     .unwrap_or(0);
     let auto_identities: i64 = sqlx::query_scalar(&format!(
-        "SELECT COUNT(*) FROM {} WHERE source = 'auto'",
-        identities_table
+        "SELECT COUNT(*) FROM {} WHERE file_uuid IS NOT NULL",
+        crate::core::db::schema::table_name("strangers")
     ))
     .fetch_one(db.pool())
     .await
@@ -258,7 +258,7 @@ pub struct FaceCandidate {
     pub id: i32,
     pub face_id: Option<String>,
     pub file_uuid: String,
-    pub frame_number: i32,
+    pub frame_number: i64,
     pub confidence: f32,
     pub bbox: Option<serde_json::Value>,
     pub attributes: Option<serde_json::Value>,
@@ -352,7 +352,7 @@ async fn list_face_candidates(
 
     let rows = if let Some(file_uuid) = &query.file_uuid {
         let sql = format!(
-            "SELECT id, face_id, file_uuid, frame_number::int, confidence::float4, 
+            "SELECT id, face_id, file_uuid, frame_number::bigint, confidence::float4, 
                     jsonb_build_object('x', x, 'y', y, 'width', width, 'height', height) as bbox,
                     NULL::jsonb as attributes 
              FROM {} 
@@ -367,7 +367,7 @@ async fn list_face_candidates(
                 i32,
                 Option<String>,
                 String,
-                i32,
+                i64,
                 f32,
                 Option<serde_json::Value>,
                 Option<serde_json::Value>,
@@ -390,7 +390,7 @@ async fn list_face_candidates(
         }
     } else {
         let sql = format!(
-            "SELECT id, face_id, file_uuid, frame_number::int, confidence::float4, 
+            "SELECT id, face_id, file_uuid, frame_number::bigint, confidence::float4, 
                     jsonb_build_object('x', x, 'y', y, 'width', width, 'height', height) as bbox,
                     NULL::jsonb as attributes 
              FROM {} 
@@ -405,7 +405,7 @@ async fn list_face_candidates(
                 i32,
                 Option<String>,
                 String,
-                i32,
+                i64,
                 f32,
                 Option<serde_json::Value>,
                 Option<serde_json::Value>,
diff --git a/src/api/identity_agent_api.rs b/src/api/identity_agent_api.rs
index 56123e9..89787ca 100644
--- a/src/api/identity_agent_api.rs
+++ b/src/api/identity_agent_api.rs
@@ -640,8 +640,9 @@ async fn match_faces_iterative(pool: &sqlx::PgPool, file_uuid: &str) -> anyhow::
     );
 
     // Step 2: 載入所有 face_detections（含 frame_number），按 trace_id 分組
+    // frame_number is BIGINT (i64) in database
     let fd_table = schema::table_name("face_detections");
-    let fd_rows = sqlx::query_as::<_, (i32, i32, Vec<f32>)>(&format!(
+    let fd_rows = sqlx::query_as::<_, (i32, i64, Vec<f32>)>(&format!(
         "SELECT trace_id, frame_number, embedding FROM {} \
          WHERE file_uuid=$1 AND trace_id IS NOT NULL AND embedding IS NOT NULL \
          ORDER BY trace_id, frame_number",
@@ -658,7 +659,7 @@ async fn match_faces_iterative(pool: &sqlx::PgPool, file_uuid: &str) -> anyhow::
 
     // 分組：trace_id → (frame_number, embedding)
     use std::collections::HashMap;
-    let mut trace_faces_raw: HashMap<i32, Vec<(i32, Vec<f32>)>> = HashMap::new();
+    let mut trace_faces_raw: HashMap<i32, Vec<(i64, Vec<f32>)>> = HashMap::new();
     for (tid, frame, emb) in &fd_rows {
         trace_faces_raw
             .entry(*tid)
@@ -723,6 +724,7 @@ async fn match_faces_iterative(pool: &sqlx::PgPool, file_uuid: &str) -> anyhow::
 
     // Step 5: 寫入 DB — Round 1 結果先存
     let identities_table = schema::table_name("identities");
+    let strangers_table = schema::table_name("strangers");
     let fd_table = schema::table_name("face_detections");
     let mut updated = 0usize;
     for (tid, name) in &matched {
@@ -805,13 +807,28 @@ async fn match_faces_iterative(pool: &sqlx::PgPool, file_uuid: &str) -> anyhow::
         }
     }
 
-    // Step 6: 未匹配的 trace 設 stranger_id = trace_id
-    // trace_id 在同一個 file 內是 sequential integer，直接複用為 stranger_id
+    // Step 6: 未匹配的 trace 設 stranger_id = strangers.id (FK)
+    // First: ensure strangers records exist
+    let _ = sqlx::query(&format!(
+        "INSERT INTO {} (file_uuid, trace_id) \
+         SELECT $1, fd.trace_id FROM {} fd \
+         WHERE fd.file_uuid = $1 AND fd.trace_id IS NOT NULL \
+           AND fd.identity_id IS NULL \
+         ON CONFLICT (file_uuid, trace_id) DO NOTHING",
+        strangers_table, fd_table
+    ))
+    .bind(file_uuid)
+    .execute(pool)
+    .await?;
+
+    // Then: update face_detections.stranger_id = strangers.id
     let stranger_update = sqlx::query(&format!(
-        "UPDATE {} SET stranger_id = trace_id \
-             WHERE file_uuid = $1 AND trace_id IS NOT NULL AND identity_id IS NULL \
-               AND (stranger_id IS NULL OR stranger_id != trace_id)",
-        fd_table
+        "UPDATE {} fd SET stranger_id = s.id \
+         FROM {} s \
+         WHERE s.file_uuid = fd.file_uuid AND s.trace_id = fd.trace_id \
+           AND fd.file_uuid = $1 AND fd.identity_id IS NULL \
+           AND fd.trace_id IS NOT NULL AND fd.stranger_id IS NULL",
+        fd_table, strangers_table
     ))
     .bind(file_uuid)
     .execute(pool)
@@ -971,16 +988,30 @@ pub async fn bind_speakers(pool: &sqlx::PgPool, file_uuid: &str) -> anyhow::Resu
 
             let ib_table = schema::table_name("identity_bindings");
             let _ = sqlx::query(
-                &format!("INSERT INTO {} (identity_id, identity_type, identity_value, confidence, metadata) \
-                 VALUES ($1, 'speaker', $2, $3, $4::jsonb) \
-                 ON CONFLICT (identity_id, identity_type, identity_value) DO UPDATE SET confidence = EXCLUDED.confidence, metadata = EXCLUDED.metadata", ib_table)
+                &format!("INSERT INTO {} (identity_id, identity_type, identity_value, file_uuid, confidence, metadata) \
+                 VALUES ($1, 'speaker', $2, $3, $4, $5::jsonb) \
+                 ON CONFLICT (identity_id, identity_type, identity_value, file_uuid) \
+                 DO UPDATE SET confidence = EXCLUDED.confidence, metadata = EXCLUDED.metadata", ib_table)
             )
             .bind(identity_id)
             .bind(&best_speaker)
+            .bind(file_uuid)
             .bind(overlap_ratio)
             .bind(&metadata)
             .execute(pool).await;
 
+            // Also update speaker_detections with the identity_id
+            let sd_table = schema::table_name("speaker_detections");
+            let _ = sqlx::query(
+                &format!("UPDATE {} SET identity_id = $1, confidence = $2 \
+                 WHERE file_uuid = $3 AND speaker_id = $4 AND identity_id IS NULL", sd_table)
+            )
+            .bind(identity_id)
+            .bind(overlap_ratio)
+            .bind(file_uuid)
+            .bind(&best_speaker)
+            .execute(pool).await;
+
             bindings += 1;
         }
     }
@@ -1028,31 +1059,31 @@ pub async fn run_identity_agent(db: &PostgresDb, file_uuid: &str) -> anyhow::Res
         let speakers = extract_speakers_from_asrx_data(&asrx_data);
         let identities = analyze_person_speaker_overlap(&persons, &speakers);
 
-        for (idx, id_result) in identities.iter().enumerate() {
-            let identity_name = format!("stranger_{}", idx);
+        let _ = identities.len();
+        if !identities.is_empty() {
             let metadata = serde_json::json!({
                 "source": "identity_agent",
-                "trace_ids": id_result.person_ids,
-                "speaker_ids": id_result.speaker_ids,
-                "confidence": id_result.confidence,
+                "speaker_ids": identities[0].speaker_ids,
+                "confidence": identities[0].confidence,
                 "evidence": {
-                    "speaker_overlap": id_result.evidence.speaker_overlap,
-                    "frame_ratio": id_result.evidence.frame_ratio,
+                    "speaker_overlap": identities[0].evidence.speaker_overlap,
+                    "frame_ratio": identities[0].evidence.frame_ratio,
                 },
-                "reasoning": id_result.reasoning,
+                "reasoning": identities[0].reasoning,
             });
-            let _ = sqlx::query(
-                &format!("INSERT INTO {} (name, identity_type, source, metadata, status) VALUES ($1, 'people', 'auto', $2::jsonb, 'pending') ON CONFLICT DO NOTHING", schema::table_name("identities"))
-            )
-            .bind(&identity_name)
+            let _ = sqlx::query(&format!(
+                "INSERT INTO {} (file_uuid, trace_id, metadata) \
+                     VALUES ($1, NULL, $2::jsonb) ON CONFLICT DO NOTHING",
+                schema::table_name("strangers")
+            ))
+            .bind(file_uuid)
             .bind(&metadata)
             .execute(pool)
             .await;
         }
-        let _created = identities.len();
         tracing::info!(
-            "[IdentityAgent] Created {} auto identities from face_clustered for {}",
-            _created,
+            "[IdentityAgent] Analyzed {} face clusters from face_clustered for {}",
+            identities.len(),
             file_uuid
         );
     } else {
diff --git a/src/api/identity_api.rs b/src/api/identity_api.rs
index fb5df94..a768137 100644
--- a/src/api/identity_api.rs
+++ b/src/api/identity_api.rs
@@ -1,5 +1,5 @@
 use axum::{
-    extract::{Multipart, Path, Query, State},
+    extract::{Extension, Multipart, Path, Query, State},
     http::StatusCode,
     response::{Html, Json},
     routing::{get, patch, post},
@@ -36,6 +36,7 @@ pub fn identity_routes() -> Router<crate::api::types::AppState> {
             "/api/v1/identity/:identity_uuid/faces",
             get(get_identity_faces),
         )
+        .route("/api/v1/file/:file_uuid/faces", get(get_file_faces))
         .route("/api/v1/resource/register", post(register_resource))
         .route("/api/v1/resource/heartbeat", post(heartbeat_resource))
         .route("/api/v1/resources", get(list_resources))
@@ -55,15 +56,23 @@ pub fn identity_routes() -> Router<crate::api::types::AppState> {
         // Experiment: identity text search (non-polluting, separate endpoint)
         .route("/api/v1/search/identity_text", get(search_identity_text))
         .route("/api/v1/identities/search", get(search_identities_by_text))
+        // Undo/Redo/History
+        .route("/api/v1/identity/:identity_uuid/undo", post(undo_identity))
+        .route("/api/v1/identity/:identity_uuid/redo", post(redo_identity))
+        .route(
+            "/api/v1/identity/:identity_uuid/history",
+            get(get_identity_history),
+        )
 }
 
 // --- Files Endpoints ---
 
 #[derive(Debug, Deserialize)]
 pub struct FilesQuery {
-    page: Option<usize>,
-    page_size: Option<usize>,
-    uuid: Option<String>, // Add uuid filter
+    pub page: Option<usize>,
+    pub page_size: Option<usize>,
+    pub status: Option<String>,
+    pub file_uuid: Option<String>,
 }
 
 async fn list_files(
@@ -74,10 +83,10 @@ async fn list_files(
     let page_size = params.page_size.unwrap_or(20);
 
     // If UUID is provided, fetch that specific file and return it as a list item
-    if let Some(ref uuid) = params.uuid {
+    if let Some(ref file_uuid) = params.file_uuid {
         let video = state
             .db
-            .get_video_by_uuid(uuid)
+            .get_video_by_uuid(file_uuid)
             .await
             .map_err(|e| (StatusCode::INTERNAL_SERVER_ERROR, e.to_string()))?;
 
@@ -387,6 +396,7 @@ async fn get_identity_status(
 pub struct IdentityFilesResponse {
     pub success: bool,
     pub identity_uuid: String,
+    pub name: String,
     pub total: i64,
     pub page: usize,
     pub page_size: usize,
@@ -395,26 +405,87 @@ pub struct IdentityFilesResponse {
 
 async fn delete_identity(
     State(state): State<crate::api::types::AppState>,
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
     Path(identity_uuid): Path<String>,
 ) -> Result<StatusCode, StatusCode> {
     let table = crate::core::db::schema::table_name("face_detections");
     let id_table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
 
-    // Get identity_id from identity_uuid
-    let row: Option<(i32,)> = sqlx::query_as(&format!(
-        "SELECT id FROM {} WHERE replace(uuid::text, '-', '') = $1",
+    let uuid_clean = identity_uuid.replace('-', "");
+
+    // Get identity_id + full snapshot before deletion
+    let row: Option<(i32, serde_json::Value)> = sqlx::query_as(&format!(
+        "SELECT id, jsonb_build_object('id', id, 'uuid', uuid::text, 'name', name, 'identity_type', identity_type, 'source', source, 'status', status, 'metadata', metadata, 'tmdb_id', tmdb_id, 'tmdb_profile', tmdb_profile) FROM {} WHERE replace(uuid::text, '-', '') = $1",
         id_table
     ))
-    .bind(&identity_uuid)
+    .bind(&uuid_clean)
     .fetch_optional(state.db.pool())
     .await
     .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
 
-    let (identity_id,) = row.ok_or(StatusCode::NOT_FOUND)?;
+    let (identity_id, identity_snapshot) = row.ok_or(StatusCode::NOT_FOUND)?;
+
+    // Delete identity file from disk
+    let _ = crate::core::identity::storage::delete_identity_file(&uuid_clean);
+
+    // Capture unbound faces before unbinding
+    let unbound_faces: Vec<(String, Option<String>, Option<i32>)> = sqlx::query_as(&format!(
+        "SELECT file_uuid, face_id, trace_id FROM {} WHERE identity_id = $1",
+        table
+    ))
+    .bind(identity_id)
+    .fetch_all(state.db.pool())
+    .await
+    .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
+
+    let face_list: Vec<serde_json::Value> = unbound_faces
+        .into_iter()
+        .map(|(fu, fid, tid)| {
+            serde_json::json!({
+                "file_uuid": fu,
+                "face_id": fid,
+                "trace_id": tid
+            })
+        })
+        .collect();
+
+    // Clear delete redo stack (if identity was previously restored via undo)
+    let _ = sqlx::query(&format!(
+        "DELETE FROM {} WHERE identity_id = $1 AND operation = 'delete' AND is_undone = true",
+        history_table
+    ))
+    .bind(identity_id)
+    .execute(state.db.pool())
+    .await;
+
+    // Insert delete history record
+    let uid = auth.user_id.to_string();
+    let usrc = match auth.source {
+        crate::api::middleware::AuthSource::Jwt => "jwt",
+        crate::api::middleware::AuthSource::Session => "session",
+        crate::api::middleware::AuthSource::ApiKey => "api_key",
+    };
+    let before_snapshot = serde_json::json!({
+        "identity": identity_snapshot,
+        "unbound_faces": face_list,
+    });
+    let after_snapshot = serde_json::json!({});
+    let _ = sqlx::query(&format!(
+        "INSERT INTO {} (identity_id, operation, before_snapshot, after_snapshot, is_undone, user_id, user_source) VALUES ($1, 'delete', $2, $3, false, $4, $5)",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(before_snapshot)
+    .bind(after_snapshot)
+    .bind(&uid)
+    .bind(usrc)
+    .execute(state.db.pool())
+    .await;
 
     // Unbind all faces
     sqlx::query(&format!(
-        "UPDATE {} SET identity_id = NULL, identity_confidence = NULL WHERE identity_id = $1",
+        "UPDATE {} SET identity_id = NULL WHERE identity_id = $1",
         table
     ))
     .bind(identity_id)
@@ -451,6 +522,19 @@ async fn get_identity_files(
     Query(params): Query<FilesQuery>,
 ) -> Result<Json<IdentityFilesResponse>, (StatusCode, String)> {
     let uuid = identity_uuid.replace('-', "");
+    let id_table = crate::core::db::schema::table_name("identities");
+
+    let identity: Option<(i32, String)> = sqlx::query_as(&format!(
+        "SELECT id, name FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        id_table
+    ))
+    .bind(&uuid)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| (StatusCode::INTERNAL_SERVER_ERROR, e.to_string()))?;
+
+    let (identity_id, name) =
+        identity.ok_or((StatusCode::NOT_FOUND, "Identity not found".to_string()))?;
 
     let page = params.page.unwrap_or(1);
     let page_size = params.page_size.unwrap_or(20);
@@ -477,14 +561,11 @@ async fn get_identity_files(
         })
         .collect();
 
-    let total = match sqlx::query_scalar::<_, i64>(
-        &format!(
-            "SELECT COUNT(DISTINCT fd.file_uuid) FROM {} fd WHERE fd.identity_id = (SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1)",
-            crate::core::db::schema::table_name("face_detections"),
-            crate::core::db::schema::table_name("identities"),
-        )
-    )
-    .bind(&uuid)
+    let total = match sqlx::query_scalar::<_, i64>(&format!(
+        "SELECT COUNT(DISTINCT fd.file_uuid) FROM {} fd WHERE fd.identity_id = $1",
+        crate::core::db::schema::table_name("face_detections"),
+    ))
+    .bind(identity_id)
     .fetch_one(state.db.pool())
     .await
     {
@@ -495,6 +576,7 @@ async fn get_identity_files(
     Ok(Json(IdentityFilesResponse {
         success: true,
         identity_uuid: uuid.to_string().replace('-', ""),
+        name,
         total,
         page,
         page_size,
@@ -506,6 +588,7 @@ async fn get_identity_files(
 pub struct IdentityFacesResponse {
     pub success: bool,
     pub identity_uuid: String,
+    pub name: String,
     pub total: i64,
     pub page: usize,
     pub page_size: usize,
@@ -537,6 +620,19 @@ async fn get_identity_faces(
     Query(params): Query<FilesQuery>,
 ) -> Result<Json<IdentityFacesResponse>, (StatusCode, String)> {
     let uuid = identity_uuid.replace('-', "");
+    let id_table = crate::core::db::schema::table_name("identities");
+
+    let identity: Option<(i32, String)> = sqlx::query_as(&format!(
+        "SELECT id, name FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        id_table
+    ))
+    .bind(&uuid)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| (StatusCode::INTERNAL_SERVER_ERROR, e.to_string()))?;
+
+    let (identity_id, name) =
+        identity.ok_or((StatusCode::NOT_FOUND, "Identity not found".to_string()))?;
 
     let page = params.page.unwrap_or(1);
     let page_size = params.page_size.unwrap_or(50);
@@ -566,14 +662,11 @@ async fn get_identity_faces(
         })
         .collect();
 
-    let total = match sqlx::query_scalar::<_, i64>(
-        &format!(
-            "SELECT COUNT(*) FROM {} fd WHERE fd.identity_id = (SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1)",
-            crate::core::db::schema::table_name("face_detections"),
-            crate::core::db::schema::table_name("identities"),
-        )
-    )
-    .bind(&uuid)
+    let total = match sqlx::query_scalar::<_, i64>(&format!(
+        "SELECT COUNT(*) FROM {} fd WHERE fd.identity_id = $1",
+        crate::core::db::schema::table_name("face_detections"),
+    ))
+    .bind(identity_id)
     .fetch_one(state.db.pool())
     .await
     {
@@ -584,6 +677,215 @@ async fn get_identity_faces(
     Ok(Json(IdentityFacesResponse {
         success: true,
         identity_uuid: uuid.to_string().replace('-', ""),
+        name,
+        total,
+        page,
+        page_size,
+        data,
+    }))
+}
+
+// --- File Faces Endpoint ---
+
+#[derive(Debug, Serialize)]
+pub struct FileFacesResponse {
+    pub success: bool,
+    pub file_uuid: String,
+    pub total: i64,
+    pub page: usize,
+    pub page_size: usize,
+    pub data: Vec<FileFaceItem>,
+}
+
+#[derive(Debug, Serialize)]
+pub struct FileFaceItem {
+    pub id: i64,
+    pub file_uuid: String,
+    pub frame_number: i64,
+    pub timestamp_secs: Option<f64>,
+    pub face_id: Option<String>,
+    pub trace_id: Option<i32>,
+    pub bbox: BBox,
+    pub confidence: f64,
+    pub binding: FaceBinding,
+}
+
+#[derive(Debug, Serialize)]
+#[serde(untagged)]
+pub enum FaceBinding {
+    Identity {
+        identity_id: i32,
+        identity_uuid: String,
+        identity_name: String,
+    },
+    Stranger {
+        stranger_id: i32,
+        metadata: serde_json::Value,
+    },
+    Dangling {
+        old_identity_id: i32,
+    },
+    Unbound,
+}
+
+#[derive(Debug, Deserialize)]
+pub struct FileFacesQuery {
+    page: Option<usize>,
+    page_size: Option<usize>,
+    binding: Option<String>,
+    trace_id: Option<i32>,
+    min_confidence: Option<f64>,
+    start_frame: Option<i64>,
+    end_frame: Option<i64>,
+}
+
+async fn get_file_faces(
+    State(state): State<crate::api::types::AppState>,
+    Path(file_uuid): Path<String>,
+    Query(params): Query<FileFacesQuery>,
+) -> Result<Json<FileFacesResponse>, (StatusCode, String)> {
+    let page = params.page.unwrap_or(1);
+    let page_size = params.page_size.unwrap_or(50);
+    let offset = ((page - 1) as i64) * (page_size as i64);
+
+    let fd_table = crate::core::db::schema::table_name("face_detections");
+    let id_table = crate::core::db::schema::table_name("identities");
+    let st_table = crate::core::db::schema::table_name("strangers");
+    let video_table = crate::core::db::schema::table_name("videos");
+
+    // Build WHERE clauses
+    let mut where_clauses = vec![format!(
+        "fd.file_uuid = '{}'",
+        file_uuid.replace('\'', "''")
+    )];
+
+    if let Some(ref binding) = params.binding {
+        match binding.as_str() {
+            "identity" => {
+                where_clauses.push(format!("fd.identity_id IN (SELECT id FROM {})", id_table));
+            }
+            "stranger" => {
+                where_clauses.push("fd.stranger_id IS NOT NULL".to_string());
+            }
+            "dangling" => {
+                where_clauses.push(format!(
+                    "fd.identity_id IS NOT NULL AND NOT EXISTS (SELECT 1 FROM {} WHERE id = fd.identity_id)",
+                    id_table
+                ));
+            }
+            "unbound" => {
+                where_clauses.push("fd.identity_id IS NULL AND fd.stranger_id IS NULL".to_string());
+            }
+            _ => {}
+        }
+    }
+
+    if let Some(tid) = params.trace_id {
+        where_clauses.push(format!("fd.trace_id = {}", tid));
+    }
+    if let Some(mc) = params.min_confidence {
+        where_clauses.push(format!("fd.confidence >= {}", mc));
+    }
+    if let Some(sf) = params.start_frame {
+        where_clauses.push(format!("fd.frame_number >= {}", sf));
+    }
+    if let Some(ef) = params.end_frame {
+        where_clauses.push(format!("fd.frame_number <= {}", ef));
+    }
+
+    let where_sql = where_clauses.join(" AND ");
+
+    let select_sql = format!(
+        "SELECT fd.id::bigint as id, fd.file_uuid, \
+         fd.frame_number::bigint as frame_number, \
+         (fd.frame_number::float8 / NULLIF(v.fps, 0)) as timestamp_secs, \
+         fd.face_id, fd.trace_id, \
+         fd.x::float8 as x, fd.y::float8 as y, \
+         fd.width::float8 as width, fd.height::float8 as height, \
+         fd.confidence::float8 as confidence, \
+         fd.identity_id, fd.stranger_id, \
+         i.uuid::text as identity_uuid, i.name as identity_name, \
+         s.metadata as stranger_metadata \
+         FROM {} fd \
+         JOIN {} v ON v.file_uuid = fd.file_uuid \
+         LEFT JOIN {} i ON i.id = fd.identity_id \
+         LEFT JOIN {} s ON s.id = fd.stranger_id \
+         WHERE {} \
+         ORDER BY fd.frame_number, fd.trace_id \
+         LIMIT {} OFFSET {}",
+        fd_table, video_table, id_table, st_table, where_sql, page_size as i64, offset
+    );
+
+    let count_sql = format!(
+        "SELECT COUNT(*) FROM {} fd \
+         WHERE {}",
+        fd_table, where_sql
+    );
+
+    use sqlx::Row;
+    let rows = sqlx::query(&select_sql)
+        .fetch_all(state.db.pool())
+        .await
+        .map_err(|e| (StatusCode::INTERNAL_SERVER_ERROR, e.to_string()))?;
+
+    let total: i64 = sqlx::query_scalar(&count_sql)
+        .fetch_one(state.db.pool())
+        .await
+        .map_err(|e| (StatusCode::INTERNAL_SERVER_ERROR, e.to_string()))?;
+
+    let data: Vec<FileFaceItem> = rows
+        .into_iter()
+        .map(|r| {
+            let identity_id: Option<i32> = r.get("identity_id");
+            let identity_uuid: Option<String> = r.get("identity_uuid");
+            let identity_name: Option<String> = r.get("identity_name");
+            let stranger_id: Option<i32> = r.get("stranger_id");
+
+            let binding = if let (Some(iid), Some(iuuid), Some(iname)) =
+                (identity_id, identity_uuid, identity_name)
+            {
+                FaceBinding::Identity {
+                    identity_id: iid,
+                    identity_uuid: iuuid,
+                    identity_name: iname,
+                }
+            } else if let Some(sid) = stranger_id {
+                FaceBinding::Stranger {
+                    stranger_id: sid,
+                    metadata: r
+                        .get::<Option<serde_json::Value>, _>("stranger_metadata")
+                        .unwrap_or(serde_json::Value::Null),
+                }
+            } else if let Some(iid) = identity_id {
+                FaceBinding::Dangling {
+                    old_identity_id: iid,
+                }
+            } else {
+                FaceBinding::Unbound
+            };
+
+            FileFaceItem {
+                id: r.get("id"),
+                file_uuid: r.get("file_uuid"),
+                frame_number: r.get("frame_number"),
+                timestamp_secs: r.get("timestamp_secs"),
+                face_id: r.get("face_id"),
+                trace_id: r.get("trace_id"),
+                bbox: BBox {
+                    x: r.get("x"),
+                    y: r.get("y"),
+                    width: r.get("width"),
+                    height: r.get("height"),
+                },
+                confidence: r.get("confidence"),
+                binding,
+            }
+        })
+        .collect();
+
+    Ok(Json(FileFacesResponse {
+        success: true,
+        file_uuid,
         total,
         page,
         page_size,
@@ -595,6 +897,7 @@ async fn get_identity_faces(
 pub struct IdentityChunksResponse {
     pub success: bool,
     pub identity_uuid: String,
+    pub name: String,
     pub total: i64,
     pub page: usize,
     pub page_size: usize,
@@ -621,6 +924,19 @@ async fn get_identity_chunks(
     Query(params): Query<FilesQuery>,
 ) -> Result<Json<IdentityChunksResponse>, (StatusCode, String)> {
     let uuid = identity_uuid.replace('-', "");
+    let id_table = crate::core::db::schema::table_name("identities");
+
+    let identity: Option<(i32, String)> = sqlx::query_as(&format!(
+        "SELECT id, name FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        id_table
+    ))
+    .bind(&uuid)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| (StatusCode::INTERNAL_SERVER_ERROR, e.to_string()))?;
+
+    let (_identity_id, name) =
+        identity.ok_or((StatusCode::NOT_FOUND, "Identity not found".to_string()))?;
 
     let page = params.page.unwrap_or(1);
     let page_size = params.page_size.unwrap_or(20);
@@ -651,6 +967,7 @@ async fn get_identity_chunks(
     Ok(Json(IdentityChunksResponse {
         success: true,
         identity_uuid: uuid.to_string().replace('-', ""),
+        name,
         total: data.len() as i64,
         page,
         page_size,
@@ -1001,15 +1318,17 @@ async fn get_identity_json(
         return Err(StatusCode::NOT_FOUND);
     }
 
-    // 3. Read the newly generated file
-    let p = crate::core::identity::storage::identity_file_path(&clean);
-    if p.exists() {
-        let data = std::fs::read(&p).map_err(|_| StatusCode::NOT_FOUND)?;
-        return Ok((
-            StatusCode::OK,
-            [("content-type".to_string(), "application/json".to_string())],
-            data,
-        ));
+    // 3. Read the newly generated file (try all UUID variants)
+    for u in [&clean, &identity_uuid, &with_hyphens] {
+        let p = crate::core::identity::storage::identity_file_path(u);
+        if p.exists() {
+            let data = std::fs::read(&p).map_err(|_| StatusCode::NOT_FOUND)?;
+            return Ok((
+                StatusCode::OK,
+                [("content-type".to_string(), "application/json".to_string())],
+                data,
+            ));
+        }
     }
 
     Err(StatusCode::NOT_FOUND)
@@ -1020,7 +1339,8 @@ async fn get_identity_json(
 
 #[derive(Debug, Deserialize)]
 struct IdentityTextQuery {
-    uuid: String,
+    #[serde(default)]
+    file_uuid: Option<String>,
     q: String,
     limit: Option<i64>,
     page: Option<usize>,
@@ -1062,6 +1382,7 @@ async fn search_identity_text(
     let like_q = format!("%{}%", params.q.replace('%', "%%"));
     let limit = params.limit.unwrap_or(50).min(100);
 
+    let sd_table = schema::table_name("speaker_detections");
     let query = format!(
         r#"SELECT c.file_uuid, c.chunk_id, c.start_time, c.end_time, c.text_content,
                   fd.identity_id, i.name AS identity_name, i.source AS identity_source,
@@ -1071,10 +1392,22 @@ async fn search_identity_text(
                AND fd.frame_number BETWEEN c.start_frame AND c.end_frame
                AND fd.identity_id IS NOT NULL
            LEFT JOIN {} i ON i.id = fd.identity_id
-           WHERE c.file_uuid = $1 AND LOWER(c.text_content) LIKE LOWER($2)
-           ORDER BY c.start_time
+           WHERE ($1::text IS NULL OR c.file_uuid = $1) AND (LOWER(c.text_content) LIKE LOWER($2) OR LOWER(c.content::text) LIKE LOWER($2))
+
+           UNION ALL
+
+           SELECT sd.file_uuid, COALESCE(c.chunk_id, sd.chunk_id),
+                  sd.start_time, sd.end_time, sd.text_content,
+                  sd.identity_id, i.name AS identity_name, i.source AS identity_source,
+                  NULL::int AS trace_id
+           FROM {} sd
+           JOIN {} i ON i.id = sd.identity_id
+           LEFT JOIN {} c ON c.chunk_id = sd.chunk_id
+           WHERE ($1::text IS NULL OR sd.file_uuid = $1) AND (LOWER(sd.text_content) LIKE LOWER($2) OR LOWER($2) = '%%')
+
+           ORDER BY 3
            LIMIT $3"#,
-        chunk_table, fd_table, id_table
+        chunk_table, fd_table, id_table, sd_table, id_table, chunk_table
     );
 
     let rows = sqlx::query_as::<
@@ -1091,7 +1424,7 @@ async fn search_identity_text(
             Option<i32>,
         ),
     >(&query)
-    .bind(&params.uuid)
+    .bind(&params.file_uuid)
     .bind(&like_q)
     .bind(limit)
     .fetch_all(state.db.pool())
@@ -1134,7 +1467,9 @@ async fn search_identity_text(
 #[derive(Debug, Deserialize)]
 struct IdentitySearchQuery {
     q: String,
-    uuid: Option<String>,
+    file_uuid: Option<String>,
+    page: Option<i64>,
+    page_size: Option<i64>,
     limit: Option<i64>,
 }
 
@@ -1147,13 +1482,19 @@ struct IdentitySearchHit {
     file_uuid: String,
     trace_id: Option<i32>,
     chunk_id: String,
+    start_frame: i64,
+    end_frame: i64,
+    fps: f64,
     start_time: f64,
+    end_time: f64,
     text_content: Option<String>,
 }
 
 #[derive(Debug, Serialize)]
 struct IdentitySearchResponse {
     success: bool,
+    page: i64,
+    page_size: i64,
     total: i64,
     results: Vec<IdentitySearchHit>,
 }
@@ -1168,72 +1509,100 @@ async fn search_identities_by_text(
     let fd_table = schema::table_name("face_detections");
     let chunk_table = schema::table_name("chunk");
     let like_q = format!("%{}%", params.q.replace('%', "%%"));
-    let limit = params.limit.unwrap_or(50).min(100);
+    let page = params.page.unwrap_or(1).max(1);
+    let page_size = params.page_size
+        .or(params.limit)
+        .unwrap_or(20)
+        .min(100)
+        .max(1);
+    let offset = (page - 1) * page_size;
 
+    let sd_table = schema::table_name("speaker_detections");
+    let ib_table = schema::table_name("identity_bindings");
     let query = format!(
-        r#"SELECT i.id::int, i.name, i.source, i.tmdb_id,
+        r#"WITH matched AS (
+           SELECT i.id::int, i.name, i.source, i.tmdb_id,
                   fd.file_uuid, fd.trace_id,
-                  c.chunk_id, c.start_time, c.text_content
+                  c.chunk_id, c.start_frame, c.end_frame, c.fps,
+                  c.start_time, c.end_time, c.text_content
            FROM {} i
-            JOIN {} fd ON fd.identity_id = i.id
-           JOIN {} c ON c.file_uuid = fd.file_uuid
-               AND c.start_time <= fd.frame_number / COALESCE(c.fps, 25.0)
-               AND c.end_time >= fd.frame_number / COALESCE(c.fps, 25.0)
+            JOIN {} ib ON ib.identity_id = i.id AND ib.identity_type = 'trace'
+            JOIN {} fd ON fd.trace_id = ib.identity_value::int
+            JOIN {} c ON c.file_uuid = fd.file_uuid
+                AND c.start_time <= fd.frame_number / COALESCE(c.fps, 25.0)
+                AND c.end_time >= fd.frame_number / COALESCE(c.fps, 25.0)
+              WHERE (i.name ILIKE $1
+                 OR EXISTS (
+                     SELECT 1 FROM jsonb_array_elements(i.metadata->'aliases') AS a
+                     WHERE a->>'name' ILIKE $1
+                 ))
+                AND ($2::text IS NULL OR fd.file_uuid = $2)
+
+             UNION ALL
+
+            SELECT i.id::int, i.name, i.source, i.tmdb_id,
+                   sd.file_uuid, NULL::int AS trace_id,
+                   COALESCE(c.chunk_id, sd.chunk_id) as chunk_id,
+                   c.start_frame, c.end_frame, c.fps,
+                   sd.start_time, sd.end_time, sd.text_content
+            FROM {} i
+            JOIN {} sd ON sd.identity_id = i.id
+            LEFT JOIN {} c ON c.chunk_id = sd.chunk_id
             WHERE (i.name ILIKE $1
-               OR EXISTS (
-                   SELECT 1 FROM jsonb_array_elements(i.metadata->'aliases') AS a
-                   WHERE a->>'name' ILIKE $1
-               ))
-              AND ($2::text IS NULL OR fd.file_uuid = $2)
-           ORDER BY i.name, c.start_time
-           LIMIT $3"#,
-        id_table, fd_table, chunk_table
+                OR EXISTS (
+                    SELECT 1 FROM jsonb_array_elements(i.metadata->'aliases') AS a
+                    WHERE a->>'name' ILIKE $1
+                ))
+               AND ($2::text IS NULL OR sd.file_uuid = $2)
+),
+deduped AS (
+    SELECT DISTINCT ON (name, chunk_id) *
+    FROM matched
+    ORDER BY name, chunk_id, start_time
+)
+SELECT *, COUNT(*) OVER() AS total_count
+FROM deduped
+ORDER BY name, start_time
+LIMIT $3 OFFSET $4"#,
+        id_table, ib_table, fd_table, chunk_table, id_table, sd_table, chunk_table
     );
 
-    let rows = sqlx::query_as::<
-        _,
-        (
-            i32,
-            String,
-            Option<String>,
-            Option<i32>,
-            String,
-            Option<i32>,
-            String,
-            f64,
-            Option<String>,
-        ),
-    >(&query)
-    .bind(&like_q)
-    .bind(&params.uuid)
-    .bind(limit)
-    .fetch_all(state.db.pool())
-    .await
-    .map_err(|e| {
-        tracing::error!("[identities/search] Query failed: {}", e);
-        StatusCode::INTERNAL_SERVER_ERROR
-    })?;
+    let rows = sqlx::query(&query)
+        .bind(&like_q)
+        .bind(&params.file_uuid)
+        .bind(page_size)
+        .bind(offset)
+        .fetch_all(state.db.pool())
+        .await
+        .map_err(|e| {
+            tracing::error!("[identities/search] Query failed: {}", e);
+            StatusCode::INTERNAL_SERVER_ERROR
+        })?;
 
+    let total = rows.first().map(|r| r.get::<i64, _>(13)).unwrap_or(0);
     let results: Vec<IdentitySearchHit> = rows
         .into_iter()
-        .map(
-            |(iid, name, src, tid, fu, trace_id, cid, st, txt)| IdentitySearchHit {
-                identity_id: iid,
-                name,
-                source: src,
-                tmdb_id: tid,
-                file_uuid: fu,
-                trace_id,
-                chunk_id: cid,
-                start_time: st,
-                text_content: txt,
-            },
-        )
+        .map(|r| IdentitySearchHit {
+            identity_id: r.get(0),
+            name: r.get(1),
+            source: r.get(2),
+            tmdb_id: r.get(3),
+            file_uuid: r.get(4),
+            trace_id: r.get(5),
+            chunk_id: r.get(6),
+            start_frame: r.get(7),
+            end_frame: r.get(8),
+            fps: r.get(9),
+            start_time: r.get(10),
+            end_time: r.get(11),
+            text_content: r.get(12),
+        })
         .collect();
 
-    let total = results.len() as i64;
     Ok(Json(IdentitySearchResponse {
         success: true,
+        page,
+        page_size,
         total,
         results,
     }))
@@ -1258,6 +1627,7 @@ struct UpdateIdentityResponse {
 
 async fn update_identity(
     State(state): State<crate::api::types::AppState>,
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
     Path(identity_uuid): Path<String>,
     Json(req): Json<UpdateIdentityRequest>,
 ) -> Result<Json<UpdateIdentityResponse>, (StatusCode, Json<serde_json::Value>)> {
@@ -1272,11 +1642,31 @@ async fn update_identity(
     })?;
 
     let table = crate::core::db::schema::table_name("identities");
-    let existing: Option<(i32, String)> = sqlx::query_as(&format!(
-        "SELECT id, name FROM {} WHERE uuid = $1::uuid",
+    let history_table = crate::core::db::schema::table_name("identity_history");
+
+    // Get before snapshot (current state)
+    let before_snapshot: Option<serde_json::Value> = sqlx::query_scalar(&format!(
+        "SELECT jsonb_build_object('id', id, 'uuid', uuid::text, 'name', name, 'identity_type', identity_type, 'source', source, 'status', status, 'metadata', metadata, 'tmdb_id', tmdb_id, 'tmdb_profile', tmdb_profile) FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
         table
     ))
-    .bind(uuid_parsed)
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("DB error: {}", e)
+            })),
+        )
+    })?;
+
+    // Use text-based UUID comparison to avoid UUID type encoding issues
+    let existing: Option<(i32, String)> = sqlx::query_as(&format!(
+        "SELECT id, name FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        table
+    ))
+    .bind(&uuid_clean)
     .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
@@ -1305,7 +1695,18 @@ async fn update_identity(
         updated_fields.push("name".to_string());
     }
     if let Some(ref metadata) = req.metadata {
-        set_clauses.push(format!("metadata = ${}::jsonb", set_clauses.len() + 1));
+        if !metadata.is_object() {
+            return Err((
+                StatusCode::BAD_REQUEST,
+                Json(serde_json::json!({
+                    "success": false, "error": "metadata must be a JSON object"
+                })),
+            ));
+        }
+        set_clauses.push(format!(
+            "metadata = jsonb_deep_merge(COALESCE(metadata, '{{}}'::jsonb), ${}::jsonb)",
+            set_clauses.len() + 1
+        ));
         updated_fields.push("metadata".to_string());
     }
     if let Some(ref status) = req.status {
@@ -1326,10 +1727,27 @@ async fn update_identity(
         ));
     }
 
+    // Clear redo stack (only PATCH operations, not bind)
+    sqlx::query(&format!(
+        "DELETE FROM {} WHERE identity_id = $1 AND is_undone = true AND operation = 'update'",
+        history_table
+    ))
+    .bind(identity_id)
+    .execute(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to clear redo stack: {}", e)
+            })),
+        )
+    })?;
+
     let set_sql = set_clauses.join(", ");
     let uuid_param = set_clauses.len() + 1;
     let update_sql = format!(
-        "UPDATE {} SET {} WHERE uuid = ${}::uuid",
+        "UPDATE {} SET {} WHERE REPLACE(uuid::text, '-', '') = ${}",
         table, set_sql, uuid_param
     );
 
@@ -1348,7 +1766,7 @@ async fn update_identity(
         query = query.bind(identity_type);
     }
 
-    query = query.bind(uuid_parsed);
+    query = query.bind(&uuid_clean);
 
     query.execute(state.db.pool()).await.map_err(|e| {
         (
@@ -1359,6 +1777,87 @@ async fn update_identity(
         )
     })?;
 
+    // Get after snapshot
+    let after_snapshot: Option<serde_json::Value> = sqlx::query_scalar(&format!(
+        "SELECT jsonb_build_object('id', id, 'uuid', uuid::text, 'name', name, 'identity_type', identity_type, 'source', source, 'status', status, 'metadata', metadata, 'tmdb_id', tmdb_id, 'tmdb_profile', tmdb_profile) FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        table
+    ))
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to get after snapshot: {}", e)
+            })),
+        )
+    })?;
+
+    // Insert history record with user tracking
+    let uid = auth.user_id.to_string();
+    let usrc = match auth.source {
+        crate::api::middleware::AuthSource::Jwt => "jwt",
+        crate::api::middleware::AuthSource::Session => "session",
+        crate::api::middleware::AuthSource::ApiKey => "api_key",
+    };
+    sqlx::query(&format!(
+        "INSERT INTO {} (identity_id, operation, before_snapshot, after_snapshot, is_undone, user_id, user_source) VALUES ($1, 'update', $2, $3, false, $4, $5)",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(before_snapshot)
+    .bind(after_snapshot)
+    .bind(&uid)
+    .bind(usrc)
+    .execute(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to insert history: {}", e)
+            })),
+        )
+    })?;
+
+    // Cleanup: keep max 256 history records per identity
+    let count: i64 = sqlx::query_scalar(&format!(
+        "SELECT COUNT(*) FROM {} WHERE identity_id = $1",
+        history_table
+    ))
+    .bind(identity_id)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to count history: {}", e)
+            })),
+        )
+    })?;
+
+    if count > 256 {
+        let delete_count = count - 256;
+        sqlx::query(&format!(
+            "DELETE FROM {} WHERE identity_id = $1 AND id IN (SELECT id FROM {} WHERE identity_id = $1 ORDER BY created_at ASC LIMIT $2)",
+            history_table, history_table
+        ))
+        .bind(identity_id)
+        .bind(delete_count)
+        .execute(state.db.pool())
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({
+                    "success": false, "error": format!("Failed to cleanup history: {}", e)
+                })),
+            )
+        })?;
+    }
+
     // Sync identity.json to disk
     let _ =
         crate::core::identity::storage::save_identity_file_by_pool(state.db.pool(), &uuid_clean)
@@ -1376,3 +1875,633 @@ async fn update_identity(
         updated_fields,
     }))
 }
+
+// ── Undo/Redo APIs ────────────────────────────────────────────────
+
+#[derive(Debug, Deserialize)]
+struct UndoRequest {
+    steps: Option<usize>,
+}
+
+#[derive(Debug, Serialize)]
+struct UndoResponse {
+    success: bool,
+    identity_uuid: String,
+    undone_count: usize,
+    current_state: serde_json::Value,
+}
+
+async fn undo_identity(
+    State(state): State<crate::api::types::AppState>,
+    Extension(_auth): Extension<crate::api::middleware::UserAuth>,
+    Path(identity_uuid): Path<String>,
+    Json(req): Json<UndoRequest>,
+) -> Result<Json<UndoResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let uuid_clean = identity_uuid.replace('-', "");
+    let steps = req.steps.unwrap_or(1).max(1);
+
+    let table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
+    let face_table = crate::core::db::schema::table_name("face_detections");
+
+    // Try normal identity lookup
+    let identity_row: Option<(i32,)> = sqlx::query_as(&format!(
+        "SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        table
+    ))
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("DB error: {}", e)
+            })),
+        )
+    })?;
+
+    let (identity_id,) = match identity_row {
+        Some(row) => row,
+        None => {
+            // Identity might have been deleted — check for delete history
+            let delete_record: Option<(i64, serde_json::Value)> = sqlx::query_as(&format!(
+                "SELECT id, before_snapshot FROM {} WHERE operation = 'delete' AND is_undone = false AND REPLACE(before_snapshot->'identity'->>'uuid', '-', '') = $1 ORDER BY created_at DESC LIMIT 1",
+                history_table
+            ))
+            .bind(&uuid_clean)
+            .fetch_optional(state.db.pool())
+            .await
+            .map_err(|e| {
+                (
+                    StatusCode::INTERNAL_SERVER_ERROR,
+                    Json(serde_json::json!({
+                        "success": false, "error": format!("Failed to check delete history: {}", e)
+                    })),
+                )
+            })?;
+
+            let (history_id, snapshot) = delete_record.ok_or_else(|| {
+                (
+                    StatusCode::BAD_REQUEST,
+                    Json(serde_json::json!({
+                        "success": false, "error": "No undo operations available"
+                    })),
+                )
+            })?;
+
+            // Recreate identity from snapshot
+            let identity_obj = snapshot.get("identity").ok_or_else(|| {
+                (
+                    StatusCode::INTERNAL_SERVER_ERROR,
+                    Json(serde_json::json!({
+                        "success": false, "error": "Missing identity snapshot"
+                    })),
+                )
+            })?;
+
+            let new_id: i32 = sqlx::query_scalar(&format!(
+                "INSERT INTO {} (uuid, name, identity_type, source, status, metadata, tmdb_id, tmdb_profile) VALUES ($1::uuid, $2, $3, $4, $5, $6::jsonb, $7, $8) RETURNING id",
+                table
+            ))
+            .bind(identity_obj.get("uuid").and_then(|v| v.as_str()).unwrap_or(""))
+            .bind(identity_obj.get("name").and_then(|v| v.as_str()).unwrap_or(""))
+            .bind(identity_obj.get("identity_type").and_then(|v| v.as_str()))
+            .bind(identity_obj.get("source").and_then(|v| v.as_str()))
+            .bind(identity_obj.get("status").and_then(|v| v.as_str()))
+            .bind(identity_obj.get("metadata").cloned().unwrap_or(serde_json::json!({})))
+            .bind(identity_obj.get("tmdb_id").and_then(|v| v.as_i64()))
+            .bind(identity_obj.get("tmdb_profile").and_then(|v| v.as_str()))
+            .fetch_one(state.db.pool())
+            .await
+            .map_err(|e| {
+                (
+                    StatusCode::INTERNAL_SERVER_ERROR,
+                    Json(serde_json::json!({
+                        "success": false, "error": format!("Failed to recreate identity: {}", e)
+                    })),
+                )
+            })?;
+
+            // Re-bind faces
+            if let Some(faces) = snapshot.get("unbound_faces").and_then(|v| v.as_array()) {
+                for face in faces {
+                    let file_uuid = face.get("file_uuid").and_then(|v| v.as_str());
+                    let face_id = face.get("face_id").and_then(|v| v.as_str());
+                    let trace_id = face.get("trace_id").and_then(|v| v.as_i64());
+                    if let (Some(fu), Some(fid)) = (file_uuid, face_id) {
+                        let _ = sqlx::query(&format!(
+                            "UPDATE {} SET identity_id = $1 WHERE file_uuid = $2 AND face_id = $3",
+                            face_table
+                        ))
+                        .bind(new_id)
+                        .bind(fu)
+                        .bind(fid)
+                        .execute(state.db.pool())
+                        .await;
+                    }
+                }
+            }
+
+            // Mark delete history as undone
+            let _ = sqlx::query(&format!(
+                "UPDATE {} SET is_undone = true, undone_at = NOW() WHERE id = $1",
+                history_table
+            ))
+            .bind(history_id)
+            .execute(state.db.pool())
+            .await;
+
+            // Sync identity.json
+            let _ = crate::core::identity::storage::save_identity_file_by_pool(
+                state.db.pool(),
+                &uuid_clean,
+            )
+            .await;
+
+            // Update index
+            let new_name = identity_obj
+                .get("name")
+                .and_then(|v| v.as_str())
+                .unwrap_or("");
+            let _ = crate::core::identity::storage::update_index(&uuid_clean, new_name);
+
+            // Get current state
+            let current_state: serde_json::Value = sqlx::query_scalar(&format!(
+                "SELECT jsonb_build_object('id', id, 'uuid', uuid::text, 'name', name, 'identity_type', identity_type, 'source', source, 'status', status, 'metadata', metadata, 'tmdb_id', tmdb_id, 'tmdb_profile', tmdb_profile) FROM {} WHERE id = $1",
+                table
+            ))
+            .bind(new_id)
+            .fetch_one(state.db.pool())
+            .await
+            .map_err(|e| {
+                (
+                    StatusCode::INTERNAL_SERVER_ERROR,
+                    Json(serde_json::json!({
+                        "success": false, "error": format!("Failed to get current state: {}", e)
+                    })),
+                )
+            })?;
+
+            return Ok(Json(UndoResponse {
+                success: true,
+                identity_uuid: uuid_clean,
+                undone_count: 1,
+                current_state,
+            }));
+        }
+    };
+
+    // ── Normal PATCH undo flow (identity exists) ──
+
+    // Get recent N history records (is_undone=false, only 'update')
+    let history_records: Vec<(i64, serde_json::Value)> = sqlx::query_as(&format!(
+        "SELECT id, before_snapshot FROM {} WHERE identity_id = $1 AND is_undone = false AND operation = 'update' ORDER BY created_at DESC LIMIT $2",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(steps as i64)
+    .fetch_all(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to get history: {}", e)
+            })),
+        )
+    })?;
+
+    if history_records.is_empty() {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({
+                "success": false, "error": "No undo operations available"
+            })),
+        ));
+    }
+
+    // Apply the last before_snapshot
+    let (_, last_before) = history_records.last().unwrap();
+    let before = last_before.as_object().unwrap();
+
+    // Restore identity from before_snapshot
+    sqlx::query(&format!(
+        "UPDATE {} SET name = $1, identity_type = $2, source = $3, status = $4, metadata = $5, tmdb_id = $6, tmdb_profile = $7 WHERE id = $8",
+        table
+    ))
+    .bind(before.get("name").and_then(|v| v.as_str()).unwrap_or(""))
+    .bind(before.get("identity_type").and_then(|v| v.as_str()))
+    .bind(before.get("source").and_then(|v| v.as_str()))
+    .bind(before.get("status").and_then(|v| v.as_str()))
+    .bind(before.get("metadata").cloned().unwrap_or(serde_json::json!({})))
+    .bind(before.get("tmdb_id").and_then(|v| v.as_i64()))
+    .bind(before.get("tmdb_profile").and_then(|v| v.as_str()))
+    .bind(identity_id)
+    .execute(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to restore identity: {}", e)
+            })),
+        )
+    })?;
+
+    // Mark history records as undone
+    for (history_id, _) in &history_records {
+        sqlx::query(&format!(
+            "UPDATE {} SET is_undone = true, undone_at = NOW() WHERE id = $1",
+            history_table
+        ))
+        .bind(*history_id)
+        .execute(state.db.pool())
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({
+                    "success": false, "error": format!("Failed to mark history as undone: {}", e)
+                })),
+            )
+        })?;
+    }
+
+    // Sync identity.json
+    let _ =
+        crate::core::identity::storage::save_identity_file_by_pool(state.db.pool(), &uuid_clean)
+            .await;
+
+    // Update index if name changed
+    let new_name = before.get("name").and_then(|v| v.as_str()).unwrap_or("");
+    let _ = crate::core::identity::storage::update_index(&uuid_clean, new_name);
+
+    // Get current state
+    let current_state: serde_json::Value = sqlx::query_scalar(&format!(
+        "SELECT jsonb_build_object('id', id, 'uuid', uuid::text, 'name', name, 'identity_type', identity_type, 'source', source, 'status', status, 'metadata', metadata, 'tmdb_id', tmdb_id, 'tmdb_profile', tmdb_profile) FROM {} WHERE id = $1",
+        table
+    ))
+    .bind(identity_id)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to get current state: {}", e)
+            })),
+        )
+    })?;
+
+    Ok(Json(UndoResponse {
+        success: true,
+        identity_uuid: uuid_clean,
+        undone_count: history_records.len(),
+        current_state,
+    }))
+}
+
+#[derive(Debug, Deserialize)]
+struct RedoRequest {
+    steps: Option<usize>,
+}
+
+#[derive(Debug, Serialize)]
+struct RedoResponse {
+    success: bool,
+    identity_uuid: String,
+    redone_count: usize,
+    current_state: serde_json::Value,
+}
+
+async fn redo_identity(
+    State(state): State<crate::api::types::AppState>,
+    Extension(_auth): Extension<crate::api::middleware::UserAuth>,
+    Path(identity_uuid): Path<String>,
+    Json(req): Json<RedoRequest>,
+) -> Result<Json<RedoResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let uuid_clean = identity_uuid.replace('-', "");
+    let steps = req.steps.unwrap_or(1).max(1);
+
+    let table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
+    let face_table = crate::core::db::schema::table_name("face_detections");
+
+    // Get identity_id
+    let identity_id: i32 = sqlx::query_scalar(&format!(
+        "SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        table
+    ))
+    .bind(&uuid_clean)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Identity not found: {}", e)
+            })),
+        )
+    })?;
+
+    // Check for delete redo first (identity was previously restored via undo)
+    let delete_record: Option<(i64,)> = sqlx::query_as(&format!(
+        "SELECT id FROM {} WHERE identity_id = $1 AND operation = 'delete' AND is_undone = true ORDER BY created_at DESC LIMIT 1",
+        history_table
+    ))
+    .bind(identity_id)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to check delete redo: {}", e)
+            })),
+        )
+    })?;
+
+    if let Some((delete_history_id,)) = delete_record {
+        // ── Delete redo: re-delete the identity ──
+        let _ = crate::core::identity::storage::delete_identity_file(&uuid_clean);
+
+        // Unbind all faces
+        let _ = sqlx::query(&format!(
+            "UPDATE {} SET identity_id = NULL WHERE identity_id = $1",
+            face_table
+        ))
+        .bind(identity_id)
+        .execute(state.db.pool())
+        .await;
+
+        // Delete identity
+        sqlx::query(&format!("DELETE FROM {} WHERE id = $1", table))
+            .bind(identity_id)
+            .execute(state.db.pool())
+            .await
+            .map_err(|e| {
+                (
+                    StatusCode::INTERNAL_SERVER_ERROR,
+                    Json(serde_json::json!({
+                        "success": false, "error": format!("Failed to delete identity: {}", e)
+                    })),
+                )
+            })?;
+
+        // Mark delete history as no longer undone
+        let _ = sqlx::query(&format!(
+            "UPDATE {} SET is_undone = false, undone_at = NULL WHERE id = $1",
+            history_table
+        ))
+        .bind(delete_history_id)
+        .execute(state.db.pool())
+        .await;
+
+        return Ok(Json(RedoResponse {
+            success: true,
+            identity_uuid: uuid_clean,
+            redone_count: 1,
+            current_state: serde_json::json!({"deleted": true}),
+        }));
+    }
+
+    // ── Normal PATCH redo flow ──
+
+    // Get recent N history records (is_undone=true, operation='update')
+    let history_records: Vec<(i64, serde_json::Value)> = sqlx::query_as(&format!(
+        "SELECT id, after_snapshot FROM {} WHERE identity_id = $1 AND is_undone = true AND operation = 'update' ORDER BY created_at DESC LIMIT $2",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(steps as i64)
+    .fetch_all(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to get history: {}", e)
+            })),
+        )
+    })?;
+
+    if history_records.is_empty() {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({
+                "success": false, "error": "No redo operations available"
+            })),
+        ));
+    }
+
+    // Apply the last after_snapshot
+    let (_, last_after) = history_records.last().unwrap();
+    let after = last_after.as_object().unwrap();
+
+    // Restore identity from after_snapshot
+    sqlx::query(&format!(
+        "UPDATE {} SET name = $1, identity_type = $2, source = $3, status = $4, metadata = $5, tmdb_id = $6, tmdb_profile = $7 WHERE id = $8",
+        table
+    ))
+    .bind(after.get("name").and_then(|v| v.as_str()).unwrap_or(""))
+    .bind(after.get("identity_type").and_then(|v| v.as_str()))
+    .bind(after.get("source").and_then(|v| v.as_str()))
+    .bind(after.get("status").and_then(|v| v.as_str()))
+    .bind(after.get("metadata").cloned().unwrap_or(serde_json::json!({})))
+    .bind(after.get("tmdb_id").and_then(|v| v.as_i64()))
+    .bind(after.get("tmdb_profile").and_then(|v| v.as_str()))
+    .bind(identity_id)
+    .execute(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to restore identity: {}", e)
+            })),
+        )
+    })?;
+
+    // Mark history records as not undone
+    for (history_id, _) in &history_records {
+        sqlx::query(&format!(
+            "UPDATE {} SET is_undone = false, undone_at = NULL WHERE id = $1",
+            history_table
+        ))
+        .bind(*history_id)
+        .execute(state.db.pool())
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({
+                    "success": false, "error": format!("Failed to mark history as redone: {}", e)
+                })),
+            )
+        })?;
+    }
+
+    // Sync identity.json
+    let _ =
+        crate::core::identity::storage::save_identity_file_by_pool(state.db.pool(), &uuid_clean)
+            .await;
+
+    // Update index if name changed
+    let new_name = after.get("name").and_then(|v| v.as_str()).unwrap_or("");
+    let _ = crate::core::identity::storage::update_index(&uuid_clean, new_name);
+
+    // Get current state
+    let current_state: serde_json::Value = sqlx::query_scalar(&format!(
+        "SELECT jsonb_build_object('id', id, 'uuid', uuid::text, 'name', name, 'identity_type', identity_type, 'source', source, 'status', status, 'metadata', metadata, 'tmdb_id', tmdb_id, 'tmdb_profile', tmdb_profile) FROM {} WHERE id = $1",
+        table
+    ))
+    .bind(identity_id)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to get current state: {}", e)
+            })),
+        )
+    })?;
+
+    Ok(Json(RedoResponse {
+        success: true,
+        identity_uuid: uuid_clean,
+        redone_count: history_records.len(),
+        current_state,
+    }))
+}
+
+#[derive(Debug, Deserialize)]
+struct HistoryQuery {
+    limit: Option<usize>,
+    page: Option<usize>,
+}
+
+#[derive(Debug, Serialize)]
+struct HistoryResponse {
+    success: bool,
+    identity_uuid: String,
+    total: i64,
+    undo_stack_count: i64,
+    redo_stack_count: i64,
+    results: Vec<HistoryItem>,
+}
+
+#[derive(Debug, Serialize)]
+struct HistoryItem {
+    history_id: i64,
+    operation: String,
+    is_undone: bool,
+    created_at: Option<chrono::DateTime<chrono::Utc>>,
+    undone_at: Option<chrono::DateTime<chrono::Utc>>,
+}
+
+async fn get_identity_history(
+    State(state): State<crate::api::types::AppState>,
+    Path(identity_uuid): Path<String>,
+    Query(params): Query<HistoryQuery>,
+) -> Result<Json<HistoryResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let uuid_clean = identity_uuid.replace('-', "");
+    let limit = params.limit.unwrap_or(20).max(1).min(100);
+    let page = params.page.unwrap_or(1).max(1);
+    let offset = ((page - 1) * limit) as i64;
+
+    let table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
+
+    // Get identity_id
+    let identity_id: i32 = sqlx::query_scalar(&format!(
+        "SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        table
+    ))
+    .bind(&uuid_clean)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Identity not found: {}", e)
+            })),
+        )
+    })?;
+
+    // Get counts
+    let undo_stack_count: i64 = sqlx::query_scalar(&format!(
+        "SELECT COUNT(*) FROM {} WHERE identity_id = $1 AND is_undone = false",
+        history_table
+    ))
+    .bind(identity_id)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to count undo stack: {}", e)
+            })),
+        )
+    })?;
+
+    let redo_stack_count: i64 = sqlx::query_scalar(&format!(
+        "SELECT COUNT(*) FROM {} WHERE identity_id = $1 AND is_undone = true",
+        history_table
+    ))
+    .bind(identity_id)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to count redo stack: {}", e)
+            })),
+        )
+    })?;
+
+    // Get history records
+    let rows = sqlx::query(&format!(
+        "SELECT id, operation, is_undone, created_at, undone_at FROM {} WHERE identity_id = $1 ORDER BY created_at DESC LIMIT $2 OFFSET $3",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(limit as i64)
+    .bind(offset)
+    .fetch_all(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({
+                "success": false, "error": format!("Failed to get history: {}", e)
+            })),
+        )
+    })?;
+
+    let results: Vec<HistoryItem> = rows
+        .into_iter()
+        .map(|r| HistoryItem {
+            history_id: r.get::<i64, _>("id"),
+            operation: r.get::<String, _>("operation"),
+            is_undone: r.get::<bool, _>("is_undone"),
+            created_at: r.get::<Option<chrono::DateTime<chrono::Utc>>, _>("created_at"),
+            undone_at: r.get::<Option<chrono::DateTime<chrono::Utc>>, _>("undone_at"),
+        })
+        .collect();
+
+    let total = undo_stack_count + redo_stack_count;
+
+    Ok(Json(HistoryResponse {
+        success: true,
+        identity_uuid: uuid_clean,
+        total,
+        undo_stack_count,
+        redo_stack_count,
+        results,
+    }))
+}
diff --git a/src/api/identity_binding.rs b/src/api/identity_binding.rs
index c4afd22..09e7878 100644
--- a/src/api/identity_binding.rs
+++ b/src/api/identity_binding.rs
@@ -1,11 +1,12 @@
 use axum::{
-    extract::{Path, Query, State},
+    extract::{Extension, Path, Query, State},
     http::StatusCode,
     response::Json,
     routing::{get, post},
     Router,
 };
 use serde::{Deserialize, Serialize};
+use sqlx::Row;
 
 use crate::core::db::{Database, PostgresDb};
 use crate::core::person_identity::{
@@ -61,28 +62,22 @@ pub async fn list_identities(
 
 /// V4.0 直接綁定：face_detections.identity_id = identities.id
 pub async fn bind_identity(
+    State(state): State<crate::api::types::AppState>,
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
     Path(identity_uuid): Path<String>,
     Json(req): Json<BindIdentityRequest>,
 ) -> Result<Json<ApiResponse<serde_json::Value>>, (StatusCode, Json<serde_json::Value>)> {
     let table = crate::core::db::schema::table_name("face_detections");
     let id_table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
 
-    let db = sqlx::PgPool::connect(&crate::core::config::DATABASE_URL)
-        .await
-        .map_err(|e| {
-            (
-                StatusCode::INTERNAL_SERVER_ERROR,
-                Json(serde_json::json!({"error": e.to_string()})),
-            )
-        })?;
-
-    // Get identity_id from identity_uuid
+    let uuid_clean = identity_uuid.replace('-', "");
     let identity_row: Option<(i32, String)> = sqlx::query_as(&format!(
-        "SELECT id, name FROM {} WHERE uuid = $1::uuid",
+        "SELECT id, name FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
         id_table
     ))
-    .bind(&identity_uuid)
-    .fetch_optional(&db)
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
         (
@@ -98,15 +93,32 @@ pub async fn bind_identity(
         )
     })?;
 
+    // Capture old identity_id before bind
+    let old_identity_id: Option<i32> = sqlx::query_scalar(&format!(
+        "SELECT identity_id FROM {} WHERE file_uuid = $1 AND face_id = $2",
+        table
+    ))
+    .bind(&req.file_uuid)
+    .bind(&req.face_id)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?
+    .flatten();
+
     // Direct UPDATE face_detections.identity_id
     let result = sqlx::query(&format!(
-        "UPDATE {} SET identity_id = $1, stranger_id = NULL WHERE file_uuid = $2 AND face_id = $3",
+        "UPDATE {} SET identity_id = $1 WHERE file_uuid = $2 AND face_id = $3",
         table
     ))
     .bind(identity_id)
     .bind(&req.file_uuid)
     .bind(&req.face_id)
-    .execute(&db)
+    .execute(state.db.pool())
     .await
     .map_err(|e| {
         (
@@ -115,10 +127,44 @@ pub async fn bind_identity(
         )
     })?;
 
-    let uuid_clean = identity_uuid.replace('-', "");
+    // Clear bind redo stack
+    let _ = sqlx::query(&format!(
+        "DELETE FROM {} WHERE identity_id = $1 AND is_undone = true AND operation IN ('bind','unbind','bind_trace')",
+        history_table
+    ))
+    .bind(identity_id)
+    .execute(state.db.pool())
+    .await;
+
+    // Insert history record
+    let uid = auth.user_id.to_string();
+    let usrc = match auth.source {
+        crate::api::middleware::AuthSource::Jwt => "jwt",
+        crate::api::middleware::AuthSource::Session => "session",
+        crate::api::middleware::AuthSource::ApiKey => "api_key",
+    };
+    let before = serde_json::json!({
+        "file_uuid": req.file_uuid, "face_id": req.face_id, "identity_id_before": old_identity_id
+    });
+    let after = serde_json::json!({
+        "file_uuid": req.file_uuid, "face_id": req.face_id, "identity_id_after": identity_id
+    });
+    let _ = sqlx::query(&format!(
+        "INSERT INTO {} (identity_id, operation, before_snapshot, after_snapshot, is_undone, user_id, user_source) VALUES ($1, 'bind', $2, $3, false, $4, $5)",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(before)
+    .bind(after)
+    .bind(&uid)
+    .bind(usrc)
+    .execute(state.db.pool())
+    .await;
+
     // Sync identity JSON file
     if let Err(e) =
-        crate::core::identity::storage::save_identity_file_by_pool(&db, &uuid_clean).await
+        crate::core::identity::storage::save_identity_file_by_pool(state.db.pool(), &uuid_clean)
+            .await
     {
         tracing::warn!(
             "[bind] Failed to sync identity file for {}: {}",
@@ -139,35 +185,30 @@ pub async fn bind_identity(
 
 /// V4.0 直接解綁：SET face_detections.identity_id = NULL
 pub async fn unbind_identity(
+    State(state): State<crate::api::types::AppState>,
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
     Json(req): Json<UnbindIdentityRequest>,
 ) -> Result<Json<ApiResponse<serde_json::Value>>, (StatusCode, Json<serde_json::Value>)> {
     let table = crate::core::db::schema::table_name("face_detections");
     let id_table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
 
-    let db = sqlx::PgPool::connect(&crate::core::config::DATABASE_URL)
-        .await
-        .map_err(|e| {
-            (
-                StatusCode::INTERNAL_SERVER_ERROR,
-                Json(serde_json::json!({"error": e.to_string()})),
-            )
-        })?;
-
-    // Find the identity_id before unbinding to sync it later
-    let identity_id: Option<i64> = sqlx::query_scalar(&format!(
-        "SELECT identity_id FROM {} WHERE file_uuid = $1 AND face_id = $2 AND identity_id IS NOT NULL",
+    // Capture old identity_id before unbind
+    let old_identity_id: Option<i32> = sqlx::query_scalar(&format!(
+        "SELECT identity_id FROM {} WHERE file_uuid = $1 AND face_id = $2",
         table
     ))
     .bind(&req.file_uuid)
     .bind(&req.face_id)
-    .fetch_optional(&db)
+    .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
         (
             StatusCode::INTERNAL_SERVER_ERROR,
             Json(serde_json::json!({"error": e.to_string()})),
         )
-    })?;
+    })?
+    .flatten();
 
     let result = sqlx::query(&format!(
         "UPDATE {} SET identity_id = NULL WHERE file_uuid = $1 AND face_id = $2",
@@ -175,7 +216,7 @@ pub async fn unbind_identity(
     ))
     .bind(&req.file_uuid)
     .bind(&req.face_id)
-    .execute(&db)
+    .execute(state.db.pool())
     .await
     .map_err(|e| {
         (
@@ -184,21 +225,58 @@ pub async fn unbind_identity(
         )
     })?;
 
-    // Sync the identity JSON if we found an identity
-    if let Some(id) = identity_id {
+    // Record history if there was a binding
+    if let Some(identity_id) = old_identity_id {
+        // Clear bind redo stack
+        let _ = sqlx::query(&format!(
+            "DELETE FROM {} WHERE identity_id = $1 AND is_undone = true AND operation IN ('bind','unbind','bind_trace')",
+            history_table
+        ))
+        .bind(identity_id)
+        .execute(state.db.pool())
+        .await;
+
+        // Insert history record
+        let uid = auth.user_id.to_string();
+        let usrc = match auth.source {
+            crate::api::middleware::AuthSource::Jwt => "jwt",
+            crate::api::middleware::AuthSource::Session => "session",
+            crate::api::middleware::AuthSource::ApiKey => "api_key",
+        };
+        let before = serde_json::json!({
+            "file_uuid": req.file_uuid, "face_id": req.face_id, "identity_id_before": old_identity_id
+        });
+        let after = serde_json::json!({
+            "file_uuid": req.file_uuid, "face_id": req.face_id, "identity_id_after": null
+        });
+        let _ = sqlx::query(&format!(
+            "INSERT INTO {} (identity_id, operation, before_snapshot, after_snapshot, is_undone, user_id, user_source) VALUES ($1, 'unbind', $2, $3, false, $4, $5)",
+            history_table
+        ))
+        .bind(identity_id)
+        .bind(before)
+        .bind(after)
+        .bind(&uid)
+        .bind(usrc)
+        .execute(state.db.pool())
+        .await;
+
+        // Sync the identity JSON
         let uuid: Option<String> = sqlx::query_scalar(&format!(
             "SELECT uuid::text FROM {} WHERE id = $1",
             id_table
         ))
-        .bind(id)
-        .fetch_optional(&db)
+        .bind(identity_id)
+        .fetch_optional(state.db.pool())
         .await
         .ok()
         .flatten();
         if let Some(identity_uuid) = uuid {
-            if let Err(e) =
-                crate::core::identity::storage::save_identity_file_by_pool(&db, &identity_uuid)
-                    .await
+            if let Err(e) = crate::core::identity::storage::save_identity_file_by_pool(
+                state.db.pool(),
+                &identity_uuid,
+            )
+            .await
             {
                 tracing::warn!(
                     "[unbind] Failed to sync identity file for {}: {}",
@@ -216,8 +294,58 @@ pub async fn unbind_identity(
     }))
 }
 
-/// V4.0 合併：將 identity A 合併入 identity B，A 被刪除
+fn deep_merge_metadata_fields(
+    from: &serde_json::Map<String, serde_json::Value>,
+    into: &mut serde_json::Map<String, serde_json::Value>,
+    added: &mut Vec<String>,
+    prefix: &str,
+) {
+    for (key, value) in from.iter() {
+        if key == "aliases" {
+            continue;
+        }
+        let path = if prefix.is_empty() {
+            key.clone()
+        } else {
+            format!("{}.{}", prefix, key)
+        };
+        if !into.contains_key(key) {
+            into.insert(key.clone(), value.clone());
+            added.push(path);
+        } else if let (Some(from_obj), Some(into_obj)) = (value.as_object(), into[key].as_object())
+        {
+            let mut merged = into_obj.clone();
+            deep_merge_metadata_fields(from_obj, &mut merged, added, &path);
+            into.insert(key.clone(), serde_json::Value::Object(merged));
+        }
+    }
+}
+
+fn remove_nested_meta_field(value: &mut serde_json::Value, parts: &[&str]) {
+    if parts.is_empty() {
+        return;
+    }
+    if parts.len() == 1 {
+        if let Some(obj) = value.as_object_mut() {
+            obj.remove(parts[0]);
+        }
+        return;
+    }
+    if let Some(child) = value.get_mut(parts[0]) {
+        remove_nested_meta_field(child, &parts[1..]);
+        if let Some(obj) = value.get(parts[0]).and_then(|v| v.as_object()) {
+            if obj.is_empty() {
+                if let Some(parent_obj) = value.as_object_mut() {
+                    parent_obj.remove(parts[0]);
+                }
+            }
+        }
+    }
+}
+
+/// V4.0 合併：將 identity A 合併入 identity B，A 被刪除或標記為 merged
 pub async fn merge_identities(
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
     Path(identity_uuid): Path<String>,
     Json(req): Json<MergeIdentitiesRequest>,
 ) -> Result<Json<ApiResponse<serde_json::Value>>, (StatusCode, Json<serde_json::Value>)> {
@@ -233,12 +361,25 @@ pub async fn merge_identities(
             )
         })?;
 
-    // Get IDs for both identities
-    let from_row: Option<(i32, String)> = sqlx::query_as(&format!(
-        "SELECT id, name FROM {} WHERE uuid = $1::uuid",
+    let uuid_clean = identity_uuid.replace('-', "");
+    let into_uuid_clean = req.into_uuid.replace('-', "");
+
+    // Get full source identity snapshot
+    let source_row: Option<(
+        i32,
+        String,
+        Option<String>,
+        Option<String>,
+        String,
+        Option<i32>,
+        Option<String>,
+        Option<serde_json::Value>,
+        Option<chrono::NaiveDateTime>,
+    )> = sqlx::query_as(&format!(
+        "SELECT id, name, identity_type, source, status, tmdb_id, tmdb_profile, metadata, created_at FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
         id_table
     ))
-    .bind(&identity_uuid)
+    .bind(&uuid_clean)
     .fetch_optional(&db)
     .await
     .map_err(|e| {
@@ -247,16 +388,28 @@ pub async fn merge_identities(
             Json(serde_json::json!({"error": e.to_string()})),
         )
     })?;
-    let (from_id, from_name) = from_row.ok_or((
+
+    let (
+        from_id,
+        from_name,
+        from_type,
+        from_source,
+        from_status,
+        from_tmdb_id,
+        from_tmdb_profile,
+        from_metadata,
+        from_created_at,
+    ) = source_row.ok_or((
         StatusCode::NOT_FOUND,
         Json(serde_json::json!({"error": "Source identity not found"})),
     ))?;
 
-    let into_row: Option<(i32, String)> = sqlx::query_as(&format!(
-        "SELECT id, name FROM {} WHERE uuid = $1::uuid",
+    // Get full target identity snapshot
+    let target_row: Option<(i32, String, Option<serde_json::Value>)> = sqlx::query_as(&format!(
+        "SELECT id, name, metadata FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
         id_table
     ))
-    .bind(&req.into_uuid)
+    .bind(&into_uuid_clean)
     .fetch_optional(&db)
     .await
     .map_err(|e| {
@@ -265,11 +418,45 @@ pub async fn merge_identities(
             Json(serde_json::json!({"error": e.to_string()})),
         )
     })?;
-    let (into_id, into_name) = into_row.ok_or((
+
+    let (into_id, into_name, into_metadata) = target_row.ok_or((
         StatusCode::NOT_FOUND,
         Json(serde_json::json!({"error": "Target identity not found"})),
     ))?;
 
+    // Get face_ids that will be transferred
+    let face_ids: Vec<(Option<String>, Option<i32>)> = sqlx::query_as(&format!(
+        "SELECT face_id, trace_id FROM {} WHERE identity_id = $1",
+        face_table
+    ))
+    .bind(from_id)
+    .fetch_all(&db)
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?;
+
+    let face_id_list: Vec<String> = face_ids.iter().filter_map(|(f, _)| f.clone()).collect();
+    let trace_id_list: Vec<i32> = face_ids.iter().filter_map(|(_, t)| *t).collect();
+    let faces_count = face_id_list.len() as i64;
+
+    // Get file_uuid for these faces
+    let file_uuid: Option<String> = sqlx::query_scalar(&format!(
+        "SELECT file_uuid FROM {} WHERE identity_id = $1 LIMIT 1",
+        face_table
+    ))
+    .bind(from_id)
+    .fetch_optional(&db)
+    .await
+    .ok()
+    .flatten();
+
+    // Capture target metadata BEFORE merge
+    let into_meta_before = into_metadata.clone().unwrap_or(serde_json::json!({}));
+
     // Transfer all face bindings from source → target
     let updated = sqlx::query(&format!(
         "UPDATE {} SET identity_id = $1, stranger_id = NULL WHERE identity_id = $2",
@@ -286,6 +473,89 @@ pub async fn merge_identities(
         )
     })?;
 
+    // Merge text: source name → target aliases, source aliases → target aliases, source metadata → target metadata
+    let from_meta = from_metadata.clone();
+    let into_meta = into_metadata.clone();
+
+    let mut merged_meta = into_meta.clone().unwrap_or(serde_json::json!({}));
+    let from_meta_obj = from_meta
+        .as_ref()
+        .and_then(|m| m.as_object())
+        .cloned()
+        .unwrap_or_default();
+    let into_meta_obj = into_meta
+        .as_ref()
+        .and_then(|m| m.as_object())
+        .cloned()
+        .unwrap_or_default();
+
+    // Track aliases added for undo
+    let mut aliases_added: Vec<crate::core::db::AliasEntry> = Vec::new();
+    let mut metadata_fields_added: Vec<String> = Vec::new();
+
+    // Merge aliases
+    let mut aliases = into_meta_obj
+        .get("aliases")
+        .and_then(|a| a.as_array())
+        .cloned()
+        .unwrap_or_default();
+
+    // Add source name as alias (if not already present)
+    let from_name_str = from_name.clone();
+    if !aliases
+        .iter()
+        .any(|a| a.get("name").and_then(|n| n.as_str()) == Some(&from_name_str))
+    {
+        aliases.push(serde_json::json!({"name": from_name_str, "locale": "en", "source": "merge"}));
+        aliases_added.push(crate::core::db::AliasEntry {
+            name: from_name_str,
+            locale: "en".to_string(),
+            source: Some("merge".to_string()),
+        });
+    }
+
+    // Add source aliases (if not already present)
+    if let Some(from_aliases) = from_meta_obj.get("aliases").and_then(|a| a.as_array()) {
+        for fa in from_aliases {
+            let fa_name = fa.get("name").and_then(|n| n.as_str()).unwrap_or("");
+            let fa_locale = fa.get("locale").and_then(|l| l.as_str()).unwrap_or("en");
+            if !aliases
+                .iter()
+                .any(|a| a.get("name").and_then(|n| n.as_str()) == Some(fa_name))
+            {
+                aliases.push(fa.clone());
+                aliases_added.push(crate::core::db::AliasEntry {
+                    name: fa_name.to_string(),
+                    locale: fa_locale.to_string(),
+                    source: None,
+                });
+            }
+        }
+    }
+
+    merged_meta["aliases"] = serde_json::Value::Array(aliases);
+
+    // Deep-merge other metadata fields (recursive for nested objects)
+    if let Some(ref mut merged_map) = merged_meta.as_object_mut() {
+        deep_merge_metadata_fields(&from_meta_obj, merged_map, &mut metadata_fields_added, "");
+    }
+
+    // Update target metadata
+    sqlx::query(&format!(
+        "UPDATE {} SET metadata = $1 WHERE id = $2",
+        id_table
+    ))
+    .bind(&merged_meta)
+    .bind(into_id)
+    .execute(&db)
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?;
+
     let keep = req.keep_history.unwrap_or(true);
 
     if keep {
@@ -312,7 +582,6 @@ pub async fn merge_identities(
     }
 
     // Sync target identity JSON
-    let into_uuid_clean = req.into_uuid.replace('-', "");
     if let Err(e) =
         crate::core::identity::storage::save_identity_file_by_pool(&db, &into_uuid_clean).await
     {
@@ -325,8 +594,72 @@ pub async fn merge_identities(
 
     // Delete source identity JSON if not keeping history
     if !keep {
-        let from_uuid_clean = identity_uuid.replace('-', "");
-        let _ = crate::core::identity::storage::delete_identity_file(&from_uuid_clean);
+        let _ = crate::core::identity::storage::delete_identity_file(&uuid_clean);
+    }
+
+    // Generate merge_id and store to MongoDB
+    let merge_id = crate::core::db::IdentityMergeHistoryStore::generate_merge_id();
+    let now = chrono::Utc::now();
+    let undo_deadline = now + chrono::Duration::hours(24);
+
+    // Create MongoDB history record
+    let merge_history = crate::core::db::IdentityMergeHistory {
+        id: None,
+        merge_id: merge_id.clone(),
+        source_identity: crate::core::db::IdentitySnapshot {
+            id: from_id as i64,
+            uuid: uuid_clean.clone(),
+            name: from_name.clone(),
+            identity_type: from_type,
+            source: from_source,
+            status: from_status,
+            tmdb_id: from_tmdb_id.map(|id| id as i64),
+            tmdb_profile: from_tmdb_profile,
+            metadata: from_metadata.unwrap_or(serde_json::json!({})),
+            created_at: from_created_at
+                .map(|dt| chrono::DateTime::from_naive_utc_and_offset(dt, chrono::Utc)),
+            face_count: faces_count,
+        },
+        target_identity: crate::core::db::TargetIdentitySnapshot {
+            id: into_id as i64,
+            uuid: into_uuid_clean.clone(),
+            name: into_name.clone(),
+            metadata_before: into_meta_before,
+            metadata_after: Some(merged_meta.clone()),
+        },
+        aliases_added_to_target: aliases_added.clone(),
+        metadata_fields_added: metadata_fields_added.clone(),
+        faces_transferred: crate::core::db::FacesTransferred {
+            file_uuid: file_uuid.unwrap_or_default(),
+            face_ids: face_id_list,
+            trace_ids: trace_id_list,
+            count: faces_count,
+        },
+        merge_params: crate::core::db::MergeParams {
+            keep_history: keep,
+            cleared_stranger_id: true,
+            performed_by_user: Some(auth.user_id.to_string()),
+        },
+        merged_at: now,
+        undo_deadline,
+        undone: false,
+        undone_at: None,
+        undone_by: None,
+        undone_snapshot: None,
+        undo_expired: false,
+    };
+
+    // Store to MongoDB (non-blocking, warn on failure)
+    let mongo_store = crate::core::db::IdentityMergeHistoryStore::init().await;
+    if let Ok(store) = mongo_store {
+        if let Err(e) = store.store_merge_history(&merge_history).await {
+            tracing::warn!("[merge] Failed to store merge history in MongoDB: {}", e);
+        }
+    } else {
+        tracing::warn!(
+            "[merge] Failed to init MongoDB store: {:?}",
+            mongo_store.err()
+        );
     }
 
     Ok(Json(ApiResponse {
@@ -342,7 +675,12 @@ pub async fn merge_identities(
                 "source deleted"
             }
         ),
-        data: Some(serde_json::json!({"faces_transferred": updated.rows_affected()})),
+        data: Some(serde_json::json!({
+            "merge_id": merge_id,
+            "faces_transferred": updated.rows_affected(),
+            "aliases_added": aliases_added.len(),
+            "metadata_fields_added": metadata_fields_added.len()
+        })),
     }))
 }
 
@@ -390,27 +728,22 @@ pub struct TracesQuery {
 }
 
 pub async fn bind_identity_trace(
+    State(state): State<crate::api::types::AppState>,
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
     Path(identity_uuid): Path<String>,
     Json(req): Json<BindIdentityTraceRequest>,
 ) -> Result<Json<ApiResponse<serde_json::Value>>, (StatusCode, Json<serde_json::Value>)> {
     let fd_table = crate::core::db::schema::table_name("face_detections");
     let id_table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
 
-    let db = sqlx::PgPool::connect(&crate::core::config::DATABASE_URL)
-        .await
-        .map_err(|e| {
-            (
-                StatusCode::INTERNAL_SERVER_ERROR,
-                Json(serde_json::json!({"error": e.to_string()})),
-            )
-        })?;
-
+    let uuid_clean = identity_uuid.replace('-', "");
     let identity_row: Option<(i32, String)> = sqlx::query_as(&format!(
-        "SELECT id, name FROM {} WHERE uuid = $1::uuid",
+        "SELECT id, name FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
         id_table
     ))
-    .bind(&identity_uuid)
-    .fetch_optional(&db)
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
         (
@@ -426,14 +759,31 @@ pub async fn bind_identity_trace(
         )
     })?;
 
+    // Capture old identity_id before bind trace (use first face in trace as reference)
+    let old_identity_id: Option<i32> = sqlx::query_scalar(&format!(
+        "SELECT identity_id FROM {} WHERE file_uuid = $1 AND trace_id = $2 LIMIT 1",
+        fd_table
+    ))
+    .bind(&req.file_uuid)
+    .bind(req.trace_id)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("DB error: {}", e)})),
+        )
+    })?
+    .flatten();
+
     let result = sqlx::query(&format!(
-        "UPDATE {} SET identity_id = $1, stranger_id = NULL WHERE file_uuid = $2 AND trace_id = $3",
+        "UPDATE {} SET identity_id = $1 WHERE file_uuid = $2 AND trace_id = $3",
         fd_table
     ))
     .bind(identity_id)
     .bind(&req.file_uuid)
     .bind(req.trace_id)
-    .execute(&db)
+    .execute(state.db.pool())
     .await
     .map_err(|e| {
         (
@@ -442,9 +792,43 @@ pub async fn bind_identity_trace(
         )
     })?;
 
-    let uuid_clean = identity_uuid.replace('-', "");
+    // Clear bind redo stack
+    let _ = sqlx::query(&format!(
+        "DELETE FROM {} WHERE identity_id = $1 AND is_undone = true AND operation IN ('bind','unbind','bind_trace')",
+        history_table
+    ))
+    .bind(identity_id)
+    .execute(state.db.pool())
+    .await;
+
+    // Insert history record
+    let uid = auth.user_id.to_string();
+    let usrc = match auth.source {
+        crate::api::middleware::AuthSource::Jwt => "jwt",
+        crate::api::middleware::AuthSource::Session => "session",
+        crate::api::middleware::AuthSource::ApiKey => "api_key",
+    };
+    let before = serde_json::json!({
+        "file_uuid": req.file_uuid, "trace_id": req.trace_id, "identity_id_before": old_identity_id
+    });
+    let after = serde_json::json!({
+        "file_uuid": req.file_uuid, "trace_id": req.trace_id, "identity_id_after": identity_id
+    });
+    let _ = sqlx::query(&format!(
+        "INSERT INTO {} (identity_id, operation, before_snapshot, after_snapshot, is_undone, user_id, user_source) VALUES ($1, 'bind_trace', $2, $3, false, $4, $5)",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(before)
+    .bind(after)
+    .bind(&uid)
+    .bind(usrc)
+    .execute(state.db.pool())
+    .await;
+
     if let Err(e) =
-        crate::core::identity::storage::save_identity_file_by_pool(&db, &uuid_clean).await
+        crate::core::identity::storage::save_identity_file_by_pool(state.db.pool(), &uuid_clean)
+            .await
     {
         tracing::warn!(
             "[bind/trace] Failed to sync identity file for {}: {}",
@@ -476,11 +860,12 @@ pub async fn get_identity_traces(
     let offset = ((page - 1) as i64) * (page_size as i64);
 
     // Get identity name
+    let uuid_clean = identity_uuid.replace('-', "");
     let identity: Option<(i32, String)> = sqlx::query_as(&format!(
-        "SELECT id, name FROM {} WHERE uuid = $1::uuid",
+        "SELECT id, name FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
         id_table
     ))
-    .bind(&identity_uuid)
+    .bind(&uuid_clean)
     .fetch_optional(state.db.pool())
     .await
     .map_err(|e| (StatusCode::INTERNAL_SERVER_ERROR, e.to_string()))?;
@@ -560,6 +945,870 @@ pub async fn get_identity_traces(
     }))
 }
 
+/// Undo a merge operation within 24 hours
+pub async fn undo_merge(
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
+    Path(merge_id): Path<String>,
+) -> Result<Json<ApiResponse<serde_json::Value>>, (StatusCode, Json<serde_json::Value>)> {
+    let face_table = crate::core::db::schema::table_name("face_detections");
+    let id_table = crate::core::db::schema::table_name("identities");
+
+    // Get merge history from MongoDB
+    let mongo_store = crate::core::db::IdentityMergeHistoryStore::init()
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("MongoDB init failed: {}", e)})),
+            )
+        })?;
+
+    let history = mongo_store
+        .get_merge_history(&merge_id)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("MongoDB query failed: {}", e)})),
+            )
+        })?;
+
+    let history = history.ok_or((
+        StatusCode::NOT_FOUND,
+        Json(serde_json::json!({"error": "Merge record not found"})),
+    ))?;
+
+    // Check if already undone
+    if history.undone {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({"error": "Merge already undone"})),
+        ));
+    }
+
+    // Check 24hr deadline
+    let now = chrono::Utc::now();
+    let now_naive = now.naive_utc();
+    if now > history.undo_deadline {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({
+                "error": "Undo deadline expired",
+                "merged_at": history.merged_at.to_rfc3339(),
+                "undo_deadline": history.undo_deadline.to_rfc3339()
+            })),
+        ));
+    }
+
+    // Connect to PostgreSQL
+    let db = sqlx::PgPool::connect(&crate::core::config::DATABASE_URL)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })?;
+
+    // Restore source identity (or recreate if keep_history=false)
+    let mut source_id = history.source_identity.id;
+    let source_uuid = history.source_identity.uuid.clone();
+
+    if history.merge_params.keep_history {
+        // Source identity still exists, just restore status
+        sqlx::query(&format!(
+            "UPDATE {} SET status = 'confirmed', metadata = $1 WHERE id = $2",
+            id_table
+        ))
+        .bind(&history.source_identity.metadata)
+        .bind(source_id as i32)
+        .execute(&db)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })?;
+    } else {
+        // Need to recreate source identity
+        let source_uuid_parsed = uuid::Uuid::parse_str(&source_uuid).map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("Invalid UUID format: {}", e)})),
+            )
+        })?;
+        let new_id: i32 = sqlx::query_scalar(&format!(
+            "INSERT INTO {} (uuid, name, identity_type, source, status, tmdb_id, tmdb_profile, metadata, created_at) VALUES ($1, $2, $3, $4, $5, $6, $7, $8, $9) RETURNING id",
+            id_table
+        ))
+        .bind(source_uuid_parsed)
+        .bind(&history.source_identity.name)
+        .bind(&history.source_identity.identity_type)
+        .bind(&history.source_identity.source)
+        .bind("confirmed")
+        .bind(history.source_identity.tmdb_id.map(|id| id as i32))
+        .bind(&history.source_identity.tmdb_profile)
+        .bind(&history.source_identity.metadata)
+        .bind(history.source_identity.created_at.map(|dt| dt.naive_utc()).unwrap_or(now_naive))
+        .fetch_one(&db)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("Failed to recreate source identity: {}", e)})),
+            )
+        })?;
+
+        source_id = new_id as i64;
+    }
+
+    // Restore faces to source identity
+    let faces_reverted = sqlx::query(&format!(
+        "UPDATE {} SET identity_id = $1 WHERE face_id = ANY($2)",
+        face_table
+    ))
+    .bind(source_id as i32)
+    .bind(&history.faces_transferred.face_ids)
+    .execute(&db)
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?;
+
+    // Restore target metadata (precise removal)
+    let target_meta: Option<serde_json::Value> =
+        sqlx::query_scalar(&format!("SELECT metadata FROM {} WHERE id = $1", id_table))
+            .bind(history.target_identity.id as i32)
+            .fetch_optional(&db)
+            .await
+            .map_err(|e| {
+                (
+                    StatusCode::INTERNAL_SERVER_ERROR,
+                    Json(serde_json::json!({"error": e.to_string()})),
+                )
+            })?;
+
+    let mut restored_meta = target_meta.unwrap_or(serde_json::json!({}));
+
+    // Remove aliases that were added from source
+    let aliases_to_remove = &history.aliases_added_to_target;
+    if let Some(aliases) = restored_meta
+        .get("aliases")
+        .and_then(|a| a.as_array())
+        .cloned()
+    {
+        let new_aliases: Vec<serde_json::Value> = aliases
+            .into_iter()
+            .filter(|alias| {
+                let alias_name = alias.get("name").and_then(|n| n.as_str()).unwrap_or("");
+                let alias_source = alias.get("source").and_then(|s| s.as_str());
+                !aliases_to_remove.iter().any(|to_remove| {
+                    to_remove.name == alias_name && to_remove.source == Some("merge".to_string())
+                }) && alias_source != Some("merge")
+            })
+            .collect();
+        if let Some(obj) = restored_meta.as_object_mut() {
+            obj.insert("aliases".to_string(), serde_json::Value::Array(new_aliases));
+        }
+    }
+
+    // Remove metadata fields that were added from source (handles nested paths)
+    for field in &history.metadata_fields_added {
+        let parts: Vec<&str> = field.split('.').collect();
+        remove_nested_meta_field(&mut restored_meta, &parts);
+    }
+
+    // Update target metadata
+    sqlx::query(&format!(
+        "UPDATE {} SET metadata = $1 WHERE id = $2",
+        id_table
+    ))
+    .bind(&restored_meta)
+    .bind(history.target_identity.id as i32)
+    .execute(&db)
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?;
+
+    // Sync identity JSON files
+    let source_uuid_clean = source_uuid.replace('-', "");
+    if let Err(e) =
+        crate::core::identity::storage::save_identity_file_by_pool(&db, &source_uuid_clean).await
+    {
+        tracing::warn!("[undo] Failed to sync source identity file: {}", e);
+    }
+
+    let target_uuid_clean = history.target_identity.uuid.replace('-', "");
+    if let Err(e) =
+        crate::core::identity::storage::save_identity_file_by_pool(&db, &target_uuid_clean).await
+    {
+        tracing::warn!("[undo] Failed to sync target identity file: {}", e);
+    }
+
+    // Mark as undone in MongoDB with snapshot for potential redo
+    let undone_snapshot = crate::core::db::UndoneSnapshot {
+        source_identity_id: source_id,
+        source_uuid: source_uuid.clone(),
+        source_name: history.source_identity.name.clone(),
+        target_metadata_at_undo: restored_meta.clone(),
+    };
+    mongo_store
+        .mark_as_undone(&merge_id, Some(&auth.user_id.to_string()), undone_snapshot)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("Failed to mark as undone: {}", e)})),
+            )
+        })?;
+
+    Ok(Json(ApiResponse {
+        success: true,
+        message: format!(
+            "Undo merge completed: '{}' restored, {} faces reverted",
+            history.source_identity.name,
+            faces_reverted.rows_affected()
+        ),
+        data: Some(serde_json::json!({
+            "source_identity_restored": {
+                "uuid": source_uuid,
+                "name": history.source_identity.name,
+                "status": "confirmed"
+            },
+            "faces_reverted": faces_reverted.rows_affected(),
+            "aliases_removed_from_target": history.aliases_added_to_target.len(),
+            "metadata_fields_removed_from_target": history.metadata_fields_added.len()
+        })),
+    }))
+}
+
+/// Query merge history
+#[derive(Debug, Deserialize)]
+pub struct MergeHistoryQueryParams {
+    pub source_uuid: Option<String>,
+    pub target_uuid: Option<String>,
+    pub merge_id: Option<String>,
+    pub undone: Option<bool>,
+    pub page: Option<u32>,
+    pub page_size: Option<u32>,
+}
+
+#[derive(Debug, Serialize)]
+pub struct MergeHistoryResponse {
+    pub success: bool,
+    pub total: u64,
+    pub page: u32,
+    pub page_size: u32,
+    pub results: Vec<crate::core::db::MergeHistoryEntry>,
+}
+
+pub async fn get_merge_history(
+    Query(params): Query<MergeHistoryQueryParams>,
+) -> Result<Json<MergeHistoryResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let mongo_store = crate::core::db::IdentityMergeHistoryStore::init()
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("MongoDB init failed: {}", e)})),
+            )
+        })?;
+
+    let query = crate::core::db::MergeHistoryQuery {
+        source_uuid: params.source_uuid,
+        target_uuid: params.target_uuid,
+        merge_id: params.merge_id,
+        undone: params.undone,
+    };
+
+    let page = params.page.unwrap_or(1);
+    let page_size = params.page_size.unwrap_or(20);
+
+    let (results, total) = mongo_store
+        .query_merge_history(query, page, page_size)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("MongoDB query failed: {}", e)})),
+            )
+        })?;
+
+    Ok(Json(MergeHistoryResponse {
+        success: true,
+        total,
+        page,
+        page_size,
+        results,
+    }))
+}
+
+pub async fn redo_merge(
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
+    Path(merge_id): Path<String>,
+) -> Result<Json<ApiResponse<serde_json::Value>>, (StatusCode, Json<serde_json::Value>)> {
+    let face_table = crate::core::db::schema::table_name("face_detections");
+    let id_table = crate::core::db::schema::table_name("identities");
+
+    let mongo_store = crate::core::db::IdentityMergeHistoryStore::init()
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("MongoDB init failed: {}", e)})),
+            )
+        })?;
+
+    let history = mongo_store
+        .get_merge_history(&merge_id)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("MongoDB query failed: {}", e)})),
+            )
+        })?;
+
+    let history = history.ok_or((
+        StatusCode::NOT_FOUND,
+        Json(serde_json::json!({"error": "Merge record not found"})),
+    ))?;
+
+    if !history.undone {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({"error": "Merge is not undone, nothing to redo"})),
+        ));
+    }
+
+    let now = chrono::Utc::now();
+    if now > history.undo_deadline {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({
+                "error": "Redo deadline expired",
+                "undo_deadline": history.undo_deadline.to_rfc3339()
+            })),
+        ));
+    }
+
+    let snapshot = history.undone_snapshot.as_ref().ok_or((
+        StatusCode::INTERNAL_SERVER_ERROR,
+        Json(serde_json::json!({"error": "Undone snapshot not found, cannot redo"})),
+    ))?;
+
+    let db = sqlx::PgPool::connect(&crate::core::config::DATABASE_URL)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })?;
+
+    // Transfer faces from source back to target
+    let faces_redone = sqlx::query(&format!(
+        "UPDATE {} SET identity_id = $1, stranger_id = NULL WHERE identity_id = $2",
+        face_table
+    ))
+    .bind(history.target_identity.id as i32)
+    .bind(snapshot.source_identity_id as i32)
+    .execute(&db)
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?;
+
+    // Build target metadata: start from undone_snapshot (clean state after undo)
+    let mut target_meta = snapshot.target_metadata_at_undo.clone();
+    let meta_obj = target_meta.as_object_mut().unwrap();
+
+    // Add aliases from source
+    let source_meta = &history.source_identity.metadata;
+    let existing_aliases = meta_obj
+        .get("aliases")
+        .and_then(|a| a.as_array())
+        .cloned()
+        .unwrap_or_default();
+    let mut new_aliases = existing_aliases.clone();
+    for alias_added in &history.aliases_added_to_target {
+        let already_exists = new_aliases.iter().any(|a| {
+            a.get("name").and_then(|n| n.as_str()) == Some(&alias_added.name)
+                && a.get("locale").and_then(|l| l.as_str()) == Some(&alias_added.locale)
+        });
+        if !already_exists {
+            new_aliases.push(serde_json::json!({
+                "name": alias_added.name,
+                "locale": alias_added.locale,
+                "source": "merge"
+            }));
+        }
+    }
+    meta_obj.insert("aliases".into(), serde_json::Value::Array(new_aliases));
+
+    // Add metadata fields from source
+    for field in &history.metadata_fields_added {
+        if let Some(value) = source_meta.get(field) {
+            meta_obj.insert(field.clone(), value.clone());
+        }
+    }
+
+    // Update target metadata
+    sqlx::query(&format!(
+        "UPDATE {} SET metadata = $1 WHERE id = $2",
+        id_table
+    ))
+    .bind(&target_meta)
+    .bind(history.target_identity.id as i32)
+    .execute(&db)
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?;
+
+    // Handle source identity
+    if history.merge_params.keep_history {
+        sqlx::query(&format!(
+            "UPDATE {} SET status = 'merged' WHERE id = $1",
+            id_table
+        ))
+        .bind(snapshot.source_identity_id as i32)
+        .execute(&db)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })?;
+    } else {
+        sqlx::query(&format!("DELETE FROM {} WHERE id = $1", id_table))
+            .bind(snapshot.source_identity_id as i32)
+            .execute(&db)
+            .await
+            .map_err(|e| {
+                (
+                    StatusCode::INTERNAL_SERVER_ERROR,
+                    Json(serde_json::json!({"error": e.to_string()})),
+                )
+            })?;
+    }
+
+    // Sync identity JSON files
+    let source_uuid_clean = snapshot.source_uuid.replace('-', "");
+    if let Err(e) =
+        crate::core::identity::storage::save_identity_file_by_pool(&db, &source_uuid_clean).await
+    {
+        tracing::warn!("[redo] Failed to sync source identity file: {}", e);
+    }
+    let target_uuid_clean = history.target_identity.uuid.replace('-', "");
+    if let Err(e) =
+        crate::core::identity::storage::save_identity_file_by_pool(&db, &target_uuid_clean).await
+    {
+        tracing::warn!("[redo] Failed to sync target identity file: {}", e);
+    }
+
+    // Mark as redone in MongoDB
+    mongo_store
+        .mark_as_redone(&merge_id, Some(&auth.user_id.to_string()))
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": format!("Failed to mark as redone: {}", e)})),
+            )
+        })?;
+
+    Ok(Json(ApiResponse {
+        success: true,
+        message: format!(
+            "Redo merge completed: '{}' merged into '{}', {} faces transferred",
+            snapshot.source_name,
+            history.target_identity.name,
+            faces_redone.rows_affected()
+        ),
+        data: Some(serde_json::json!({
+            "merge_id": merge_id,
+            "faces_transferred": faces_redone.rows_affected(),
+            "aliases_added": history.aliases_added_to_target.len(),
+            "metadata_fields_added": history.metadata_fields_added.len()
+        })),
+    }))
+}
+
+// ── Bind Undo/Redo/History ──────────────────────────────────────────
+
+#[derive(Debug, Deserialize)]
+struct BindUndoRequest {
+    steps: Option<usize>,
+}
+
+#[derive(Debug, Serialize)]
+struct BindUndoResponse {
+    success: bool,
+    identity_uuid: String,
+    operation: String,
+    undone_count: usize,
+    affected_rows: i64,
+}
+
+async fn apply_bind_snapshot(
+    pool: &sqlx::PgPool,
+    face_table: &str,
+    snapshot: &serde_json::Value,
+    identity_id_value: Option<serde_json::Value>,
+) -> Result<i64, (StatusCode, Json<serde_json::Value>)> {
+    let file_uuid = snapshot
+        .get("file_uuid")
+        .and_then(|v| v.as_str())
+        .ok_or_else(|| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": "Missing file_uuid in snapshot"})),
+            )
+        })?;
+
+    let id_val = match identity_id_value {
+        Some(val) => val.as_i64(),
+        None => None,
+    };
+
+    if let Some(face_id) = snapshot.get("face_id").and_then(|v| v.as_str()) {
+        let rows = sqlx::query(&format!(
+            "UPDATE {} SET identity_id = $1 WHERE file_uuid = $2 AND face_id = $3",
+            face_table
+        ))
+        .bind(id_val)
+        .bind(file_uuid)
+        .bind(face_id)
+        .execute(pool)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })?;
+        Ok(rows.rows_affected() as i64)
+    } else if let Some(trace_id) = snapshot.get("trace_id").and_then(|v| v.as_i64()) {
+        let rows = sqlx::query(&format!(
+            "UPDATE {} SET identity_id = $1 WHERE file_uuid = $2 AND trace_id = $3",
+            face_table
+        ))
+        .bind(id_val)
+        .bind(file_uuid)
+        .bind(trace_id as i32)
+        .execute(pool)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })?;
+        Ok(rows.rows_affected() as i64)
+    } else {
+        Err((
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": "Snapshot has neither face_id nor trace_id"})),
+        ))
+    }
+}
+
+pub async fn bind_undo(
+    State(state): State<crate::api::types::AppState>,
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
+    Path(identity_uuid): Path<String>,
+    Json(req): Json<BindUndoRequest>,
+) -> Result<Json<BindUndoResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let uuid_clean = identity_uuid.replace('-', "");
+    let steps = req.steps.unwrap_or(1).max(1);
+    let id_table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
+    let face_table = crate::core::db::schema::table_name("face_detections");
+
+    let identity_id: i32 = sqlx::query_scalar(&format!(
+        "SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        id_table
+    ))
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("DB error: {}", e)})),
+        )
+    })?
+    .ok_or((
+        StatusCode::NOT_FOUND,
+        Json(serde_json::json!({"error": "Identity not found"})),
+    ))?;
+
+    let records: Vec<(i64, String, serde_json::Value)> = sqlx::query_as(&format!(
+        "SELECT id, operation, before_snapshot FROM {} WHERE identity_id = $1 AND is_undone = false AND operation IN ('bind','unbind','bind_trace') ORDER BY created_at DESC LIMIT $2",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(steps as i64)
+    .fetch_all(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("Failed to get history: {}", e)})),
+        )
+    })?;
+
+    if records.is_empty() {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({"error": "No bind undo operations available"})),
+        ));
+    }
+
+    let operation = records.last().unwrap().1.clone();
+    let before = &records.last().unwrap().2;
+
+    let identity_id_before = before.get("identity_id_before").cloned();
+    let affected_rows =
+        apply_bind_snapshot(state.db.pool(), &face_table, before, identity_id_before).await?;
+
+    // Mark all as undone
+    for (history_id, _, _) in &records {
+        let _ = sqlx::query(&format!(
+            "UPDATE {} SET is_undone = true, undone_at = NOW() WHERE id = $1",
+            history_table
+        ))
+        .bind(history_id)
+        .execute(state.db.pool())
+        .await;
+    }
+
+    Ok(Json(BindUndoResponse {
+        success: true,
+        identity_uuid: uuid_clean,
+        operation,
+        undone_count: records.len(),
+        affected_rows,
+    }))
+}
+
+pub async fn bind_redo(
+    State(state): State<crate::api::types::AppState>,
+    Extension(auth): Extension<crate::api::middleware::UserAuth>,
+    Path(identity_uuid): Path<String>,
+    Json(req): Json<BindUndoRequest>,
+) -> Result<Json<BindUndoResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let uuid_clean = identity_uuid.replace('-', "");
+    let steps = req.steps.unwrap_or(1).max(1);
+    let id_table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
+    let face_table = crate::core::db::schema::table_name("face_detections");
+
+    let identity_id: i32 = sqlx::query_scalar(&format!(
+        "SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        id_table
+    ))
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("DB error: {}", e)})),
+        )
+    })?
+    .ok_or((
+        StatusCode::NOT_FOUND,
+        Json(serde_json::json!({"error": "Identity not found"})),
+    ))?;
+
+    let records: Vec<(i64, String, serde_json::Value)> = sqlx::query_as(&format!(
+        "SELECT id, operation, after_snapshot FROM {} WHERE identity_id = $1 AND is_undone = true AND operation IN ('bind','unbind','bind_trace') ORDER BY created_at DESC LIMIT $2",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(steps as i64)
+    .fetch_all(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("Failed to get history: {}", e)})),
+        )
+    })?;
+
+    if records.is_empty() {
+        return Err((
+            StatusCode::BAD_REQUEST,
+            Json(serde_json::json!({"error": "No bind redo operations available"})),
+        ));
+    }
+
+    let operation = records.last().unwrap().1.clone();
+    let after = &records.last().unwrap().2;
+
+    let identity_id_after = after.get("identity_id_after").cloned();
+    let affected_rows =
+        apply_bind_snapshot(state.db.pool(), &face_table, after, identity_id_after).await?;
+
+    // Mark all as redone
+    for (history_id, _, _) in &records {
+        let _ = sqlx::query(&format!(
+            "UPDATE {} SET is_undone = false, undone_at = NULL WHERE id = $1",
+            history_table
+        ))
+        .bind(history_id)
+        .execute(state.db.pool())
+        .await;
+    }
+
+    Ok(Json(BindUndoResponse {
+        success: true,
+        identity_uuid: uuid_clean,
+        operation,
+        undone_count: records.len(),
+        affected_rows,
+    }))
+}
+
+#[derive(Debug, Serialize)]
+struct BindHistoryItem {
+    history_id: i64,
+    operation: String,
+    is_undone: bool,
+    created_at: Option<chrono::DateTime<chrono::Utc>>,
+    undone_at: Option<chrono::DateTime<chrono::Utc>>,
+}
+
+#[derive(Debug, Serialize)]
+struct BindHistoryResponse {
+    success: bool,
+    identity_uuid: String,
+    total: i64,
+    undo_stack_count: i64,
+    redo_stack_count: i64,
+    results: Vec<BindHistoryItem>,
+}
+
+#[derive(Debug, Deserialize)]
+struct BindHistoryQuery {
+    limit: Option<usize>,
+    page: Option<usize>,
+}
+
+pub async fn bind_history(
+    State(state): State<crate::api::types::AppState>,
+    Path(identity_uuid): Path<String>,
+    Query(params): Query<BindHistoryQuery>,
+) -> Result<Json<BindHistoryResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let uuid_clean = identity_uuid.replace('-', "");
+    let limit = params.limit.unwrap_or(20).max(1).min(100);
+    let page = params.page.unwrap_or(1).max(1);
+    let offset = ((page - 1) * limit) as i64;
+    let id_table = crate::core::db::schema::table_name("identities");
+    let history_table = crate::core::db::schema::table_name("identity_history");
+
+    let identity_id: i32 = sqlx::query_scalar(&format!(
+        "SELECT id FROM {} WHERE REPLACE(uuid::text, '-', '') = $1",
+        id_table
+    ))
+    .bind(&uuid_clean)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("DB error: {}", e)})),
+        )
+    })?
+    .ok_or((
+        StatusCode::NOT_FOUND,
+        Json(serde_json::json!({"error": "Identity not found"})),
+    ))?;
+
+    let undo_stack_count: i64 = sqlx::query_scalar(&format!(
+        "SELECT COUNT(*) FROM {} WHERE identity_id = $1 AND is_undone = false AND operation IN ('bind','unbind','bind_trace')",
+        history_table
+    ))
+    .bind(identity_id)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("DB error: {}", e)})),
+        )
+    })?;
+
+    let redo_stack_count: i64 = sqlx::query_scalar(&format!(
+        "SELECT COUNT(*) FROM {} WHERE identity_id = $1 AND is_undone = true AND operation IN ('bind','unbind','bind_trace')",
+        history_table
+    ))
+    .bind(identity_id)
+    .fetch_one(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("DB error: {}", e)})),
+        )
+    })?;
+
+    let rows = sqlx::query(&format!(
+        "SELECT id, operation, is_undone, created_at, undone_at FROM {} WHERE identity_id = $1 AND operation IN ('bind','unbind','bind_trace') ORDER BY created_at DESC LIMIT $2 OFFSET $3",
+        history_table
+    ))
+    .bind(identity_id)
+    .bind(limit as i64)
+    .bind(offset)
+    .fetch_all(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": format!("DB error: {}", e)})),
+        )
+    })?;
+
+    let results: Vec<BindHistoryItem> = rows
+        .into_iter()
+        .map(|r| BindHistoryItem {
+            history_id: r.get::<i64, _>("id"),
+            operation: r.get::<String, _>("operation"),
+            is_undone: r.get::<bool, _>("is_undone"),
+            created_at: r.get::<Option<chrono::DateTime<chrono::Utc>>, _>("created_at"),
+            undone_at: r.get::<Option<chrono::DateTime<chrono::Utc>>, _>("undone_at"),
+        })
+        .collect();
+
+    let total = undo_stack_count + redo_stack_count;
+
+    Ok(Json(BindHistoryResponse {
+        success: true,
+        identity_uuid: uuid_clean,
+        total,
+        undo_stack_count,
+        redo_stack_count,
+        results,
+    }))
+}
+
 pub fn identity_binding_routes() -> Router<crate::api::types::AppState> {
     Router::new()
         .route("/api/v1/identity/:identity_uuid/bind", post(bind_identity))
@@ -579,4 +1828,13 @@ pub fn identity_binding_routes() -> Router<crate::api::types::AppState> {
             "/api/v1/identity/:identity_uuid/traces",
             get(get_identity_traces),
         )
+        .route("/api/v1/identity/:identity_uuid/bind/undo", post(bind_undo))
+        .route("/api/v1/identity/:identity_uuid/bind/redo", post(bind_redo))
+        .route(
+            "/api/v1/identity/:identity_uuid/bind/history",
+            get(bind_history),
+        )
+        .route("/api/v1/identity/merge/:merge_id/undo", post(undo_merge))
+        .route("/api/v1/identity/merge/:merge_id/redo", post(redo_merge))
+        .route("/api/v1/identity/merge/history", get(get_merge_history))
 }
diff --git a/src/api/media_api.rs b/src/api/media_api.rs
index 2150e2f..407b4fa 100644
--- a/src/api/media_api.rs
+++ b/src/api/media_api.rs
@@ -57,6 +57,10 @@ pub fn bbox_routes() -> Router<crate::api::types::AppState> {
             "/api/v1/file/:file_uuid/trace/:trace_id/video",
             get(trace_video),
         )
+        .route(
+            "/api/v1/file/:file_uuid/stranger/:stranger_id/video",
+            get(stranger_video),
+        )
         .route("/api/v1/file/:file_uuid/video", get(stream_video))
         .route("/api/v1/file/:file_uuid/thumbnail", get(face_thumbnail))
         .route("/api/v1/file/:file_uuid/clip", get(video_clip))
@@ -210,8 +214,9 @@ async fn bbox_overlay_video(
     let start_sec = start_f as f64 / fps;
 
     // Get face bboxes
+    // frame_number is BIGINT (i64) in database
     let face_table = schema::table_name("face_detections");
-    let rows: Vec<(i32, i32, i32, i32, i32, Option<i32>, Option<String>)> = sqlx::query_as(
+    let rows: Vec<(i64, i32, i32, i32, i32, Option<i32>, Option<String>)> = sqlx::query_as(
         &format!("SELECT frame_number, x, y, width, height, trace_id, face_id FROM {} WHERE file_uuid = $1 AND frame_number BETWEEN $2 AND $3 ORDER BY frame_number", face_table)
     )
     .bind(face_fuid).bind(start_f).bind(end_f)
@@ -222,7 +227,7 @@ async fn bbox_overlay_video(
     let mut parts: Vec<String> = Vec::new();
     for (frame, x, y, w, h, trace_id, _) in &rows {
         let text = format!("t{}", trace_id.unwrap_or(0));
-        let offset = frame - start_f;
+        let offset = (*frame as i32) - start_f;
         parts.push(format!(
             "drawbox=x={}:y={}:w={}:h={}:color=red@0.8:thickness=4:enable='eq(n,{})'",
             x, y, w, h, offset
@@ -300,6 +305,15 @@ async fn trace_video(
     State(state): State<crate::api::types::AppState>,
     Path((file_uuid, trace_id)): Path<(String, i32)>,
     Query(params): Query<std::collections::HashMap<String, String>>,
+) -> Result<impl IntoResponse, StatusCode> {
+    trace_video_inner(&state, &file_uuid, trace_id, &params).await
+}
+
+async fn trace_video_inner(
+    state: &crate::api::types::AppState,
+    file_uuid: &str,
+    trace_id: i32,
+    params: &std::collections::HashMap<String, String>,
 ) -> Result<impl IntoResponse, StatusCode> {
     use axum::http::header;
 
@@ -317,8 +331,9 @@ async fn trace_video(
     let (video_path, fps, _width, _height) = row.ok_or(StatusCode::NOT_FOUND)?;
 
     // Query face detections to find frame range for target trace
+    // frame_number is BIGINT (i64) in database
     let face_table = schema::table_name("face_detections");
-    let rows: Vec<(i32, i32, i32, i32, i32)> = sqlx::query_as(&format!(
+    let rows: Vec<(i64, i32, i32, i32, i32)> = sqlx::query_as(&format!(
         "SELECT frame_number, x, y, width, height FROM {} WHERE file_uuid = $1 AND trace_id = $2 ORDER BY frame_number",
         face_table
     ))
@@ -371,11 +386,12 @@ async fn trace_video(
 
     // === DEBUG MODE: text overlay, list all traces in frame range ===
     let start_fn = (start_sec * fps) as i32;
-    let end_fn = ((start_sec + duration) * fps) as i32;
+    let end_fn = ((start_sec + duration) * fps) as i64;
 
     // Query all traces with identity names and bbox positions in the visible frame range
+    // frame_number is BIGINT (i64) in database
     let identities_table = schema::table_name("identities");
-    let all_rows: Vec<(i32, i32, i32, i32, i32, i32, Option<String>)> = sqlx::query_as(&format!(
+    let all_rows: Vec<(i32, i64, i32, i32, i32, i32, Option<String>)> = sqlx::query_as(&format!(
         "SELECT fd.trace_id, fd.frame_number, fd.x, fd.y, fd.width, fd.height, i.name \
          FROM {} fd \
          LEFT JOIN {} i ON fd.identity_id = i.id \
@@ -391,9 +407,10 @@ async fn trace_video(
     .unwrap_or_default();
 
     // Group frames by trace_id, compute start_frame per trace; collect bbox per frame
-    let mut trace_frames: HashMap<i32, Vec<i32>> = HashMap::new();
+    // frame_number is i64 (BIGINT), so HashMaps need i64 for frame values
+    let mut trace_frames: HashMap<i32, Vec<i64>> = HashMap::new();
     let mut trace_identity: HashMap<i32, String> = HashMap::new();
-    let mut bbox_per_frame: HashMap<(i32, i32), (i32, i32, i32, i32)> = HashMap::new(); // (tid, fn) -> (x, y, w, h)
+    let mut bbox_per_frame: HashMap<(i32, i64), (i32, i32, i32, i32)> = HashMap::new(); // (tid, fn) -> (x, y, w, h)
     for (tid, fn_, x, y, w, h, name_opt) in &all_rows {
         trace_frames.entry(*tid).or_default().push(*fn_);
         bbox_per_frame.insert((*tid, *fn_), (*x, *y, *w, *h));
@@ -417,7 +434,7 @@ async fn trace_video(
     .unwrap_or_else(|| "-".to_string());
 
     // Sort traces for consistent ordering
-    let mut sorted_traces: Vec<(i32, &Vec<i32>)> =
+    let mut sorted_traces: Vec<(i32, &Vec<i64>)> =
         trace_frames.iter().map(|(k, v)| (*k, v)).collect();
     sorted_traces.sort_by_key(|(tid, _)| *tid);
 
@@ -695,6 +712,7 @@ struct ThumbQuery {
     y: Option<i32>,
     w: Option<i32>,
     h: Option<i32>,
+    trace_id: Option<i32>,
 }
 
 async fn face_thumbnail(
@@ -717,15 +735,70 @@ async fn face_thumbnail(
         }
     };
 
-    let row: Option<(String,)> = sqlx::query_as(&format!(
-        "SELECT file_path FROM {} WHERE file_uuid = $1",
+    // Step 1: Check for pre-stored face crop if trace_id is provided
+    if let Some(trace_id) = q.trace_id {
+        let output_dir = crate::core::config::OUTPUT_DIR.as_str();
+        let cached_path = std::path::PathBuf::from(output_dir)
+            .join(".faces")
+            .join(&file_uuid)
+            .join(trace_id.to_string())
+            .join(format!("{}.jpg", frame));
+
+        if cached_path.exists() {
+            tracing::debug!("[thumbnail] Using cached face crop: {}", cached_path.display());
+            let bytes = tokio::fs::read(&cached_path)
+                .await
+                .map_err(|e| {
+                    tracing::warn!("[thumbnail] Failed to read cached file: {}", e);
+                    StatusCode::INTERNAL_SERVER_ERROR
+                })?;
+
+            // Validate cached JPEG
+            crate::core::thumbnail::validator::validate_jpeg(&bytes).map_err(|e| {
+                tracing::warn!("[thumbnail] Cached JPEG validation failed: {}", e);
+                StatusCode::INTERNAL_SERVER_ERROR
+            })?;
+
+            return Ok(Response::builder()
+                .status(StatusCode::OK)
+                .header(header::CONTENT_TYPE, "image/jpeg")
+                .header(header::CACHE_CONTROL, "public, max-age=86400")
+                .body(Body::from(bytes))
+                .unwrap());
+        }
+        
+        // Cached file not found, fallback to ffmpeg
+        tracing::debug!("[thumbnail] Cached file not found, falling back to ffmpeg");
+    }
+
+    // Step 2: Fallback to ffmpeg on-demand extraction
+    let row: Option<(String, Option<i64>, Option<i32>, Option<i32>)> = sqlx::query_as(&format!(
+        "SELECT file_path, total_frames, width, height FROM {} WHERE file_uuid = $1",
         videos_table
     ))
     .bind(&file_uuid)
     .fetch_optional(state.db.pool())
     .await
     .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
-    let (file_path,) = row.ok_or(StatusCode::NOT_FOUND)?;
+    let (file_path, total_frames, video_width, video_height) = row.ok_or(StatusCode::NOT_FOUND)?;
+
+    if let Some(total) = total_frames {
+        if total > 0 {
+            crate::core::thumbnail::validator::validate_frame(frame, total).map_err(|e| {
+                tracing::warn!("[thumbnail] Frame validation failed: {}", e);
+                StatusCode::BAD_REQUEST
+            })?;
+        }
+    }
+
+    if let (Some(x), Some(y), Some(w), Some(h)) = (q.x, q.y, q.w, q.h) {
+        if let (Some(vw), Some(vh)) = (video_width, video_height) {
+            crate::core::thumbnail::validator::validate_crop(x, y, w, h, vw, vh).map_err(|e| {
+                tracing::warn!("[thumbnail] Crop validation failed: {}", e);
+                StatusCode::BAD_REQUEST
+            })?;
+        }
+    }
 
     let select = format!("select=eq(n\\,{})", frame);
     let vf = if let (Some(x), Some(y), Some(w), Some(h)) = (q.x, q.y, q.w, q.h) {
@@ -755,6 +828,11 @@ async fn face_thumbnail(
         return Err(StatusCode::INTERNAL_SERVER_ERROR);
     }
 
+    crate::core::thumbnail::validator::validate_jpeg(&output.stdout).map_err(|e| {
+        tracing::warn!("[thumbnail] JPEG validation failed: {}", e);
+        StatusCode::INTERNAL_SERVER_ERROR
+    })?;
+
     Ok(Response::builder()
         .status(StatusCode::OK)
         .header(header::CONTENT_TYPE, "image/jpeg")
@@ -849,3 +927,127 @@ async fn video_clip(
         .body(Body::from(output.stdout))
         .unwrap())
 }
+
+async fn stranger_video(
+    State(state): State<crate::api::types::AppState>,
+    Path((file_uuid, stranger_id)): Path<(String, i32)>,
+    Query(params): Query<std::collections::HashMap<String, String>>,
+) -> Result<impl IntoResponse, StatusCode> {
+    stranger_video_inner(&state, &file_uuid, stranger_id, &params).await
+}
+
+async fn stranger_video_inner(
+    state: &crate::api::types::AppState,
+    file_uuid: &str,
+    stranger_id: i32,
+    params: &std::collections::HashMap<String, String>,
+) -> Result<impl IntoResponse, StatusCode> {
+    use axum::http::header;
+    use uuid::Uuid;
+
+    tracing::info!("[stranger_video] Starting for file={}, stranger={}", file_uuid, stranger_id);
+
+    let (mode, audio) = parse_video_params(&params);
+
+    let videos_table = schema::table_name("videos");
+    tracing::debug!("[stranger_video] videos_table: {}", videos_table);
+    
+    let row: Option<(String, f64, i32, i32)> = sqlx::query_as(&format!(
+        "SELECT file_path, COALESCE(fps, 24.0), COALESCE(width, 0), COALESCE(height, 0) FROM {} WHERE file_uuid = $1",
+        videos_table
+    ))
+    .bind(&file_uuid)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        tracing::error!("[stranger_video] Video query error: {}", e);
+        StatusCode::INTERNAL_SERVER_ERROR
+    })?;
+    
+    let (video_path, fps, _width, _height) = row.ok_or_else(|| {
+        tracing::error!("[stranger_video] Video not found for uuid={}", file_uuid);
+        StatusCode::NOT_FOUND
+    })?;
+    
+    tracing::info!("[stranger_video] Found video: path={}, fps={}", video_path, fps);
+
+    // Query face detections by stranger_id directly
+    let face_table = schema::table_name("face_detections");
+    tracing::debug!("[stranger_video] face_table: {}", face_table);
+    
+    // frame_number is BIGINT (i64) in database
+    let rows: Vec<(i64, i32, i32, i32, i32)> = sqlx::query_as(&format!(
+        "SELECT frame_number, x, y, width, height FROM {} WHERE file_uuid = $1 AND stranger_id = $2 ORDER BY frame_number",
+        face_table
+    ))
+    .bind(&file_uuid).bind(stranger_id)
+    .fetch_all(state.db.pool()).await
+    .unwrap_or_else(|e| { 
+        tracing::error!("[stranger_video] Face query error: {}", e); 
+        vec![] 
+    });
+
+    tracing::info!("[stranger_video] Found {} faces", rows.len());
+
+    if rows.is_empty() {
+        tracing::error!("[stranger_video] No faces found for stranger_id={}", stranger_id);
+        return Err(StatusCode::NOT_FOUND);
+    }
+
+    let first_frame = rows[0].0;
+    let last_frame = rows[rows.len() - 1].0;
+    let start_sec = first_frame as f64 / fps;
+    let padding = params
+        .get("padding")
+        .and_then(|s| s.parse().ok())
+        .unwrap_or(2.0);
+    let duration = (last_frame - first_frame) as f64 / fps + padding * 2.0;
+    let seek = (start_sec - padding).max(0.0);
+
+    tracing::info!("[stranger_video] Frame range: {} - {}, time: {:.2}s - {:.2}s", 
+        first_frame, last_frame, seek, seek + duration);
+
+    // Only support normal mode for stranger video
+    let tmp = std::env::temp_dir().join(format!("stranger_{}.mp4", Uuid::new_v4()));
+    let tmp_str = tmp.to_str().unwrap_or("").to_string();
+    let sk = seek.to_string();
+    let du = duration.to_string();
+    let mut cmd_args = vec!["-ss", &sk, "-i", &video_path, "-t", &du, "-c", "copy"];
+    if audio == "off" {
+        cmd_args.push("-an");
+    }
+    cmd_args.extend_from_slice(&["-y", &tmp_str]);
+    
+    tracing::debug!("[stranger_video] ffmpeg args: {:?}", cmd_args);
+    
+    let result = ffmpeg_cmd()
+        .args(&cmd_args)
+        .output()
+        .map_err(|e| {
+            tracing::error!("[stranger_video] ffmpeg spawn error: {}", e);
+            StatusCode::INTERNAL_SERVER_ERROR
+        })?;
+    
+    if !result.status.success() {
+        tracing::error!("[stranger_video] ffmpeg failed: {}", String::from_utf8_lossy(&result.stderr));
+        return Err(StatusCode::INTERNAL_SERVER_ERROR);
+    }
+    
+    tracing::info!("[stranger_video] ffmpeg success, output size: {} bytes", result.stdout.len());
+    
+    let data = tokio::fs::read(&tmp)
+        .await
+        .map_err(|e| {
+            tracing::error!("[stranger_video] Read output error: {}", e);
+            StatusCode::INTERNAL_SERVER_ERROR
+        })?;
+    let _ = std::fs::remove_file(&tmp);
+    
+    tracing::info!("[stranger_video] Returning video, size: {} bytes", data.len());
+    
+    Ok(Response::builder()
+        .header(header::CONTENT_TYPE, "video/mp4")
+        .header(header::CONTENT_LENGTH, data.len())
+        .body(Body::from(data))
+        .unwrap())
+}
diff --git a/src/api/mod.rs b/src/api/mod.rs
index d3d36b6..f348fa2 100644
--- a/src/api/mod.rs
+++ b/src/api/mod.rs
@@ -4,7 +4,6 @@ pub mod auth;
 pub mod docs;
 pub mod files;
 pub mod five_w1h_agent_api;
-pub mod processing;
 pub mod health;
 pub mod identities;
 pub mod identity_agent_api;
@@ -12,6 +11,7 @@ pub mod identity_api;
 pub mod identity_binding;
 pub mod media_api;
 pub mod middleware;
+pub mod processing;
 pub mod scan;
 pub mod search;
 pub mod server;
@@ -19,7 +19,5 @@ pub mod tmdb_api;
 pub mod trace_agent_api;
 pub mod types;
 pub mod universal_search;
-pub mod visual_chunk_search;
-pub mod visual_search;
 
 pub use server::start_server;
diff --git a/src/api/processing.rs b/src/api/processing.rs
index 4ef2f66..d286803 100644
--- a/src/api/processing.rs
+++ b/src/api/processing.rs
@@ -233,50 +233,54 @@ async fn trigger_processing(
         .await
         .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
 
-    let processors_to_run: Vec<&str> = if let Some(procs) = &req.processors {
-        // 檢查 job 是否存在，不存在則 INSERT（state machine entry）
-        let existing_id: Option<i32> = sqlx::query_scalar(&format!(
-            "SELECT id FROM {monitor_jobs_table} WHERE uuid = $1"
-        ))
-        .bind(&file_uuid)
-        .fetch_optional(state.db.pool())
-        .await
-        .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
-
-        if existing_id.is_none() {
-            state
-                .db
-                .create_monitor_job(&file_uuid, Some(&file_path))
-                .await
-                .map_err(|e| {
-                    tracing::error!(
-                        "[TRIGGER] Failed to create monitor job for {}: {}",
-                        file_uuid,
-                        e
-                    );
-                    StatusCode::INTERNAL_SERVER_ERROR
-                })?;
-        }
-
-        // UPDATE processors + reset 狀態讓 worker 可 pickup
-        let procs_db: Vec<String> = procs.iter().map(|s| s.to_string()).collect();
-        sqlx::query(&format!(
-            "UPDATE {monitor_jobs_table} SET processors = $1::text[], status = 'pending' WHERE uuid = $2"
-        ))
-        .bind(&procs_db)
-        .bind(&file_uuid)
-        .execute(state.db.pool())
-        .await
-        .map_err(|e| {
-            tracing::error!("[TRIGGER] Failed to update monitor job for {}: {}", file_uuid, e);
-            StatusCode::INTERNAL_SERVER_ERROR
-        })?;
-
-        procs.iter().map(|s| s.as_str()).collect()
+    let processors_to_run: Vec<String> = if let Some(procs) = &req.processors {
+        procs.iter().map(|s| s.to_string()).collect()
     } else {
-        vec![]
+        crate::core::db::ProcessorType::all()
+            .iter()
+            .map(|p| p.as_str().to_string())
+            .collect()
     };
 
+    // 確保 monitor_job 存在
+    let existing_id: Option<i32> = sqlx::query_scalar(&format!(
+        "SELECT id FROM {monitor_jobs_table} WHERE uuid = $1"
+    ))
+    .bind(&file_uuid)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
+
+    if existing_id.is_none() {
+        state
+            .db
+            .create_monitor_job(&file_uuid, Some(&file_path))
+            .await
+            .map_err(|e| {
+                tracing::error!(
+                    "[TRIGGER] Failed to create monitor job for {}: {}",
+                    file_uuid,
+                    e
+                );
+                StatusCode::INTERNAL_SERVER_ERROR
+            })?;
+    }
+
+    // UPDATE processors + reset 狀態讓 worker 可 pickup
+    sqlx::query(&format!(
+        "UPDATE {monitor_jobs_table} SET processors = $1::text[], status = 'pending' WHERE uuid = $2"
+    ))
+    .bind(&processors_to_run)
+    .bind(&file_uuid)
+    .execute(state.db.pool())
+    .await
+    .map_err(|e| {
+        tracing::error!("[TRIGGER] Failed to update monitor job for {}: {}", file_uuid, e);
+        StatusCode::INTERNAL_SERVER_ERROR
+    })?;
+
+    let processors_to_run_refs: Vec<&str> = processors_to_run.iter().map(|s| s.as_str()).collect();
+
     let notification = serde_json::json!({
         "action": "process",
         "file_uuid": file_uuid,
@@ -285,7 +289,7 @@ async fn trigger_processing(
         "file_type": file_type,
         "content_hash": content_hash,
         "output_dir": output_dir,
-        "processors": processors_to_run,
+        "processors": processors_to_run_refs,
     });
 
     let notification_key = format!("{}notifications", REDIS_KEY_PREFIX.as_str());
diff --git a/src/api/scan.rs b/src/api/scan.rs
index a875aef..26853a5 100644
--- a/src/api/scan.rs
+++ b/src/api/scan.rs
@@ -414,8 +414,6 @@ async fn get_ingestion_status(
         "SELECT COUNT(*) FROM {} WHERE file_uuid = '{file_uuid}'",
         schema::table_name("tkg_edges")
     ));
-    let scene_5w1h = count_sql!(&format!("SELECT COUNT(*) FROM {chunk} WHERE file_uuid = '{file_uuid}' AND chunk_type = 'cut' AND summary_text IS NOT NULL AND summary_text != ''"));
-
     let related_identities: Vec<IdentityRef> =
         match sqlx::query_as::<_, (String, String)>(&format!(
             "SELECT DISTINCT i.uuid::text, i.name FROM {identities} i \
@@ -491,11 +489,6 @@ async fn get_ingestion_status(
             Some(format!("{identity_count} identities matched"))
         ),
         step!("scene_metadata", scene_meta_ok, None),
-        step!(
-            "5w1h",
-            scene_5w1h > 0,
-            Some(format!("{scene_5w1h} scenes with 5W1H"))
-        ),
     ];
 
     Ok(Json(IngestionStatusResponse {
diff --git a/src/api/server.rs b/src/api/server.rs
index 1fdd558..8512b33 100644
--- a/src/api/server.rs
+++ b/src/api/server.rs
@@ -5,7 +5,7 @@ use tokio::time::timeout;
 use tower_http::cors::{Any, CorsLayer};
 
 use crate::core::cache::{MongoCache, RedisCache};
-use crate::core::db::{Database, PostgresDb};
+use crate::core::db::{Database, PostgresDb, QdrantDb};
 use crate::Embedder;
 
 use super::agent_api;
@@ -14,7 +14,6 @@ use super::auth;
 use super::docs;
 use super::files;
 use super::five_w1h_agent_api;
-use super::processing;
 use super::health;
 use super::identities;
 use super::identity_agent_api;
@@ -22,18 +21,18 @@ use super::identity_api;
 use super::identity_binding;
 use super::media_api;
 use super::middleware::unified_auth;
+use super::processing;
 use super::scan;
 use super::search::search_routes;
 use super::tmdb_api;
 use super::trace_agent_api;
 use super::types::AppState;
 use super::universal_search::universal_search_routes;
-use super::visual_search;
 
 pub async fn start_server(host: &str, port: u16) -> anyhow::Result<()> {
     health::init_server_state(host, port);
 
-    let embedder = std::sync::Arc::new(Embedder::new("nomic-embed-text-v2-moe:latest".to_string()));
+    let embedder = std::sync::Arc::new(Embedder::new("embeddinggemma-300m".to_string()));
 
     // ── ⚠️ WARNING: DO NOT move MongoCache::init() back to critical path ──
     //
@@ -57,6 +56,9 @@ pub async fn start_server(host: &str, port: u16) -> anyhow::Result<()> {
     let redis_cache = RedisCache::new()?;
     let db = PostgresDb::init().await?;
 
+    // Run migrations (create identity_history table if not exists)
+    PostgresDb::run_migrations(db.pool()).await?;
+
     let schema_health = health::check_schema_migrations(db.pool()).await;
     if schema_health.ok {
         tracing::info!(
@@ -89,8 +91,10 @@ pub async fn start_server(host: &str, port: u16) -> anyhow::Result<()> {
     let db = std::sync::Arc::new(db);
     let api_state = super::middleware::ApiState { db: db.clone() };
 
+    let qdrant = std::sync::Arc::new(QdrantDb::new());
     let state = AppState {
         db,
+        qdrant,
         embedder,
         embedder_model: "nomic-embed-text-v2-moe:latest".to_string(),
         mongo_cache,
@@ -129,7 +133,6 @@ pub async fn start_server(host: &str, port: u16) -> anyhow::Result<()> {
         .merge(auth::auth_routes())
         .merge(health::health_routes())
         .merge(docs::doc_routes())
-        .merge(visual_search::visual_search_routes())
         .merge(protected_routes)
         .layer(cors)
         .with_state(state);
diff --git a/src/api/trace_agent_api.rs b/src/api/trace_agent_api.rs
index d6e946e..ffff929 100644
--- a/src/api/trace_agent_api.rs
+++ b/src/api/trace_agent_api.rs
@@ -25,14 +25,19 @@ pub fn trace_agent_routes() -> Router<crate::api::types::AppState> {
             "/api/v1/file/:file_uuid/trace/:trace_id/thumbnail",
             get(get_trace_thumbnail),
         )
+        .route(
+            "/api/v1/file/:file_uuid/stranger/:stranger_id/representative-face",
+            get(get_stranger_representative_face),
+        )
+        .route(
+            "/api/v1/file/:file_uuid/stranger/:stranger_id/thumbnail",
+            get(get_stranger_thumbnail),
+        )
         .route(
             "/api/v1/file/:file_uuid/identities/:identity_uuid_a/co-occur-with/:identity_uuid_b",
             get(get_cooccurrence),
         )
-        .route(
-            "/api/v1/file/:file_uuid/tkg/rebuild",
-            post(rebuild_tkg),
-        )
+        .route("/api/v1/file/:file_uuid/tkg/rebuild", post(rebuild_tkg))
         .route(
             "/api/v1/file/:file_uuid/representative-frame",
             get(get_representative_frame),
@@ -54,8 +59,8 @@ struct TracesRequest {
 struct TraceInfo {
     trace_id: i32,
     face_count: i64,
-    start_frame: i32,
-    end_frame: i32,
+    start_frame: i64,
+    end_frame: i64,
     start_time: f64,
     end_time: f64,
     duration_sec: f64,
@@ -110,8 +115,8 @@ async fn list_traces_sorted(
         "SELECT tt.*, fd.id AS sample_face_id FROM (
             SELECT trace_id::int AS trace_id,
                    COUNT(*) AS face_count,
-                   MIN(frame_number)::int AS start_frame,
-                   MAX(frame_number)::int AS end_frame,
+                   MIN(frame_number)::bigint AS start_frame,
+                   MAX(frame_number)::bigint AS end_frame,
                    (MAX(frame_number) - MIN(frame_number))::float8 AS duration_sec,
                    AVG(confidence)::float8 AS avg_confidence
             FROM {}
@@ -132,7 +137,7 @@ async fn list_traces_sorted(
         crate::core::db::schema::table_name("face_detections"),
     );
 
-    let rows: Vec<(i32, i64, i32, i32, f64, f64, Option<i32>)> = sqlx::query_as(&query)
+    let rows: Vec<(i32, i64, i64, i64, f64, f64, Option<i32>)> = sqlx::query_as(&query)
         .bind(&file_uuid)
         .bind(min_faces)
         .bind(effective_limit)
@@ -193,8 +198,8 @@ struct TraceFacesQuery {
 #[derive(Debug, Serialize)]
 struct TraceFaceItem {
     id: i32,
-    start_frame: i32,
-    end_frame: i32,
+    start_frame: i64,
+    end_frame: i64,
     start_time: f64,
     end_time: f64,
     x: Option<i32>,
@@ -260,14 +265,14 @@ async fn list_trace_faces(
 
     let rows: Vec<(
         i32,
-        i32,
+        i64,
         Option<i32>,
         Option<i32>,
         Option<i32>,
         Option<i32>,
         f32,
     )> = sqlx::query_as(&format!(
-        "SELECT id, frame_number::int, x, y, width, height, confidence::float4 \
+        "SELECT id, frame_number, x, y, width, height, confidence::float4 \
                    FROM {} WHERE file_uuid = $1 AND trace_id = $2 \
                    ORDER BY frame_number ASC LIMIT $3 OFFSET $4",
         crate::core::db::schema::table_name("face_detections")
@@ -405,7 +410,8 @@ where
     let video_table = schema::table_name("videos");
 
     let fps: f64 = sqlx::query_scalar(&format!(
-        "SELECT COALESCE(fps, 25.0) FROM {} WHERE file_uuid = $1", video_table
+        "SELECT COALESCE(fps, 25.0) FROM {} WHERE file_uuid = $1",
+        video_table
     ))
     .bind(file_uuid)
     .fetch_optional(pool)
@@ -414,7 +420,8 @@ where
     .unwrap_or(25.0);
 
     let face_count: (i64,) = sqlx::query_as(&format!(
-        "SELECT COUNT(*) FROM {} WHERE file_uuid = $1 AND trace_id = $2", fd_table
+        "SELECT COUNT(*) FROM {} WHERE file_uuid = $1 AND trace_id = $2",
+        fd_table
     ))
     .bind(file_uuid)
     .bind(trace_id)
@@ -422,7 +429,15 @@ where
     .await
     .map_err(|e| err_fn(anyhow::anyhow!("{}", e)))?;
 
-    struct Candidate { frame: i64, x: i32, y: i32, w: i32, h: i32, conf: f64, score: f64 }
+    struct Candidate {
+        frame: i64,
+        x: i32,
+        y: i32,
+        w: i32,
+        h: i32,
+        conf: f64,
+        score: f64,
+    }
 
     let rows = sqlx::query_as::<_, (i64, i32, i32, i32, i32, f64)>(&format!(
         "SELECT frame_number::bigint, x, y, width, height, confidence::float8 \
@@ -431,7 +446,8 @@ where
          ORDER BY (width::float8 * height::float8) * confidence::float8 DESC LIMIT 10",
         fd_table
     ))
-    .bind(file_uuid).bind(trace_id)
+    .bind(file_uuid)
+    .bind(trace_id)
     .fetch_all(pool)
     .await
     .map_err(|e| err_fn(anyhow::anyhow!("{}", e)))?;
@@ -440,15 +456,25 @@ where
         return Err(err_fn(anyhow::anyhow!("No suitable face found")));
     }
 
-    let candidates: Vec<Candidate> = rows.into_iter()
+    let candidates: Vec<Candidate> = rows
+        .into_iter()
         .map(|(frame, x, y, w, h, conf)| {
             let score = (w as f64 * h as f64) * conf;
-            Candidate { frame, x, y, w, h, conf, score }
+            Candidate {
+                frame,
+                x,
+                y,
+                w,
+                h,
+                conf,
+                score,
+            }
         })
         .collect();
 
     let video_path: String = sqlx::query_scalar(&format!(
-        "SELECT file_path FROM {} WHERE file_uuid = $1", video_table
+        "SELECT file_path FROM {} WHERE file_uuid = $1",
+        video_table
     ))
     .bind(file_uuid)
     .fetch_optional(pool)
@@ -463,16 +489,31 @@ where
     for (i, c) in candidates.iter().enumerate() {
         let seek = c.frame as f64 / fps;
         if let Ok(output) = tokio::process::Command::new("ffmpeg")
-            .args(["-ss", &format!("{:.2}", seek), "-i", &video_path,
-                   "-vframes", "1", "-vf", &format!("crop={}:{}:{}:{},blurdetect", c.w, c.h, c.x, c.y),
-                   "-f", "null", "-"])
-            .output().await
+            .args([
+                "-ss",
+                &format!("{:.2}", seek),
+                "-i",
+                &video_path,
+                "-vframes",
+                "1",
+                "-vf",
+                &format!("crop={}:{}:{}:{},blurdetect", c.w, c.h, c.x, c.y),
+                "-f",
+                "null",
+                "-",
+            ])
+            .output()
+            .await
         {
             let stderr = String::from_utf8_lossy(&output.stderr);
             for line in stderr.lines() {
                 if let Some(blur_str) = line.split("blur mean: ").nth(1) {
                     if let Ok(blur) = blur_str.trim().parse::<f64>() {
-                        if blur < best_blur { best_blur = blur; best = c.frame; best_idx = i; }
+                        if blur < best_blur {
+                            best_blur = blur;
+                            best = c.frame;
+                            best_idx = i;
+                        }
                     }
                 }
             }
@@ -481,9 +522,17 @@ where
 
     let chosen = &candidates[best_idx];
     Ok(RepFaceSelection {
-        frame: chosen.frame, x: chosen.x, y: chosen.y, w: chosen.w, h: chosen.h,
-        conf: chosen.conf, blur: best_blur, score: chosen.score,
-        video_path, fps, face_count: face_count.0,
+        frame: chosen.frame,
+        x: chosen.x,
+        y: chosen.y,
+        w: chosen.w,
+        h: chosen.h,
+        conf: chosen.conf,
+        blur: best_blur,
+        score: chosen.score,
+        video_path,
+        fps,
+        face_count: face_count.0,
     })
 }
 
@@ -491,19 +540,36 @@ async fn get_representative_face(
     State(state): State<crate::api::types::AppState>,
     Path((file_uuid, trace_id)): Path<(String, i32)>,
 ) -> Result<Json<RepFaceResponse>, (StatusCode, Json<serde_json::Value>)> {
-    let sel = select_rep_face(state.db.pool(), &file_uuid, trace_id, |e| {
-        (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
-    }).await?;
+    get_representative_face_inner(&state, &file_uuid, trace_id).await
+}
+
+async fn get_representative_face_inner(
+    state: &crate::api::types::AppState,
+    file_uuid: &str,
+    trace_id: i32,
+) -> Result<Json<RepFaceResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let sel = select_rep_face(state.db.pool(), file_uuid, trace_id, |e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })
+    .await?;
 
     Ok(Json(RepFaceResponse {
         success: true,
-        file_uuid,
+        file_uuid: file_uuid.to_string(),
         trace_id,
         face_count: sel.face_count,
         representative: RepFaceResult {
             frame_number: sel.frame,
             timestamp_secs: sel.frame as f64 / sel.fps,
-            bbox: RepFaceBbox { x: sel.x, y: sel.y, width: sel.w, height: sel.h },
+            bbox: RepFaceBbox {
+                x: sel.x,
+                y: sel.y,
+                width: sel.w,
+                height: sel.h,
+            },
             confidence: sel.conf,
             quality_score: sel.score,
             blur_score: sel.blur,
@@ -515,34 +581,118 @@ async fn get_trace_thumbnail(
     State(state): State<crate::api::types::AppState>,
     Path((file_uuid, trace_id)): Path<(String, i32)>,
 ) -> Result<Response, (StatusCode, Json<serde_json::Value>)> {
+    get_trace_thumbnail_inner(&state, &file_uuid, trace_id).await
+}
+
+async fn get_trace_thumbnail_inner(
+    state: &crate::api::types::AppState,
+    file_uuid: &str,
+    trace_id: i32,
+) -> Result<Response, (StatusCode, Json<serde_json::Value>)> {
+    // Step 1: Check for pre-stored face crops in .faces/{file_uuid}/{trace_id}/
+    // For trace_id=0 (untracked/stranger), check unbound directory instead
+    let output_dir = crate::core::config::OUTPUT_DIR.as_str();
+    let trace_id_str = trace_id.to_string();
+    let trace_dir_name = if trace_id == 0 { "unbound" } else { &trace_id_str };
+    let trace_dir = std::path::PathBuf::from(output_dir)
+        .join(".faces")
+        .join(&file_uuid)
+        .join(trace_dir_name);
+
+    if trace_dir.exists() {
+        // Find any cached face crop in this trace directory
+        if let Ok(mut entries) = std::fs::read_dir(&trace_dir) {
+            while let Some(Ok(entry)) = entries.next() {
+                let path = entry.path();
+                if path.extension().map_or(false, |e| e == "jpg") {
+                    tracing::info!("[trace_thumbnail] Using cached face crop: {}", path.display());
+                    let bytes = tokio::fs::read(&path)
+                        .await
+                        .map_err(|e| {
+                            (
+                                StatusCode::INTERNAL_SERVER_ERROR,
+                                Json(serde_json::json!({"error": e.to_string()})),
+                            )
+                        })?;
+
+                    // Validate cached JPEG
+                    crate::core::thumbnail::validator::validate_jpeg(&bytes).map_err(|e| {
+                        tracing::warn!("[trace_thumbnail] Cached JPEG validation failed: {}", e);
+                        (
+                            StatusCode::INTERNAL_SERVER_ERROR,
+                            Json(serde_json::json!({"error": "Invalid cached JPEG"})),
+                        )
+                    })?;
+
+                    return Ok(Response::builder()
+                        .status(StatusCode::OK)
+                        .header(header::CONTENT_TYPE, "image/jpeg")
+                        .header(header::CACHE_CONTROL, "public, max-age=86400")
+                        .body(Body::from(bytes))
+                        .unwrap());
+                }
+            }
+        }
+    }
+
+    // Step 2: Fallback to ffmpeg on-demand extraction
     let sel = select_rep_face(state.db.pool(), &file_uuid, trace_id, |e| {
-        (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
-    }).await?;
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })
+    .await?;
 
     let seek = sel.frame as f64 / sel.fps;
     let tmp = std::env::temp_dir().join(format!("trace_{}_{}.jpg", file_uuid, trace_id));
 
+    tracing::debug!("[trace_thumbnail] Fallback to ffmpeg for trace {} frame {}", trace_id, sel.frame);
+
     let status = tokio::process::Command::new("ffmpeg")
         .args([
-            "-ss", &format!("{:.2}", seek),
-            "-i", &sel.video_path,
-            "-vframes", "1",
-            "-vf", &format!("crop={}:{}:{}:{},scale=320:320", sel.w, sel.h, sel.x, sel.y),
-            "-q:v", "2",
-            "-y", &tmp.to_string_lossy().to_string(),
+            "-ss",
+            &format!("{:.2}", seek),
+            "-i",
+            &sel.video_path,
+            "-vframes",
+            "1",
+            "-vf",
+            &format!("crop={}:{}:{}:{},scale=320:320", sel.w, sel.h, sel.x, sel.y),
+            "-q:v",
+            "2",
+            "-y",
+            &tmp.to_string_lossy().to_string(),
         ])
         .output()
         .await
         .map_err(|e| {
-            (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
         })?;
 
     if !status.status.success() {
-        return Err((StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": "FFmpeg failed"}))));
+        return Err((
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": "FFmpeg failed"})),
+        ));
     }
 
     let bytes = tokio::fs::read(&tmp).await.map_err(|e| {
-        (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?;
+
+    crate::core::thumbnail::validator::validate_jpeg(&bytes).map_err(|e| {
+        tracing::warn!("[trace_thumbnail] JPEG validation failed: {}", e);
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": "Invalid JPEG output"})),
+        )
     })?;
 
     let _ = tokio::fs::remove_file(&tmp).await;
@@ -605,10 +755,16 @@ async fn get_cooccurrence(
     .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
-        (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
     })?
     .ok_or_else(|| {
-        (StatusCode::NOT_FOUND, Json(serde_json::json!({"error": "Identity A not found"})))
+        (
+            StatusCode::NOT_FOUND,
+            Json(serde_json::json!({"error": "Identity A not found"})),
+        )
     })?;
 
     let id_b = sqlx::query_as::<_, (i32, String)>(&format!(
@@ -619,31 +775,38 @@ async fn get_cooccurrence(
     .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
-        (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
     })?
     .ok_or_else(|| {
-        (StatusCode::NOT_FOUND, Json(serde_json::json!({"error": "Identity B not found"})))
+        (
+            StatusCode::NOT_FOUND,
+            Json(serde_json::json!({"error": "Identity B not found"})),
+        )
     })?;
 
     // Stage 2: Find first frame where both identity_ids appear
-    let cooccur: Option<(i64,)> = sqlx::query_as(
-        &format!(
-            "SELECT MIN(fd.frame_number)::bigint FROM {} fd \
+    let cooccur: Option<(i64,)> = sqlx::query_as(&format!(
+        "SELECT MIN(fd.frame_number)::bigint FROM {} fd \
              WHERE fd.file_uuid = $1 AND fd.identity_id = $2 \
              AND fd.frame_number IN ( \
                SELECT frame_number FROM {} \
                WHERE file_uuid = $1 AND identity_id = $3 \
              )",
-            fd_table, fd_table
-        )
-    )
+        fd_table, fd_table
+    ))
     .bind(&file_uuid)
     .bind(id_a.0)
     .bind(id_b.0)
     .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
-        (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
     })?;
 
     let (first_frame,) = cooccur.ok_or_else(|| {
@@ -653,13 +816,17 @@ async fn get_cooccurrence(
     // Get fps for timestamp
     let video_table = schema::table_name("videos");
     let fps: f64 = sqlx::query_scalar(&format!(
-        "SELECT COALESCE(fps, 25.0) FROM {} WHERE file_uuid = $1", video_table
+        "SELECT COALESCE(fps, 25.0) FROM {} WHERE file_uuid = $1",
+        video_table
     ))
     .bind(&file_uuid)
     .fetch_optional(state.db.pool())
     .await
     .map_err(|e| {
-        (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
     })?
     .unwrap_or(25.0);
 
@@ -685,40 +852,67 @@ async fn get_cooccurrence(
     // Stage 4: Get representative faces for both traces (reusing select_rep_face)
     let rep_a = if let Some((tid,)) = trace_a {
         select_rep_face(state.db.pool(), &file_uuid, tid, |e| {
-            (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
-        }).await.ok().map(|sel| CoOccurRepFace {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })
+        .await
+        .ok()
+        .map(|sel| CoOccurRepFace {
             frame_number: sel.frame,
-            bbox: RepFaceBbox { x: sel.x, y: sel.y, width: sel.w, height: sel.h },
+            bbox: RepFaceBbox {
+                x: sel.x,
+                y: sel.y,
+                width: sel.w,
+                height: sel.h,
+            },
             confidence: sel.conf,
             thumbnail_url: format!("/api/v1/file/{}/trace/{}/thumbnail", file_uuid, tid),
         })
-    } else { None };
+    } else {
+        None
+    };
 
     let rep_b = if let Some((tid,)) = trace_b {
         select_rep_face(state.db.pool(), &file_uuid, tid, |e| {
-            (StatusCode::INTERNAL_SERVER_ERROR, Json(serde_json::json!({"error": e.to_string()})))
-        }).await.ok().map(|sel| CoOccurRepFace {
+            (
+                StatusCode::INTERNAL_SERVER_ERROR,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })
+        .await
+        .ok()
+        .map(|sel| CoOccurRepFace {
             frame_number: sel.frame,
-            bbox: RepFaceBbox { x: sel.x, y: sel.y, width: sel.w, height: sel.h },
+            bbox: RepFaceBbox {
+                x: sel.x,
+                y: sel.y,
+                width: sel.w,
+                height: sel.h,
+            },
             confidence: sel.conf,
             thumbnail_url: format!("/api/v1/file/{}/trace/{}/thumbnail", file_uuid, tid),
         })
-    } else { None };
+    } else {
+        None
+    };
 
     // Total co-occurrence frames (from TKG if available, otherwise from face_detections)
-    let total_cooccurrence_frames: i64 = sqlx::query_scalar(
-        &format!(
-            "SELECT COUNT(DISTINCT fd.frame_number)::bigint FROM {} fd \
+    let total_cooccurrence_frames: i64 = sqlx::query_scalar(&format!(
+        "SELECT COUNT(DISTINCT fd.frame_number)::bigint FROM {} fd \
              WHERE fd.file_uuid = $1 AND fd.identity_id = $2 \
              AND fd.frame_number IN ( \
                SELECT frame_number FROM {} \
                WHERE file_uuid = $1 AND identity_id = $3 \
              )",
-            fd_table, fd_table
-        )
-    )
-    .bind(&file_uuid).bind(id_a.0).bind(id_b.0)
-    .fetch_one(state.db.pool()).await
+        fd_table, fd_table
+    ))
+    .bind(&file_uuid)
+    .bind(id_a.0)
+    .bind(id_b.0)
+    .fetch_one(state.db.pool())
+    .await
     .unwrap_or(0);
 
     Ok(Json(CoOccurResponse {
@@ -758,12 +952,7 @@ async fn rebuild_tkg(
     State(state): State<crate::api::types::AppState>,
     Path(file_uuid): Path<String>,
 ) -> Json<TkgRebuildResponse> {
-    let result = crate::core::processor::tkg::build_tkg(
-        &state.db,
-        &file_uuid,
-        &OUTPUT_DIR,
-    )
-    .await;
+    let result = crate::core::processor::tkg::build_tkg(&state.db, &file_uuid, &OUTPUT_DIR).await;
 
     match result {
         Ok(r) => Json(TkgRebuildResponse {
@@ -807,14 +996,14 @@ async fn get_representative_frame(
     State(state): State<crate::api::types::AppState>,
     Path(file_uuid): Path<String>,
 ) -> Result<Json<RepFrameResponse>, (StatusCode, Json<serde_json::Value>)> {
-    let result = tkg::query_auto_representative_frame(
-        state.db.pool(),
-        &file_uuid,
-    )
-    .await
-    .map_err(|e| {
-        (StatusCode::NOT_FOUND, Json(serde_json::json!({"error": e.to_string()})))
-    })?;
+    let result = tkg::query_auto_representative_frame(state.db.pool(), &file_uuid)
+        .await
+        .map_err(|e| {
+            (
+                StatusCode::NOT_FOUND,
+                Json(serde_json::json!({"error": e.to_string()})),
+            )
+        })?;
 
     let fps = query_fps(state.db.pool(), &file_uuid).await;
 
@@ -843,3 +1032,59 @@ async fn query_fps(pool: &sqlx::PgPool, file_uuid: &str) -> f64 {
     .flatten()
     .unwrap_or(25.0)
 }
+
+async fn get_stranger_representative_face(
+    State(state): State<crate::api::types::AppState>,
+    Path((file_uuid, stranger_id)): Path<(String, i32)>,
+) -> Result<Json<RepFaceResponse>, (StatusCode, Json<serde_json::Value>)> {
+    let faces_table = crate::core::db::schema::table_name("face_detections");
+
+    let trace_id: i32 = sqlx::query_scalar(&format!(
+        "SELECT trace_id FROM {} WHERE file_uuid = $1 AND stranger_id = $2 LIMIT 1",
+        faces_table
+    ))
+    .bind(&file_uuid)
+    .bind(stranger_id)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?
+    .ok_or((
+        StatusCode::NOT_FOUND,
+        Json(serde_json::json!({"error": "Stranger not found"})),
+    ))?;
+
+    get_representative_face_inner(&state, &file_uuid, trace_id).await
+}
+
+async fn get_stranger_thumbnail(
+    State(state): State<crate::api::types::AppState>,
+    Path((file_uuid, stranger_id)): Path<(String, i32)>,
+) -> Result<Response, (StatusCode, Json<serde_json::Value>)> {
+    let faces_table = crate::core::db::schema::table_name("face_detections");
+
+    let trace_id: i32 = sqlx::query_scalar(&format!(
+        "SELECT trace_id FROM {} WHERE file_uuid = $1 AND stranger_id = $2 LIMIT 1",
+        faces_table
+    ))
+    .bind(&file_uuid)
+    .bind(stranger_id)
+    .fetch_optional(state.db.pool())
+    .await
+    .map_err(|e| {
+        (
+            StatusCode::INTERNAL_SERVER_ERROR,
+            Json(serde_json::json!({"error": e.to_string()})),
+        )
+    })?
+    .ok_or((
+        StatusCode::NOT_FOUND,
+        Json(serde_json::json!({"error": "Stranger not found"})),
+    ))?;
+
+    get_trace_thumbnail_inner(&state, &file_uuid, trace_id).await
+}
diff --git a/src/api/types.rs b/src/api/types.rs
index 9bca68c..0669b0f 100644
--- a/src/api/types.rs
+++ b/src/api/types.rs
@@ -1,6 +1,7 @@
 #[derive(Clone)]
 pub struct AppState {
     pub db: std::sync::Arc<crate::core::db::PostgresDb>,
+    pub qdrant: std::sync::Arc<crate::core::db::QdrantDb>,
     pub embedder: std::sync::Arc<crate::Embedder>,
     pub embedder_model: String,
     pub mongo_cache: crate::core::cache::MongoCache,
diff --git a/src/api/universal_search.rs b/src/api/universal_search.rs
index 34cb15a..739c21d 100644
--- a/src/api/universal_search.rs
+++ b/src/api/universal_search.rs
@@ -60,13 +60,12 @@ pub struct UniversalSearchResponse {
 pub enum SearchResult {
     #[serde(rename = "chunk")]
     Chunk {
+        file_uuid: String,
         chunk_id: String,
         chunk_type: String,
-        // Primary: frame-accurate position
         start_frame: i64,
         end_frame: i64,
         fps: f64,
-        // Reference: time derived from frames (subject to FPS variation)
         start_time: f64,
         end_time: f64,
         score: f64,
@@ -76,9 +75,8 @@ pub enum SearchResult {
     },
     #[serde(rename = "frame")]
     Frame {
-        // Primary: exact frame number
+        file_uuid: String,
         frame_number: i64,
-        // Reference: time derived from frame (subject to FPS variation)
         timestamp: f64,
         score: f64,
         objects: Option<Vec<serde_json::Value>>,
@@ -88,6 +86,7 @@ pub enum SearchResult {
     },
     #[serde(rename = "person")]
     Person {
+        file_uuid: Option<String>,
         identity_id: i32,
         identity_uuid: String,
         name: Option<String>,
@@ -328,17 +327,15 @@ async fn search_chunks(
     db: &PostgresDb,
     req: &UniversalSearchRequest,
 ) -> Result<Vec<SearchResult>, anyhow::Error> {
-    // uuid is required for chunk search - chunk_id is only unique within a video
-    let uuid = match &req.file_uuid {
-        Some(u) => u.replace('\'', "''"),
-        None => return Err(anyhow::anyhow!("file_uuid is required for chunk search")),
-    };
-
     let chunk_table = schema::table_name("chunk");
     let mut sql = format!(
-        "SELECT chunk_id, chunk_type, start_time, end_time, (start_time * fps)::bigint as start_frame, (end_time * fps)::bigint as end_frame, fps, text_content, content FROM {} WHERE file_uuid = '{}'",
-        chunk_table, uuid
+        "SELECT file_uuid, chunk_id, chunk_type, start_time, end_time, (start_time * fps)::bigint as start_frame, (end_time * fps)::bigint as end_frame, fps, text_content, content FROM {} WHERE 1=1",
+        chunk_table
     );
+
+    if let Some(uuid) = &req.file_uuid {
+        sql.push_str(&format!(" AND file_uuid = '{}'", uuid.replace('\'', "''")));
+    }
     if let Some(tr) = &req.time_range {
         sql.push_str(&format!(
             " AND start_time >= {} AND end_time <= {}",
@@ -422,6 +419,7 @@ async fn search_chunks(
     sql.push_str(&format!(" LIMIT {}", req.page_size.unwrap_or(20)));
 
     let rows: Vec<(
+        String,
         String,
         String,
         f64,
@@ -437,6 +435,7 @@ async fn search_chunks(
         .into_iter()
         .map(
             |(
+                file_uuid,
                 chunk_id,
                 chunk_type,
                 start_time,
@@ -457,7 +456,6 @@ async fn search_chunks(
                         .and_then(|v| v.as_str())
                         .map(String::from)
                 });
-                // Simple scoring: if query matches, score 0.8
                 let score = if !req.query.is_empty()
                     && text.as_ref().map_or(false, |t| {
                         t.to_lowercase().contains(&req.query.to_lowercase())
@@ -468,6 +466,7 @@ async fn search_chunks(
                 };
 
                 SearchResult::Chunk {
+                    file_uuid,
                     chunk_id,
                     chunk_type,
                     start_time,
@@ -549,7 +548,7 @@ async fn search_frames_internal(
 
     let results: Vec<SearchResult> = rows
         .into_iter()
-        .map(|(frame_number, timestamp, yolo, ocr, face, _uuid)| {
+        .map(|(frame_number, timestamp, yolo, ocr, face, file_uuid)| {
             let objects = yolo.as_ref().and_then(|v| {
                 v.get("objects")
                     .map(|o| o.as_array().cloned().unwrap_or_default())
@@ -571,6 +570,7 @@ async fn search_frames_internal(
             });
 
             SearchResult::Frame {
+                file_uuid,
                 frame_number,
                 timestamp,
                 score: 0.7,
@@ -589,37 +589,54 @@ async fn search_persons_internal(
     db: &PostgresDb,
     req: &UniversalSearchRequest,
 ) -> Result<Vec<SearchResult>, anyhow::Error> {
-    let uuid = match &req.file_uuid {
-        Some(u) => u.replace('\'', "''"),
-        None => return Err(anyhow::anyhow!("file_uuid is required for person search")),
-    };
-
     let id_table = schema::table_name("identities");
     let fd_table = schema::table_name("face_detections");
     let mut sql = format!(
         "SELECT i.id, i.uuid::text, i.name, COUNT(fd.id) AS appearance_count, \
-         MIN(fd.timestamp_secs) AS first_time, MAX(fd.timestamp_secs) AS last_time \
-         FROM {} i JOIN {} fd ON fd.identity_id = i.id \
-         WHERE fd.file_uuid = '{}'",
-        id_table, fd_table, uuid
+         MIN(fd.timestamp_secs) AS first_time, MAX(fd.timestamp_secs) AS last_time, \
+         fd.file_uuid \
+         FROM {} i JOIN {} fd ON fd.identity_id = i.id WHERE 1=1",
+        id_table, fd_table
     );
 
+    if let Some(uuid) = &req.file_uuid {
+        sql.push_str(&format!(
+            " AND fd.file_uuid = '{}'",
+            uuid.replace('\'', "''")
+        ));
+    }
+
     if !req.query.is_empty() {
         let q = req.query.replace('\'', "''");
         sql.push_str(&format!(" AND i.name ILIKE '%{}%'", q));
     }
 
-    sql.push_str(" GROUP BY i.id, i.uuid, i.name");
+    sql.push_str(" GROUP BY i.id, i.uuid, i.name, fd.file_uuid");
     sql.push_str(" ORDER BY appearance_count DESC");
     sql.push_str(&format!(" LIMIT {}", req.page_size.unwrap_or(20)));
 
-    let rows: Vec<(i32, String, Option<String>, i64, Option<f64>, Option<f64>)> =
-        sqlx::query_as(&sql).fetch_all(db.pool()).await?;
+    let rows: Vec<(
+        i32,
+        String,
+        Option<String>,
+        i64,
+        Option<f64>,
+        Option<f64>,
+        String,
+    )> = sqlx::query_as(&sql).fetch_all(db.pool()).await?;
 
     let results: Vec<SearchResult> = rows
         .into_iter()
         .map(
-            |(identity_id, identity_uuid, name, appearance_count, first_time, last_time)| {
+            |(
+                identity_id,
+                identity_uuid,
+                name,
+                appearance_count,
+                first_time,
+                last_time,
+                file_uuid,
+            )| {
                 let score = if !req.query.is_empty()
                     && name.as_ref().map_or(false, |n| {
                         n.to_lowercase().contains(&req.query.to_lowercase())
@@ -630,6 +647,7 @@ async fn search_persons_internal(
                 };
 
                 SearchResult::Person {
+                    file_uuid: Some(file_uuid),
                     identity_id,
                     identity_uuid,
                     name,
diff --git a/src/api/visual_chunk_search.rs b/src/api/visual_chunk_search.rs
deleted file mode 100644
index 1b21221..0000000
--- a/src/api/visual_chunk_search.rs
+++ /dev/null
@@ -1,513 +0,0 @@
-//! Visual chunk search functionality.
-//!
-//! This module provides search capabilities for visual chunks based on:
-//! - Object classes (e.g., "person", "car", "envelope")
-//! - Confidence thresholds
-//! - Object counts
-//! - Spatial density
-//! - Object relationships
-
-use crate::core::chunk::types::{Chunk, ChunkRule, ChunkType};
-use crate::core::db::{schema, PostgresDb};
-use anyhow::Result;
-use serde_json::Value;
-use std::collections::HashMap;
-
-/// Criteria for searching visual chunks
-#[derive(Debug, Clone, serde::Serialize, serde::Deserialize)]
-pub struct VisualChunkSearchCriteria {
-    /// Minimum average confidence across frames
-    pub min_avg_confidence: Option<f32>,
-    /// Minimum number of frames with objects
-    pub min_frames_with_objects: Option<u32>,
-    /// Minimum number of unique object classes
-    pub min_unique_classes: Option<u32>,
-    /// Specific object classes to include (empty means all)
-    #[serde(default)]
-    pub required_classes: Vec<String>,
-    /// Object class counts to filter by
-    #[serde(default)]
-    pub class_counts: HashMap<String, (u32, u32)>,
-    /// Time range (optional)
-    pub time_range: Option<(f64, f64)>,
-}
-
-impl Default for VisualChunkSearchCriteria {
-    fn default() -> Self {
-        Self {
-            min_avg_confidence: None,
-            min_frames_with_objects: None,
-            min_unique_classes: None,
-            required_classes: Vec::new(),
-            class_counts: HashMap::new(),
-            time_range: None,
-        }
-    }
-}
-
-/// Search visual chunks based on criteria
-pub async fn search_visual_chunks(
-    db: &PostgresDb,
-    uuid: &str,
-    criteria: &VisualChunkSearchCriteria,
-) -> Result<Vec<Chunk>> {
-    // First, get all visual chunks for this video
-    let all_chunks = get_visual_chunks_by_uuid(db, uuid).await?;
-
-    // Apply filters
-    let filtered_chunks: Vec<Chunk> = all_chunks
-        .into_iter()
-        .filter(|chunk| {
-            // Check min avg confidence
-            if let Some(min_avg_confidence) = criteria.min_avg_confidence {
-                if let Some(content) = &chunk.content.as_object() {
-                    if let Some(metadata) = content.get("metadata") {
-                        if let Some(avg_confidence) = metadata.get("avg_confidence") {
-                            if let Some(conf) = avg_confidence.as_f64() {
-                                if conf < min_avg_confidence as f64 {
-                                    return false;
-                                }
-                            }
-                        }
-                    }
-                }
-            }
-
-            // Check min frames with objects
-            if let Some(min_frames) = criteria.min_frames_with_objects {
-                if let Some(stats) = &chunk.visual_stats {
-                    if let Some(frames_with_objects) = stats.get("frames_with_objects") {
-                        if let Some(count) = frames_with_objects.as_u64() {
-                            if count < min_frames as u64 {
-                                return false;
-                            }
-                        }
-                    }
-                }
-            }
-
-            // Check min unique classes
-            if let Some(min_unique_classes) = criteria.min_unique_classes {
-                if let Some(content) = &chunk.content.as_object() {
-                    if let Some(metadata) = content.get("metadata") {
-                        if let Some(unique_classes) = metadata.get("unique_classes") {
-                            if let Some(classes) = unique_classes.as_array() {
-                                if (classes.len() as u32) < min_unique_classes {
-                                    return false;
-                                }
-                            }
-                        }
-                    }
-                }
-            }
-
-            // Check required classes
-            if !criteria.required_classes.is_empty() {
-                if let Some(content) = &chunk.content.as_object() {
-                    if let Some(keyframe_objects) = content.get("keyframe_objects") {
-                        if let Some(objects) = keyframe_objects.as_array() {
-                            let mut found_all = true;
-                            for required_class in &criteria.required_classes {
-                                let mut found = false;
-                                for obj in objects {
-                                    if let Some(class_name) = obj.get("class_name") {
-                                        if let Some(class_str) = class_name.as_str() {
-                                            if class_str == required_class {
-                                                found = true;
-                                                break;
-                                            }
-                                        }
-                                    }
-                                }
-                                if !found {
-                                    found_all = false;
-                                    break;
-                                }
-                            }
-                            if !found_all {
-                                return false;
-                            }
-                        }
-                    }
-                }
-            }
-
-            // Check class counts
-            if !criteria.class_counts.is_empty() {
-                if let Some(content) = &chunk.content.as_object() {
-                    if let Some(metadata) = content.get("metadata") {
-                        if let Some(object_counts) = metadata.get("object_counts") {
-                            for (class, (min, max)) in &criteria.class_counts {
-                                if let Some(count_value) = object_counts.get(class) {
-                                    if let Some(count) = count_value.as_u64() {
-                                        if *min > 0 && count < *min as u64 {
-                                            return false;
-                                        }
-                                        if *max < u32::MAX && count > *max as u64 {
-                                            return false;
-                                        }
-                                    }
-                                } else if *min > 0 {
-                                    return false;
-                                }
-                            }
-                        } else if criteria.class_counts.values().any(|(min, _)| *min > 0) {
-                            return false;
-                        }
-                    }
-                }
-            }
-
-            // Check time range
-            if let Some((start_time, end_time)) = criteria.time_range {
-                // Calculate chunk time from frames
-                let chunk_start_time = chunk.start_frame as f64 / chunk.fps;
-                let chunk_end_time = chunk.end_frame as f64 / chunk.fps;
-
-                if chunk_start_time < start_time || chunk_end_time > end_time {
-                    return false;
-                }
-            }
-
-            true
-        })
-        .collect();
-
-    Ok(filtered_chunks)
-}
-
-/// Get all visual chunks for a video UUID
-async fn get_visual_chunks_by_uuid(db: &PostgresDb, uuid: &str) -> Result<Vec<Chunk>> {
-    let chunk_table = schema::table_name("chunk");
-    let sql = format!(
-        "SELECT file_id, file_uuid, chunk_id, chunk_type, fps, start_frame, end_frame, text_content, content, metadata, vector_id, visual_stats FROM {} WHERE file_uuid = '{}' AND chunk_type = 'visual' ORDER BY start_frame ASC",
-        chunk_table, uuid.replace('\'', "''")
-    );
-
-    let rows: Vec<(
-        i32,            // file_id
-        String,         // uuid
-        String,         // chunk_id
-        String,         // chunk_type
-        f64,            // fps
-        i64,            // start_frame
-        i64,            // end_frame
-        Option<String>, // text_content
-        Value,          // content
-        Option<Value>,  // metadata
-        Option<String>, // vector_id
-        Option<Value>,  // visual_stats
-    )> = sqlx::query_as(&sql).fetch_all(db.pool()).await?;
-
-    let mut chunks = Vec::new();
-    for row in rows {
-        let chunk_type = match row.3.as_str() {
-            "visual" => ChunkType::Visual,
-            "sentence" => ChunkType::Sentence,
-            "time_based" => ChunkType::TimeBased,
-            "cut" => ChunkType::Cut,
-            "trace" => ChunkType::Trace,
-            "story" => ChunkType::Story,
-            _ => ChunkType::TimeBased,
-        };
-
-        // Calculate frame_count
-        let frame_count = (row.6 - row.5) as i32;
-
-        chunks.push(Chunk {
-            file_id: row.0,
-            uuid: row.1,
-            chunk_id: row.2,
-            chunk_type,
-            rule: ChunkRule::Rule2, // Visual chunks use Rule2
-            fps: row.4,
-            start_frame: row.5,
-            end_frame: row.6,
-            text_content: row.7,
-            content: row.8,
-            metadata: row.9,
-            vector_id: row.10,
-            frame_count,
-            pre_chunk_ids: Vec::new(),
-            parent_chunk_id: None,
-            child_chunk_ids: Vec::new(),
-            visual_stats: row.11,
-        });
-    }
-
-    Ok(chunks)
-}
-
-/// Search visual chunks by object class
-pub async fn search_visual_chunks_by_class(
-    db: &PostgresDb,
-    uuid: &str,
-    object_class: &str,
-    min_count: Option<u32>,
-    max_count: Option<u32>,
-) -> Result<Vec<Chunk>> {
-    let all_chunks = get_visual_chunks_by_uuid(db, uuid).await?;
-
-    let filtered_chunks: Vec<Chunk> = all_chunks
-        .into_iter()
-        .filter(|chunk| {
-            // Check if chunk contains the object class
-            let mut contains_class = false;
-            if let Some(content) = &chunk.content.as_object() {
-                if let Some(keyframe_objects) = content.get("keyframe_objects") {
-                    if let Some(objects) = keyframe_objects.as_array() {
-                        for obj in objects {
-                            if let Some(class_name) = obj.get("class_name") {
-                                if let Some(class_str) = class_name.as_str() {
-                                    if class_str == object_class {
-                                        contains_class = true;
-                                        break;
-                                    }
-                                }
-                            }
-                        }
-                    }
-                }
-            }
-
-            if !contains_class {
-                return false;
-            }
-
-            // Check count in visual_stats
-            if let Some(stats) = &chunk.visual_stats {
-                if let Some(count) = stats.get(object_class) {
-                    if let Some(c) = count.as_u64() {
-                        if let Some(min) = min_count {
-                            if c < min as u64 {
-                                return false;
-                            }
-                        }
-                        if let Some(max) = max_count {
-                            if c > max as u64 {
-                                return false;
-                            }
-                        }
-                    }
-                }
-            }
-
-            true
-        })
-        .collect();
-
-    Ok(filtered_chunks)
-}
-
-/// Search visual chunks by spatial density
-pub async fn search_visual_chunks_by_density(
-    db: &PostgresDb,
-    uuid: &str,
-    min_density: f32,
-    max_density: Option<f32>,
-) -> Result<Vec<Chunk>> {
-    let all_chunks = get_visual_chunks_by_uuid(db, uuid).await?;
-
-    let filtered_chunks: Vec<Chunk> = all_chunks
-        .into_iter()
-        .filter(|chunk| {
-            if let Some(content) = &chunk.content.as_object() {
-                if let Some(metadata) = content.get("metadata") {
-                    if let Some(density_value) = metadata.get("spatial_density") {
-                        if let Some(density) = density_value.as_f64() {
-                            if density < min_density as f64 {
-                                return false;
-                            }
-                            if let Some(max_dens) = max_density {
-                                if density > max_dens as f64 {
-                                    return false;
-                                }
-                            }
-                            return true;
-                        }
-                    }
-                }
-            }
-            false
-        })
-        .collect();
-
-    Ok(filtered_chunks)
-}
-
-/// Find chunks containing specific object combinations
-pub async fn search_visual_chunks_by_combination(
-    db: &PostgresDb,
-    uuid: &str,
-    combination: &[(&str, u32)],
-) -> Result<Vec<Chunk>> {
-    let all_chunks = get_visual_chunks_by_uuid(db, uuid).await?;
-
-    let filtered_chunks: Vec<Chunk> = all_chunks
-        .into_iter()
-        .filter(|chunk| {
-            // Check if all required combinations are present
-            for (object_class, min_count) in combination {
-                let mut found = false;
-                if let Some(stats) = &chunk.visual_stats {
-                    if let Some(object_counts) = stats.get("object_counts") {
-                        if let Some(count_value) = object_counts.get(*object_class) {
-                            if let Some(count) = count_value.as_u64() {
-                                if count >= *min_count as u64 {
-                                    found = true;
-                                }
-                            }
-                        }
-                    }
-                }
-                if !found {
-                    return false;
-                }
-            }
-            true
-        })
-        .collect();
-
-    Ok(filtered_chunks)
-}
-
-/// Get visual chunk statistics
-pub async fn get_visual_chunk_statistics(
-    db: &PostgresDb,
-    uuid: &str,
-) -> Result<HashMap<String, Value>> {
-    let chunk_table = schema::table_name("chunk");
-    let sql = format!(
-        "SELECT 
-            COUNT(*) as total_chunks,
-            AVG((content->'metadata'->>'avg_confidence')::float) as avg_confidence,
-            MIN((content->'metadata'->>'avg_confidence')::float) as min_confidence,
-            MAX((content->'metadata'->>'avg_confidence')::float) as max_confidence,
-            SUM((content->'metadata'->>'object_count')::int) as total_objects,
-            AVG((content->'metadata'->>'spatial_density')::float) as avg_density
-        FROM {} 
-        WHERE file_uuid = '{}' 
-        AND chunk_type = 'visual'",
-        chunk_table,
-        uuid.replace('\'', "''")
-    );
-
-    let row: (
-        i64,
-        Option<f64>,
-        Option<f64>,
-        Option<f64>,
-        Option<i64>,
-        Option<f64>,
-    ) = sqlx::query_as(&sql).fetch_one(db.pool()).await?;
-
-    let mut stats = HashMap::new();
-    stats.insert("total_chunks".to_string(), Value::from(row.0));
-    stats.insert(
-        "avg_confidence".to_string(),
-        Value::from(row.1.unwrap_or(0.0)),
-    );
-    stats.insert(
-        "min_confidence".to_string(),
-        Value::from(row.2.unwrap_or(0.0)),
-    );
-    stats.insert(
-        "max_confidence".to_string(),
-        Value::from(row.3.unwrap_or(0.0)),
-    );
-    stats.insert("total_objects".to_string(), Value::from(row.4.unwrap_or(0)));
-    stats.insert("avg_density".to_string(), Value::from(row.5.unwrap_or(0.0)));
-
-    Ok(stats)
-}
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn test_visual_chunk_search_criteria_default() {
-        let criteria = VisualChunkSearchCriteria::default();
-
-        assert_eq!(criteria.min_avg_confidence, None);
-        assert_eq!(criteria.min_frames_with_objects, None);
-        assert_eq!(criteria.min_unique_classes, None);
-        assert!(criteria.required_classes.is_empty());
-        assert!(criteria.class_counts.is_empty());
-        assert_eq!(criteria.time_range, None);
-    }
-
-    #[test]
-    fn test_visual_chunk_search_criteria_with_values() {
-        let mut criteria = VisualChunkSearchCriteria::default();
-        criteria.min_avg_confidence = Some(0.8);
-        criteria.min_frames_with_objects = Some(10);
-        criteria.min_unique_classes = Some(3);
-        criteria.required_classes = vec!["person".to_string(), "car".to_string()];
-        criteria.time_range = Some((0.0, 60.0));
-
-        assert_eq!(criteria.min_avg_confidence, Some(0.8));
-        assert_eq!(criteria.min_frames_with_objects, Some(10));
-        assert_eq!(criteria.min_unique_classes, Some(3));
-        assert_eq!(criteria.required_classes.len(), 2);
-        assert_eq!(criteria.time_range, Some((0.0, 60.0)));
-    }
-
-    #[test]
-    fn test_visual_chunk_search_criteria_serialization() {
-        let criteria = VisualChunkSearchCriteria {
-            min_avg_confidence: Some(0.85),
-            min_frames_with_objects: Some(5),
-            min_unique_classes: Some(2),
-            required_classes: vec!["person".to_string()],
-            class_counts: HashMap::new(),
-            time_range: Some((10.0, 30.0)),
-        };
-
-        let json = serde_json::to_string(&criteria).unwrap();
-        assert!(json.contains("min_avg_confidence"));
-        assert!(json.contains("required_classes"));
-
-        let deserialized: VisualChunkSearchCriteria = serde_json::from_str(&json).unwrap();
-        assert_eq!(deserialized.min_avg_confidence, Some(0.85));
-        assert_eq!(deserialized.required_classes.len(), 1);
-    }
-
-    #[test]
-    fn test_visual_chunk_search_criteria_with_class_counts() {
-        let mut criteria = VisualChunkSearchCriteria::default();
-        criteria.class_counts.insert("person".to_string(), (5, 20));
-        criteria.class_counts.insert("car".to_string(), (1, 10));
-
-        assert_eq!(criteria.class_counts.len(), 2);
-        assert_eq!(criteria.class_counts.get("person"), Some(&(5, 20)));
-        assert_eq!(criteria.class_counts.get("car"), Some(&(1, 10)));
-    }
-
-    #[test]
-    fn test_chunk_type_conversion() {
-        // Test chunk type string to enum conversion logic
-        let test_cases = vec![
-            ("visual", ChunkType::Visual),
-            ("sentence", ChunkType::Sentence),
-            ("time_based", ChunkType::TimeBased),
-            ("cut", ChunkType::Cut),
-            ("trace", ChunkType::Trace),
-            ("story", ChunkType::Story),
-            ("unknown", ChunkType::TimeBased), // Default fallback
-        ];
-
-        for (input, expected) in test_cases {
-            let chunk_type = match input {
-                "visual" => ChunkType::Visual,
-                "sentence" => ChunkType::Sentence,
-                "time_based" => ChunkType::TimeBased,
-                "cut" => ChunkType::Cut,
-                "trace" => ChunkType::Trace,
-                "story" => ChunkType::Story,
-                _ => ChunkType::TimeBased,
-            };
-            assert_eq!(chunk_type, expected);
-        }
-    }
-}
diff --git a/src/api/visual_search.rs b/src/api/visual_search.rs
deleted file mode 100644
index bdca397..0000000
--- a/src/api/visual_search.rs
+++ /dev/null
@@ -1,217 +0,0 @@
-use axum::{extract::State, http::StatusCode, response::Json, routing::post, Router};
-use serde::{Deserialize, Serialize};
-use sha2::{Digest, Sha256};
-
-use super::types::AppState;
-use super::visual_chunk_search;
-use crate::core::cache::keys;
-use crate::core::chunk::types::Chunk;
-use crate::core::db::{Database, PostgresDb};
-
-fn generate_visual_search_hash(
-    uuid: &str,
-    criteria: &visual_chunk_search::VisualChunkSearchCriteria,
-) -> String {
-    let data = serde_json::json!({
-        "uuid": uuid,
-        "criteria": criteria,
-    });
-    let mut hasher = Sha256::new();
-    hasher.update(data.to_string().as_bytes());
-    format!("{:x}", hasher.finalize())[..16].to_string()
-}
-
-#[derive(Debug, Deserialize)]
-struct VisualChunkSearchRequest {
-    file_uuid: String,
-    criteria: visual_chunk_search::VisualChunkSearchCriteria,
-}
-
-#[derive(Debug, Serialize)]
-struct VisualChunkSearchResponse {
-    chunks: Vec<Chunk>,
-    total: usize,
-}
-
-async fn search_visual_chunks(
-    State(state): State<AppState>,
-    Json(req): Json<VisualChunkSearchRequest>,
-) -> Result<Json<VisualChunkSearchResponse>, StatusCode> {
-    let criteria_hash = generate_visual_search_hash(&req.file_uuid, &req.criteria);
-    let cache_key = keys::visual_search(&req.file_uuid, &criteria_hash);
-    let ttl = state.mongo_cache.ttl_visual_search();
-
-    let chunks = state
-        .mongo_cache
-        .get_or_fetch(&cache_key, ttl, keys::CATEGORY_VISUAL_SEARCH, || async {
-            let db = PostgresDb::init()
-                .await
-                .map_err(|e| anyhow::anyhow!("PG init failed: {}", e))?;
-
-            visual_chunk_search::search_visual_chunks(&db, &req.file_uuid, &req.criteria)
-                .await
-                .map_err(|e| anyhow::anyhow!("Visual search failed: {}", e))
-        })
-        .await
-        .map_err(|e| {
-            tracing::error!("Visual chunk search failed: {}", e);
-            StatusCode::INTERNAL_SERVER_ERROR
-        })?;
-
-    Ok(Json(VisualChunkSearchResponse {
-        total: chunks.len(),
-        chunks,
-    }))
-}
-
-#[derive(Debug, Deserialize)]
-struct VisualChunkSearchByClassRequest {
-    uuid: String,
-    object_class: String,
-    min_count: Option<u32>,
-    max_count: Option<u32>,
-}
-
-#[derive(Debug, Deserialize)]
-struct VisualChunkSearchByDensityRequest {
-    uuid: String,
-    min_density: f32,
-    max_density: Option<f32>,
-}
-
-#[derive(Debug, Deserialize)]
-struct VisualChunkStatsRequest {
-    uuid: String,
-}
-
-async fn search_visual_chunks_by_class(
-    State(state): State<AppState>,
-    Json(req): Json<VisualChunkSearchByClassRequest>,
-) -> Result<Json<VisualChunkSearchResponse>, StatusCode> {
-    let db = PostgresDb::init()
-        .await
-        .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
-
-    let chunks = visual_chunk_search::search_visual_chunks_by_class(
-        &db,
-        &req.uuid,
-        &req.object_class,
-        req.min_count,
-        req.max_count,
-    )
-    .await
-    .map_err(|e| {
-        tracing::error!("Visual chunk search by class failed: {}", e);
-        StatusCode::INTERNAL_SERVER_ERROR
-    })?;
-
-    Ok(Json(VisualChunkSearchResponse {
-        total: chunks.len(),
-        chunks,
-    }))
-}
-
-async fn search_visual_chunks_by_density(
-    State(state): State<AppState>,
-    Json(req): Json<VisualChunkSearchByDensityRequest>,
-) -> Result<Json<VisualChunkSearchResponse>, StatusCode> {
-    let db = PostgresDb::init()
-        .await
-        .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
-
-    let chunks = visual_chunk_search::search_visual_chunks_by_density(
-        &db,
-        &req.uuid,
-        req.min_density,
-        req.max_density,
-    )
-    .await
-    .map_err(|e| {
-        tracing::error!("Visual chunk search by density failed: {}", e);
-        StatusCode::INTERNAL_SERVER_ERROR
-    })?;
-
-    Ok(Json(VisualChunkSearchResponse {
-        total: chunks.len(),
-        chunks,
-    }))
-}
-
-#[derive(Debug, Serialize)]
-struct VisualChunkStatsResponse {
-    uuid: String,
-    stats: std::collections::HashMap<String, serde_json::Value>,
-}
-
-async fn get_visual_chunk_stats(
-    State(state): State<AppState>,
-    Json(req): Json<VisualChunkStatsRequest>,
-) -> Result<Json<VisualChunkStatsResponse>, StatusCode> {
-    let db = PostgresDb::init()
-        .await
-        .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
-
-    let stats = visual_chunk_search::get_visual_chunk_statistics(&db, &req.uuid)
-        .await
-        .map_err(|e| {
-            tracing::error!("Get visual chunk stats failed: {}", e);
-            StatusCode::INTERNAL_SERVER_ERROR
-        })?;
-
-    Ok(Json(VisualChunkStatsResponse {
-        uuid: req.uuid,
-        stats,
-    }))
-}
-
-#[derive(Debug, Deserialize)]
-struct VisualChunkSearchByCombinationRequest {
-    uuid: String,
-    combination: Vec<(String, u32)>,
-}
-
-async fn search_visual_chunks_by_combination(
-    State(state): State<AppState>,
-    Json(req): Json<VisualChunkSearchByCombinationRequest>,
-) -> Result<Json<VisualChunkSearchResponse>, StatusCode> {
-    let db = PostgresDb::init()
-        .await
-        .map_err(|_| StatusCode::INTERNAL_SERVER_ERROR)?;
-
-    let combination: Vec<(&str, u32)> = req
-        .combination
-        .iter()
-        .map(|(c, n)| (c.as_str(), *n))
-        .collect();
-
-    let chunks =
-        visual_chunk_search::search_visual_chunks_by_combination(&db, &req.uuid, &combination)
-            .await
-            .map_err(|e| {
-                tracing::error!("Visual chunk search by combination failed: {}", e);
-                StatusCode::INTERNAL_SERVER_ERROR
-            })?;
-
-    Ok(Json(VisualChunkSearchResponse {
-        total: chunks.len(),
-        chunks,
-    }))
-}
-
-pub fn visual_search_routes() -> Router<AppState> {
-    Router::new()
-        .route("/api/v1/search/visual", post(search_visual_chunks))
-        .route(
-            "/api/v1/search/visual/class",
-            post(search_visual_chunks_by_class),
-        )
-        .route(
-            "/api/v1/search/visual/density",
-            post(search_visual_chunks_by_density),
-        )
-        .route("/api/v1/search/visual/stats", post(get_visual_chunk_stats))
-        .route(
-            "/api/v1/search/visual/combination",
-            post(search_visual_chunks_by_combination),
-        )
-}
diff --git a/src/bin/check_db_schema.rs b/src/bin/check_db_schema.rs
new file mode 100644
index 0000000..04bc422
--- /dev/null
+++ b/src/bin/check_db_schema.rs
@@ -0,0 +1,42 @@
+use sqlx::postgres::PgPoolOptions;
+use sqlx::Row;
+
+#[tokio::main]
+async fn main() -> Result<(), Box<dyn std::error::Error>> {
+    let url = std::env::var("DATABASE_URL")
+        .unwrap_or_else(|_| "postgres://accusys@localhost:5432/momentry".into());
+    let pool = PgPoolOptions::new()
+        .max_connections(1)
+        .connect(&url)
+        .await?;
+
+    // Check videos columns
+    let rows = sqlx::query(
+        "SELECT column_name, data_type FROM information_schema.columns WHERE table_schema='public' AND table_name='videos' ORDER BY ordinal_position"
+    ).fetch_all(&pool).await?;
+    println!("=== public.videos columns ===");
+    for r in &rows {
+        let col: String = r.get("column_name");
+        let typ: String = r.get("data_type");
+        println!("  {}: {}", col, typ);
+    }
+
+    // Check chunks_rule1 columns
+    let rows2 = sqlx::query(
+        "SELECT column_name, data_type FROM information_schema.columns WHERE table_schema='public' AND table_name='chunks_rule1' ORDER BY ordinal_position"
+    ).fetch_all(&pool).await?;
+    println!("=== public.chunks_rule1 columns ===");
+    for r in &rows2 {
+        let col: String = r.get("column_name");
+        let typ: String = r.get("data_type");
+        println!("  {}: {}", col, typ);
+    }
+
+    // Check if jobs exists
+    let exists: bool = sqlx::query_scalar(
+        "SELECT EXISTS (SELECT 1 FROM information_schema.tables WHERE table_schema='public' AND table_name='jobs')"
+    ).fetch_one(&pool).await?;
+    println!("=== public.jobs exists: {} ===", exists);
+
+    Ok(())
+}
diff --git a/src/bin/sync_qdrant_from_pg.rs b/src/bin/sync_qdrant_from_pg.rs
new file mode 100644
index 0000000..7790d7a
--- /dev/null
+++ b/src/bin/sync_qdrant_from_pg.rs
@@ -0,0 +1,95 @@
+use anyhow::{Context, Result};
+use momentry_core::{Database, PostgresDb, QdrantDb, VectorPayload};
+
+#[tokio::main]
+async fn main() -> Result<()> {
+    dotenv::from_filename("/Users/accusys/momentry_core_0.1/.env.development").ok();
+    tracing_subscriber::fmt::init();
+
+    let pg = PostgresDb::init().await.context("Failed to init PostgreSQL")?;
+    let qdrant = QdrantDb::new();
+    let chunk_table = momentry_core::core::db::schema::table_name("chunk");
+
+    let uuids = vec![
+        "63acd3bb02b5b9dfbb9d6db499fcc864",
+        "a6fb22eebefaef17e62af874997c5944",
+        "d81e01261391b45c1a14ddd5f082733e",
+    ];
+
+    for uuid in &uuids {
+        let rows = sqlx::query_as::<_, (String, String, i64, i64, f64, f64, String, String)>(
+            &format!(
+                "SELECT chunk_id, text_content, start_frame, end_frame, \
+                 start_time, end_time, embedding::text, content::text \
+                 FROM {} \
+                 WHERE file_uuid = $1 \
+                   AND chunk_type = 'sentence' \
+                   AND embedding IS NOT NULL \
+                   AND (text_content IS NOT NULL AND text_content != '') \
+                 ORDER BY id",
+                chunk_table
+            ),
+        )
+        .bind(uuid)
+        .fetch_all(pg.pool())
+        .await?;
+
+        let total = rows.len();
+        println!("[{}] Found {} sentence chunks with embeddings to sync to Qdrant", uuid, total);
+
+        if total == 0 {
+            continue;
+        }
+
+        let start = std::time::Instant::now();
+        let mut stored = 0usize;
+        let mut errors = 0usize;
+
+        for (chunk_id, text, start_frame, end_frame, start_time, end_time, vector_text, _content_str) in &rows {
+            let vector: Vec<f32> = serde_json::from_str(vector_text)
+                .map_err(|e| anyhow::anyhow!("Failed to parse vector for {}: {}", chunk_id, e))?;
+
+            let payload = VectorPayload {
+                file_uuid: uuid.to_string(),
+                chunk_id: chunk_id.clone(),
+                chunk_type: "sentence".to_string(),
+                start_frame: *start_frame,
+                end_frame: *end_frame,
+                start_time: *start_time,
+                end_time: *end_time,
+                text: Some(text.clone()),
+            };
+
+            if let Err(e) = qdrant.upsert_vector(chunk_id, &vector, payload).await {
+                eprintln!("[ERROR] Qdrant upsert failed for {}: {}", chunk_id, e);
+                errors += 1;
+                continue;
+            }
+
+            stored += 1;
+            if stored % 5000 == 0 || stored == total {
+                let elapsed = start.elapsed();
+                let rate = stored as f64 / elapsed.as_secs_f64();
+                println!(
+                    "  [{}] {}/{} ({:.1}%) | {:.0} vec/s | {} errors",
+                    uuid.get(..8).unwrap_or(uuid),
+                    stored, total,
+                    100.0 * stored as f64 / total as f64,
+                    rate, errors,
+                );
+            }
+        }
+
+        let elapsed = start.elapsed();
+        println!(
+            "[{}] Done! {}/{} vectors synced ({} errors) in {:.1}s ({:.0} vec/s avg)",
+            uuid.get(..8).unwrap_or(uuid),
+            stored, total, errors,
+            elapsed.as_secs_f64(),
+            stored as f64 / elapsed.as_secs_f64(),
+        );
+    }
+
+    println!("\nAll files synced to Qdrant!");
+    Ok(())
+}
diff --git a/src/bin/test_bson_deserialize.rs b/src/bin/test_bson_deserialize.rs
new file mode 100644
index 0000000..1402d5f
--- /dev/null
+++ b/src/bin/test_bson_deserialize.rs
@@ -0,0 +1,45 @@
+use bson::bson;
+use chrono::{DateTime, Utc};
+use serde::{Deserialize, Serialize};
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct TestIdentitySnapshot {
+    id: i32,
+    uuid: String,
+    name: String,
+    identity_type: Option<String>,
+    source: Option<String>,
+    status: String,
+    tmdb_id: Option<i32>,
+    tmdb_profile: Option<String>,
+    metadata: serde_json::Value,
+    #[serde(
+        with = "bson::serde_helpers::chrono_datetime_as_bson_datetime_optional",
+        default
+    )]
+    created_at: Option<DateTime<Utc>>,
+    face_count: i64,
+}
+
+fn main() {
+    // 模拟 MongoDB document
+    let doc = bson!({
+        "id": bson::Bson::Int32(21),
+        "uuid": "1524f6a1537f48a187526d44a236584f",
+        "name": "Albert Daumergue",
+        "identity_type": "people",
+        "source": "tmdb",
+        "status": "confirmed",
+        "tmdb_id": bson::Bson::Int32(1100817),
+        "tmdb_profile": bson::Bson::Null,
+        "metadata": {"role": "", "notes": "", "aliases": [], "starred": false},
+        "created_at": bson::Bson::DateTime(bson::DateTime::from_millis(1714641951963)),
+        "face_count": bson::Bson::Int64(0)
+    });
+
+    let result: Result<TestIdentitySnapshot, _> = bson::from_bson(doc);
+    match result {
+        Ok(s) => println!("Success! {:?}", s),
+        Err(e) => println!("Error: {}", e),
+    }
+}
diff --git a/src/bin/test_empty_array.rs b/src/bin/test_empty_array.rs
new file mode 100644
index 0000000..49ebe32
--- /dev/null
+++ b/src/bin/test_empty_array.rs
@@ -0,0 +1,25 @@
+use bson::bson;
+use serde::{Deserialize, Serialize};
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct FacesTransferred {
+    file_uuid: String,
+    face_ids: Vec<String>,
+    trace_ids: Vec<i32>,
+    count: i64,
+}
+
+fn main() {
+    let doc = bson!({
+        "file_uuid": "",
+        "face_ids": [],
+        "trace_ids": [],
+        "count": bson::Bson::Int64(0)
+    });
+
+    let result: Result<FacesTransferred, _> = bson::from_bson(doc);
+    match result {
+        Ok(f) => println!("Success! trace_ids len: {}", f.trace_ids.len()),
+        Err(e) => println!("Error: {}", e),
+    }
+}
diff --git a/src/bin/test_full_deserialize.rs b/src/bin/test_full_deserialize.rs
new file mode 100644
index 0000000..c605ff3
--- /dev/null
+++ b/src/bin/test_full_deserialize.rs
@@ -0,0 +1,131 @@
+use bson::bson;
+use chrono::{DateTime, Utc};
+use serde::{Deserialize, Serialize};
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct IdentitySnapshot {
+    id: i32,
+    uuid: String,
+    name: String,
+    identity_type: Option<String>,
+    source: Option<String>,
+    status: String,
+    tmdb_id: Option<i32>,
+    tmdb_profile: Option<String>,
+    metadata: serde_json::Value,
+    #[serde(
+        with = "bson::serde_helpers::chrono_datetime_as_bson_datetime_optional",
+        default
+    )]
+    created_at: Option<DateTime<Utc>>,
+    face_count: i64,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct TargetIdentitySnapshot {
+    id: i32,
+    uuid: String,
+    name: String,
+    metadata_before: serde_json::Value,
+    metadata_after: Option<serde_json::Value>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct AliasEntry {
+    name: String,
+    locale: String,
+    source: Option<String>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct FacesTransferred {
+    file_uuid: String,
+    face_ids: Vec<String>,
+    trace_ids: Vec<i32>,
+    count: i64,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct MergeParams {
+    keep_history: bool,
+    cleared_stranger_id: bool,
+    performed_by_user: Option<String>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct IdentityMergeHistory {
+    #[serde(rename = "_id", skip_serializing_if = "Option::is_none")]
+    id: Option<bson::oid::ObjectId>,
+    merge_id: String,
+    source_identity: IdentitySnapshot,
+    target_identity: TargetIdentitySnapshot,
+    aliases_added_to_target: Vec<AliasEntry>,
+    metadata_fields_added: Vec<String>,
+    faces_transferred: FacesTransferred,
+    merge_params: MergeParams,
+    #[serde(with = "bson::serde_helpers::chrono_datetime_as_bson_datetime")]
+    merged_at: DateTime<Utc>,
+    #[serde(with = "bson::serde_helpers::chrono_datetime_as_bson_datetime")]
+    undo_deadline: DateTime<Utc>,
+    undone: bool,
+    #[serde(
+        with = "bson::serde_helpers::chrono_datetime_as_bson_datetime_optional",
+        skip_serializing_if = "Option::is_none"
+    )]
+    undone_at: Option<DateTime<Utc>>,
+    undone_by: Option<String>,
+    undone_snapshot: Option<serde_json::Value>,
+    undo_expired: bool,
+}
+
+fn main() {
+    let doc = bson!({
+        "merge_id": "test-id",
+        "source_identity": {
+            "id": bson::Bson::Int32(21),
+            "uuid": "test-uuid",
+            "name": "Test",
+            "identity_type": "people",
+            "source": "tmdb",
+            "status": "confirmed",
+            "tmdb_id": bson::Bson::Int32(123),
+            "tmdb_profile": bson::Bson::Null,
+            "metadata": {},
+            "created_at": bson::Bson::DateTime(bson::DateTime::from_millis(1714641951963)),
+            "face_count": bson::Bson::Int64(0)
+        },
+        "target_identity": {
+            "id": bson::Bson::Int32(22),
+            "uuid": "target-uuid",
+            "name": "Target",
+            "metadata_before": {},
+            "metadata_after": bson::Bson::Null
+        },
+        "aliases_added_to_target": [],
+        "metadata_fields_added": [],
+        "faces_transferred": {
+            "file_uuid": "",
+            "face_ids": [],
+            "trace_ids": [],
+            "count": bson::Bson::Int64(0)
+        },
+        "merge_params": {
+            "keep_history": false,
+            "cleared_stranger_id": true,
+            "performed_by_user": "0"
+        },
+        "merged_at": bson::Bson::DateTime(bson::DateTime::from_millis(1714641951963)),
+        "undo_deadline": bson::Bson::DateTime(bson::DateTime::from_millis(1714641951963)),
+        "undone": false,
+        "undone_at": bson::Bson::Null,
+        "undone_by": bson::Bson::Null,
+        "undone_snapshot": bson::Bson::Null,
+        "undo_expired": false
+    });
+
+    let result: Result<IdentityMergeHistory, _> = bson::from_bson(doc);
+    match result {
+        Ok(h) => println!("Success! {:?}", h.merge_id),
+        Err(e) => println!("Error: {}", e),
+    }
+}
diff --git a/src/bin/test_number_types.rs b/src/bin/test_number_types.rs
new file mode 100644
index 0000000..48859ff
--- /dev/null
+++ b/src/bin/test_number_types.rs
@@ -0,0 +1,31 @@
+use bson::bson;
+use serde::{Deserialize, Serialize};
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct TestId {
+    id: i32,
+    tmdb_id: Option<i32>,
+}
+
+fn main() {
+    // 测试 Int32
+    let doc_int32 = bson!({
+        "id": bson::Bson::Int32(21),
+        "tmdb_id": bson::Bson::Int32(1100817)
+    });
+
+    let result1: Result<TestId, _> = bson::from_bson(doc_int32);
+    println!("Int32 test: {}", result1.is_ok());
+
+    // 测试 Double (JavaScript Number 可能是这个)
+    let doc_double = bson!({
+        "id": bson::Bson::Double(21.0),
+        "tmdb_id": bson::Bson::Double(1100817.0)
+    });
+
+    let result2: Result<TestId, _> = bson::from_bson(doc_double);
+    println!("Double test: {}", result2.is_ok());
+    if result2.is_err() {
+        println!("Double error: {}", result2.unwrap_err());
+    }
+}
diff --git a/src/bin/vectorize_missing.rs b/src/bin/vectorize_missing.rs
new file mode 100644
index 0000000..785265f
--- /dev/null
+++ b/src/bin/vectorize_missing.rs
@@ -0,0 +1,117 @@
+use anyhow::{Context, Result};
+use momentry_core::{
+    Database, Embedder, PostgresDb, QdrantDb, VectorPayload,
+};
+use std::time::{Duration, Instant};
+
+#[tokio::main]
+async fn main() -> Result<()> {
+    dotenv::from_filename("/Users/accusys/momentry_core_0.1/.env.development").ok();
+    tracing_subscriber::fmt::init();
+
+    let pg = PostgresDb::init().await.context("Failed to init PostgreSQL")?;
+    let qdrant = QdrantDb::new();
+    let embedder = Embedder::new("embeddinggemma-300m".to_string());
+
+    let uuid = "63acd3bb02b5b9dfbb9d6db499fcc864";
+    let chunk_table = momentry_core::core::db::schema::table_name("chunk");
+
+    let rows = sqlx::query_as::<_, (String, String, i64, i64, f64, f64, String)>(
+        &format!(
+            "SELECT chunk_id, text_content, start_frame, end_frame, \
+             start_time, end_time, content::text \
+             FROM {} \
+             WHERE file_uuid = $1 \
+               AND chunk_type = 'sentence' \
+               AND embedding IS NULL \
+               AND (text_content IS NOT NULL AND text_content != '') \
+             ORDER BY id",
+            chunk_table
+        ),
+    )
+    .bind(uuid)
+    .fetch_all(pg.pool())
+    .await?;
+
+    let total = rows.len();
+    println!("Found {} sentence chunks without embedding for {}", total, uuid);
+
+    if total == 0 {
+        println!("Nothing to vectorize. Exiting.");
+        return Ok(());
+    }
+
+    let start = Instant::now();
+    let mut stored = 0usize;
+    let mut errors = 0usize;
+
+    for (chunk_id, text, start_frame, end_frame, start_time, end_time, _content_str) in &rows {
+        if text.is_empty() {
+            continue;
+        }
+
+        match embedder.embed_document(text).await {
+            Ok(vector) => {
+                if let Err(e) = pg.store_vector(chunk_id, &vector, uuid).await {
+                    eprintln!("[ERROR] PG store failed for {}: {}", chunk_id, e);
+                    errors += 1;
+                    continue;
+                }
+
+                let payload = VectorPayload {
+                    file_uuid: uuid.to_string(),
+                    chunk_id: chunk_id.clone(),
+                    chunk_type: "sentence".to_string(),
+                    start_frame: *start_frame,
+                    end_frame: *end_frame,
+                    start_time: *start_time,
+                    end_time: *end_time,
+                    text: Some(text.clone()),
+                };
+
+                if let Err(e) = qdrant.upsert_vector(chunk_id, &vector, payload).await {
+                    eprintln!("[ERROR] Qdrant upsert failed for {}: {}", chunk_id, e);
+                    errors += 1;
+                    continue;
+                }
+
+                stored += 1;
+                if stored % 500 == 0 || stored == total {
+                    let elapsed = start.elapsed();
+                    let rate = stored as f64 / elapsed.as_secs_f64();
+                    let eta = if stored < total {
+                        let remaining = Duration::from_secs_f64((total - stored) as f64 / rate);
+                        format!(" (ETA: {}s)", remaining.as_secs())
+                    } else {
+                        String::new()
+                    };
+                    println!(
+                        "  [{}/{}] {:.1}% done | {:.0} vec/s | {} errors{}",
+                        stored,
+                        total,
+                        100.0 * stored as f64 / total as f64,
+                        rate,
+                        errors,
+                        eta,
+                    );
+                }
+            }
+            Err(e) => {
+                eprintln!("[ERROR] Embedding failed for {}: {}", chunk_id, e);
+                errors += 1;
+            }
+        }
+    }
+
+    let elapsed = start.elapsed();
+    println!(
+        "\nDone! {}/{} vectors stored ({} errors) in {:.1}s ({:.0} vec/s avg)",
+        stored,
+        total,
+        errors,
+        elapsed.as_secs_f64(),
+        stored as f64 / elapsed.as_secs_f64(),
+    );
+
+    Ok(())
+}
diff --git a/src/core/chunk/rule3_ingest.rs b/src/core/chunk/rule3_ingest.rs
index 58d5726..af66b91 100644
--- a/src/core/chunk/rule3_ingest.rs
+++ b/src/core/chunk/rule3_ingest.rs
@@ -1,6 +1,5 @@
 use crate::core::config::OUTPUT_DIR;
 use crate::core::db::schema;
-use crate::core::llm::client::generate_5w1h_summary;
 use anyhow::{Context, Result};
 use serde::Deserialize;
 use sqlx::PgPool;
@@ -115,19 +114,6 @@ pub async fn ingest_rule3(pool: &PgPool, file_uuid: &str) -> Result<usize> {
 
         let aggregated_text = texts.join(" ");
 
-        // 3. Call LLM for Summary
-        let summary = if !aggregated_text.is_empty() {
-            match generate_5w1h_summary(&aggregated_text).await {
-                Ok(s) => s,
-                Err(e) => {
-                    warn!("LLM Summary failed for scene {}: {}", scene.scene_number, e);
-                    "LLM Error".to_string()
-                }
-            }
-        } else {
-            "No Audio".to_string()
-        };
-
         info!(
             "Scene {}: {} -> {} ({} sentences)",
             scene.scene_number,
@@ -168,7 +154,7 @@ pub async fn ingest_rule3(pool: &PgPool, file_uuid: &str) -> Result<usize> {
         .bind(scene.end_frame as i64)
         .bind(&metadata)
         .bind(&aggregated_text)
-        .bind(&summary)
+        .bind(&String::new())
         .bind(&metadata)
         .bind(&child_ids)
         .execute(&mut *tx)
diff --git a/src/core/chunk/types.rs b/src/core/chunk/types.rs
index 0aa9ec6..fb5b09f 100644
--- a/src/core/chunk/types.rs
+++ b/src/core/chunk/types.rs
@@ -1,7 +1,6 @@
 use crate::core::time::FrameTime;
 use serde::{Deserialize, Serialize};
 
-// ==================== ChunkType ====================
 #[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq)]
 #[serde(rename_all = "snake_case")]
 pub enum ChunkType {
@@ -10,7 +9,6 @@ pub enum ChunkType {
     Cut,
     Trace,
     Story,
-    Visual, // 視覺分片 (Phase 2.1)
 }
 
 impl ChunkType {
@@ -21,17 +19,15 @@ impl ChunkType {
             ChunkType::Cut => "cut",
             ChunkType::Trace => "trace",
             ChunkType::Story => "story",
-            ChunkType::Visual => "visual",
         }
     }
 }
 
-// ==================== ChunkRule ====================
 #[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq)]
 #[serde(rename_all = "snake_case")]
 pub enum ChunkRule {
-    Rule1, // 直接轉換
-    Rule2, // 集合內容
+    Rule1,
+    Rule2,
 }
 
 impl ChunkRule {
@@ -43,73 +39,6 @@ impl ChunkRule {
     }
 }
 
-// ==================== 視覺分片相關結構 (Phase 2.1) ====================
-/// 邊界框
-#[derive(Debug, Clone, Serialize, Deserialize)]
-pub struct BoundingBox {
-    pub x: i32,
-    pub y: i32,
-    pub width: i32,
-    pub height: i32,
-}
-
-/// 檢測到的物件
-#[derive(Debug, Clone, Serialize, Deserialize)]
-pub struct DetectedObject {
-    /// 物件類別名稱
-    pub class_name: String,
-    /// 物件類別 ID
-    pub class_id: u32,
-    /// 信心值 (0.0-1.0)
-    pub confidence: f32,
-    /// 邊界框
-    pub bbox: Option<BoundingBox>,
-    /// 出現次數 (在分片內)
-    pub occurrence: u32,
-}
-
-/// 關鍵幀的物件列表
-#[derive(Debug, Clone, Serialize, Deserialize)]
-pub struct KeyframeObjects {
-    /// 關鍵幀時間 (秒) - 僅供參考，主要使用 frame_number
-    pub timestamp: f64,
-    /// 關鍵幀幀號 - 主要時間標示
-    pub frame_number: u64,
-    /// 檢測到的物件
-    pub objects: Vec<DetectedObject>,
-}
-
-/// 視覺元數據
-#[derive(Debug, Clone, Serialize, Deserialize)]
-pub struct VisualMetadata {
-    /// 總物件數量
-    pub object_count: u32,
-    /// 唯一物件類別列表
-    pub unique_classes: Vec<String>,
-    /// 最高信心值
-    pub max_confidence: f32,
-    /// 平均信心值
-    pub avg_confidence: f32,
-    /// 空間密度（每幀平均物件數）
-    pub spatial_density: f32,
-}
-
-/// 視覺分片內容
-#[derive(Debug, Clone, Serialize, Deserialize)]
-pub struct VisualChunkContent {
-    /// 關鍵幀物件列表，每個關鍵幀包含 frame_number
-    pub keyframe_objects: Vec<KeyframeObjects>,
-    /// 主要物件標籤（出現在大多數幀中的物件）
-    pub dominant_objects: Vec<String>,
-    /// 物件關係 (object1, relationship, object2) - 可選
-    pub object_relationships: Vec<(String, String, String)>,
-    /// 場景描述 - 可選
-    pub scene_description: Option<String>,
-    /// 視覺元數據
-    pub metadata: VisualMetadata,
-}
-
-// ==================== Chunk 主結構 ====================
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct Chunk {
     pub file_id: i32,
@@ -117,11 +46,8 @@ pub struct Chunk {
     pub chunk_id: String,
     pub chunk_type: ChunkType,
     pub rule: ChunkRule,
-    /// Frames per second (can be fractional, e.g., 29.97, 23.976)
     pub fps: f64,
-    /// Start frame (0-based) - 主要時間標示
     pub start_frame: i64,
-    /// End frame (exclusive) - 主要時間標示
     pub end_frame: i64,
     pub text_content: Option<String>,
     pub content: serde_json::Value,
@@ -129,13 +55,11 @@ pub struct Chunk {
     pub vector_id: Option<String>,
     pub frame_count: i32,
     pub pre_chunk_ids: Vec<i32>,
-    pub parent_chunk_id: Option<String>, // For parent-child chunk hierarchy
-    pub child_chunk_ids: Vec<String>,    // Child chunk IDs (for parent chunks)
-    pub visual_stats: Option<serde_json::Value>,
+    pub parent_chunk_id: Option<String>,
+    pub child_chunk_ids: Vec<String>,
 }
 
 impl Chunk {
-    /// 創建新分片
     pub fn new(
         file_id: i32,
         uuid: String,
@@ -166,167 +90,17 @@ impl Chunk {
             pre_chunk_ids: vec![],
             parent_chunk_id: None,
             child_chunk_ids: vec![],
-            visual_stats: None,
         }
     }
 
-    /// 創建視覺分片 (Phase 2.1)
-    pub fn new_visual(
-        file_id: i32,
-        uuid: String,
-        chunk_id: String,
-        start_frame: i64,
-        end_frame: i64,
-        fps: f64,
-        visual_content: VisualChunkContent,
-    ) -> Self {
-        let content = serde_json::to_value(&visual_content)
-            .unwrap_or_else(|_| serde_json::json!({"error": "Failed to serialize visual content"}));
-
-        Self::new(
-            file_id,
-            uuid,
-            chunk_id,
-            ChunkType::Visual,
-            ChunkRule::Rule2,
-            start_frame,
-            end_frame,
-            fps,
-            content,
-        )
-    }
-
-    /// 從 YOLO 幀創建視覺分片 (Phase 2.1)
-    pub fn from_yolo_frames(
-        file_id: i32,
-        uuid: String,
-        chunk_id: String,
-        start_frame: i64,
-        end_frame: i64,
-        fps: f64,
-        yolo_frames: Vec<crate::core::processor::yolo::YoloFrame>,
-    ) -> Self {
-        // 將 YOLO 幀轉換為關鍵幀物件
-        let keyframe_objects: Vec<KeyframeObjects> = yolo_frames
-            .iter()
-            .map(|frame| {
-                let objects: Vec<DetectedObject> = frame
-                    .objects
-                    .iter()
-                    .map(|obj| DetectedObject {
-                        class_name: obj.class_name.clone(),
-                        class_id: obj.class_id,
-                        confidence: obj.confidence,
-                        bbox: Some(BoundingBox {
-                            x: obj.x,
-                            y: obj.y,
-                            width: obj.width,
-                            height: obj.height,
-                        }),
-                        occurrence: 1,
-                    })
-                    .collect();
-
-                KeyframeObjects {
-                    timestamp: frame.timestamp,
-                    frame_number: frame.frame,
-                    objects,
-                }
-            })
-            .collect();
-
-        // 計算物件統計
-        let total_objects: u32 = yolo_frames.iter().map(|f| f.objects.len() as u32).sum();
-
-        // 收集所有物件類別
-        let all_classes: Vec<String> = yolo_frames
-            .iter()
-            .flat_map(|f| f.objects.iter().map(|o| o.class_name.clone()))
-            .collect();
-
-        // 獲取唯一類別
-        let unique_classes: Vec<String> = all_classes
-            .iter()
-            .cloned()
-            .collect::<std::collections::HashSet<_>>()
-            .into_iter()
-            .collect();
-
-        // 計算信心值統計
-        let confidences: Vec<f32> = yolo_frames
-            .iter()
-            .flat_map(|f| f.objects.iter().map(|o| o.confidence))
-            .collect();
-
-        let max_confidence = confidences.iter().copied().fold(0.0f32, f32::max);
-        let avg_confidence = if !confidences.is_empty() {
-            confidences.iter().sum::<f32>() / confidences.len() as f32
-        } else {
-            0.0
-        };
-
-        // 計算主要物件（出現在大多數幀中的物件）
-        let mut object_counts = std::collections::HashMap::new();
-        for frame in &yolo_frames {
-            let frame_classes: std::collections::HashSet<_> =
-                frame.objects.iter().map(|o| o.class_name.clone()).collect();
-            for class in frame_classes {
-                *object_counts.entry(class).or_insert(0) += 1;
-            }
-        }
-
-        let mut dominant_objects: Vec<String> = object_counts
-            .into_iter()
-            .filter(|(_, count)| *count as f32 / yolo_frames.len() as f32 > 0.5)
-            .map(|(class, _)| class)
-            .collect();
-        dominant_objects.sort();
-
-        // 創建視覺內容
-        let visual_content = VisualChunkContent {
-            keyframe_objects,
-            dominant_objects,
-            object_relationships: vec![], // 可選：後期添加關係檢測
-            scene_description: None,      // 可選：後期添加 LLM 生成的場景描述
-            metadata: VisualMetadata {
-                object_count: total_objects,
-                unique_classes,
-                max_confidence,
-                avg_confidence,
-                spatial_density: if yolo_frames.len() > 0 {
-                    total_objects as f32 / yolo_frames.len() as f32
-                } else {
-                    0.0
-                },
-            },
-        };
-
-        Self::new_visual(
-            file_id,
-            uuid,
-            chunk_id,
-            start_frame,
-            end_frame,
-            fps,
-            visual_content,
-        )
-    }
-
-    /// 將分片轉換為幀時間
     pub fn to_frame_time(&self) -> FrameTime {
-        // 使用第一個幀作為參考點
         FrameTime::from_frames(self.start_frame, self.fps)
     }
 
-    /// 檢查是否是父分片
     pub fn is_parent(&self) -> bool {
         self.parent_chunk_id.is_some()
     }
 
-    /// 從秒數創建新分片（舊版轉換）
-    ///
-    /// 這對於從存儲時間為秒的舊系統遷移很有用。
-    /// 幀數通過舍入 `seconds * fps` 計算。
     #[allow(clippy::too_many_arguments)]
     pub fn from_seconds(
         file_id: i32,
@@ -354,197 +128,82 @@ impl Chunk {
         )
     }
 
-    /// 返回開始時間為 `FrameTime`
     pub fn start_time(&self) -> FrameTime {
         FrameTime::from_frames(self.start_frame, self.fps)
     }
 
-    /// 返回結束時間為 `FrameTime`
     pub fn end_time(&self) -> FrameTime {
         FrameTime::from_frames(self.end_frame, self.fps)
     }
 
-    /// 返回持續時間的幀數
     pub fn duration_frames(&self) -> i64 {
         self.end_frame - self.start_frame
     }
 
-    /// 返回持續時間的秒數
     pub fn duration_seconds(&self) -> f64 {
         self.duration_frames() as f64 / self.fps
     }
 
-    /// 將開始時間格式化為 "seconds.frame" (例如："123.04")
     pub fn format_start_sec_frame(&self) -> String {
         self.start_time().format_sec_frame()
     }
 
-    /// 將結束時間格式化為 "seconds.frame" (例如："456.15")
     pub fn format_end_sec_frame(&self) -> String {
         self.end_time().format_sec_frame()
     }
 
-    /// 將開始時間格式化為 "HH:MM:SS"
     pub fn format_start_hms(&self) -> String {
         self.start_time().format_hms()
     }
 
-    /// 將結束時間格式化為 "HH:MM:SS"
     pub fn format_end_hms(&self) -> String {
         self.end_time().format_hms()
     }
 
-    /// 將開始時間格式化為 "HH:MM:SS.FF"
     pub fn format_start_hms_frame(&self) -> String {
         self.start_time().format_hms_frame()
     }
 
-    /// 將結束時間格式化為 "HH:MM:SS.FF"
     pub fn format_end_hms_frame(&self) -> String {
         self.end_time().format_hms_frame()
     }
 
-    /// 返回 (start_seconds, end_seconds) 元組用於兼容性
-    ///
-    /// 這在遷移期間提供向後兼容性。
-    /// 建議使用 `start_time()` 和 `end_time()` 方法。
     pub fn time_range_seconds(&self) -> (f64, f64) {
         (self.start_time().seconds(), self.end_time().seconds())
     }
 
-    /// 添加元數據
     pub fn with_metadata(mut self, metadata: serde_json::Value) -> Self {
         self.metadata = Some(metadata);
         self
     }
 
-    /// 添加向量 ID
     pub fn with_vector_id(mut self, vector_id: String) -> Self {
         self.vector_id = Some(vector_id);
         self
     }
 
-    /// 添加文本內容
     pub fn with_text_content(mut self, text: String) -> Self {
         self.text_content = Some(text);
         self
     }
 
-    /// 設置幀數
     pub fn with_frame_count(mut self, count: i32) -> Self {
         self.frame_count = count;
         self
     }
 
-    /// 設置前一個分片 ID
     pub fn with_pre_chunk_ids(mut self, ids: Vec<i32>) -> Self {
         self.pre_chunk_ids = ids;
         self
     }
 
-    /// 設置父分片 ID
     pub fn with_parent_chunk_id(mut self, parent_id: String) -> Self {
         self.parent_chunk_id = Some(parent_id);
         self
     }
 
-    /// 設置子分片 ID
     pub fn with_child_chunk_ids(mut self, child_ids: Vec<String>) -> Self {
         self.child_chunk_ids = child_ids;
         self
     }
 }
-
-// ==================== VisualChunkContent 輔助方法 ====================
-impl VisualChunkContent {
-    /// 計算兩個 YOLO 幀之間的相似度（基於物件組成）
-    pub fn frame_similarity(
-        frame1: &crate::core::processor::yolo::YoloFrame,
-        frame2: &crate::core::processor::yolo::YoloFrame,
-    ) -> f32 {
-        if frame1.objects.is_empty() && frame2.objects.is_empty() {
-            return 1.0; // 兩個空幀完全相似
-        }
-
-        if frame1.objects.is_empty() || frame2.objects.is_empty() {
-            return 0.0; // 一個空一個非空，不相似
-        }
-
-        // 創建物件類別名稱集合
-        let set1: std::collections::HashSet<String> = frame1
-            .objects
-            .iter()
-            .map(|o| o.class_name.clone())
-            .collect();
-        let set2: std::collections::HashSet<String> = frame2
-            .objects
-            .iter()
-            .map(|o| o.class_name.clone())
-            .collect();
-
-        // 計算 Jaccard 相似度
-        let intersection: Vec<_> = set1.intersection(&set2).collect();
-        let union: Vec<_> = set1.union(&set2).collect();
-
-        if union.is_empty() {
-            0.0
-        } else {
-            intersection.len() as f32 / union.len() as f32
-        }
-    }
-
-    /// 獲取視覺分片的摘要（使用關鍵幀的 frame_number）
-    pub fn summary(&self, fps: f64) -> String {
-        if self.keyframe_objects.is_empty() {
-            return "Empty visual chunk".to_string();
-        }
-
-        let first_frame = self.keyframe_objects.first().unwrap().frame_number;
-        let last_frame = self.keyframe_objects.last().unwrap().frame_number;
-
-        // 計算時間（僅供參考）
-        let start_time = if fps > 0.0 {
-            first_frame as f64 / fps
-        } else {
-            0.0
-        };
-        let end_time = if fps > 0.0 {
-            last_frame as f64 / fps
-        } else {
-            0.0
-        };
-        let duration = end_time - start_time;
-        let frame_count = self.keyframe_objects.len();
-
-        format!(
-            "Visual chunk: frames {} to {} (duration: {:.1}s, {} frames). Objects: {} total, {} unique. Dominant: {}",
-            first_frame,
-            last_frame,
-            duration,
-            frame_count,
-            self.metadata.object_count,
-            self.metadata.unique_classes.len(),
-            if self.dominant_objects.is_empty() {
-                "none".to_string()
-            } else {
-                self.dominant_objects.join(", ")
-            }
-        )
-    }
-
-    /// 檢查是否包含特定物件類別
-    pub fn contains_object(&self, class_name: &str) -> bool {
-        self.keyframe_objects
-            .iter()
-            .any(|ko| ko.objects.iter().any(|obj| obj.class_name == class_name))
-    }
-
-    /// 獲取信心值高於閾值的所有物件
-    pub fn high_confidence_objects(&self, threshold: f32) -> Vec<&DetectedObject> {
-        self.keyframe_objects
-            .iter()
-            .flat_map(|ko| ko.objects.iter())
-            .filter(|obj| obj.confidence >= threshold)
-            .collect()
-    }
-}
diff --git a/src/core/config.rs b/src/core/config.rs
index 78104f4..3612bb3 100644
--- a/src/core/config.rs
+++ b/src/core/config.rs
@@ -56,7 +56,7 @@ pub static REDIS_URL: Lazy<String> = Lazy::new(|| {
     env::var("REDIS_URL").unwrap_or_else(|_| {
         let password = env::var("REDIS_PASSWORD").unwrap_or_else(|_| "accusys".to_string());
         // Format: redis://[:password]@host:port (use default user)
-        format!("redis://:{}@localhost:6379", password)
+        format!("redis://default:{}@localhost:6379", password)
     })
 });
 
@@ -277,12 +277,14 @@ pub mod llm {
 }
 
 /// Ollama embedding endpoint (vector embeddings for text sync).
-pub static OLLAMA_URL: Lazy<String> =
-    Lazy::new(|| env::var("MOMENTRY_OLLAMA_URL").unwrap_or_else(|_| "http://127.0.0.1:11434".to_string()));
+pub static OLLAMA_URL: Lazy<String> = Lazy::new(|| {
+    env::var("MOMENTRY_OLLAMA_URL").unwrap_or_else(|_| "http://127.0.0.1:11434".to_string())
+});
 
 /// Text embedding server (comic-embed or alternative).
-pub static EMBED_URL: Lazy<String> =
-    Lazy::new(|| env::var("MOMENTRY_EMBED_URL").unwrap_or_else(|_| "http://127.0.0.1:11436".to_string()));
+pub static EMBED_URL: Lazy<String> = Lazy::new(|| {
+    env::var("MOMENTRY_EMBED_URL").unwrap_or_else(|_| "http://127.0.0.1:11436".to_string())
+});
 
 /// LLM health endpoint.
 pub static LLM_HEALTH_URL: Lazy<String> = Lazy::new(|| {
diff --git a/src/core/db/identity_merge_history.rs b/src/core/db/identity_merge_history.rs
new file mode 100644
index 0000000..d8c9f71
--- /dev/null
+++ b/src/core/db/identity_merge_history.rs
@@ -0,0 +1,604 @@
+use anyhow::{Context, Result};
+use bson::{doc, oid::ObjectId, DateTime as BsonDateTime, Document};
+use chrono::{DateTime, Utc};
+use mongodb::{Client, Collection, Database, IndexModel};
+use serde::{Deserialize, Serialize};
+use serde_json::Value as JsonValue;
+use uuid::Uuid;
+
+const COLLECTION_NAME: &str = "identity_merge_history";
+
+fn bson_doc_to_json(doc: &Document) -> JsonValue {
+    match bson::to_bson(doc) {
+        Ok(bson) => bson.into_relaxed_extjson(),
+        Err(_) => JsonValue::Null,
+    }
+}
+
+fn json_value_to_bson_doc(value: &JsonValue) -> Document {
+    bson::to_document(value).unwrap_or_default()
+}
+
+fn doc_field_to_json(doc: &Document, key: &str) -> JsonValue {
+    doc.get(key)
+        .map(|b| b.clone().into_relaxed_extjson())
+        .unwrap_or(JsonValue::Null)
+}
+
+fn json_to_bson(value: &JsonValue) -> bson::Bson {
+    bson::to_bson(value).unwrap_or(bson::Bson::Null)
+}
+
+#[derive(Debug, Clone)]
+pub struct IdentityMergeHistory {
+    pub id: Option<ObjectId>,
+    pub merge_id: String,
+    pub source_identity: IdentitySnapshot,
+    pub target_identity: TargetIdentitySnapshot,
+    pub aliases_added_to_target: Vec<AliasEntry>,
+    pub metadata_fields_added: Vec<String>,
+    pub faces_transferred: FacesTransferred,
+    pub merge_params: MergeParams,
+    pub merged_at: DateTime<Utc>,
+    pub undo_deadline: DateTime<Utc>,
+    pub undone: bool,
+    pub undone_at: Option<DateTime<Utc>>,
+    pub undone_by: Option<String>,
+    pub undone_snapshot: Option<UndoneSnapshot>,
+    pub undo_expired: bool,
+}
+
+#[derive(Debug, Clone)]
+pub struct IdentitySnapshot {
+    pub id: i64,
+    pub uuid: String,
+    pub name: String,
+    pub identity_type: Option<String>,
+    pub source: Option<String>,
+    pub status: String,
+    pub tmdb_id: Option<i64>,
+    pub tmdb_profile: Option<String>,
+    pub metadata: JsonValue,
+    pub created_at: Option<DateTime<Utc>>,
+    pub face_count: i64,
+}
+
+#[derive(Debug, Clone)]
+pub struct TargetIdentitySnapshot {
+    pub id: i64,
+    pub uuid: String,
+    pub name: String,
+    pub metadata_before: JsonValue,
+    pub metadata_after: Option<JsonValue>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct AliasEntry {
+    pub name: String,
+    pub locale: String,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub source: Option<String>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct FacesTransferred {
+    pub file_uuid: String,
+    pub face_ids: Vec<String>,
+    pub trace_ids: Vec<i32>,
+    pub count: i64,
+}
+
+#[derive(Debug, Clone)]
+pub struct UndoneSnapshot {
+    pub source_identity_id: i64,
+    pub source_uuid: String,
+    pub source_name: String,
+    pub target_metadata_at_undo: JsonValue,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct MergeParams {
+    pub keep_history: bool,
+    pub cleared_stranger_id: bool,
+    pub performed_by_user: Option<String>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct MergeHistoryQuery {
+    pub source_uuid: Option<String>,
+    pub target_uuid: Option<String>,
+    pub merge_id: Option<String>,
+    pub undone: Option<bool>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct MergeHistoryEntry {
+    pub merge_id: String,
+    pub source_name: String,
+    pub target_name: String,
+    pub faces_transferred: i64,
+    pub merged_at: DateTime<Utc>,
+    pub undo_deadline: DateTime<Utc>,
+    pub undone: bool,
+    pub undo_expired: bool,
+}
+
+impl IdentityMergeHistory {
+    pub fn from_document(doc: &Document) -> Result<Self> {
+        let source = doc
+            .get_document("source_identity")
+            .context("Missing source_identity")?;
+        let target = doc
+            .get_document("target_identity")
+            .context("Missing target_identity")?;
+        let faces = doc
+            .get_document("faces_transferred")
+            .context("Missing faces_transferred")?;
+        let aliases = doc
+            .get_array("aliases_added_to_target")
+            .unwrap_or(&vec![])
+            .clone();
+        let fields = doc
+            .get_array("metadata_fields_added")
+            .unwrap_or(&vec![])
+            .clone();
+        let merge_params_doc = doc
+            .get_document("merge_params")
+            .unwrap_or(&Document::new())
+            .clone();
+
+        let mut parsed_aliases = Vec::new();
+        for a in aliases {
+            if let Some(d) = a.as_document() {
+                parsed_aliases.push(AliasEntry {
+                    name: d.get_str("name").unwrap_or("").to_string(),
+                    locale: d.get_str("locale").unwrap_or("en").to_string(),
+                    source: d.get_str("source").ok().map(|s| s.to_string()),
+                });
+            }
+        }
+
+        let mut parsed_fields = Vec::new();
+        for f in fields {
+            if let Some(s) = f.as_str() {
+                parsed_fields.push(s.to_string());
+            }
+        }
+
+        let undone_snapshot = doc.get_document("undone_snapshot").ok().and_then(|d| {
+            let sid = d.get_i64("source_identity_id").unwrap_or(0);
+            let suuid = d.get_str("source_uuid").unwrap_or("").to_string();
+            let sname = d.get_str("source_name").unwrap_or("").to_string();
+            let meta = doc_field_to_json(d, "target_metadata_at_undo");
+            Some(UndoneSnapshot {
+                source_identity_id: sid,
+                source_uuid: suuid,
+                source_name: sname,
+                target_metadata_at_undo: meta,
+            })
+        });
+
+        Ok(IdentityMergeHistory {
+            id: doc.get_object_id("_id").ok(),
+            merge_id: doc.get_str("merge_id").unwrap_or("").to_string(),
+            source_identity: IdentitySnapshot {
+                id: source.get_i64("id").unwrap_or(0),
+                uuid: source.get_str("uuid").unwrap_or("").to_string(),
+                name: source.get_str("name").unwrap_or("").to_string(),
+                identity_type: source.get_str("identity_type").ok().map(|s| s.to_string()),
+                source: source.get_str("source").ok().map(|s| s.to_string()),
+                status: source.get_str("status").unwrap_or("").to_string(),
+                tmdb_id: source.get_i64("tmdb_id").ok(),
+                tmdb_profile: source.get_str("tmdb_profile").ok().map(|s| s.to_string()),
+                metadata: doc_field_to_json(source, "metadata"),
+                created_at: source
+                    .get_datetime("created_at")
+                    .map(|d| d.to_chrono())
+                    .ok(),
+                face_count: source.get_i64("face_count").unwrap_or(0),
+            },
+            target_identity: TargetIdentitySnapshot {
+                id: target.get_i64("id").unwrap_or(0),
+                uuid: target.get_str("uuid").unwrap_or("").to_string(),
+                name: target.get_str("name").unwrap_or("").to_string(),
+                metadata_before: doc_field_to_json(target, "metadata_before"),
+                metadata_after: target
+                    .get("metadata_after")
+                    .map(|b| b.clone().into_relaxed_extjson()),
+            },
+            aliases_added_to_target: parsed_aliases,
+            metadata_fields_added: parsed_fields,
+            faces_transferred: FacesTransferred {
+                file_uuid: faces.get_str("file_uuid").unwrap_or("").to_string(),
+                face_ids: faces
+                    .get_array("face_ids")
+                    .map(|arr| {
+                        arr.iter()
+                            .filter_map(|b| b.as_str().map(|s| s.to_string()))
+                            .collect()
+                    })
+                    .unwrap_or_default(),
+                trace_ids: faces
+                    .get_array("trace_ids")
+                    .map(|arr| arr.iter().filter_map(|b| b.as_i32()).collect())
+                    .unwrap_or_default(),
+                count: faces.get_i64("count").unwrap_or(0),
+            },
+            merge_params: MergeParams {
+                keep_history: merge_params_doc.get_bool("keep_history").unwrap_or(true),
+                cleared_stranger_id: merge_params_doc
+                    .get_bool("cleared_stranger_id")
+                    .unwrap_or(true),
+                performed_by_user: merge_params_doc
+                    .get_str("performed_by_user")
+                    .ok()
+                    .map(|s| s.to_string()),
+            },
+            merged_at: doc
+                .get_datetime("merged_at")
+                .map(|d| d.to_chrono())
+                .unwrap_or_default(),
+            undo_deadline: doc
+                .get_datetime("undo_deadline")
+                .map(|d| d.to_chrono())
+                .unwrap_or_default(),
+            undone: doc.get_bool("undone").unwrap_or(false),
+            undone_at: doc.get_datetime("undone_at").map(|d| d.to_chrono()).ok(),
+            undone_by: doc.get_str("undone_by").ok().map(|s| s.to_string()),
+            undone_snapshot,
+            undo_expired: doc.get_bool("undo_expired").unwrap_or(false),
+        })
+    }
+
+    pub fn to_document(&self) -> Document {
+        let mut doc = doc! {
+            "merge_id": &self.merge_id,
+            "source_identity": {
+                "id": self.source_identity.id as i64,
+                "uuid": &self.source_identity.uuid,
+                "name": &self.source_identity.name,
+                "identity_type": self.source_identity.identity_type.as_deref(),
+                "source": self.source_identity.source.as_deref(),
+                "status": &self.source_identity.status,
+                "tmdb_id": self.source_identity.tmdb_id,
+                "tmdb_profile": self.source_identity.tmdb_profile.as_deref(),
+                "metadata": json_to_bson(&self.source_identity.metadata),
+                "created_at": self.source_identity.created_at
+                    .map(|dt| BsonDateTime::from_chrono(dt)),
+                "face_count": self.source_identity.face_count,
+            },
+            "target_identity": {
+                "id": self.target_identity.id as i64,
+                "uuid": &self.target_identity.uuid,
+                "name": &self.target_identity.name,
+                "metadata_before": json_to_bson(&self.target_identity.metadata_before),
+                "metadata_after": self.target_identity.metadata_after.as_ref().map(json_to_bson),
+            },
+            "aliases_added_to_target": self.aliases_added_to_target.iter().map(|a| {
+                doc! {
+                    "name": &a.name,
+                    "locale": &a.locale,
+                    "source": a.source.as_deref(),
+                }
+            }).collect::<Vec<Document>>(),
+            "metadata_fields_added": &self.metadata_fields_added,
+            "faces_transferred": {
+                "file_uuid": &self.faces_transferred.file_uuid,
+                "face_ids": &self.faces_transferred.face_ids,
+                "trace_ids": &self.faces_transferred.trace_ids,
+                "count": self.faces_transferred.count,
+            },
+            "merge_params": {
+                "keep_history": self.merge_params.keep_history,
+                "cleared_stranger_id": self.merge_params.cleared_stranger_id,
+                "performed_by_user": self.merge_params.performed_by_user.as_deref(),
+            },
+            "merged_at": BsonDateTime::from_chrono(self.merged_at),
+            "undo_deadline": BsonDateTime::from_chrono(self.undo_deadline),
+            "undone": self.undone,
+            "undone_at": self.undone_at.map(|dt| BsonDateTime::from_chrono(dt)),
+            "undone_by": self.undone_by.as_deref(),
+            "undone_snapshot": self.undone_snapshot.as_ref().map(|s| {
+                doc! {
+                    "source_identity_id": s.source_identity_id,
+                    "source_uuid": &s.source_uuid,
+                    "source_name": &s.source_name,
+                    "target_metadata_at_undo": json_to_bson(&s.target_metadata_at_undo),
+                }
+            }),
+            "undo_expired": self.undo_expired,
+        };
+
+        if let Some(ref oid) = self.id {
+            doc.insert("_id", oid.clone());
+        }
+
+        doc
+    }
+}
+
+#[derive(Clone)]
+pub struct IdentityMergeHistoryStore {
+    client: Client,
+    db: Database,
+    collection: Collection<Document>,
+}
+
+impl IdentityMergeHistoryStore {
+    pub async fn init() -> Result<Self> {
+        let uri = crate::core::config::MONGODB_URL.as_str();
+        let client = Client::with_uri_str(uri)
+            .await
+            .context("Failed to connect to MongoDB")?;
+        let db_name = crate::core::config::MONGODB_DATABASE.as_str();
+        let db = client.database(db_name);
+        let collection: Collection<Document> = db.collection(COLLECTION_NAME);
+
+        let store = Self {
+            client,
+            db,
+            collection,
+        };
+
+        store.ensure_indexes().await?;
+        Ok(store)
+    }
+
+    async fn ensure_indexes(&self) -> Result<()> {
+        let merge_id_index = IndexModel::builder()
+            .keys(doc! { "merge_id": 1 })
+            .options(
+                mongodb::options::IndexOptions::builder()
+                    .unique(true)
+                    .build(),
+            )
+            .build();
+
+        let merged_at_index = IndexModel::builder().keys(doc! { "merged_at": -1 }).build();
+
+        let source_uuid_index = IndexModel::builder()
+            .keys(doc! { "source_identity.uuid": 1 })
+            .build();
+
+        let target_uuid_index = IndexModel::builder()
+            .keys(doc! { "target_identity.uuid": 1 })
+            .build();
+
+        self.collection
+            .create_indexes(
+                [
+                    merge_id_index,
+                    merged_at_index,
+                    source_uuid_index,
+                    target_uuid_index,
+                ],
+                None,
+            )
+            .await
+            .context("Failed to create identity_merge_history indexes")?;
+
+        tracing::info!("MongoDB identity_merge_history indexes ensured");
+        Ok(())
+    }
+
+    pub fn generate_merge_id() -> String {
+        Uuid::new_v4().to_string()
+    }
+
+    pub async fn store_merge_history(&self, history: &IdentityMergeHistory) -> Result<()> {
+        let doc = history.to_document();
+        self.collection
+            .insert_one(doc, None)
+            .await
+            .context("Failed to store merge history in MongoDB")?;
+
+        tracing::info!(
+            "Stored merge history: merge_id={}, source={}, target={}, faces={}",
+            history.merge_id,
+            history.source_identity.name,
+            history.target_identity.name,
+            history.faces_transferred.count
+        );
+        Ok(())
+    }
+
+    pub async fn get_merge_history(&self, merge_id: &str) -> Result<Option<IdentityMergeHistory>> {
+        let filter = doc! { "merge_id": merge_id };
+        let result = self
+            .collection
+            .find_one(filter, None)
+            .await
+            .context("Failed to get merge history from MongoDB")?;
+
+        match result {
+            Some(doc) => {
+                let history = IdentityMergeHistory::from_document(&doc)
+                    .context("Failed to parse merge history from MongoDB")?;
+                Ok(Some(history))
+            }
+            None => Ok(None),
+        }
+    }
+
+    pub async fn query_merge_history(
+        &self,
+        query: MergeHistoryQuery,
+        page: u32,
+        page_size: u32,
+    ) -> Result<(Vec<MergeHistoryEntry>, u64)> {
+        let mut filter = doc! {};
+
+        if let Some(source_uuid) = query.source_uuid {
+            filter.insert("source_identity.uuid", source_uuid);
+        }
+        if let Some(target_uuid) = query.target_uuid {
+            filter.insert("target_identity.uuid", target_uuid);
+        }
+        if let Some(merge_id) = query.merge_id {
+            filter.insert("merge_id", merge_id);
+        }
+        if let Some(undone) = query.undone {
+            filter.insert("undone", undone);
+        }
+
+        let skip = (page - 1) * page_size;
+        let limit = page_size;
+
+        let mut cursor = self
+            .collection
+            .find(filter.clone(), None)
+            .await
+            .context("Failed to query merge history")?;
+
+        let total = self
+            .collection
+            .count_documents(filter, None)
+            .await
+            .context("Failed to count merge history")?;
+
+        let mut results: Vec<MergeHistoryEntry> = Vec::new();
+        let mut count = 0;
+
+        while cursor.advance().await.context("Failed to advance cursor")? {
+            if count >= skip && results.len() < limit as usize {
+                let doc: Document = cursor
+                    .deserialize_current()
+                    .context("Failed to deserialize")?;
+
+                let merge_id = doc.get_str("merge_id").unwrap_or("").to_string();
+                let source_name = doc
+                    .get_document("source_identity")
+                    .map(|d| d.get_str("name").unwrap_or("").to_string())
+                    .unwrap_or_default();
+                let target_name = doc
+                    .get_document("target_identity")
+                    .map(|d| d.get_str("name").unwrap_or("").to_string())
+                    .unwrap_or_default();
+                let faces_count = doc
+                    .get_document("faces_transferred")
+                    .map(|d| d.get_i64("count").unwrap_or(0))
+                    .unwrap_or(0);
+                let merged_at = doc
+                    .get_datetime("merged_at")
+                    .map(|d| d.to_chrono())
+                    .unwrap_or_default();
+                let undo_deadline = doc
+                    .get_datetime("undo_deadline")
+                    .map(|d| d.to_chrono())
+                    .unwrap_or_default();
+                let undone = doc.get_bool("undone").unwrap_or(false);
+                let undo_expired = doc.get_bool("undo_expired").unwrap_or(false);
+
+                results.push(MergeHistoryEntry {
+                    merge_id,
+                    source_name,
+                    target_name,
+                    faces_transferred: faces_count,
+                    merged_at,
+                    undo_deadline,
+                    undone,
+                    undo_expired,
+                });
+            }
+            count += 1;
+        }
+
+        Ok((results, total))
+    }
+
+    pub async fn mark_as_undone(
+        &self,
+        merge_id: &str,
+        undone_by: Option<&str>,
+        undone_snapshot: UndoneSnapshot,
+    ) -> Result<()> {
+        let filter = doc! { "merge_id": merge_id };
+        let snapshot_doc = doc! {
+            "source_identity_id": undone_snapshot.source_identity_id,
+            "source_uuid": &undone_snapshot.source_uuid,
+            "source_name": &undone_snapshot.source_name,
+            "target_metadata_at_undo": json_to_bson(&undone_snapshot.target_metadata_at_undo),
+        };
+        let update = doc! {
+            "$set": {
+                "undone": true,
+                "undone_at": BsonDateTime::from_chrono(Utc::now()),
+                "undone_by": undone_by,
+                "undone_snapshot": snapshot_doc,
+            }
+        };
+
+        self.collection
+            .update_one(filter, update, None)
+            .await
+            .context("Failed to mark merge as undone")?;
+
+        tracing::info!("Marked merge {} as undone", merge_id);
+        Ok(())
+    }
+
+    pub async fn mark_as_redone(&self, merge_id: &str, redone_by: Option<&str>) -> Result<()> {
+        let now = Utc::now();
+        let new_deadline = now + chrono::Duration::hours(24);
+        let filter = doc! { "merge_id": merge_id };
+        let update = doc! {
+            "$set": {
+                "undone": false,
+                "undone_at": bson::Bson::Null,
+                "undone_by": redone_by,
+                "undone_snapshot": bson::Bson::Null,
+                "undo_deadline": BsonDateTime::from_chrono(new_deadline),
+                "undo_expired": false
+            }
+        };
+
+        self.collection
+            .update_one(filter, update, None)
+            .await
+            .context("Failed to mark merge as redone")?;
+
+        tracing::info!(
+            "Marked merge {} as redone (new deadline: {})",
+            merge_id,
+            new_deadline
+        );
+        Ok(())
+    }
+
+    pub async fn check_undo_deadline(&self, merge_id: &str) -> Result<bool> {
+        let history = self
+            .get_merge_history(merge_id)
+            .await?
+            .context("Merge history not found")?;
+
+        let now = Utc::now();
+        if now > history.undo_deadline {
+            return Ok(false);
+        }
+
+        Ok(true)
+    }
+
+    pub async fn mark_expired_merges(&self) -> Result<u64> {
+        let now = BsonDateTime::from_chrono(Utc::now());
+        let filter = doc! {
+            "undo_deadline": { "$lt": now },
+            "undone": false,
+            "undo_expired": false
+        };
+        let update = doc! { "$set": { "undo_expired": true } };
+
+        let result = self
+            .collection
+            .update_many(filter, update, None)
+            .await
+            .context("Failed to mark expired merges")?;
+
+        let count = result.modified_count;
+        if count > 0 {
+            tracing::info!("Marked {} expired merges", count);
+        }
+
+        Ok(count)
+    }
+}
diff --git a/src/core/db/mod.rs b/src/core/db/mod.rs
index 019b547..9c6e5f5 100644
--- a/src/core/db/mod.rs
+++ b/src/core/db/mod.rs
@@ -32,17 +32,21 @@ pub trait VectorStore: Send + Sync {
     async fn search(&self, query_vector: &[f32], limit: usize) -> Result<Vec<SearchResult>>;
 }
 
+pub mod identity_merge_history;
 pub mod mongodb_db;
 pub mod postgres_db;
 pub mod qdrant_db;
 pub mod redis_client;
 pub mod redis_db;
-pub mod sync_db;
-
+pub use identity_merge_history::{
+    AliasEntry, FacesTransferred, IdentityMergeHistory, IdentityMergeHistoryStore,
+    IdentitySnapshot, MergeHistoryEntry, MergeHistoryQuery, MergeParams, TargetIdentitySnapshot,
+    UndoneSnapshot,
+};
 pub use mongodb_db::MongoDb;
 pub use postgres_db::{
-    Bm25Result, CandidateRecord, CreateApiKeyConfig, FileIdentityRecord, FileRecord,
-    HybridSearchResult, IdentityChunkRecord, IdentityDetailRecord, IdentityFaceRecord,
+    Bm25Result, CandidateRecord, CreateApiKeyConfig, FileFaceRecord, FileIdentityRecord,
+    FileRecord, HybridSearchResult, IdentityChunkRecord, IdentityDetailRecord, IdentityFaceRecord,
     IdentityFileRecord, MonitorJob, MonitorJobStats, MonitorJobStatus, PipelineType, PostgresDb,
     ProcessorJobStatus, ProcessorResult, ProcessorType, ResourceRecord, VideoRecord, VideoStatus,
 };
@@ -52,4 +56,3 @@ pub use redis_client::{
     ProgressMessage, RedisClient,
 };
 pub use redis_db::RedisDb;
-pub use sync_db::SyncDb;
diff --git a/src/core/db/mongodb_db.rs b/src/core/db/mongodb_db.rs
index 476c7c3..7a70b31 100644
--- a/src/core/db/mongodb_db.rs
+++ b/src/core/db/mongodb_db.rs
@@ -131,7 +131,6 @@ impl MongoDb {
                     pre_chunk_ids: vec![],
                     parent_chunk_id: doc.parent_chunk_id,
                     child_chunk_ids: doc.child_chunk_ids,
-                    visual_stats: None,
                 }
             })
             .collect();
@@ -190,7 +189,6 @@ impl MongoDb {
                     pre_chunk_ids: vec![],
                     parent_chunk_id: doc.parent_chunk_id,
                     child_chunk_ids: doc.child_chunk_ids,
-                    visual_stats: None,
                 }
             })
             .collect();
@@ -246,7 +244,6 @@ impl MongoDb {
                     pre_chunk_ids: vec![],
                     parent_chunk_id: doc.parent_chunk_id,
                     child_chunk_ids: doc.child_chunk_ids,
-                    visual_stats: None,
                 }
             })
             .collect();
diff --git a/src/core/db/qdrant_db.rs b/src/core/db/qdrant_db.rs
index d63897c..bd66b84 100644
--- a/src/core/db/qdrant_db.rs
+++ b/src/core/db/qdrant_db.rs
@@ -70,7 +70,7 @@ impl QdrantDb {
             return Ok(());
         }
 
-        let create_url = format!("{}/collections", self.base_url);
+        let create_url = format!("{}/collections/{}", self.base_url, self.collection_name);
         let body = serde_json::json!({
             "vectors": {
                 "size": vector_dim,
@@ -79,7 +79,7 @@ impl QdrantDb {
         });
 
         self.client
-            .post(&create_url)
+            .put(&create_url)
             .header("api-key", &self.api_key)
             .header("Content-Type", "application/json")
             .json(&body)
@@ -867,50 +867,6 @@ impl VectorStore for QdrantDb {
     }
 }
 
-/// Sync face embeddings from PostgreSQL to Qdrant for ANN search
-pub async fn sync_face_embeddings(file_uuid: &str) -> Result<()> {
-    use crate::core::config::DATABASE_URL;
-    use sqlx::Row;
-
-    let pool = sqlx::PgPool::connect(&DATABASE_URL).await?;
-    let table = crate::core::db::schema::table_name("face_detections");
-
-    let qdrant: QdrantDb = QdrantDb::new();
-
-    let query = format!(
-        "SELECT id, trace_id, frame_number, embedding FROM {} \
-         WHERE file_uuid = $1 AND embedding IS NOT NULL \
-         AND ((metadata->>'qc_ok')::boolean IS NULL OR (metadata->>'qc_ok')::boolean = true)",
-        table
-    );
-    let rows = sqlx::query(&query).bind(file_uuid).fetch_all(&pool).await?;
-
-    let mut count = 0u64;
-    for row in &rows {
-        let id: i32 = row.get(0);
-        let trace_id: Option<i32> = row.get(1);
-        let frame_number: i64 = row.get(2);
-        let embedding: Option<Vec<f32>> = row.get(3);
-
-        if let (Some(emb), Some(tid)) = (embedding, trace_id) {
-            if let Err(e) = qdrant
-                .upsert_face_embedding(id as u64, &emb, file_uuid, tid, frame_number)
-                .await
-            {
-                tracing::warn!("Qdrant upsert failed for face {}: {}", id, e);
-                continue;
-            }
-            count += 1;
-        }
-    }
-    tracing::info!(
-        "Synced {} face embeddings to Qdrant for {}",
-        count,
-        file_uuid
-    );
-    Ok(())
-}
-
 pub async fn sync_trace_embeddings(file_uuid: &str) -> Result<()> {
     use crate::core::config::DATABASE_URL;
     use sqlx::Row;
@@ -984,12 +940,22 @@ pub async fn sync_trace_embeddings(file_uuid: &str) -> Result<()> {
     }
 
     // Push to Qdrant in batches
+    // Point ID: hash(file_uuid + trace_id) for global uniqueness
     for chunk in trace_avgs.chunks(500) {
         let batch: Vec<(u64, &[f32], Option<serde_json::Value>)> = chunk
             .iter()
             .map(|t| {
+                let point_id = {
+                    use sha2::{Digest, Sha256};
+                    let mut hasher = Sha256::new();
+                    hasher.update(file_uuid.as_bytes());
+                    hasher.update(b"_");
+                    hasher.update(t.tid.to_string().as_bytes());
+                    let hash = hasher.finalize();
+                    u64::from_be_bytes(hash[0..8].try_into().unwrap())
+                };
                 (
-                    t.tid as u64,
+                    point_id,
                     t.avg_emb.as_slice(),
                     Some(serde_json::json!({
                         "trace_id": t.tid,
diff --git a/src/core/db/redis_client.rs b/src/core/db/redis_client.rs
index 10d3887..9b4860f 100644
--- a/src/core/db/redis_client.rs
+++ b/src/core/db/redis_client.rs
@@ -319,7 +319,9 @@ impl RedisClient {
             "timestamp": chrono::Utc::now().to_rfc3339(),
         });
 
-        let _: usize = conn.publish(&channel, serde_json::to_string(&alert_json)?).await?;
+        let _: usize = conn
+            .publish(&channel, serde_json::to_string(&alert_json)?)
+            .await?;
 
         tracing::warn!(
             "Processor alert: {} | {} | {} | {}",
diff --git a/src/core/db/sync_db.rs b/src/core/db/sync_db.rs.bak
similarity index 97%
rename from src/core/db/sync_db.rs
rename to src/core/db/sync_db.rs.bak
index bd33bb2..205817a 100644
--- a/src/core/db/sync_db.rs
+++ b/src/core/db/sync_db.rs.bak
@@ -78,7 +78,10 @@ impl SyncDb {
     pub async fn embed_text(&self, text: &str) -> Result<Vec<f32>> {
         let client = reqwest::Client::new();
         let response = client
-            .post(&format!("{}/api/embeddings", crate::core::config::OLLAMA_URL.as_str()))
+            .post(&format!(
+                "{}/api/embeddings",
+                crate::core::config::OLLAMA_URL.as_str()
+            ))
             .json(&serde_json::json!({
                 "model": "all-minilm",
                 "prompt": text,
diff --git a/src/core/frame_cache.rs b/src/core/frame_cache.rs
index 317a696..b155702 100644
--- a/src/core/frame_cache.rs
+++ b/src/core/frame_cache.rs
@@ -78,12 +78,19 @@ impl FrameManager {
                 .and_then(|s| s.strip_suffix(".jpg"))
             {
                 if let Ok(frame_num) = num_str.parse::<u64>() {
-                    let timestamp = frame_num as f64 / fps;
-                    frames.push(CachedFrame {
-                        path: entry.path(),
-                        frame_number: frame_num,
-                        timestamp_secs: timestamp,
-                    });
+                    let frame_path = entry.path();
+                    if let Ok(data) = std::fs::read(&frame_path) {
+                        if crate::core::thumbnail::validator::is_valid_jpeg(&data) {
+                            let timestamp = frame_num as f64 / fps;
+                            frames.push(CachedFrame {
+                                path: frame_path,
+                                frame_number: frame_num,
+                                timestamp_secs: timestamp,
+                            });
+                        } else {
+                            info!("[FrameCache] Skipping invalid JPEG: {:?}", frame_path);
+                        }
+                    }
                 }
             }
         }
diff --git a/src/core/identity/storage.rs b/src/core/identity/storage.rs
index c76d5a9..e2f2e67 100644
--- a/src/core/identity/storage.rs
+++ b/src/core/identity/storage.rs
@@ -193,7 +193,7 @@ pub async fn save_identity_file_by_pool(pool: &sqlx::PgPool, uuid: &str) -> Resu
 
     let record = sqlx::query_as::<_, crate::core::db::IdentityDetailRecord>(
         &format!(
-            "SELECT id, uuid::text, name, identity_type, source, status, metadata, reference_data, \
+            "SELECT id::bigint, uuid::text, name, identity_type, source, status, metadata, COALESCE(reference_data, '{{}}'::jsonb) as reference_data, \
               NULL::real[] as voice_embedding, NULL::real[] as identity_embedding, \
               face_embedding::real[] as face_embedding, \
               tmdb_id, tmdb_profile, created_at::timestamptz as created_at, NULL::timestamptz as updated_at \
diff --git a/src/core/llm/function_calling.rs b/src/core/llm/function_calling.rs
index 1add57c..dd2c9ac 100644
--- a/src/core/llm/function_calling.rs
+++ b/src/core/llm/function_calling.rs
@@ -97,6 +97,68 @@ pub fn llm_vision_model() -> String {
     config::llm::VISION_MODEL.clone()
 }
 
+/// Call the vision LLM with text + base64 images. Returns the generated text.
+pub async fn call_llm_vision(
+    system_prompt: &str,
+    user_text: &str,
+    base64_images: Vec<String>,
+    max_tokens: u32,
+    timeout_secs: u64,
+) -> anyhow::Result<String> {
+    let mut content_parts: Vec<Value> = vec![json!({"type": "text", "text": user_text})];
+    for img in &base64_images {
+        content_parts.push(json!({
+            "type": "image_url",
+            "image_url": {"url": format!("data:image/jpeg;base64,{}", img)}
+        }));
+    }
+
+    let messages = json!([
+        {"role": "system", "content": system_prompt},
+        {"role": "user", "content": content_parts}
+    ]);
+
+    let req = json!({
+        "model": llm_vision_model(),
+        "messages": messages,
+        "temperature": 0.1,
+        "max_tokens": max_tokens,
+        "stream": false,
+    });
+
+    let client = reqwest::Client::builder()
+        .timeout(std::time::Duration::from_secs(timeout_secs))
+        .build()?;
+
+    let res = client.post(&llm_vision_url()).json(&req).send().await?;
+    if !res.status().is_success() {
+        let text = res.text().await.unwrap_or_default();
+        anyhow::bail!("Vision LLM API error: {}", text);
+    }
+
+    #[derive(Deserialize)]
+    struct VisionResponse {
+        choices: Vec<VisionChoice>,
+    }
+    #[derive(Deserialize)]
+    struct VisionChoice {
+        message: VisionMessage,
+    }
+    #[derive(Deserialize)]
+    struct VisionMessage {
+        content: Option<String>,
+    }
+
+    let vision_res: VisionResponse = res.json().await?;
+    let content = vision_res
+        .choices
+        .into_iter()
+        .next()
+        .and_then(|c| c.message.content)
+        .unwrap_or_default();
+    Ok(content.trim().to_string())
+}
+
 /// Build a tool definition JSON for function calling
 pub fn make_tool(name: &str, description: &str, properties: Value, required: Vec<&str>) -> ToolDef {
     ToolDef {
@@ -121,9 +183,11 @@ pub async fn call_llm(
     timeout_secs: u64,
 ) -> anyhow::Result<LlmResponse> {
     let client = reqwest::Client::builder()
-        .timeout(std::time::Duration::from_secs(
-            if timeout_secs > 0 { timeout_secs } else { *config::llm::CHAT_TIMEOUT_SECS },
-        ))
+        .timeout(std::time::Duration::from_secs(if timeout_secs > 0 {
+            timeout_secs
+        } else {
+            *config::llm::CHAT_TIMEOUT_SECS
+        }))
         .build()?;
 
     let req = ChatRequest {
@@ -135,11 +199,7 @@ pub async fn call_llm(
         tools,
     };
 
-    let res = client
-        .post(&llm_chat_url())
-        .json(&req)
-        .send()
-        .await?;
+    let res = client.post(&llm_chat_url()).json(&req).send().await?;
 
     if !res.status().is_success() {
         let text = res.text().await.unwrap_or_default();
@@ -147,13 +207,17 @@ pub async fn call_llm(
     }
 
     let chat_res: ChatResponse = res.json().await?;
-    let choice = chat_res.choices.into_iter().next()
+    let choice = chat_res
+        .choices
+        .into_iter()
+        .next()
         .ok_or_else(|| anyhow::anyhow!("Empty LLM response"))?;
 
     match choice.finish_reason.as_deref() {
         Some("tool_calls") => {
-            let calls = choice.message.tool_calls
-                .ok_or_else(|| anyhow::anyhow!("finish_reason=tool_calls but no tool_calls in message"))?;
+            let calls = choice.message.tool_calls.ok_or_else(|| {
+                anyhow::anyhow!("finish_reason=tool_calls but no tool_calls in message")
+            })?;
             Ok(LlmResponse::ToolCalls(calls))
         }
         _ => {
@@ -164,16 +228,18 @@ pub async fn call_llm(
 }
 
 /// Helper to build the system prompt + user messages
-pub fn build_conversation(system_prompt: &str, user_query: &str, history: Vec<ChatMessage>) -> Vec<ChatMessage> {
-    let mut messages = vec![
-        ChatMessage {
-            role: "system".to_string(),
-            content: Some(system_prompt.to_string()),
-            tool_calls: None,
-            tool_call_id: None,
-            name: None,
-        },
-    ];
+pub fn build_conversation(
+    system_prompt: &str,
+    user_query: &str,
+    history: Vec<ChatMessage>,
+) -> Vec<ChatMessage> {
+    let mut messages = vec![ChatMessage {
+        role: "system".to_string(),
+        content: Some(system_prompt.to_string()),
+        tool_calls: None,
+        tool_call_id: None,
+        name: None,
+    }];
     // Add history (user + assistant exchanges)
     messages.extend(history);
     // Add current user query
diff --git a/src/core/processor/asrx.rs b/src/core/processor/asrx.rs
index 50882bb..2ab85a2 100644
--- a/src/core/processor/asrx.rs
+++ b/src/core/processor/asrx.rs
@@ -18,12 +18,22 @@ pub struct AsrxResult {
 
 #[derive(Debug, Serialize, Deserialize)]
 pub struct AsrxSegment {
+    #[serde(alias = "start")]
     pub start_time: f64,
+    #[serde(alias = "end")]
     pub end_time: f64,
+    #[serde(default)]
     pub start_frame: u64,
+    #[serde(default)]
     pub end_frame: u64,
     pub text: String,
     pub speaker_id: Option<String>,
+    #[serde(default)]
+    pub language: Option<String>,
+    #[serde(default)]
+    pub lang_prob: Option<f64>,
+    #[serde(default)]
+    pub quality: Option<f64>,
 }
 
 pub async fn process_asrx(
@@ -32,24 +42,16 @@ pub async fn process_asrx(
     uuid: Option<&str>,
 ) -> Result<AsrxResult> {
     let executor = PythonExecutor::new()?;
-    let script_path = executor.script_path("asrx_processor_custom.py");
+    let script_path = executor.script_path("asrx_processor.py");
 
     tracing::info!(
-        "[ASRX] Starting speaker diarization (custom): {}",
+        "[ASRX] Starting hybrid speaker diarization: {}",
         video_path
     );
 
     if !script_path.exists() {
-        tracing::warn!("[ASRX] Custom script not found, falling back to original");
-        let fallback_path = executor.script_path("asrx_processor.py");
-        if !fallback_path.exists() {
-            tracing::warn!("[ASRX] No script found, returning empty result");
-            return Ok(AsrxResult {
-                language: None,
-                segments: vec![],
-                embeddings: None,
-            });
-        }
+        tracing::error!("[ASRX] Script not found: {:?}", script_path);
+        anyhow::bail!("asrx_processor.py not found");
     }
 
     tracing::info!(
@@ -65,6 +67,7 @@ pub async fn process_asrx(
 
     if let Some(u) = uuid {
         cmd.arg("--uuid").arg(u);
+        cmd.arg("--file-uuid").arg(u);
     }
 
     cmd.stdout(std::process::Stdio::piped())
@@ -126,6 +129,9 @@ mod tests {
                 end_frame: 75,
                 text: "Hello".to_string(),
                 speaker_id: Some("SPEAKER_00".to_string()),
+                language: None,
+                lang_prob: None,
+                quality: None,
             }],
             embeddings: None,
         };
@@ -173,7 +179,27 @@ mod tests {
             end_frame: 150,
             text: "Test".to_string(),
             speaker_id: None,
+            language: None,
+            lang_prob: None,
+            quality: None,
         };
         assert!(segment.end_time > segment.start_time);
     }
+
+    #[test]
+    fn test_asrx_backward_compat_old_format() {
+        let json = r#"{
+            "language": "en",
+            "segments": [
+                {"start": 10.0, "end": 12.5, "text": "Hello", "speaker_id": "SPEAKER_00"}
+            ]
+        }"#;
+        let result: AsrxResult = serde_json::from_str(json).unwrap();
+        assert_eq!(result.segments.len(), 1);
+        assert_eq!(result.segments[0].start_time, 10.0);
+        assert_eq!(result.segments[0].end_time, 12.5);
+        assert_eq!(result.segments[0].text, "Hello");
+        assert_eq!(result.segments[0].start_frame, 0);
+        assert_eq!(result.segments[0].end_frame, 0);
+    }
 }
diff --git a/src/core/processor/cut.rs b/src/core/processor/cut.rs
index dd705bc..890ca18 100644
--- a/src/core/processor/cut.rs
+++ b/src/core/processor/cut.rs
@@ -43,11 +43,15 @@ pub async fn process_cut(
     let script_path = executor.script_path("cut_processor.py");
 
     if !script_path.exists() {
-        return Ok(CutResult {
+        let empty_result = CutResult {
             frame_count: 0,
             fps: 0.0,
             scenes: vec![],
-        });
+        };
+        let json = serde_json::to_string_pretty(&empty_result)?;
+        std::fs::write(output_path, &json)
+            .with_context(|| format!("Failed to write {:?}", output_path))?;
+        return Ok(empty_result);
     }
 
     executor
@@ -127,18 +131,26 @@ fn try_native_cut(video_path: &str) -> Result<CutResult> {
         .context("Failed to run ffmpeg scene detection")?;
 
     let stderr_output = String::from_utf8_lossy(&scene_output.stderr);
+    let stdout_output = String::from_utf8_lossy(&scene_output.stdout);
     let mut scene_times: Vec<f64> = Vec::new();
 
-    // Parse ffmpeg showinfo output for scene changes
-    // Format: [Parsed_showinfo...] pts:123.456 pts_time:123.456 ...
-    for line in stderr_output.lines() {
-        if line.contains("pts_time:") {
-            if let Some(pos) = line.find("pts_time:") {
-                let rest = &line[pos + 9..];
-                let time_str = rest.split_whitespace().next().unwrap_or("");
-                if let Ok(t) = time_str.parse::<f64>() {
-                    scene_times.push(t);
-                }
+    // Parse ffprobe output for scene changes (check both stderr and stdout)
+    // Format: pts_time=123.456 or pts_time:123.456
+    for line in stderr_output.lines().chain(stdout_output.lines()) {
+        // Try pts_time= format (standard ffprobe output)
+        if let Some(pos) = line.find("pts_time=") {
+            let rest = &line[pos + 9..];
+            let time_str = rest.split_whitespace().next().unwrap_or("");
+            if let Ok(t) = time_str.parse::<f64>() {
+                scene_times.push(t);
+            }
+        }
+        // Try pts_time: format (showinfo filter output)
+        else if let Some(pos) = line.find("pts_time:") {
+            let rest = &line[pos + 9..];
+            let time_str = rest.split_whitespace().next().unwrap_or("");
+            if let Ok(t) = time_str.parse::<f64>() {
+                scene_times.push(t);
             }
         }
     }
diff --git a/src/core/processor/mod.rs b/src/core/processor/mod.rs
index 51ebb07..402958a 100644
--- a/src/core/processor/mod.rs
+++ b/src/core/processor/mod.rs
@@ -11,7 +11,6 @@ pub mod pose;
 pub mod scene_classification;
 pub mod story;
 pub mod tkg;
-pub mod visual_chunk;
 pub mod yolo;
 
 pub use asr::{process_asr, AsrResult, AsrSegment};
@@ -40,5 +39,4 @@ pub use tkg::{
     build_tkg, query_auto_representative_frame, FrameTraceInfo, MainIdentityInfo,
     RepresentativeFrameResult, TkgResult,
 };
-pub use visual_chunk::{process_visual_chunk, process_visual_chunk_advanced, VisualChunkResult};
 pub use yolo::{process_yolo, YoloFrame, YoloObject, YoloResult};
diff --git a/src/core/processor/tkg.rs b/src/core/processor/tkg.rs
index 52a6147..791a5d0 100644
--- a/src/core/processor/tkg.rs
+++ b/src/core/processor/tkg.rs
@@ -38,7 +38,10 @@ fn load_face_pose_data(output_dir: &str, file_uuid: &str) -> Result<Vec<FacePose
     let mut poses = Vec::new();
     if let Some(frames) = json.get("frames").and_then(|v| v.as_array()) {
         for frame_entry in frames {
-            let frame_num = frame_entry.get("frame").and_then(|v| v.as_i64()).unwrap_or(0);
+            let frame_num = frame_entry
+                .get("frame")
+                .and_then(|v| v.as_i64())
+                .unwrap_or(0);
             if let Some(faces) = frame_entry.get("faces").and_then(|v| v.as_array()) {
                 for face in faces {
                     let bbox = match face.get("bbox") {
@@ -68,7 +71,14 @@ fn load_face_pose_data(output_dir: &str, file_uuid: &str) -> Result<Vec<FacePose
 
 /// Match a face from face_detections (frame, x, y, w, h) to its pose in face.json
 /// Uses bbox center distance to find the best match when multiple faces per frame.
-fn get_pose_for_face(frame: i64, x: f64, y: f64, w: f64, h: f64, poses: &[FacePose]) -> Option<(f64, f64, f64)> {
+fn get_pose_for_face(
+    frame: i64,
+    x: f64,
+    y: f64,
+    w: f64,
+    h: f64,
+    poses: &[FacePose],
+) -> Option<(f64, f64, f64)> {
     let cx = x + w / 2.0;
     let cy = y + h / 2.0;
     let mut best_dist = f64::MAX;
@@ -86,8 +96,12 @@ fn get_pose_for_face(frame: i64, x: f64, y: f64, w: f64, h: f64, poses: &[FacePo
 }
 
 fn detect_mutual_gaze(
-    bbox_a_x: f64, bbox_a_w: f64, yaw_a: f64,
-    bbox_b_x: f64, bbox_b_w: f64, yaw_b: f64,
+    bbox_a_x: f64,
+    bbox_a_w: f64,
+    yaw_a: f64,
+    bbox_b_x: f64,
+    bbox_b_w: f64,
+    yaw_b: f64,
     threshold: f64,
 ) -> bool {
     let cx_a = bbox_a_x + bbox_a_w / 2.0;
@@ -138,12 +152,16 @@ struct AsrxSegmentEntry {
     #[serde(default)]
     speaker_id: String,
     #[serde(default)]
-    start_time: f64,
+    start: f64,
     #[serde(default)]
-    end_time: f64,
+    end: f64,
+    #[serde(default)]
+    text: String,
     #[allow(dead_code)]
+    #[serde(default)]
     start_frame: i64,
     #[allow(dead_code)]
+    #[serde(default)]
     end_frame: i64,
 }
 
@@ -195,7 +213,10 @@ pub struct TkgResult {
 pub async fn build_tkg(db: &PostgresDb, file_uuid: &str, output_dir: &str) -> Result<TkgResult> {
     let pool = db.pool();
     let pose_data = load_face_pose_data(output_dir, file_uuid).unwrap_or_default();
-    tracing::info!("[TKG] Loaded {} pose entries from face.json", pose_data.len());
+    tracing::info!(
+        "[TKG] Loaded {} pose entries from face.json",
+        pose_data.len()
+    );
 
     let n_face = build_face_trace_nodes(pool, file_uuid, &pose_data).await?;
     let n_objects = build_yolo_object_nodes(pool, file_uuid, output_dir).await?;
@@ -217,7 +238,11 @@ pub async fn build_tkg(db: &PostgresDb, file_uuid: &str, output_dir: &str) -> Re
 
 // ── Node builders ─────────────────────────────────────────────────
 
-async fn build_face_trace_nodes(pool: &PgPool, file_uuid: &str, pose_data: &[FacePose]) -> Result<usize> {
+async fn build_face_trace_nodes(
+    pool: &PgPool,
+    file_uuid: &str,
+    pose_data: &[FacePose],
+) -> Result<usize> {
     let face_table = t("face_detections");
     let nodes_table = t("tkg_nodes");
 
@@ -257,7 +282,10 @@ async fn build_face_trace_nodes(pool: &PgPool, file_uuid: &str, pose_data: &[Fac
     // Group by trace_id: trace_id → Vec<(frame, x, y, w, h)>
     let mut trace_frames: HashMap<i64, Vec<(i64, f64, f64, f64, f64)>> = HashMap::new();
     for (tid, frame, x, y, w, h) in &frame_rows {
-        trace_frames.entry(*tid).or_default().push((*frame, *x, *y, *w, *h));
+        trace_frames
+            .entry(*tid)
+            .or_default()
+            .push((*frame, *x, *y, *w, *h));
     }
 
     let mut count = 0;
@@ -274,7 +302,9 @@ async fn build_face_trace_nodes(pool: &PgPool, file_uuid: &str, pose_data: &[Fac
 
         if let Some(frames) = trace_frames.get(&tid) {
             for (frame, x, y, w, h) in frames {
-                if let Some((yaw, pitch, roll)) = get_pose_for_face(*frame, *x, *y, *w, *h, pose_data) {
+                if let Some((yaw, pitch, roll)) =
+                    get_pose_for_face(*frame, *x, *y, *w, *h, pose_data)
+                {
                     yaw_sum += yaw;
                     pitch_sum += pitch;
                     roll_sum += roll;
@@ -284,7 +314,11 @@ async fn build_face_trace_nodes(pool: &PgPool, file_uuid: &str, pose_data: &[Fac
         }
 
         let (avg_yaw, avg_pitch, avg_roll) = if pose_count > 0 {
-            (yaw_sum / pose_count as f64, pitch_sum / pose_count as f64, roll_sum / pose_count as f64)
+            (
+                yaw_sum / pose_count as f64,
+                pitch_sum / pose_count as f64,
+                roll_sum / pose_count as f64,
+            )
         } else {
             (0.0, 0.0, 0.0)
         };
@@ -401,8 +435,44 @@ async fn build_speaker_nodes(pool: &PgPool, file_uuid: &str, output_dir: &str) -
     let nodes_table = t("tkg_nodes");
     let mut count = 0;
 
+    // Group segments by speaker_id
+    let mut speaker_segments: HashMap<String, Vec<&AsrxSegmentEntry>> = HashMap::new();
+    for seg in &asrx.segments {
+        speaker_segments
+            .entry(seg.speaker_id.clone())
+            .or_default()
+            .push(seg);
+    }
+
     for (sid, stat) in &stats {
-        let props = serde_json::json!({ "segment_count": stat.count });
+        let segs = speaker_segments.get(sid);
+        let (full_text, segments_json) = if let Some(seg_list) = segs {
+            let full: String = seg_list
+                .iter()
+                .map(|s| s.text.trim())
+                .filter(|t| !t.is_empty())
+                .collect::<Vec<_>>()
+                .join(" ");
+            let segments: Vec<serde_json::Value> = seg_list
+                .iter()
+                .map(|s| {
+                    serde_json::json!({
+                        "start": s.start,
+                        "end": s.end,
+                        "text": s.text,
+                    })
+                })
+                .collect();
+            (full, serde_json::Value::Array(segments))
+        } else {
+            (String::new(), serde_json::Value::Array(vec![]))
+        };
+
+        let props = serde_json::json!({
+            "segment_count": stat.count,
+            "segments": segments_json,
+            "full_text": full_text,
+        });
 
         sqlx::query(&format!(
             r#"
@@ -576,8 +646,8 @@ async fn build_speaker_face_edges(
 
     // Calculate fps from last segment
     let last = asrx.segments.last().unwrap();
-    let fps = if last.end_time > 0.0 {
-        last.end_frame as f64 / last.end_time
+    let fps = if last.end > 0.0 {
+        last.end_frame as f64 / last.end
     } else {
         30.0
     };
@@ -604,8 +674,8 @@ async fn build_speaker_face_edges(
         let face_end_sec = *ef as f64 / fps;
 
         for seg in &asrx.segments {
-            let seg_start = seg.start_time;
-            let seg_end = seg.end_time;
+            let seg_start = seg.start;
+            let seg_end = seg.end;
             let overlap_start = face_start_sec.max(seg_start);
             let overlap_end = face_end_sec.min(seg_end);
 
@@ -669,7 +739,11 @@ async fn build_speaker_face_edges(
     Ok(edge_count)
 }
 
-async fn build_face_face_edges(pool: &PgPool, file_uuid: &str, pose_data: &[FacePose]) -> Result<usize> {
+async fn build_face_face_edges(
+    pool: &PgPool,
+    file_uuid: &str,
+    pose_data: &[FacePose],
+) -> Result<usize> {
     let face_table = t("face_detections");
     let nodes_table = t("tkg_nodes");
     let edges_table = t("tkg_edges");
@@ -722,8 +796,9 @@ async fn build_face_face_edges(pool: &PgPool, file_uuid: &str, pose_data: &[Face
             (Some(&(xa, ya, wa, ha)), Some(&(xb, yb, wb, hb))) => {
                 get_pose_for_face(*frame, xa, ya, wa, ha, pose_data)
                     .and_then(|(yaw_a, _, _)| {
-                        get_pose_for_face(*frame, xb, yb, wb, hb, pose_data)
-                            .map(|(yaw_b, _, _)| detect_mutual_gaze(xa, wa, yaw_a, xb, wb, yaw_b, 0.05))
+                        get_pose_for_face(*frame, xb, yb, wb, hb, pose_data).map(|(yaw_b, _, _)| {
+                            detect_mutual_gaze(xa, wa, yaw_a, xb, wb, yaw_b, 0.05)
+                        })
                     })
                     .unwrap_or(false)
             }
@@ -770,7 +845,11 @@ async fn build_face_face_edges(pool: &PgPool, file_uuid: &str, pose_data: &[Face
         };
 
         let frames: Vec<i64> = frame_data.iter().map(|(f, _)| *f).collect();
-        let gaze_frames: Vec<i64> = frame_data.iter().filter(|(_, g)| *g).map(|(f, _)| *f).collect();
+        let gaze_frames: Vec<i64> = frame_data
+            .iter()
+            .filter(|(_, g)| *g)
+            .map(|(f, _)| *f)
+            .collect();
         let gaze_count = gaze_frames.len() as i64;
         let has_gaze = gaze_count > 0;
 
@@ -793,8 +872,13 @@ async fn build_face_face_edges(pool: &PgPool, file_uuid: &str, pose_data: &[Face
                 }
             }
             let (avg_ya, avg_yb) = if gaze_sample > 0 {
-                (yaw_a_sum / gaze_sample as f64, yaw_b_sum / gaze_sample as f64)
-            } else { (0.0, 0.0) };
+                (
+                    yaw_a_sum / gaze_sample as f64,
+                    yaw_b_sum / gaze_sample as f64,
+                )
+            } else {
+                (0.0, 0.0)
+            };
 
             serde_json::json!({
                 "first_frame": frames[0],
@@ -902,9 +986,14 @@ pub async fn query_auto_representative_frame(
     .context("Failed to detect main identities")?;
 
     let main_ids: Vec<(i32, String, String, i64)> = mains;
-    let main_idents: Vec<MainIdentityInfo> = main_ids.iter().map(|(_, u, n, c)|
-        MainIdentityInfo { identity_uuid: u.clone(), name: n.clone(), face_count: *c }
-    ).collect();
+    let main_idents: Vec<MainIdentityInfo> = main_ids
+        .iter()
+        .map(|(_, u, n, c)| MainIdentityInfo {
+            identity_uuid: u.clone(),
+            name: n.clone(),
+            face_count: *c,
+        })
+        .collect();
 
     let frame_number: Option<i64> = if main_ids.len() >= 2 {
         let id_a = main_ids[0].0;
@@ -915,16 +1004,20 @@ pub async fn query_auto_representative_frame(
              AND trace_id IS NOT NULL GROUP BY trace_id ORDER BY COUNT(*) DESC LIMIT 1",
             fd_table
         ))
-        .bind(file_uuid).bind(id_a)
-        .fetch_optional(pool).await?;
+        .bind(file_uuid)
+        .bind(id_a)
+        .fetch_optional(pool)
+        .await?;
 
         let trace_b: Option<(i32,)> = sqlx::query_as(&format!(
             "SELECT trace_id FROM {} WHERE file_uuid = $1 AND identity_id = $2 \
              AND trace_id IS NOT NULL GROUP BY trace_id ORDER BY COUNT(*) DESC LIMIT 1",
             fd_table
         ))
-        .bind(file_uuid).bind(id_b)
-        .fetch_optional(pool).await?;
+        .bind(file_uuid)
+        .bind(id_b)
+        .fetch_optional(pool)
+        .await?;
 
         match (trace_a, trace_b) {
             (Some((ta,)), Some((tb,))) => {
@@ -940,11 +1033,18 @@ pub async fn query_auto_representative_frame(
                      LIMIT 1",
                     edges_table, nodes_table, nodes_table
                 ))
-                .bind(file_uuid).bind(ta).bind(tb)
-                .fetch_optional(pool).await?;
+                .bind(file_uuid)
+                .bind(ta)
+                .bind(tb)
+                .fetch_optional(pool)
+                .await?;
 
                 if let Some((f,)) = tkg_frame {
-                    if f <= half_frame { Some(f) } else { None }
+                    if f <= half_frame {
+                        Some(f)
+                    } else {
+                        None
+                    }
                 } else {
                     sqlx::query_scalar::<_, i64>(&format!(
                         "SELECT MIN(fd_a.frame_number)::bigint \
@@ -954,8 +1054,12 @@ pub async fn query_auto_representative_frame(
                          AND fd_b.identity_id = $3 AND fd_a.frame_number <= $4",
                         fd_table, fd_table
                     ))
-                    .bind(file_uuid).bind(id_a).bind(id_b).bind(half_frame)
-                    .fetch_optional(pool).await?
+                    .bind(file_uuid)
+                    .bind(id_a)
+                    .bind(id_b)
+                    .bind(half_frame)
+                    .fetch_optional(pool)
+                    .await?
                 }
             }
             _ => None,
@@ -976,8 +1080,11 @@ pub async fn query_auto_representative_frame(
                      LIMIT 1",
                     fd_table
                 ))
-                .bind(file_uuid).bind(first_id).bind(half_frame)
-                .fetch_optional(pool).await?
+                .bind(file_uuid)
+                .bind(first_id)
+                .bind(half_frame)
+                .fetch_optional(pool)
+                .await?
             } else {
                 None
             }
@@ -995,20 +1102,25 @@ pub async fn query_auto_representative_frame(
                  LIMIT 1",
                 fd_table
             ))
-            .bind(file_uuid).bind(half_frame)
-            .fetch_optional(pool).await?
+            .bind(file_uuid)
+            .bind(half_frame)
+            .fetch_optional(pool)
+            .await?
         }
     };
 
-    let frame_number = frame_number.ok_or_else(|| anyhow::anyhow!("No faces found in this file"))?;
+    let frame_number =
+        frame_number.ok_or_else(|| anyhow::anyhow!("No faces found in this file"))?;
 
     let face_quality: f64 = sqlx::query_scalar::<_, f64>(&format!(
         "SELECT COALESCE(MAX((width::float8 * height::float8) * confidence::float8), 0) \
          FROM {} WHERE file_uuid = $1 AND frame_number = $2",
         fd_table
     ))
-    .bind(file_uuid).bind(frame_number)
-    .fetch_one(pool).await?;
+    .bind(file_uuid)
+    .bind(frame_number)
+    .fetch_one(pool)
+    .await?;
 
     let traces: Vec<FrameTraceInfo> = sqlx::query_as::<_, (i32, Option<String>, Option<String>, i32, i32, i32, i32, f64)>(&format!(
         "SELECT fd.trace_id, i.uuid::text, i.name, fd.x, fd.y, fd.width, fd.height, fd.confidence::float8 \
diff --git a/src/core/processor/visual_chunk.rs b/src/core/processor/visual_chunk.rs
deleted file mode 100644
index b94ba61..0000000
--- a/src/core/processor/visual_chunk.rs
+++ /dev/null
@@ -1,594 +0,0 @@
-//! 視覺分片處理器 (Phase 2.2)
-//!
-//! 從 YOLO 結果生成視覺分片
-
-use anyhow::{Context, Result};
-use serde::{Deserialize, Serialize};
-use std::time::Duration;
-
-use super::executor::PythonExecutor;
-use super::yolo::{YoloFrame, YoloResult};
-
-const VISUAL_CHUNK_TIMEOUT: Duration = Duration::from_secs(3600);
-
-/// 視覺分片處理結果
-#[derive(Debug, Serialize, Deserialize, Clone, Default)]
-pub struct VisualChunkResult {
-    /// 生成的視覺分片數量
-    pub chunk_count: u32,
-    /// 處理的總幀數
-    pub total_frames: u32,
-    /// 檢測到的總物件數
-    pub total_objects: u32,
-    /// 唯一物件類別數
-    pub unique_classes: u32,
-    /// 生成的視覺分片
-    pub chunks: Vec<crate::core::chunk::Chunk>,
-}
-
-/// 從 YOLO 結果生成視覺分片
-pub async fn process_visual_chunk(
-    file_id: i32,
-    uuid: String,
-    video_path: &str,
-    yolo_result: &YoloResult,
-    chunk_index_offset: u32,
-    fps: f64,
-) -> Result<VisualChunkResult> {
-    tracing::info!(
-        "[VisualChunk] Starting visual chunk generation for video: {}, {} frames",
-        video_path,
-        yolo_result.frames.len()
-    );
-
-    if yolo_result.frames.is_empty() {
-        tracing::warn!("[VisualChunk] No YOLO frames to process");
-        return Ok(VisualChunkResult {
-            chunk_count: 0,
-            total_frames: 0,
-            total_objects: 0,
-            unique_classes: 0,
-            chunks: vec![],
-        });
-    }
-
-    // 策略 1: 固定幀數分片（每 N 幀一個分片）
-    let chunks = create_fixed_frame_chunks(file_id, &uuid, yolo_result, chunk_index_offset, fps);
-
-    // 統計信息
-    let total_objects: u32 = yolo_result
-        .frames
-        .iter()
-        .map(|f| f.objects.len() as u32)
-        .sum();
-    let all_classes: Vec<String> = yolo_result
-        .frames
-        .iter()
-        .flat_map(|f| f.objects.iter().map(|o| o.class_name.clone()))
-        .collect();
-    let unique_classes: u32 = all_classes
-        .iter()
-        .cloned()
-        .collect::<std::collections::HashSet<_>>()
-        .len() as u32;
-
-    tracing::info!(
-        "[VisualChunk] Generated {} visual chunks from {} frames, {} total objects, {} unique classes",
-        chunks.len(),
-        yolo_result.frames.len(),
-        total_objects,
-        unique_classes
-    );
-
-    Ok(VisualChunkResult {
-        chunk_count: chunks.len() as u32,
-        total_frames: yolo_result.frames.len() as u32,
-        total_objects,
-        unique_classes,
-        chunks,
-    })
-}
-
-/// 創建固定幀數分片（每 N 幀一個分片）
-fn create_fixed_frame_chunks(
-    file_id: i32,
-    uuid: &str,
-    yolo_result: &YoloResult,
-    chunk_index_offset: u32,
-    fps: f64,
-) -> Vec<crate::core::chunk::Chunk> {
-    let mut chunks = Vec::new();
-
-    // 配置：每 30 幀創建一個分片（約 1 秒，如果 fps=30）
-    let frames_per_chunk = 30;
-    let total_frames = yolo_result.frames.len();
-
-    if total_frames == 0 {
-        return chunks;
-    }
-
-    let mut chunk_index = chunk_index_offset;
-    let mut start_idx = 0;
-
-    while start_idx < total_frames {
-        let end_idx = std::cmp::min(start_idx + frames_per_chunk, total_frames);
-
-        // 獲取這個分片的幀
-        let chunk_frames: Vec<YoloFrame> = yolo_result.frames[start_idx..end_idx]
-            .iter()
-            .cloned()
-            .collect();
-
-        if chunk_frames.is_empty() {
-            break;
-        }
-
-        // 計算幀範圍
-        let start_frame = chunk_frames.first().unwrap().frame as i64;
-        let end_frame = chunk_frames.last().unwrap().frame as i64 + 1; // exclusive
-
-        // 創建視覺分片
-        let chunk = crate::core::chunk::Chunk::from_yolo_frames(
-            file_id,
-            uuid.to_string(),
-            format!("vis_{}", chunk_index),
-            start_frame,
-            end_frame,
-            fps,
-            chunk_frames,
-        );
-
-        chunks.push(chunk);
-
-        // 更新索引
-        start_idx = end_idx;
-        chunk_index += 1;
-    }
-
-    chunks
-}
-
-/// 基於物件相似度創建分片
-fn create_similarity_based_chunks(
-    file_id: i32,
-    uuid: &str,
-    yolo_result: &YoloResult,
-    chunk_index_offset: u32,
-    fps: f64,
-    similarity_threshold: f32,
-    min_frames_per_chunk: usize,
-) -> Vec<crate::core::chunk::Chunk> {
-    let mut chunks = Vec::new();
-
-    if yolo_result.frames.is_empty() {
-        return chunks;
-    }
-
-    let mut current_chunk_frames: Vec<YoloFrame> = Vec::new();
-    let mut chunk_index = chunk_index_offset;
-    let mut current_start_frame = 0;
-
-    for (i, frame) in yolo_result.frames.iter().enumerate() {
-        if current_chunk_frames.is_empty() {
-            current_chunk_frames.push(frame.clone());
-            current_start_frame = frame.frame as i64;
-            continue;
-        }
-
-        // 檢查相似度（簡化版本：檢查物件類別是否相同）
-        let last_frame = current_chunk_frames.last().unwrap();
-        let similarity = calculate_frame_similarity(last_frame, frame);
-
-        if similarity >= similarity_threshold {
-            // 相似度高，加入當前分片
-            current_chunk_frames.push(frame.clone());
-        } else {
-            // 相似度低，創建新分片
-            if current_chunk_frames.len() >= min_frames_per_chunk {
-                let end_frame = current_chunk_frames.last().unwrap().frame as i64 + 1;
-
-                let chunk = crate::core::chunk::Chunk::from_yolo_frames(
-                    file_id,
-                    uuid.to_string(),
-                    format!("vis_{}", chunk_index),
-                    current_start_frame,
-                    end_frame,
-                    fps,
-                    current_chunk_frames.clone(),
-                );
-
-                chunks.push(chunk);
-                chunk_index += 1;
-            }
-
-            // 開始新的分片
-            current_chunk_frames = vec![frame.clone()];
-            current_start_frame = frame.frame as i64;
-        }
-    }
-
-    // 處理最後一個分片
-    if current_chunk_frames.len() >= min_frames_per_chunk {
-        let end_frame = current_chunk_frames.last().unwrap().frame as i64 + 1;
-
-        let chunk = crate::core::chunk::Chunk::from_yolo_frames(
-            file_id,
-            uuid.to_string(),
-            format!("vis_{}", chunk_index),
-            current_start_frame,
-            end_frame,
-            fps,
-            current_chunk_frames,
-        );
-
-        chunks.push(chunk);
-    }
-
-    chunks
-}
-
-/// 計算兩個幀之間的相似度（基於物件類別）
-fn calculate_frame_similarity(frame1: &YoloFrame, frame2: &YoloFrame) -> f32 {
-    if frame1.objects.is_empty() && frame2.objects.is_empty() {
-        return 1.0;
-    }
-
-    if frame1.objects.is_empty() || frame2.objects.is_empty() {
-        return 0.0;
-    }
-
-    let set1: std::collections::HashSet<String> = frame1
-        .objects
-        .iter()
-        .map(|o| o.class_name.clone())
-        .collect();
-    let set2: std::collections::HashSet<String> = frame2
-        .objects
-        .iter()
-        .map(|o| o.class_name.clone())
-        .collect();
-
-    let intersection: Vec<_> = set1.intersection(&set2).collect();
-    let union: Vec<_> = set1.union(&set2).collect();
-
-    if union.is_empty() {
-        0.0
-    } else {
-        intersection.len() as f32 / union.len() as f32
-    }
-}
-
-/// 使用 Python 腳本生成視覺分片（進階版本）
-pub async fn process_visual_chunk_advanced(
-    video_path: &str,
-    output_path: &str,
-    uuid: Option<&str>,
-) -> Result<VisualChunkResult> {
-    let executor = PythonExecutor::new()?;
-    let script_path = executor.script_path("visual_chunk_processor.py");
-
-    tracing::info!(
-        "[VisualChunk] Starting advanced visual chunk generation: {}",
-        video_path
-    );
-
-    if !script_path.exists() {
-        tracing::warn!("[VisualChunk] Script not found, using basic generation");
-        // 這裡可以回退到基本生成方法
-        return Ok(VisualChunkResult {
-            chunk_count: 0,
-            total_frames: 0,
-            total_objects: 0,
-            unique_classes: 0,
-            chunks: vec![],
-        });
-    }
-
-    let yolo_path = uuid.map(|u| {
-        std::path::PathBuf::from(crate::core::config::OUTPUT_DIR.as_str())
-            .join(format!("{}.yolo.json", u))
-            .to_string_lossy()
-            .to_string()
-    });
-    let args: &[&str] = if let Some(ref yp) = yolo_path {
-        &[video_path, output_path, "--yolo-result", yp]
-    } else {
-        &[video_path, output_path]
-    };
-    let result = match executor
-        .run(
-            "visual_chunk_processor.py",
-            args,
-            uuid,
-            "VisualChunk",
-            Some(VISUAL_CHUNK_TIMEOUT),
-        )
-        .await
-    {
-        Ok(_) => match std::fs::read_to_string(output_path) {
-            Ok(json_str) => match serde_json::from_str::<VisualChunkResult>(&json_str) {
-                Ok(r) => r,
-                Err(e) => {
-                    tracing::warn!(
-                        "[VisualChunk] Failed to parse output ({}), returning empty",
-                        e
-                    );
-                    VisualChunkResult::default()
-                }
-            },
-            Err(e) => {
-                tracing::warn!(
-                    "[VisualChunk] Failed to read output ({}), returning empty",
-                    e
-                );
-                VisualChunkResult::default()
-            }
-        },
-        Err(e) => {
-            tracing::warn!(
-                "[VisualChunk] Failed to run script ({}), returning empty",
-                e
-            );
-            VisualChunkResult::default()
-        }
-    };
-
-    tracing::info!(
-        "[VisualChunk] Advanced generation result: {} chunks, {} frames",
-        result.chunk_count,
-        result.total_frames
-    );
-
-    Ok(result)
-}
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn test_calculate_frame_similarity() {
-        use crate::core::processor::yolo::{YoloFrame, YoloObject};
-
-        let frame1 = YoloFrame {
-            frame: 0,
-            timestamp: 0.0,
-            objects: vec![
-                YoloObject {
-                    class_name: "person".to_string(),
-                    class_id: 0,
-                    x: 100,
-                    y: 200,
-                    width: 50,
-                    height: 100,
-                    confidence: 0.95,
-                },
-                YoloObject {
-                    class_name: "car".to_string(),
-                    class_id: 2,
-                    x: 300,
-                    y: 150,
-                    width: 80,
-                    height: 60,
-                    confidence: 0.87,
-                },
-            ],
-        };
-
-        let frame2 = YoloFrame {
-            frame: 1,
-            timestamp: 0.033,
-            objects: vec![
-                YoloObject {
-                    class_name: "person".to_string(),
-                    class_id: 0,
-                    x: 110,
-                    y: 210,
-                    width: 52,
-                    height: 102,
-                    confidence: 0.92,
-                },
-                YoloObject {
-                    class_name: "car".to_string(),
-                    class_id: 2,
-                    x: 310,
-                    y: 155,
-                    width: 82,
-                    height: 62,
-                    confidence: 0.85,
-                },
-            ],
-        };
-
-        let frame3 = YoloFrame {
-            frame: 2,
-            timestamp: 0.066,
-            objects: vec![YoloObject {
-                class_name: "dog".to_string(),
-                class_id: 16,
-                x: 150,
-                y: 250,
-                width: 40,
-                height: 60,
-                confidence: 0.78,
-            }],
-        };
-
-        // 相同物件的幀應該高度相似
-        let similarity_same = calculate_frame_similarity(&frame1, &frame2);
-        assert!((similarity_same - 1.0).abs() < 0.001);
-
-        // 不同物件的幀應該不相似
-        let similarity_diff = calculate_frame_similarity(&frame1, &frame3);
-        assert!((similarity_diff - 0.0).abs() < 0.001);
-
-        // 空幀應該完全相似
-        let empty_frame = YoloFrame {
-            frame: 3,
-            timestamp: 0.1,
-            objects: vec![],
-        };
-        let similarity_empty = calculate_frame_similarity(&empty_frame, &empty_frame);
-        assert!((similarity_empty - 1.0).abs() < 0.001);
-    }
-
-    #[tokio::test]
-    async fn test_create_fixed_frame_chunks() {
-        use crate::core::processor::yolo::{YoloFrame, YoloObject, YoloResult};
-
-        // 創建測試 YOLO 結果（60 幀，每幀都有物件）
-        let mut frames = Vec::new();
-        for i in 0..60 {
-            frames.push(YoloFrame {
-                frame: i as u64,
-                timestamp: i as f64 / 30.0, // 假設 fps=30
-                objects: vec![YoloObject {
-                    class_name: "person".to_string(),
-                    class_id: 0,
-                    x: 100,
-                    y: 200,
-                    width: 50,
-                    height: 100,
-                    confidence: 0.9,
-                }],
-            });
-        }
-
-        let yolo_result = YoloResult {
-            frame_count: 60,
-            fps: 30.0,
-            frames,
-        };
-
-        let chunks = create_fixed_frame_chunks(1, "test-uuid", &yolo_result, 0, 30.0);
-
-        // 60 幀，每 30 幀一個分片，應該有 2 個分片
-        assert_eq!(chunks.len(), 2);
-
-        // 檢查第一個分片
-        let first_chunk = &chunks[0];
-        assert_eq!(
-            first_chunk.chunk_type,
-            crate::core::chunk::ChunkType::Visual
-        );
-        assert_eq!(first_chunk.start_frame, 0);
-        assert_eq!(first_chunk.end_frame, 30); // exclusive
-        assert_eq!(first_chunk.frame_count, 30);
-
-        // 檢查第二個分片
-        let second_chunk = &chunks[1];
-        assert_eq!(
-            second_chunk.chunk_type,
-            crate::core::chunk::ChunkType::Visual
-        );
-        assert_eq!(second_chunk.start_frame, 30);
-        assert_eq!(second_chunk.end_frame, 60); // exclusive
-        assert_eq!(second_chunk.frame_count, 30);
-    }
-
-    #[test]
-    fn test_create_similarity_based_chunks() {
-        use crate::core::processor::yolo::{YoloFrame, YoloObject, YoloResult};
-
-        // 創建測試 YOLO 結果
-        let frames = vec![
-            YoloFrame {
-                // 幀 0-4: 都有 person 和 car
-                frame: 0,
-                timestamp: 0.0,
-                objects: vec![
-                    YoloObject {
-                        class_name: "person".to_string(),
-                        class_id: 0,
-                        x: 100,
-                        y: 200,
-                        width: 50,
-                        height: 100,
-                        confidence: 0.9,
-                    },
-                    YoloObject {
-                        class_name: "car".to_string(),
-                        class_id: 2,
-                        x: 300,
-                        y: 150,
-                        width: 80,
-                        height: 60,
-                        confidence: 0.8,
-                    },
-                ],
-            },
-            YoloFrame {
-                // 幀 1
-                frame: 1,
-                timestamp: 0.033,
-                objects: vec![
-                    YoloObject {
-                        class_name: "person".to_string(),
-                        class_id: 0,
-                        x: 110,
-                        y: 210,
-                        width: 52,
-                        height: 102,
-                        confidence: 0.88,
-                    },
-                    YoloObject {
-                        class_name: "car".to_string(),
-                        class_id: 2,
-                        x: 310,
-                        y: 155,
-                        width: 82,
-                        height: 62,
-                        confidence: 0.78,
-                    },
-                ],
-            },
-            YoloFrame {
-                // 幀 5-9: 只有 dog
-                frame: 5,
-                timestamp: 0.166,
-                objects: vec![YoloObject {
-                    class_name: "dog".to_string(),
-                    class_id: 16,
-                    x: 150,
-                    y: 250,
-                    width: 40,
-                    height: 60,
-                    confidence: 0.7,
-                }],
-            },
-            YoloFrame {
-                // 幀 6
-                frame: 6,
-                timestamp: 0.2,
-                objects: vec![YoloObject {
-                    class_name: "dog".to_string(),
-                    class_id: 16,
-                    x: 155,
-                    y: 255,
-                    width: 42,
-                    height: 62,
-                    confidence: 0.68,
-                }],
-            },
-        ];
-
-        let yolo_result = YoloResult {
-            frame_count: 7,
-            fps: 30.0,
-            frames,
-        };
-
-        let chunks = create_similarity_based_chunks(
-            1,
-            "test-uuid",
-            &yolo_result,
-            0,
-            30.0,
-            0.5, // similarity threshold
-            2,   // min frames per chunk
-        );
-
-        // 應該有 2 個分片：一個是 person+car，一個是 dog
-        assert_eq!(chunks.len(), 2);
-    }
-}
diff --git a/src/core/thumbnail/mod.rs b/src/core/thumbnail/mod.rs
index ee1a9c9..41d6c5c 100644
--- a/src/core/thumbnail/mod.rs
+++ b/src/core/thumbnail/mod.rs
@@ -1,3 +1,5 @@
+pub mod validator;
+
 use anyhow::{Context, Result};
 use serde::{Deserialize, Serialize};
 use std::path::{Path, PathBuf};
diff --git a/src/core/thumbnail/validator.rs b/src/core/thumbnail/validator.rs
new file mode 100644
index 0000000..456104f
--- /dev/null
+++ b/src/core/thumbnail/validator.rs
@@ -0,0 +1,202 @@
+use anyhow::{bail, Result};
+
+pub const JPEG_MIN_SIZE: usize = 100;
+pub const JPEG_SOI_MARKER: [u8; 3] = [0xFF, 0xD8, 0xFF];
+pub const JPEG_EOI_MARKER: [u8; 2] = [0xFF, 0xD9];
+
+pub fn validate_jpeg(data: &[u8]) -> Result<()> {
+    if data.len() < JPEG_MIN_SIZE {
+        bail!(
+            "JPEG too small: {} bytes (minimum {})",
+            data.len(),
+            JPEG_MIN_SIZE
+        );
+    }
+
+    if data[0..3] != JPEG_SOI_MARKER {
+        bail!(
+            "Invalid JPEG header: expected {:02X?}, got {:02X?}",
+            JPEG_SOI_MARKER,
+            &data[0..3]
+        );
+    }
+
+    if data[data.len() - 2..] != JPEG_EOI_MARKER {
+        bail!(
+            "Incomplete JPEG: missing EOI marker, got {:02X?}",
+            &data[data.len() - 2..]
+        );
+    }
+
+    Ok(())
+}
+
+pub fn is_valid_jpeg(data: &[u8]) -> bool {
+    validate_jpeg(data).is_ok()
+}
+
+pub fn jpeg_size_ok(data: &[u8]) -> bool {
+    data.len() >= JPEG_MIN_SIZE
+}
+
+pub fn jpeg_header_ok(data: &[u8]) -> bool {
+    data.len() >= 3 && data[0..3] == JPEG_SOI_MARKER
+}
+
+pub fn jpeg_footer_ok(data: &[u8]) -> bool {
+    data.len() >= 2 && data[data.len() - 2..] == JPEG_EOI_MARKER
+}
+
+pub fn validate_frame(frame: i64, total_frames: i64) -> Result<()> {
+    if frame < 0 {
+        bail!("Frame number cannot be negative: {}", frame);
+    }
+    if frame > total_frames {
+        bail!("Frame {} exceeds total frames {}", frame, total_frames);
+    }
+    Ok(())
+}
+
+pub fn validate_crop(
+    x: i32,
+    y: i32,
+    w: i32,
+    h: i32,
+    video_width: i32,
+    video_height: i32,
+) -> Result<()> {
+    if x < 0 || y < 0 || w <= 0 || h <= 0 {
+        bail!(
+            "Invalid crop parameters: x={}, y={}, w={}, h={} (must be positive)",
+            x,
+            y,
+            w,
+            h
+        );
+    }
+    if x + w > video_width {
+        bail!(
+            "Crop width exceeds video: x+w={} > video_width={}",
+            x + w,
+            video_width
+        );
+    }
+    if y + h > video_height {
+        bail!(
+            "Crop height exceeds video: y+h={} > video_height={}",
+            y + h,
+            video_height
+        );
+    }
+    Ok(())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_validate_jpeg_valid() {
+        let valid_jpeg = vec![
+            0xFF, 0xD8, 0xFF, // SOI marker
+            0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D,
+            0x0E, 0x0F, 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, 0x18, 0x19, 0x1A, 0x1B,
+            0x1C, 0x1D, 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, 0x28, 0x29,
+            0x2A, 0x2B, 0x2C, 0x2D, 0x2E, 0x2F, 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37,
+            0x38, 0x39, 0x3A, 0x3B, 0x3C, 0x3D, 0x3E, 0x3F, 0x40, 0x41, 0x42, 0x43, 0x44, 0x45,
+            0x46, 0x47, 0x48, 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F, 0x50, 0x51, 0x52, 0x53,
+            0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5A, 0x5B, 0x5C, 0x5D, 0x5E, 0x5F, 0xFF,
+            0xD9, // EOI marker
+        ];
+        assert!(validate_jpeg(&valid_jpeg).is_ok());
+    }
+
+    #[test]
+    fn test_validate_jpeg_too_small() {
+        let small_data = vec![0xFF, 0xD8, 0xFF, 0xFF, 0xD9];
+        assert!(validate_jpeg(&small_data).is_err());
+    }
+
+    #[test]
+    fn test_validate_jpeg_invalid_header() {
+        let invalid_header = vec![
+            0x00, 0x00, 0x00, // wrong header
+            0x00, 0x01, 0x02, 0x03, 0xFF, 0xD9,
+        ];
+        assert!(validate_jpeg(&invalid_header).is_err());
+    }
+
+    #[test]
+    fn test_validate_jpeg_missing_footer() {
+        let missing_footer = vec![0xFF, 0xD8, 0xFF, 0x00, 0x01, 0x02, 0x03];
+        assert!(validate_jpeg(&missing_footer).is_err());
+    }
+
+    #[test]
+    fn test_validate_frame_valid() {
+        assert!(validate_frame(500, 1000).is_ok());
+        assert!(validate_frame(0, 1000).is_ok());
+        assert!(validate_frame(1000, 1000).is_ok());
+    }
+
+    #[test]
+    fn test_validate_frame_exceeds() {
+        assert!(validate_frame(1001, 1000).is_err());
+        assert!(validate_frame(-1, 1000).is_err());
+    }
+
+    #[test]
+    fn test_validate_crop_valid() {
+        assert!(validate_crop(100, 100, 200, 200, 1920, 1080).is_ok());
+        assert!(validate_crop(0, 0, 1920, 1080, 1920, 1080).is_ok());
+    }
+
+    #[test]
+    fn test_validate_crop_exceeds_width() {
+        assert!(validate_crop(1800, 100, 200, 200, 1920, 1080).is_err());
+    }
+
+    #[test]
+    fn test_validate_crop_exceeds_height() {
+        assert!(validate_crop(100, 900, 200, 200, 1920, 1080).is_err());
+    }
+
+    #[test]
+    fn test_validate_crop_negative() {
+        assert!(validate_crop(-1, 100, 200, 200, 1920, 1080).is_err());
+        assert!(validate_crop(100, -1, 200, 200, 1920, 1080).is_err());
+    }
+
+    #[test]
+    fn test_is_valid_jpeg() {
+        let valid_jpeg = vec![
+            0xFF, 0xD8, 0xFF, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A,
+            0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, 0x18,
+            0x19, 0x1A, 0x1B, 0x1C, 0x1D, 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26,
+            0x27, 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x2D, 0x2E, 0x2F, 0x30, 0x31, 0x32, 0x33, 0x34,
+            0x35, 0x36, 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, 0x3D, 0x3E, 0x3F, 0x40, 0x41, 0x42,
+            0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F, 0x50,
+            0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5A, 0x5B, 0x5C, 0x5D, 0x5E,
+            0x5F, 0xFF, 0xD9,
+        ];
+        assert!(is_valid_jpeg(&valid_jpeg));
+        assert!(!is_valid_jpeg(&[0xFF, 0xD8, 0xFF, 0xFF, 0xD9])); // too small
+    }
+
+    #[test]
+    fn test_jpeg_helpers() {
+        let valid_jpeg = vec![
+            0xFF, 0xD8, 0xFF, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0A,
+            0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, 0x18,
+            0x19, 0x1A, 0x1B, 0x1C, 0x1D, 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26,
+            0x27, 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x2D, 0x2E, 0x2F, 0x30, 0x31, 0x32, 0x33, 0x34,
+            0x35, 0x36, 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, 0x3D, 0x3E, 0x3F, 0x40, 0x41, 0x42,
+            0x43, 0x44, 0x45, 0x46, 0x47, 0x48, 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F, 0x50,
+            0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, 0x58, 0x59, 0x5A, 0x5B, 0x5C, 0x5D, 0x5E,
+            0x5F, 0xFF, 0xD9,
+        ];
+        assert!(jpeg_size_ok(&valid_jpeg));
+        assert!(jpeg_header_ok(&valid_jpeg));
+        assert!(jpeg_footer_ok(&valid_jpeg));
+    }
+}
diff --git a/src/core/tmdb/probe.rs b/src/core/tmdb/probe.rs
index d010117..b9ff9a3 100644
--- a/src/core/tmdb/probe.rs
+++ b/src/core/tmdb/probe.rs
@@ -91,22 +91,21 @@ async fn upsert_identities_from_disk(
                 {
                     Ok(identity_file) => {
                         let identities_table = crate::core::db::schema::table_name("identities");
+                        let uuid_clean = identity_file.identity_uuid.replace('-', "");
                         let result = sqlx::query(&format!(
                             "INSERT INTO {} (uuid, name, identity_type, source, status, tmdb_id, tmdb_profile, metadata) \
-                             VALUES ($1::uuid, $2, 'people', 'tmdb', 'confirmed', $3, $4, $5::jsonb) \
+                             VALUES (gen_random_uuid(), $1, 'people', 'tmdb', 'confirmed', $2, $3, $4::jsonb) \
                              ON CONFLICT (tmdb_id) WHERE tmdb_id IS NOT NULL DO UPDATE SET \
-                             uuid = COALESCE({}.uuid, $1::uuid), \
                              tmdb_profile = COALESCE(EXCLUDED.tmdb_profile, {}.tmdb_profile), \
-                             metadata = {}.metadata || $5::jsonb",
-                            identities_table, identities_table, identities_table, identities_table
-                        ))
-                        .bind(&identity_file.identity_uuid)
-                        .bind(&identity_file.name)
-                        .bind(identity_file.tmdb_id)
-                        .bind(&identity_file.tmdb_profile)
-                        .bind(&identity_file.metadata)
-                        .execute(db.pool())
-                        .await;
+                             metadata = jsonb_deep_merge({}.metadata, $4::jsonb)",
+                             identities_table, identities_table, identities_table
+                         ))
+                         .bind(&identity_file.name)
+                         .bind(identity_file.tmdb_id)
+                         .bind(&identity_file.tmdb_profile)
+                         .bind(&identity_file.metadata)
+                         .execute(db.pool())
+                         .await;
 
                         match result {
                             Ok(_) => {
@@ -226,7 +225,7 @@ pub async fn create_identities_from_data(
              VALUES ($1, 'people', 'tmdb', 'confirmed', $2, $3, $4::jsonb) \
              ON CONFLICT (tmdb_id) WHERE tmdb_id IS NOT NULL DO UPDATE SET \
              tmdb_profile = COALESCE(EXCLUDED.tmdb_profile, {}.tmdb_profile), \
-             metadata = {}.metadata || $4::jsonb \
+             metadata = jsonb_deep_merge({}.metadata, $4::jsonb) \
              RETURNING uuid",
              identities_table, identities_table, identities_table
         ))
diff --git a/src/playground.rs b/src/playground.rs
index a36fa6e..eead128 100644
--- a/src/playground.rs
+++ b/src/playground.rs
@@ -2426,7 +2426,7 @@ async fn main() -> Result<()> {
                 .await
                 .context("Failed to init PostgreSQL")?;
             let qdrant = QdrantDb::init().await.context("Failed to init Qdrant")?;
-            let embedder = Embedder::new("nomic-embed-text-v2-moe:latest".to_string());
+            let embedder = Embedder::new("embeddinggemma-300m".to_string());
 
             let target_uuid = if uuid == "all" {
                 None
diff --git a/src/verification/verifier.rs b/src/verification/verifier.rs
index d6bab51..cb1f1c5 100644
--- a/src/verification/verifier.rs
+++ b/src/verification/verifier.rs
@@ -41,7 +41,6 @@ pub fn verify_output(processor: &ProcessorType, file_uuid: &str) -> Verification
     let proc_name = processor.as_str();
     let filename = match processor {
         ProcessorType::Story => format!("{}.story_story.json", file_uuid),
-        ProcessorType::FiveW1H => format!("{}.story_llm.json", file_uuid),
         _ => format!("{}.{}.json", file_uuid, proc_name),
     };
     let output_path = PathBuf::from(OUTPUT_DIR.as_str()).join(&filename);
@@ -65,7 +64,7 @@ pub fn verify_output(processor: &ProcessorType, file_uuid: &str) -> Verification
     };
 
     match processor {
-        ProcessorType::Asr | ProcessorType::Asrx => {
+        ProcessorType::Asrx => {
             let segs = value.get("segments").and_then(|v| v.as_array());
             match segs {
                 Some(_) => VerificationResult::ok(proc_name, file_uuid),
@@ -105,18 +104,8 @@ pub fn verify_output(processor: &ProcessorType, file_uuid: &str) -> Verification
                 None => VerificationResult::ok(proc_name, file_uuid),
             }
         }
-        ProcessorType::VisualChunk => VerificationResult::ok(proc_name, file_uuid),
         ProcessorType::Story => VerificationResult::ok(proc_name, file_uuid),
-        ProcessorType::FiveW1H => {
-            let scenes = value.get("scenes").and_then(|v| v.as_array());
-            match scenes {
-                Some(s) if s.is_empty() => {
-                    VerificationResult::fail(proc_name, file_uuid, "0 scenes")
-                }
-                Some(_) => VerificationResult::ok(proc_name, file_uuid),
-                None => VerificationResult::ok(proc_name, file_uuid),
-            }
-        }
+        _ => VerificationResult::ok(proc_name, file_uuid),
     }
 }
 
diff --git a/src/worker/job_worker.rs b/src/worker/job_worker.rs
index ffc5b23..55b0023 100644
--- a/src/worker/job_worker.rs
+++ b/src/worker/job_worker.rs
@@ -91,6 +91,7 @@ impl JobWorker {
         self.processor_pool.sweep_stale().await;
 
         // Reset stale running jobs: jobs stuck in 'running' with no active processor results
+        // Exclude jobs where all processor_results are completed (waiting for ingestion)
         let monitor_jobs_table = schema::table_name("monitor_jobs");
         let processor_results_table = schema::table_name("processor_results");
         if let Err(e) = sqlx::query(&format!(
@@ -99,8 +100,13 @@ impl JobWorker {
              AND id NOT IN (
                  SELECT DISTINCT job_id FROM {}
                  WHERE status IN ('pending', 'running')
+             )
+             AND id NOT IN (
+                 SELECT job_id FROM {}
+                 GROUP BY job_id
+                 HAVING bool_and(status = 'completed')
              )",
-            monitor_jobs_table, processor_results_table
+            monitor_jobs_table, processor_results_table, processor_results_table
         ))
         .execute(self.db.pool())
         .await
@@ -197,9 +203,9 @@ impl JobWorker {
                     job.processors.len()
                 };
                 let should_retry = self
-                    .check_and_complete_job(job.id, &job.uuid, expected_count)
+                    .check_and_complete_job(job.id, &job.uuid, &job.processors, expected_count)
                     .await
-                    .is_ok();
+                    .unwrap_or(false);
                 if should_retry && self.processor_pool.can_start().await {
                     if let Err(e) = self.process_job(job.clone()).await {
                         error!("Failed to reprocess job {}: {}", job.uuid, e);
@@ -708,14 +714,14 @@ impl JobWorker {
         } else {
             job.processors.len()
         };
-        self.check_and_complete_job(job.id, &job.uuid, expected_count)
+        self.check_and_complete_job(job.id, &job.uuid, &job.processors, expected_count)
             .await?;
 
         Ok(())
     }
 
     /// 檢查所有入庫步驟是否已完成（與 ingestion-status endpoint 同步邏輯）
-    async fn ingestion_complete(pool: &PgPool, uuid: &str) -> bool {
+    async fn ingestion_complete(pool: &PgPool, uuid: &str, job_processors: &[String]) -> bool {
         let chunk_t = schema::table_name("chunk");
         let fd_t = schema::table_name("face_detections");
 
@@ -730,18 +736,30 @@ impl JobWorker {
         }
 
         let fu = uuid;
-        let rule1 = check!(&format!(
-            "SELECT 1 FROM {chunk_t} WHERE file_uuid = '{fu}' AND chunk_type = 'sentence' LIMIT 1"
-        ));
-        let vector = check!(&format!("SELECT 1 FROM {chunk_t} WHERE file_uuid = '{fu}' AND chunk_type = 'sentence' AND embedding IS NOT NULL LIMIT 1"));
-        let rule3 = check!(&format!(
-            "SELECT 1 FROM {chunk_t} WHERE file_uuid = '{fu}' AND chunk_type = 'cut' LIMIT 1"
-        ));
-        let trace = check!(&format!("SELECT COUNT(DISTINCT trace_id) FROM {fd_t} WHERE file_uuid = '{fu}' AND trace_id IS NOT NULL"));
+        // Only check conditions relevant to the job's processors
+        let has_asr_or_asrx = job_processors.is_empty()
+            || job_processors.iter().any(|p| p == "asrx" || p == "asr");
+        let has_cut = job_processors.is_empty()
+            || job_processors.iter().any(|p| p == "cut");
+        let has_face = job_processors.is_empty()
+            || job_processors.iter().any(|p| p == "face");
+
+        let rule1 = !has_asr_or_asrx
+            || check!(&format!(
+                "SELECT 1 FROM {chunk_t} WHERE file_uuid = '{fu}' AND chunk_type = 'sentence' LIMIT 1"
+            ));
+        let vector = !has_asr_or_asrx
+            || check!(&format!("SELECT 1 FROM {chunk_t} WHERE file_uuid = '{fu}' AND chunk_type = 'sentence' AND embedding IS NOT NULL LIMIT 1"));
+        let rule3 = !has_cut
+            || check!(&format!(
+                "SELECT 1 FROM {chunk_t} WHERE file_uuid = '{fu}' AND chunk_type = 'cut' LIMIT 1"
+            ));
+        let trace = !has_face
+            || check!(&format!("SELECT COUNT(DISTINCT trace_id) FROM {fd_t} WHERE file_uuid = '{fu}' AND trace_id IS NOT NULL"));
         let all_ok = rule1 && vector && rule3 && trace;
         if !all_ok {
             tracing::info!(
-                "[Ingestion] waiting: rule1={rule1} vector={vector} rule3={rule3} trace={trace}"
+                "[Ingestion] waiting (uuid={fu}): rule1={rule1} vector={vector} rule3={rule3} trace={trace}"
             );
         }
         all_ok
@@ -751,8 +769,9 @@ impl JobWorker {
         &self,
         job_id: i32,
         uuid: &str,
+        job_processors: &[String],
         expected_count: usize,
-    ) -> Result<()> {
+    ) -> Result<bool> {
         let results = self.db.get_processor_results_by_job(job_id).await?;
 
         info!(
@@ -831,10 +850,29 @@ impl JobWorker {
             .await?;
 
         if has_asrx {
-            info!("📝 Prerequisites met for Rule 1 Chunking. Starting ingestion...");
-            let db_clone = self.db.clone();
-            let uuid_clone = uuid.to_string();
-            tokio::spawn(async move {
+            // Guard: only spawn Rule 1 if sentence chunks don't exist yet
+            let chunk_t = schema::table_name("chunk");
+            let already_spawned: bool = sqlx::query_scalar::<_, i64>(
+                &format!(
+                    "SELECT 1 FROM {chunk_t} WHERE file_uuid = $1 AND chunk_type = 'sentence' LIMIT 1"
+                ),
+            )
+            .bind(uuid)
+            .fetch_optional(self.db.pool())
+            .await?
+            .unwrap_or(0)
+                > 0;
+
+            if already_spawned {
+                info!(
+                    "✅ Rule 1 already completed for {}, skipping spawn",
+                    uuid
+                );
+            } else {
+                info!("📝 Prerequisites met for Rule 1 Chunking. Starting ingestion...");
+                let db_clone = self.db.clone();
+                let uuid_clone = uuid.to_string();
+                tokio::spawn(async move {
                 match db_clone.get_video_by_uuid(&uuid_clone).await {
                     Ok(Some(video)) => {
                         let fps = video.fps;
@@ -886,6 +924,7 @@ impl JobWorker {
                     Err(e) => error!("Failed to get video info for chunking: {}", e),
                 }
             });
+            }
         }
 
         if all_completed {
@@ -1031,12 +1070,12 @@ impl JobWorker {
                 });
             }
 
-            if !Self::ingestion_complete(self.db.pool(), uuid).await {
+            if !Self::ingestion_complete(self.db.pool(), uuid, job_processors).await {
                 info!(
                     "Job {}: all processors done, waiting for ingestion...",
                     job_id
                 );
-                return Ok(());
+                return Ok(false);
             }
 
             self.db
@@ -1114,7 +1153,7 @@ impl JobWorker {
                 .await?;
         }
 
-        Ok(())
+        Ok(false)
     }
 
     pub async fn shutdown(&self) {
diff --git a/src/worker/processor.rs b/src/worker/processor.rs
index 4c95aad..9702404 100644
--- a/src/worker/processor.rs
+++ b/src/worker/processor.rs
@@ -7,8 +7,6 @@ use std::sync::Arc;
 use tokio::sync::{mpsc, RwLock};
 use tracing::{error, info, warn};
 
-
-
 /// Guard that ensures processor pool cleanup runs even if the task panics.
 struct ProcessorCleanupGuard {
     job_id: i32,
@@ -28,17 +26,23 @@ impl Drop for ProcessorCleanupGuard {
             warn!("[ProcessorCleanupGuard] running lock contended");
         }
         if let Ok(mut guard) = self.running_count.try_write() {
-            if *guard > 0 { *guard -= 1; }
+            if *guard > 0 {
+                *guard -= 1;
+            }
         }
         match self.pipeline {
             PipelineType::Frame => {
                 if let Ok(mut guard) = self.frame_count.try_write() {
-                    if *guard > 0 { *guard -= 1; }
+                    if *guard > 0 {
+                        *guard -= 1;
+                    }
                 }
             }
             PipelineType::Time => {
                 if let Ok(mut guard) = self.time_count.try_write() {
-                    if *guard > 0 { *guard -= 1; }
+                    if *guard > 0 {
+                        *guard -= 1;
+                    }
                 }
             }
             PipelineType::Cross => {} // cross pipeline not tracked in slot counts
@@ -66,7 +70,6 @@ use crate::core::processor::face::FaceResult;
 use crate::core::processor::ocr::OcrResult;
 use crate::core::processor::pose::PoseResult;
 use crate::core::processor::scene_classification::SceneClassificationResult;
-use crate::core::processor::visual_chunk::VisualChunkResult;
 use crate::core::processor::yolo::YoloResult;
 use crate::worker::resources::SystemResources;
 
@@ -518,32 +521,10 @@ impl ProcessorPool {
         let total_frames = video.as_ref().map(|v| v.total_frames as i32).unwrap_or(0);
 
         match processor_type {
-            ProcessorType::Asr => {
-                let result =
-                    processor::process_asr(video_path, output_path.to_str().unwrap(), uuid).await?;
-                let chunks_produced = result.segments.len() as i32;
-                tracing::info!(
-                    "ASR completed, storing {} segments for {}",
-                    chunks_produced,
-                    job.uuid
-                );
-                if let Err(e) = Self::store_asr_chunks(db, &job.uuid, &result).await {
-                    tracing::error!("Failed to store ASR chunks for {}: {}", job.uuid, e);
-                }
-                Ok(ProcessorOutput {
-                    data: serde_json::to_value(result)?,
-                    chunks_produced,
-                    frames_processed: total_frames,
-                    total_frames,
-                    retry_count: 0,
-                    pid: 0,
-                })
-            }
             ProcessorType::Cut => {
                 let cut_path =
                     std::path::Path::new(&output_dir).join(format!("{}.cut.json", job.uuid));
                 let result = if cut_path.exists() {
-                    // CUT 在 register 階段已完成，直接載入
                     let content =
                         std::fs::read_to_string(&cut_path).context("Failed to read cut.json")?;
                     serde_json::from_str(&content).context("Failed to parse cut.json")?
@@ -624,10 +605,6 @@ impl ProcessorPool {
                 if let Err(e) = Self::store_face_chunks(db, &job.uuid, &result).await {
                     tracing::error!("Failed to store FACE chunks for {}: {}", job.uuid, e);
                 }
-                // 將 face embedding 寫入 Qdrant
-                if let Err(e) = Self::store_face_embeddings_to_qdrant(&job.uuid, &result).await {
-                    tracing::error!("Failed to store face embeddings to Qdrant: {}", e);
-                }
                 Ok(ProcessorOutput {
                     data: serde_json::to_value(result)?,
                     chunks_produced,
@@ -685,31 +662,6 @@ impl ProcessorPool {
                     pid: 0,
                 })
             }
-            ProcessorType::VisualChunk => {
-                let result = processor::process_visual_chunk_advanced(
-                    video_path,
-                    output_path.to_str().unwrap(),
-                    uuid,
-                )
-                .await?;
-                let chunks_produced = result.chunk_count as i32;
-                tracing::info!(
-                    "VisualChunk completed, storing {} chunks for {}",
-                    chunks_produced,
-                    job.uuid
-                );
-                if let Err(e) = Self::store_visual_chunk_chunks(db, &job.uuid, &result).await {
-                    tracing::error!("Failed to store VisualChunk chunks for {}: {}", job.uuid, e);
-                }
-                Ok(ProcessorOutput {
-                    data: serde_json::to_value(result)?,
-                    chunks_produced,
-                    frames_processed: total_frames,
-                    total_frames,
-                    retry_count: 0,
-                    pid: 0,
-                })
-            }
             ProcessorType::Scene => {
                 let scene_path =
                     std::path::Path::new(&output_dir).join(format!("{}.scene.json", job.uuid));
@@ -717,7 +669,6 @@ impl ProcessorPool {
                     std::path::Path::new(&output_dir).join(format!("{}.scene.err", job.uuid));
                 let scene_tmp =
                     std::path::Path::new(&output_dir).join(format!("{}.scene.tmp", job.uuid));
-                // 優先順序：.err（跳過）→ .json（載入）→ .tmp（等待或重新執行）
                 let result = if scene_err.exists() {
                     tracing::warn!("Scene previously failed for {}, skipping", job.uuid);
                     return Ok(ProcessorOutput {
@@ -1009,72 +960,6 @@ impl ProcessorPool {
         Ok(())
     }
 
-    /// 將 face embeddings 寫入 Qdrant momentry_dev_face collection
-    pub async fn store_face_embeddings_to_qdrant(
-        uuid: &str,
-        face_result: &FaceResult,
-    ) -> Result<()> {
-        let qdrant = QdrantDb::new();
-        let collection = format!(
-            "{}{}",
-            crate::core::config::REDIS_KEY_PREFIX
-                .as_str()
-                .trim_end_matches(':'),
-            "_face"
-        );
-
-        // 確保 collection 存在（dim=512 for FaceNet）
-        if let Err(e) = qdrant.ensure_collection(&collection, 512).await {
-            tracing::error!("Failed to ensure Qdrant face collection: {}", e);
-            return Ok(());
-        }
-
-        let mut count = 0;
-        for frame in &face_result.frames {
-            for face in &frame.faces {
-                if let Some(embedding) = &face.embedding {
-                    if embedding.len() != 512 {
-                        continue;
-                    }
-                    // 使用 hash 作為 Qdrant point ID（需要 unsigned integer）
-                    // 使用 frame number 作為 Qdrant point ID（u64）
-                    let point_id = frame.frame as u64;
-
-                    let payload = serde_json::json!({
-                        "file_uuid": uuid,
-                        "face_id": face.face_id,
-                        "frame": frame.frame,
-                        "timestamp": frame.timestamp,
-                        "x": face.x,
-                        "y": face.y,
-                        "width": face.width,
-                        "height": face.height,
-                        "confidence": face.confidence,
-                    });
-
-                    if let Err(e) = qdrant
-                        .upsert_vector_to_collection(
-                            &collection,
-                            point_id,
-                            embedding,
-                            Some(payload),
-                        )
-                        .await
-                    {
-                        tracing::error!("Failed to upsert face vector {}: {}", point_id, e);
-                    } else {
-                        count += 1;
-                    }
-                }
-            }
-        }
-
-        if count > 0 {
-            tracing::info!("Stored {} face embeddings to Qdrant for {}", count, uuid);
-        }
-        Ok(())
-    }
-
     /// 將 voice embeddings 寫入 Qdrant momentry_dev_voice collection
     pub async fn store_voice_embeddings_to_qdrant(
         uuid: &str,
@@ -1106,9 +991,22 @@ impl ProcessorPool {
                 if emb.len() != 192 {
                     continue;
                 }
+                // Point ID: hash(file_uuid + speaker_id + index) for global uniqueness
+                let point_id = {
+                    use sha2::{Digest, Sha256};
+                    let mut hasher = Sha256::new();
+                    hasher.update(uuid.as_bytes());
+                    hasher.update(b"_");
+                    hasher.update(segment.speaker_id.clone().unwrap_or_default().as_bytes());
+                    hasher.update(b"_");
+                    hasher.update(i.to_string().as_bytes());
+                    let hash = hasher.finalize();
+                    u64::from_be_bytes(hash[0..8].try_into().unwrap())
+                };
+
                 let payload = serde_json::json!({
                     "file_uuid": uuid,
-                    "speaker_id": segment.speaker_id,
+                    "speaker_id": segment.speaker_id.clone().unwrap_or_default(),
                     "segment_index": i,
                     "start_frame": segment.start_frame,
                     "end_frame": segment.end_frame,
@@ -1117,7 +1015,7 @@ impl ProcessorPool {
                 });
 
                 if let Err(e) = qdrant
-                    .upsert_vector_to_collection(&collection, i as u64, emb, Some(payload))
+                    .upsert_vector_to_collection(&collection, point_id, emb, Some(payload))
                     .await
                 {
                     tracing::error!("Failed to upsert voice vector {}: {}", i, e);
@@ -1174,6 +1072,7 @@ impl ProcessorPool {
         );
 
         let mut pre_chunks_to_store = Vec::new();
+        let mut speaker_detections = Vec::new();
 
         for (i, segment) in asrx_result.segments.iter().enumerate() {
             let data = serde_json::json!({
@@ -1184,28 +1083,23 @@ impl ProcessorPool {
 
             // ASRX is time-based, so we use segment index or start time as coordinate.
             pre_chunks_to_store.push((i as i64, Some(segment.start_time), data, None, None));
+
+            speaker_detections.push((
+                segment.speaker_id.clone().unwrap_or_default(),
+                segment.start_time,
+                segment.end_time,
+                segment.text.clone(),
+                None::<String>,     // chunk_id: unknown yet, filled later
+                0.0,                 // confidence: updated after binding
+            ));
         }
 
         db.store_raw_pre_chunks_batch(uuid, "asrx", &pre_chunks_to_store)
             .await?;
-        Ok(())
-    }
-
-    pub async fn store_visual_chunk_chunks(
-        db: &PostgresDb,
-        uuid: &str,
-        visual_chunk_result: &VisualChunkResult,
-    ) -> Result<()> {
-        for (i, chunk) in visual_chunk_result.chunks.iter().enumerate() {
-            match db.store_chunk(chunk).await {
-                Ok(_) => {
-                    tracing::info!("Stored VisualChunk chunk {} for video {}", i, uuid);
-                }
-                Err(e) => {
-                    tracing::error!("Failed to store VisualChunk chunk {}: {}", i, e);
-                }
-            }
-        }
+        db.store_raw_pre_chunks_batch(uuid, "asr", &pre_chunks_to_store)
+            .await?;
+        db.store_speaker_detections_batch(uuid, &speaker_detections)
+            .await?;
         Ok(())
     }
 
@@ -1256,7 +1150,7 @@ impl ProcessorPool {
             });
             let chunk_table = crate::core::db::schema::table_name("chunk");
             let _ = sqlx::query(&format!(
-                "UPDATE {} SET metadata = metadata || $1::jsonb WHERE file_uuid=$2 AND chunk_id=$3",
+                "UPDATE {} SET metadata = jsonb_deep_merge(COALESCE(metadata, '{{}}'::jsonb), $1::jsonb) WHERE file_uuid=$2 AND chunk_id=$3",
                 chunk_table
             ))
             .bind(&meta)
diff --git a/tests/visual_chunk_concept.rs b/tests/visual_chunk_concept.rs
deleted file mode 100644
index f613062..0000000
--- a/tests/visual_chunk_concept.rs
+++ /dev/null
@@ -1,451 +0,0 @@
-//! 視覺分片概念驗證測試
-//!
-//! 此測試驗證視覺分片的數據結構和基本功能
-
-/// 視覺分片類型
-#[derive(Debug, Clone, Copy, PartialEq)]
-pub enum ChunkType {
-    TimeBased,
-    Sentence,
-    Cut,
-    Trace,
-    Story,
-    Visual, // 視覺分片 (Phase 2.1)
-}
-
-impl ChunkType {
-    pub fn as_str(&self) -> &'static str {
-        match self {
-            ChunkType::TimeBased => "time",
-            ChunkType::Sentence => "sentence",
-            ChunkType::Cut => "cut",
-            ChunkType::Trace => "trace",
-            ChunkType::Story => "story",
-            ChunkType::Visual => "visual",
-        }
-    }
-}
-
-/// 檢測到的物件
-#[derive(Debug, Clone)]
-pub struct DetectedObject {
-    /// 物件類別名稱
-    pub class_name: String,
-    /// 物件類別 ID
-    pub class_id: u32,
-    /// 信心值 (0.0-1.0)
-    pub confidence: f32,
-    /// 邊界框 (x, y, width, height)
-    pub bbox: Option<(i32, i32, i32, i32)>,
-}
-
-/// 關鍵幀的物件列表
-#[derive(Debug, Clone)]
-pub struct KeyframeObjects {
-    /// 關鍵幀時間 (秒)
-    pub timestamp: f64,
-    /// 關鍵幀幀號
-    pub frame_number: u64,
-    /// 檢測到的物件
-    pub objects: Vec<DetectedObject>,
-}
-
-/// 視覺分片內容
-#[derive(Debug, Clone)]
-pub struct VisualChunkContent {
-    pub start_time: f64,
-    pub end_time: f64,
-    pub keyframe_objects: Vec<KeyframeObjects>,
-    pub dominant_objects: Vec<String>,
-    pub scene_description: Option<String>,
-    pub metadata: VisualMetadata,
-}
-
-/// 視覺元數據
-#[derive(Debug, Clone)]
-pub struct VisualMetadata {
-    pub object_count: u32,
-    pub unique_classes: Vec<String>,
-    pub max_confidence: f32,
-    pub avg_confidence: f32,
-    pub spatial_density: f32, // objects per frame
-}
-
-impl VisualChunkContent {
-    /// 獲取視覺分片的摘要
-    pub fn summary(&self) -> String {
-        let duration = self.end_time - self.start_time;
-        let frame_count = self.keyframe_objects.len();
-
-        format!(
-            "視覺分片: {:.1}s 到 {:.1}s (持續時間: {:.1}s, {} 幀). 物件: {} 個總計, {} 個唯一. 主要物件: {}",
-            self.start_time,
-            self.end_time,
-            duration,
-            frame_count,
-            self.metadata.object_count,
-            self.metadata.unique_classes.len(),
-            if self.dominant_objects.is_empty() {
-                "無".to_string()
-            } else {
-                self.dominant_objects.join(", ")
-            }
-        )
-    }
-
-    /// 檢查是否包含特定物件類別
-    pub fn contains_object(&self, class_name: &str) -> bool {
-        self.keyframe_objects
-            .iter()
-            .any(|ko| ko.objects.iter().any(|obj| obj.class_name == class_name))
-    }
-}
-
-/// 模擬 YOLO 結果
-#[derive(Debug, Clone)]
-pub struct MockYoloResult {
-    pub frames: Vec<MockYoloFrame>,
-}
-
-#[derive(Debug, Clone)]
-pub struct MockYoloFrame {
-    pub frame: u64,
-    pub timestamp: f64,
-    pub objects: Vec<MockYoloObject>,
-}
-
-#[derive(Debug, Clone)]
-pub struct MockYoloObject {
-    pub class_name: String,
-    pub class_id: u32,
-    pub x: i32,
-    pub y: i32,
-    pub width: i32,
-    pub height: i32,
-    pub confidence: f32,
-}
-
-impl MockYoloResult {
-    /// 從模擬 YOLO 結果創建視覺分片
-    pub fn to_visual_chunk(&self, start_frame: u64, end_frame: u64) -> Option<VisualChunkContent> {
-        let frames: Vec<_> = self
-            .frames
-            .iter()
-            .filter(|f| f.frame >= start_frame && f.frame <= end_frame)
-            .collect();
-
-        if frames.is_empty() {
-            return None;
-        }
-
-        // 轉換幀為關鍵幀物件
-        let keyframe_objects: Vec<KeyframeObjects> = frames
-            .iter()
-            .map(|frame| {
-                let objects: Vec<DetectedObject> = frame
-                    .objects
-                    .iter()
-                    .map(|obj| DetectedObject {
-                        class_name: obj.class_name.clone(),
-                        class_id: obj.class_id,
-                        confidence: obj.confidence,
-                        bbox: Some((obj.x, obj.y, obj.width, obj.height)),
-                    })
-                    .collect();
-                KeyframeObjects {
-                    timestamp: frame.timestamp,
-                    frame_number: frame.frame,
-                    objects,
-                }
-            })
-            .collect();
-
-        // 計算元數據
-        let total_objects: u32 = frames.iter().map(|f| f.objects.len() as u32).sum();
-        let all_classes: Vec<String> = frames
-            .iter()
-            .flat_map(|f| f.objects.iter().map(|o| o.class_name.clone()))
-            .collect();
-        let unique_classes: Vec<String> = all_classes
-            .iter()
-            .cloned()
-            .collect::<std::collections::HashSet<_>>()
-            .into_iter()
-            .collect();
-        let confidences: Vec<f32> = frames
-            .iter()
-            .flat_map(|f| f.objects.iter().map(|o| o.confidence))
-            .collect();
-        let max_confidence = confidences.iter().copied().fold(0.0f32, f32::max);
-        let avg_confidence = if !confidences.is_empty() {
-            confidences.iter().sum::<f32>() / confidences.len() as f32
-        } else {
-            0.0
-        };
-
-        let start_time = frames.first().map(|f| f.timestamp).unwrap_or(0.0);
-        let end_time = frames.last().map(|f| f.timestamp).unwrap_or(0.0);
-
-        // 查找主要物件（出現在大多數幀中的物件）
-        let mut object_counts = std::collections::HashMap::new();
-        for frame in &frames {
-            let frame_classes: std::collections::HashSet<_> =
-                frame.objects.iter().map(|o| o.class_name.clone()).collect();
-            for class in frame_classes {
-                *object_counts.entry(class).or_insert(0) += 1;
-            }
-        }
-
-        let mut dominant_objects: Vec<String> = object_counts
-            .into_iter()
-            .filter(|(_, count)| *count as f32 / frames.len() as f32 > 0.5) // 出現在 >50% 的幀中
-            .map(|(class, _)| class)
-            .collect();
-        dominant_objects.sort();
-
-        Some(VisualChunkContent {
-            start_time,
-            end_time,
-            keyframe_objects,
-            dominant_objects,
-            scene_description: None, // 可由 LLM 後期生成
-            metadata: VisualMetadata {
-                object_count: total_objects,
-                unique_classes,
-                max_confidence,
-                avg_confidence,
-                spatial_density: if frames.len() > 0 {
-                    total_objects as f32 / frames.len() as f32
-                } else {
-                    0.0
-                },
-            },
-        })
-    }
-}
-
-#[cfg(test)]
-mod tests {
-    use super::*;
-
-    #[test]
-    fn test_chunk_type_visual() {
-        let chunk_type = ChunkType::Visual;
-        assert_eq!(chunk_type.as_str(), "visual");
-        assert_eq!(chunk_type, ChunkType::Visual);
-    }
-
-    #[test]
-    fn test_visual_chunk_creation() {
-        // 創建模擬 YOLO 結果
-        let yolo_result = MockYoloResult {
-            frames: vec![
-                MockYoloFrame {
-                    frame: 0,
-                    timestamp: 0.0,
-                    objects: vec![
-                        MockYoloObject {
-                            class_name: "person".to_string(),
-                            class_id: 0,
-                            x: 100,
-                            y: 200,
-                            width: 50,
-                            height: 100,
-                            confidence: 0.95,
-                        },
-                        MockYoloObject {
-                            class_name: "car".to_string(),
-                            class_id: 2,
-                            x: 300,
-                            y: 150,
-                            width: 80,
-                            height: 60,
-                            confidence: 0.87,
-                        },
-                    ],
-                },
-                MockYoloFrame {
-                    frame: 1,
-                    timestamp: 0.033, // 1/30 秒
-                    objects: vec![MockYoloObject {
-                        class_name: "person".to_string(),
-                        class_id: 0,
-                        x: 110,
-                        y: 210,
-                        width: 52,
-                        height: 102,
-                        confidence: 0.92,
-                    }],
-                },
-            ],
-        };
-
-        // 從 YOLO 結果創建視覺分片
-        let chunk = yolo_result.to_visual_chunk(0, 1).unwrap();
-
-        // 驗證分片屬性
-        assert_eq!(chunk.start_time, 0.0);
-        assert_eq!(chunk.end_time, 0.033);
-        assert_eq!(chunk.metadata.object_count, 3);
-        assert_eq!(chunk.metadata.unique_classes.len(), 2);
-        assert!(chunk
-            .metadata
-            .unique_classes
-            .contains(&"person".to_string()));
-        assert!(chunk.metadata.unique_classes.contains(&"car".to_string()));
-        assert_eq!(chunk.dominant_objects, vec!["person"]);
-        assert_eq!(chunk.keyframe_objects.len(), 2);
-    }
-
-    #[test]
-    fn test_visual_chunk_content_methods() {
-        let content = VisualChunkContent {
-            start_time: 0.0,
-            end_time: 5.0,
-            keyframe_objects: vec![KeyframeObjects {
-                timestamp: 0.0,
-                frame_number: 0,
-                objects: vec![
-                    DetectedObject {
-                        class_name: "person".to_string(),
-                        class_id: 0,
-                        confidence: 0.95,
-                        bbox: Some((100, 200, 50, 100)),
-                    },
-                    DetectedObject {
-                        class_name: "car".to_string(),
-                        class_id: 2,
-                        confidence: 0.87,
-                        bbox: Some((300, 150, 80, 60)),
-                    },
-                ],
-            }],
-            dominant_objects: vec!["person".to_string()],
-            scene_description: Some("一個人站在車旁".to_string()),
-            metadata: VisualMetadata {
-                object_count: 2,
-                unique_classes: vec!["person".to_string(), "car".to_string()],
-                max_confidence: 0.95,
-                avg_confidence: 0.91,
-                spatial_density: 2.0,
-            },
-        };
-
-        // 測試摘要方法
-        let summary = content.summary();
-        assert!(summary.contains("視覺分片"));
-        assert!(summary.contains("person"));
-        assert!(summary.contains("車"));
-
-        // 測試 contains_object 方法
-        assert!(content.contains_object("person"));
-        assert!(content.contains_object("car"));
-        assert!(!content.contains_object("dog"));
-    }
-
-    #[test]
-    fn test_frame_similarity_concept() {
-        // 測試幀相似度計算概念
-        let frame1_objects = vec![
-            DetectedObject {
-                class_name: "person".to_string(),
-                class_id: 0,
-                confidence: 0.95,
-                bbox: Some((100, 200, 50, 100)),
-            },
-            DetectedObject {
-                class_name: "car".to_string(),
-                class_id: 2,
-                confidence: 0.87,
-                bbox: Some((300, 150, 80, 60)),
-            },
-        ];
-
-        let frame2_objects = vec![
-            DetectedObject {
-                class_name: "person".to_string(),
-                class_id: 0,
-                confidence: 0.92,
-                bbox: Some((110, 210, 52, 102)),
-            },
-            DetectedObject {
-                class_name: "car".to_string(),
-                class_id: 2,
-                confidence: 0.85,
-                bbox: Some((310, 155, 82, 62)),
-            },
-        ];
-
-        // 創建集合
-        let set1: std::collections::HashSet<String> = frame1_objects
-            .iter()
-            .map(|o| o.class_name.clone())
-            .collect();
-        let set2: std::collections::HashSet<String> = frame2_objects
-            .iter()
-            .map(|o| o.class_name.clone())
-            .collect();
-
-        // 計算交集和聯集
-        let intersection: Vec<_> = set1.intersection(&set2).collect();
-        let union: Vec<_> = set1.union(&set2).collect();
-
-        // 驗證相似度
-        assert_eq!(intersection.len(), 2); // person, car
-        assert_eq!(union.len(), 2); // person, car
-        assert_eq!(intersection.len() as f32 / union.len() as f32, 1.0); // 完全相似
-    }
-
-    #[test]
-    fn test_dominant_objects_detection() {
-        let yolo_result = MockYoloResult {
-            frames: vec![
-                MockYoloFrame {
-                    frame: 0,
-                    timestamp: 0.0,
-                    objects: vec![MockYoloObject {
-                        class_name: "person".to_string(),
-                        class_id: 0,
-                        x: 100,
-                        y: 200,
-                        width: 50,
-                        height: 100,
-                        confidence: 0.95,
-                    }],
-                },
-                MockYoloFrame {
-                    frame: 1,
-                    timestamp: 0.033,
-                    objects: vec![MockYoloObject {
-                        class_name: "person".to_string(),
-                        class_id: 0,
-                        x: 110,
-                        y: 210,
-                        width: 52,
-                        height: 102,
-                        confidence: 0.92,
-                    }],
-                },
-                MockYoloFrame {
-                    frame: 2,
-                    timestamp: 0.066,
-                    objects: vec![MockYoloObject {
-                        class_name: "car".to_string(),
-                        class_id: 2,
-                        x: 300,
-                        y: 150,
-                        width: 80,
-                        height: 60,
-                        confidence: 0.87,
-                    }],
-                },
-            ],
-        };
-
-        let chunk = yolo_result.to_visual_chunk(0, 2).unwrap();
-
-        // person 出現在 2/3 幀中（67% > 50%），car 出現在 1/3 幀中（33% < 50%）
-        assert_eq!(chunk.dominant_objects, vec!["person"]);
-        assert!(!chunk.dominant_objects.contains(&"car".to_string()));
-    }
-}