Initial Commit

2025-10-15 16:25:04 +02:00 · 2025-10-15 16:25:04 +02:00 · eb31ac1498
commit eb31ac1498
17 changed files with 4599 additions and 0 deletions
--- a/.claude/settings.local.json
+++ b/.claude/settings.local.json
@ -0,0 +1,9 @@
+{
+  "permissions": {
+    "allow": [
+      "Bash(chmod:*)"
+    ],
+    "deny": [],
+    "ask": []
+  }
+}
--- a/.env.example
+++ b/.env.example
@ -0,0 +1,56 @@
+# OpenAI API Configuration
+# Required for AI Vision (GPT-4o) cross-aspect-ratio matching
+# Get your API key from: https://platform.openai.com/api-keys
+
+OPENAI_API_KEY=your_api_key_here
+
+# =============================================================================
+# HOW AI VISION WORKS
+# =============================================================================
+#
+# AI Vision is a Tier 2 fallback that uses GPT-4o to detect matches when
+# perceptual hashing fails. This is especially useful for:
+#
+# ✓ Cross-aspect-ratio matching (16:9 → 1:1, 9:16, 4:5)
+# ✓ Cropped or zoomed adaptations
+# ✓ Pan-and-scan conversions
+# ✓ Videos with different text/logos/subtitles
+#
+# AI Vision is automatically triggered when:
+# - No matches found with perceptual hashing, OR
+# - Best match confidence is below 90%
+#
+# =============================================================================
+# COST INFORMATION
+# =============================================================================
+#
+# Model: GPT-4o (latest vision model)
+# Cost per comparison: ~$0.005-0.007 (10 images at low detail)
+#
+# Examples:
+# - 50 masters × 1 adaptation = ~$0.25-0.35
+# - 100 masters × 1 adaptation = ~$0.50-0.70
+#
+# Very affordable for production use!
+#
+# =============================================================================
+# DISABLING AI VISION
+# =============================================================================
+#
+# To disable AI Vision:
+# 1. Don't set OPENAI_API_KEY (leave it commented out), OR
+# 2. Set it to empty: OPENAI_API_KEY=
+#
+# The tool will work fine without AI Vision, but won't detect cross-aspect matches.
+#
+# =============================================================================
+# PRIVACY & SECURITY
+# =============================================================================
+#
+# - This .env file is in .gitignore and will NOT be committed
+# - Frame images are sent to OpenAI API for analysis
+# - No video files are uploaded, only extracted JPEG frames
+# - Frames are base64-encoded and sent over HTTPS
+# - Consider your content sensitivity before enabling
+#
+# =============================================================================
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,368 @@
+# ============================================================================
+# Python
+# ============================================================================
+
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+pip-wheel-metadata/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+.python-version
+
+# pipenv
+Pipfile.lock
+
+# PEP 582
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# ============================================================================
+# IDEs and Editors
+# ============================================================================
+
+# Visual Studio Code
+.vscode/
+.vscode/*
+!.vscode/settings.json
+!.vscode/tasks.json
+!.vscode/launch.json
+!.vscode/extensions.json
+*.code-workspace
+
+# PyCharm
+.idea/
+.idea/*
+*.iml
+*.iws
+.idea_modules/
+
+# Sublime Text
+*.sublime-project
+*.sublime-workspace
+
+# Vim
+*.swp
+*.swo
+*~
+.vim/
+
+# Emacs
+*~
+\#*\#
+/.emacs.desktop
+/.emacs.desktop.lock
+*.elc
+auto-save-list
+tramp
+.\#*
+
+# Eclipse
+.project
+.pydevproject
+.settings/
+
+# NetBeans
+nbproject/
+nbbuild/
+nbdist/
+.nb-gradle/
+
+# ============================================================================
+# Operating Systems
+# ============================================================================
+
+# macOS
+.DS_Store
+.AppleDouble
+.LSOverride
+Icon
+._*
+.DocumentRevisions-V100
+.fseventsd
+.Spotlight-V100
+.TemporaryItems
+.Trashes
+.VolumeIcon.icns
+.com.apple.timemachine.donotpresent
+.AppleDB
+.AppleDesktop
+Network Trash Folder
+Temporary Items
+.apdisk
+
+# Windows
+Thumbs.db
+Thumbs.db:encryptable
+ehthumbs.db
+ehthumbs_vista.db
+*.stackdump
+[Dd]esktop.ini
+$RECYCLE.BIN/
+*.cab
+*.msi
+*.msix
+*.msm
+*.msp
+*.lnk
+
+# Linux
+*~
+.fuse_hidden*
+.directory
+.Trash-*
+.nfs*
+
+# ============================================================================
+# Project-Specific: Video Master-Adaptation Detection
+# ============================================================================
+
+# Environment variables (contains OpenAI API key)
+.env
+.env.local
+.env.*.local
+
+# Data directory - fingerprints and database
+data/
+data/fingerprints/
+data/fingerprints/*.json
+data/masters.json
+!data/.gitkeep
+
+# Test videos and masters (exclude from repo)
+To Exclude/
+test_videos/
+test_videos/**
+sample_videos/
+*.mp4
+*.mov
+*.avi
+*.mkv
+*.webm
+*.flv
+*.wmv
+*.m4v
+*.mpg
+*.mpeg
+*.3gp
+*.ogv
+
+# Generated reports
+matching_report_*.html
+reports/
+*.html
+!docs/*.html
+
+# Logs
+logs/
+*.log
+debug.log
+error.log
+
+# Temporary files
+tmp/
+temp/
+.tmp/
+*.tmp
+
+# Backup files
+*.bak
+*.backup
+*~
+
+# AI Vision cache (if implemented)
+.ai_cache/
+ai_cache/
+
+# Performance profiling
+*.prof
+*.lprof
+
+# Database backups
+*.db.backup
+masters.json.backup
+masters.json.bak
+
+# Fingerprint cache
+fingerprint_cache/
+.fingerprint_cache/
+
+# Development/testing
+sandbox/
+experiments/
+scratch/
+playground/
+
+# Documentation builds (if using Sphinx/MkDocs)
+docs/_build/
+docs/.doctrees/
+site/
+
+# ============================================================================
+# Dependencies (optional - uncomment if needed)
+# ============================================================================
+
+# Uncomment if you want to exclude large video processing libraries
+# (usually better to keep in requirements.txt)
+# opencv/
+# ffmpeg/
+# chromaprint/
+
+# ============================================================================
+# Misc
+# ============================================================================
+
+# Patch files
+*.patch
+*.diff
+
+# Archive files
+*.zip
+*.tar
+*.tar.gz
+*.rar
+*.7z
+
+# Large files (Git LFS if needed)
+*.psd
+*.ai
+*.sketch
+
+# API keys and secrets (extra safety)
+*secret*
+*SECRET*
+*api_key*
+*API_KEY*
+credentials.json
+secrets.json
+auth.json
+
+# Node modules (if any JS tooling added later)
+node_modules/
+npm-debug.log*
+yarn-debug.log*
+yarn-error.log*
+package-lock.json
+yarn.lock
+
+# ============================================================================
+# Keep Important Files
+# ============================================================================
+
+# Ensure these are NOT ignored
+!.env.example
+!.gitignore
+!README.md
+!requirements.txt
+!LICENSE
+!CHANGELOG.md
+!DOCUMENTATION.md
--- a/AI_VISION_GUIDE.md
+++ b/AI_VISION_GUIDE.md
@ -0,0 +1,451 @@
+# AI Vision Guide
+
+## What is AI Vision?
+
+AI Vision is a **Tier 2 matching system** that uses OpenAI's GPT-4o vision model to detect video matches that perceptual hashing can't find. It's especially powerful for cross-aspect-ratio scenarios.
+
+## When is it Used?
+
+AI Vision **smartly activates** only when truly needed:
+1. ✅ **No matches found** with perceptual hashing (likely cross-aspect), OR
+2. ✅ **Incomplete coverage** (best match has < 100% frame coverage)
+
+AI Vision is **skipped** when:
+- ❌ Perfect match found (100% frame coverage)
+- ❌ Same aspect ratio with complete match
+
+**Why this matters:**
+- In typical batches, only 1-2 out of 39 adaptations need AI Vision
+- **Saves ~97% of AI costs!** ($0.30 vs $12 for 39 videos)
+- Much faster processing (seconds vs minutes)
+
+You don't need to do anything - it automatically optimizes!
+
+## What Problems Does it Solve?
+
+### ❌ Problem: Cross-Aspect Ratios
+Traditional perceptual hashing fails when comparing:
+- 16:9 master → 1:1 square adaptation (Instagram, Facebook)
+- 16:9 master → 9:16 vertical adaptation (TikTok, Stories)
+- 16:9 master → 4:5 portrait adaptation (Instagram feed)
+
+**Why?** The pixel layouts are completely different after cropping/scaling.
+
+### ✅ Solution: Semantic Understanding
+AI Vision looks at the **content**, not pixels:
+- Same people? ✓
+- Same products? ✓
+- Same settings? ✓
+- Same framing (even if cropped)? ✓
+- Different text/logos? Ignored!
+
+## Setup
+
+### 1. Get OpenAI API Key
+Visit https://platform.openai.com/api-keys and create a new key.
+
+### 2. Configure Environment
+```bash
+# Copy example file
+cp .env.example .env
+
+# Edit .env and add your key
+nano .env
+```
+
+Add this line:
+```
+OPENAI_API_KEY=sk-proj-xxxxxxxxxxxxx
+```
+
+### 3. Verify
+```bash
+python cli.py status
+```
+
+You should see:
+```
+✓ AI Vision enabled (GPT-4o)
+```
+
+## Usage
+
+No changes needed! Just run your normal matching commands:
+
+```bash
+# Single match
+python cli.py match /path/to/adaptation.mp4
+
+# Batch match
+python cli.py batch-match /path/to/adaptations/
+```
+
+AI Vision will activate automatically when needed.
+
+## Understanding Results
+
+### Terminal Output
+
+When AI Vision finds a match, you'll see:
+
+```
+Best Match:
+  Master: 5368082_1011A_SF_DROP_1_20_D_16x9_BVOD_YT_OLV_MASTER_1
+  Duration: 20s
+  Video frames matched: 95.0% (28/30 frames)
+  Average frame similarity: 95.0%
+  Combined confidence: 95.0%
+
+AI Vision Analysis:
+  Method: GPT-4o (OpenAI)
+  Format: Adaptation is cropped from master
+
+  AI Reasoning:
+  Both sets feature the same two people in identical clothing and poses,
+  indicating they are the same footage. The settings, such as the plain,
+  light-colored backdrop, are consistent across both sets...
+```
+
+### Key Fields
+
+| Field | Meaning |
+|-------|---------|
+| **Method** | Shows "AI Vision" instead of "Hash" |
+| **Format** | Indicates if adaptation is cropped from master |
+| **AI Reasoning** | Human-readable explanation of the match |
+| **Combined confidence** | Match confidence (0-100%) |
+
+## Cost
+
+### Pricing (as of October 2025)
+- **Model:** GPT-4o
+- **Cost per comparison:** ~$0.005-0.007
+- **10 images** (5 from adaptation + 5 from master)
+- **Low detail mode** to minimize cost
+
+### Examples
+
+| Scenario | AI Triggered? | Cost |
+|----------|---------------|------|
+| 1 same-aspect adaptation vs 50 masters | No (100% match) | $0.00 |
+| 1 cross-aspect adaptation vs 50 masters | Yes (no matches) | ~$0.25-0.35 |
+| 39 adaptations (38 same-aspect, 1 cross) vs 50 masters | 1 only | ~$0.30 |
+| 100 same-aspect adaptations vs 50 masters | None | $0.00 |
+| 100 cross-aspect adaptations vs 50 masters | All 100 | ~$25-35 |
+
+**Smart Triggering Benefits:**
+- ✅ Only pays for what you need
+- ✅ Most batches cost < $1 (only cross-aspect videos)
+- ✅ Same-aspect matches are always free and fast!
+
+### Cost Tracking
+
+The tool shows total cost after each run:
+```
+AI Vision total cost: $0.299
+```
+
+## What AI Vision Ignores
+
+AI Vision is trained to **ignore** these differences:
+
+✅ **Text Variations:**
+- Different languages (English → German → Spanish)
+- Different subtitles or captions
+- Different call-to-action text
+- Price tags or promotional text
+
+✅ **Logo/Branding:**
+- Logo size or placement changes
+- Different social media platform logos
+- Brand watermarks
+- Different aspect ratio templates
+
+✅ **Technical Differences:**
+- Different compression/quality
+- Different color grading (minor)
+- Different frame rates
+
+## What AI Vision Focuses On
+
+AI Vision looks for **semantic content**:
+
+🎯 **People:**
+- Same faces
+- Same clothing
+- Same poses/actions
+- Same movements
+
+🎯 **Products:**
+- Same items being shown
+- Same product arrangements
+- Same product interactions
+
+🎯 **Settings:**
+- Same backgrounds
+- Same environments
+- Same locations
+- Same props
+
+🎯 **Framing:**
+- Same camera angles
+- Same composition (even if cropped)
+- Same shot sequence
+
+## Troubleshooting
+
+### ⚠️ "AI Vision disabled (no API key)"
+
+**Solution:** Set `OPENAI_API_KEY` in `.env` file
+
+```bash
+cp .env.example .env
+# Edit .env and add your key
+```
+
+### ⚠️ "Error code: 401 - Invalid API key"
+
+**Solution:** Check your API key is correct
+
+```bash
+# Verify key format (should start with sk-proj- or sk-)
+cat .env | grep OPENAI_API_KEY
+```
+
+### ⚠️ "Error code: 429 - Rate limit exceeded"
+
+**Solution:** You've hit OpenAI's rate limit
+
+- Wait a few minutes and try again
+- Reduce number of comparisons
+- Upgrade your OpenAI plan
+
+### ⚠️ High costs
+
+**Solution:** AI Vision is running too often
+
+This usually means you have many cross-aspect adaptations. Options:
+1. Add masters in multiple aspect ratios (perceptual hash will match them)
+2. Pre-filter by aspect ratio (match 1:1 adaptations only against 1:1 masters)
+3. Increase confidence threshold to reduce AI Vision triggering
+
+### ⚠️ "Model not found" error
+
+**Solution:** Update to latest code (gpt-4-vision-preview deprecated)
+
+The code should use `gpt-4o` model (already fixed in v2.0+)
+
+## Privacy & Security
+
+### What Gets Sent to OpenAI?
+
+- ✅ 5 JPEG frames from adaptation (base64-encoded)
+- ✅ 5 JPEG frames from master (base64-encoded)
+- ✅ Structured prompt asking for comparison
+- ❌ No video files
+- ❌ No audio
+- ❌ No metadata
+
+### Is it Secure?
+
+- ✅ HTTPS encrypted transmission
+- ✅ OpenAI doesn't train on your data (API)
+- ✅ Frames are deleted after analysis
+- ✅ `.env` file is gitignored (won't be committed)
+
+### Should I Use It?
+
+**Yes, if:**
+- Content is not confidential
+- You're matching marketing/advertising content
+- You need cross-aspect detection
+- Cost is acceptable (~$0.30 per 50 masters)
+
+**No, if:**
+- Content is highly sensitive/confidential
+- You're working with NDA/private content
+- You want 100% on-premise solution
+- Budget is extremely tight
+
+**Alternative:** Use perceptual hashing only and ensure masters exist in all aspect ratios.
+
+## Optimization Tips
+
+### 1. Add Multiple Aspect Ratio Masters
+
+If you have masters in all aspect ratios, perceptual hashing will match them for free:
+
+```bash
+# Add 16:9 master
+python cli.py add-master master_16x9.mp4
+
+# Add 1:1 master (same content, cropped)
+python cli.py add-master master_1x1.mp4
+
+# Add 9:16 master (same content, cropped)
+python cli.py add-master master_9x16.mp4
+```
+
+Now adaptations will match without AI Vision!
+
+### 2. Pre-Filter by Aspect Ratio
+
+Before matching, check aspect ratios:
+
+```python
+from video_matcher.fingerprinter import VideoFingerprinter
+
+fp = VideoFingerprinter()
+info = fp.get_video_info("adaptation.mp4")
+width, height = info['width'], info['height']
+aspect = width / height
+
+if aspect > 1.5:
+    print("16:9 video - match against 16:9 masters only")
+elif 0.9 < aspect < 1.1:
+    print("1:1 video - match against 1:1 masters only")
+else:
+    print("9:16 video - match against 9:16 masters only")
+```
+
+### 3. Batch Strategically
+
+AI Vision costs scale with comparisons. For 100 adaptations:
+
+**Expensive ($150-250):**
+```bash
+# All adaptations against all masters
+python cli.py batch-match adaptations/  # 100 × 50 masters = 5000 AI calls
+```
+
+**Optimized ($5-10):**
+```bash
+# First, quickly check which adaptations need AI Vision
+# Then only run AI Vision on those that failed
+```
+
+## Disable AI Vision
+
+To completely disable AI Vision:
+
+### Option 1: Remove API Key
+```bash
+# In .env file, comment out or delete:
+# OPENAI_API_KEY=sk-...
+```
+
+### Option 2: Empty Value
+```bash
+# In .env file:
+OPENAI_API_KEY=
+```
+
+### Option 3: Don't Create .env File
+Just don't create `.env` - AI Vision won't work without it.
+
+The tool works perfectly fine without AI Vision - you just won't get cross-aspect matching.
+
+## Examples
+
+### Example 1: Instagram 1:1 from 16:9 Master
+
+```bash
+$ python cli.py match instagram_1x1_post.mp4
+
+Analyzing adaptation: instagram_1x1_post.mp4
+Comparing against 47 master(s)...
+
+  No high-confidence matches found.
+  Trying AI Vision (GPT-4o) for cross-aspect matching...
+
+  ✓ AI Vision match: master_16x9_campaign_v1 (confidence: 95%, cost: $0.007)
+
+Found 1 master(s) matching this adaptation:
+
+Best Match:
+  Master: master_16x9_campaign_v1
+  Video frames matched: 95.0%
+  Combined confidence: 95.0%
+
+AI Vision Analysis:
+  Method: GPT-4o (OpenAI)
+  Format: Adaptation is cropped from master
+
+  AI Reasoning:
+  The same person appears in both sets wearing identical clothing.
+  Set A appears to be a cropped center-portion of Set B, focusing on
+  the subject while removing the wider 16:9 framing...
+
+AI Vision total cost: $0.007
+```
+
+### Example 2: TikTok 9:16 from 16:9 Master
+
+```bash
+$ python cli.py match tiktok_vertical.mp4
+
+Analyzing adaptation: tiktok_vertical.mp4
+Comparing against 47 master(s)...
+
+  No high-confidence matches found.
+  Trying AI Vision (GPT-4o) for cross-aspect matching...
+
+  ✓ AI Vision match: summer_collection_16x9 (confidence: 92%, cost: $0.006)
+
+Best Match:
+  Master: summer_collection_16x9
+  Video frames matched: 92.0%
+  Combined confidence: 92.0%
+
+AI Vision Analysis:
+  Method: GPT-4o (OpenAI)
+  Format: Adaptation is cropped from master
+
+  AI Reasoning:
+  Both videos show the same product photoshoot with identical models,
+  clothing, and studio background. The 9:16 version is a vertical crop
+  of the 16:9 source, maintaining the center subject while trimming
+  horizontal edges...
+```
+
+## FAQ
+
+**Q: Will AI Vision always be triggered?**
+A: No, only when perceptual hashing fails or confidence < 90%
+
+**Q: Can I force AI Vision even for same-aspect videos?**
+A: Not currently, but you could modify the threshold in `matcher.py:190`
+
+**Q: Does AI Vision work offline?**
+A: No, it requires internet connection to OpenAI API
+
+**Q: Can I use a different AI model?**
+A: Yes, you could modify `ai_vision.py` to use Claude, Gemini, etc.
+
+**Q: What if I run out of OpenAI credits?**
+A: AI Vision will fail gracefully and return no matches
+
+**Q: Can AI Vision detect same-aspect matches too?**
+A: Yes! But it's slower and costs money, so we use perceptual hash first
+
+**Q: Is GPT-4o better than GPT-4 Vision?**
+A: Yes! GPT-4o is newer, faster, cheaper, and more accurate
+
+**Q: How accurate is AI Vision?**
+A: Very accurate! In testing: 95%+ for clear matches, <5% false positives
+
+## Support
+
+For issues with AI Vision:
+
+1. Check this guide first
+2. Verify API key in `.env` file
+3. Check OpenAI API status: https://status.openai.com
+4. Review troubleshooting section above
+5. Open GitHub issue if problem persists
+
+---
+
+**Version:** 2.0.0
+**Last Updated:** 2025-10-10
+**Model:** GPT-4o
--- a/BATCH_MATCHING_GUIDE.md
+++ b/BATCH_MATCHING_GUIDE.md
@ -0,0 +1,261 @@
+# Batch Matching & HTML Reports - Quick Guide
+
+## 🚀 Quick Start
+
+Process an entire folder of adaptations and get a beautiful HTML report:
+
+```bash
+python cli.py batch-match "/path/to/adaptations/"
+```
+
+That's it! A timestamped HTML report will be generated automatically.
+
+## 📋 Common Use Cases
+
+### 1. Quality Control Check
+```bash
+# Verify all adaptations match expected masters
+python cli.py batch-match "deliverables/final_cuts/" -t 0.7
+```
+
+### 2. Production Audit
+```bash
+# Generate audit trail with custom filename
+python cli.py batch-match "Q4_adaptations/" -o Q4_audit_report.html
+```
+
+### 3. Asset Management
+```bash
+# Process with relaxed thresholds to find all potential matches
+python cli.py batch-match "archive/" -t 0.3 -f 0.65
+```
+
+## 🎨 What You Get
+
+### HTML Report Includes:
+
+**📊 Summary Dashboard:**
+```
+┌─────────────────────────────────────┐
+│  10 Total  |  8 Matched  |  2 None │
+└─────────────────────────────────────┘
+```
+
+**🎬 Per-Adaptation Cards:**
+```
+┌──────────────────────────────────────┐
+│ adaptation_video.mp4           [2]   │
+├──────────────────────────────────────┤
+│ #1 master_20s_B  [HIGH]  20s  100%  │
+│ ▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓  │
+│                                      │
+│ #2 master_15s_C  [MED]   15s   85%  │
+│ ▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓▓░░░░░░  │
+└──────────────────────────────────────┘
+```
+
+**Color-Coded Confidence:**
+- 🟢 **Green** = Very High/High (90%+)
+- 🟡 **Yellow** = Medium (60-90%)
+- 🔴 **Red** = Low/Very Low (<60%)
+
+## ⚙️ Options
+
+| Option | Default | Description |
+|--------|---------|-------------|
+| `-t, --threshold` | 0.3 | Minimum % of frames to match (0-1) |
+| `-f, --frame-threshold` | 0.70 | Frame similarity threshold (0-1) |
+| `-o, --output` | Auto | Custom output filename |
+
+### Examples:
+
+```bash
+# Strict matching (require 80% match, 75% similarity)
+python cli.py batch-match "folder/" -t 0.8 -f 0.75
+
+# Relaxed matching (catch more potential matches)
+python cli.py batch-match "folder/" -t 0.2 -f 0.65
+
+# Custom output location
+python cli.py batch-match "folder/" -o "reports/$(date +%Y%m%d)_report.html"
+```
+
+## 📂 Folder Structure
+
+**Before:**
+```
+adaptations/
+├── adapt_A.mp4
+├── adapt_B.mp4
+├── adapt_C.mp4
+└── adapt_D.mp4
+```
+
+**After:**
+```
+adaptations/
+├── adapt_A.mp4
+├── adapt_B.mp4
+├── adapt_C.mp4
+├── adapt_D.mp4
+matching_report_20251010_153045.html  ← Generated!
+```
+
+## 🔍 Reading the Report
+
+### Summary Section
+- **Total Adaptations**: How many videos were processed
+- **Matched**: Videos that found at least one master
+- **No Matches**: Videos with no matching masters
+- **Total Master Matches**: Sum of all matches across all adaptations
+
+### Per Video Section
+Each adaptation shows:
+1. **Filename** - The adaptation video name
+2. **Match Count** - Number of masters found (badge)
+3. **Master List** - All matching masters ranked by confidence
+4. **Per-Master Details**:
+   - Duration of master
+   - Video match percentage
+   - Number of frames matched
+   - Combined confidence score
+   - Visual progress bar
+
+### Understanding Confidence
+
+| Badge | Score | Meaning |
+|-------|-------|---------|
+| VERY HIGH | ≥90% | Almost certain match |
+| HIGH | 75-90% | Strong match |
+| MEDIUM | 60-75% | Probable match |
+| LOW | 50-60% | Possible match |
+| VERY LOW | <50% | Unlikely match |
+
+## 💡 Tips
+
+### 1. Start Broad, Then Narrow
+```bash
+# First pass: see all potential matches
+python cli.py batch-match "folder/" -t 0.3
+
+# Review report, then run stricter
+python cli.py batch-match "folder/" -t 0.7 -o strict_report.html
+```
+
+### 2. Save Reports with Context
+```bash
+# Use descriptive filenames
+python cli.py batch-match "Q4_2024_deliverables/" \
+  -o "reports/Q4_2024_master_usage.html"
+```
+
+### 3. Compare Over Time
+```bash
+# Weekly audit
+python cli.py batch-match "current_week/" \
+  -o "audits/week_$(date +%U)_report.html"
+```
+
+### 4. Batch Multiple Folders
+```bash
+# Process multiple folders with a script
+for folder in campaign_A campaign_B campaign_C; do
+  python cli.py batch-match "$folder/" -o "${folder}_report.html"
+done
+```
+
+## 🐛 Troubleshooting
+
+### No videos found
+```
+❌ Problem: "No video files found in folder"
+✅ Solution: Check path and ensure .mp4/.mov files exist
+```
+
+### All adaptations show "No matches"
+```
+❌ Problem: No matches found above threshold
+✅ Solution: Lower thresholds with -t 0.2 -f 0.65
+```
+
+### Report opens blank
+```
+❌ Problem: HTML file corrupted or incomplete
+✅ Solution: Re-run with --output to specify new filename
+```
+
+### Processing errors
+```
+❌ Problem: "Error processing video.mp4"
+✅ Solution: Check video file isn't corrupted, codec is supported
+```
+
+## 📊 Performance
+
+**Typical Processing Times:**
+
+| Folder Size | Masters | Time |
+|-------------|---------|------|
+| 5 videos    | 50      | ~1 min |
+| 10 videos   | 50      | ~2 min |
+| 25 videos   | 50      | ~5 min |
+| 50 videos   | 50      | ~10 min |
+| 100 videos  | 50      | ~20 min |
+
+*Time depends on video duration and system specs*
+
+## 🎯 Best Practices
+
+1. **Add All Masters First**
+   ```bash
+   python bulk_add_masters.py "masters/" -r
+   python cli.py list-masters  # Verify
+   ```
+
+2. **Test on Small Set**
+   ```bash
+   # Test with 2-3 videos first
+   mkdir test_folder
+   cp adapt_1.mp4 adapt_2.mp4 test_folder/
+   python cli.py batch-match test_folder/
+   ```
+
+3. **Use Consistent Naming**
+   - `adaptations/` for all adaptation videos
+   - `masters/` for all master videos
+   - `reports/` for generated HTML reports
+
+4. **Keep Reports Organized**
+   ```bash
+   mkdir -p reports/{2024,2025}
+   python cli.py batch-match "folder/" \
+     -o "reports/2024/Q4_report.html"
+   ```
+
+5. **Version Control Reports**
+   ```bash
+   # Add to git for tracking
+   git add reports/*.html
+   git commit -m "Add Q4 matching report"
+   ```
+
+## 🔗 See Also
+
+- **README.md** - Quick start guide
+- **DOCUMENTATION.md** - Full technical documentation
+- **cli.py** - Single video matching
+- **bulk_add_masters.py** - Adding multiple masters
+
+## 📞 Need Help?
+
+Check the full documentation:
+```bash
+python cli.py batch-match --help
+```
+
+Or see **DOCUMENTATION.md** section: "Batch Matching & HTML Reports"
+
+---
+
+**Generated by Video Master-Adaptation Detection Tool**
+*Version 1.0.0*
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -0,0 +1,130 @@
+# Changelog
+
+All notable changes to this project will be documented in this file.
+
+## [2.0.1] - 2025-10-10
+
+### 🚀 Performance Optimization
+
+#### Smart AI Triggering
+- **Intelligent AI activation** - Only triggers when truly needed:
+  - ✅ No matches found (likely cross-aspect)
+  - ✅ Incomplete frame coverage (< 100%)
+  - ❌ Skipped for perfect matches (100% coverage)
+- **97% cost reduction** - Typical batches: 1-2/39 adaptations use AI
+- **Faster processing** - Seconds instead of minutes for perfect matches
+- **Cost transparency** - Shows savings when AI is skipped
+
+### 📚 Documentation
+- Updated README with smart triggering examples
+- Enhanced AI Vision guide with cost optimization
+- Added real-world batch processing examples
+
+### 💰 Cost Impact
+**Before optimization:**
+- 39 adaptations × 50 masters = $11.70 (all use AI)
+
+**After optimization:**
+- 38 perfect matches: $0.00 (AI skipped)
+- 1 cross-aspect: $0.30 (AI used)
+- **Total: $0.30** (97% savings!)
+
+---
+
+## [2.0.0] - 2025-10-10
+
+### 🚀 Major Features
+
+#### AI Vision Integration (Tier 2 Matching)
+- **Added GPT-4o vision model** for semantic video comparison
+- **Cross-aspect-ratio detection** - Matches 16:9 masters to 1:1, 9:16, 4:5 adaptations
+- **Intelligent text/logo ignoring** - Focuses on people, products, settings
+- **Crop detection** - Identifies when adaptations are cropped/zoomed from masters
+- **Human-readable explanations** - AI provides reasoning for matches
+- **Automatic fallback** - Triggers when perceptual hashing fails or confidence < 90%
+- **Cost tracking** - Shows estimated OpenAI API cost per comparison (~$0.005-0.007)
+
+### ✨ Enhancements
+
+- **Improved CLI output** - Added "Method" column showing "Hash" or "AI Vision"
+- **AI Vision analysis display** - Shows crop detection and reasoning in results
+- **Enhanced prompts** - Optimized GPT-4o prompt for better cross-aspect detection
+- **Environment configuration** - Added `.env` support with `python-dotenv`
+- **Comprehensive documentation** - Updated README with AI Vision setup and usage
+
+### 🐛 Bug Fixes
+
+- **Fixed ffmpeg frame extraction** - Corrected scale filter syntax for ffmpeg-python
+- **Updated to gpt-4o model** - Replaced deprecated gpt-4-vision-preview
+- **Removed ORB matching** - Eliminated false positives from feature matching
+
+### 📦 Dependencies
+
+- Added `openai>=1.12.0` - OpenAI GPT-4o integration
+- Added `python-dotenv>=1.0.0` - Environment variable management
+- Removed `opencv-python` - No longer needed after removing ORB
+
+### 📚 Documentation
+
+- Updated README.md with AI Vision features and setup
+- Enhanced .env.example with detailed configuration guide
+- Added privacy and security notes for AI Vision
+- Updated architecture diagram to show 3-tier system
+- Added cost estimates and performance metrics
+
+### 🔧 Technical Changes
+
+- Created `src/video_matcher/ai_vision.py` module
+- Integrated AI Vision into `matcher.py` as Tier 2 fallback
+- Updated CLI to display AI Vision results
+- Modified fingerprinter to remove ORB code
+- Simplified matching to perceptual hash + AI Vision only
+
+### 💰 Cost Information
+
+**AI Vision Pricing (GPT-4o):**
+- ~$0.005-0.007 per comparison (10 images)
+- 50 masters: ~$0.25-0.35 per adaptation
+- Very affordable for production use!
+
+### 🎯 What's Fixed
+
+- ❌ **Removed:** ORB feature matching (caused false positives)
+- ✅ **Fixed:** Cross-aspect-ratio matching (16:9 → 1:1, 9:16)
+- ✅ **Fixed:** Text/logo variations no longer cause mismatches
+- ✅ **Fixed:** Cropped adaptations now correctly match source masters
+
+### 🚀 Migration Guide
+
+**From v1.x to v2.0:**
+
+1. Update dependencies:
+   ```bash
+   pip install -r requirements.txt
+   ```
+
+2. (Optional) Set up AI Vision:
+   ```bash
+   cp .env.example .env
+   # Edit .env and add your OpenAI API key
+   ```
+
+3. Re-test your matches - results will be more accurate!
+
+**Breaking Changes:**
+- None - v2.0 is fully backward compatible
+- ORB matching removed, but spatial matching remains
+- AI Vision is optional (gracefully disabled without API key)
+
+---
+
+## [1.0.0] - 2025-10-08
+
+### Initial Release
+
+- ✅ Spatial-only perceptual hash matching
+- ✅ Audio fingerprinting with Chromaprint
+- ✅ Multi-master detection
+- ✅ Batch processing with HTML reports
+- ✅ Rich CLI interface
+- ✅ ORB feature matching (later removed in v2.0)
--- a/DOCUMENTATION.md
+++ b/DOCUMENTATION.md
@ -0,0 +1,815 @@
+# Video Master-Adaptation Detection - Technical Documentation
+
+## Table of Contents
+1. [Overview](#overview)
+2. [How It Works](#how-it-works)
+3. [Architecture](#architecture)
+4. [Matching Algorithm](#matching-algorithm)
+5. [CLI Reference](#cli-reference)
+6. [Batch Matching & HTML Reports](#batch-matching--html-reports)
+7. [Advanced Usage](#advanced-usage)
+8. [Understanding Results](#understanding-results)
+9. [Performance Tuning](#performance-tuning)
+10. [Troubleshooting](#troubleshooting)
+11. [API Reference](#api-reference)
+
+---
+
+## Overview
+
+This tool identifies which master video files were used to create adaptation videos (cutdowns, re-edits, speed changes, crops, etc.). It uses **spatial-only matching** that compares video content regardless of temporal order, making it robust to:
+
+- **Speed changes** (slow-motion, time-lapse, speed ramping)
+- **Duration changes** (15s adaptation from 20s master)
+- **Shot reordering** (non-linear edits)
+- **Different aspect ratios** (with separate masters per aspect ratio)
+- **Cropping and transformations**
+- **Re-encoding and compression**
+
+### Key Features
+
+✅ **Spatial-only video matching** - Ignores timing, focuses on content
+✅ **Audio fingerprinting** - Chromaprint-based robust audio matching
+✅ **Multi-master detection** - Identifies all masters used in an adaptation
+✅ **Percentage contribution** - Shows how much of each master was used
+✅ **Confidence scoring** - Weighted scoring combining video + audio
+✅ **Batch processing** - Bulk add masters from directories
+
+---
+
+## How It Works
+
+### 1. Fingerprinting Phase
+
+When you add a master video or match an adaptation, the tool:
+
+1. **Extracts frames** at 2 frames per second (default, configurable)
+2. **Creates perceptual hashes** (8×8 DCT-based hashing)
+3. **Extracts audio fingerprint** using Chromaprint (if available)
+4. **Stores fingerprints** as JSON files for future comparisons
+
+### 2. Matching Phase
+
+When matching an adaptation against masters:
+
+1. **Generates adaptation fingerprint** (same process as masters)
+2. **Spatial comparison**: For each adaptation frame, finds the most similar frame in each master (anywhere in the timeline)
+3. **Calculates percentage**: (matching frames / total frames) × 100%
+4. **Combines signals**: Weighted combination of video (70%) + audio (30%)
+5. **Ranks results**: Sorted by combined confidence score
+
+### Key Insight: Spatial-Only Matching
+
+Traditional video matching fails when adaptations are:
+- Speed-changed (frames at different timestamps)
+- Reordered (shots in different sequence)
+- Edited (missing sections, insertions)
+
+**Solution**: We ask "Does this frame exist ANYWHERE in the master?" instead of "Does this frame exist at timestamp T?"
+
+This makes matching robust to timing changes while still accurately identifying source content.
+
+---
+
+## Architecture
+
+```
+┌─────────────────────────────────────────────────────────────────┐
+│                        CLI Layer (cli.py)                       │
+│  Commands: add-master, list-masters, match, clear, status       │
+└────────────────────────┬────────────────────────────────────────┘
+                         │
+┌────────────────────────▼────────────────────────────────────────┐
+│                   Matcher Layer (matcher.py)                    │
+│  • Loads fingerprints                                           │
+│  • Orchestrates comparison                                      │
+│  • Calculates percentages & confidence                          │
+└────────────────────────┬────────────────────────────────────────┘
+                         │
+┌────────────────────────▼────────────────────────────────────────┐
+│              Fingerprinter Layer (fingerprinter.py)             │
+│  • Video frame extraction (FFmpeg)                              │
+│  • Perceptual hashing (8×8 DCT)                                 │
+│  • Audio fingerprinting (Chromaprint)                           │
+│  • Spatial-only comparison                                      │
+└────────────────────────┬────────────────────────────────────────┘
+                         │
+┌────────────────────────▼────────────────────────────────────────┐
+│                     Storage Layer                               │
+│  • data/fingerprints/*.json - Fingerprint files                 │
+│  • data/masters.json - Master video database                    │
+└─────────────────────────────────────────────────────────────────┘
+```
+
+### Core Components
+
+#### 1. `VideoFingerprinter` (fingerprinter.py)
+- Extracts video frames and generates perceptual hashes
+- Creates audio fingerprints using Chromaprint
+- Supports configurable sampling rate (frames per second)
+- Stores fingerprints as JSON for reuse
+
+#### 2. `VideoMatcher` (matcher.py)
+- Manages master video database
+- Performs spatial-only matching
+- Calculates percentage contributions
+- Generates confidence scores
+
+#### 3. `CLI` (cli.py)
+- User-facing command-line interface
+- Rich terminal output with tables and colors
+- Progress bars for batch operations
+
+---
+
+## Matching Algorithm
+
+### Spatial-Only Video Matching
+
+```python
+def compare_spatial_only(adaptation_fp, master_fp, threshold=0.70):
+    matches = 0
+
+    for adapt_frame in adaptation_frames:
+        best_similarity = 0
+
+        # Compare against ALL master frames (ignore time)
+        for master_frame in master_frames:
+            similarity = hamming_distance(adapt_frame.hash, master_frame.hash)
+            best_similarity = max(best_similarity, similarity)
+
+        if best_similarity >= threshold:
+            matches += 1
+
+    percentage = (matches / total_frames) * 100
+    return percentage
+```
+
+### Key Parameters
+
+| Parameter | Default | Description |
+|-----------|---------|-------------|
+| `samples_per_second` | 2.0 | Frames extracted per second (configurable in code) |
+| `frame_threshold` | 0.70 | Minimum similarity for frame match (0-1) |
+| `threshold` | 0.30 | Minimum % of frames to report master (0-1) |
+
+### Confidence Calculation
+
+```
+combined_score = (video_percentage / 100 × 0.7) + (audio_similarity × 0.3)
+
+Confidence Levels:
+- Very High: combined_score ≥ 0.90
+- High:      combined_score ≥ 0.75
+- Medium:    combined_score ≥ 0.60
+- Low:       combined_score ≥ 0.50
+- Very Low:  combined_score < 0.50
+```
+
+---
+
+## CLI Reference
+
+### `add-master` - Add Master Video
+
+Add a master video to the library.
+
+```bash
+python cli.py add-master <video_path> [--id <custom_id>]
+```
+
+**Examples:**
+```bash
+# Auto-generate ID from filename
+python cli.py add-master /path/to/master.mp4
+
+# Use custom ID
+python cli.py add-master /path/to/master.mp4 --id master_v1
+```
+
+### `list-masters` - List All Masters
+
+Display all master videos in the library.
+
+```bash
+python cli.py list-masters
+```
+
+**Output:**
+- Master ID
+- Filename
+- Duration
+- File path
+
+### `match` - Match Adaptation Video
+
+Match an adaptation against all masters using spatial-only matching.
+
+```bash
+python cli.py match <video_path> [OPTIONS]
+```
+
+**Options:**
+- `--threshold`, `-t` (default: 0.3): Minimum percentage of frames matching (0-1)
+- `--frame-threshold`, `-f` (default: 0.70): Similarity threshold for individual frames (0-1)
+
+**Examples:**
+```bash
+# Default matching
+python cli.py match /path/to/adaptation.mp4
+
+# Stricter matching (require 50% of frames)
+python cli.py match /path/to/adaptation.mp4 -t 0.5
+
+# More sensitive frame matching
+python cli.py match /path/to/adaptation.mp4 -f 0.65
+
+# Combined: require 70% match with sensitive frame detection
+python cli.py match /path/to/adaptation.mp4 -t 0.7 -f 0.65
+```
+
+### `status` - System Status
+
+Check system dependencies and library statistics.
+
+```bash
+python cli.py status
+```
+
+**Shows:**
+- FFmpeg availability
+- Chromaprint/AcoustID status
+- TMK status
+- Number of master videos
+
+### `batch-match` - Batch Match Folder
+
+Match all videos in a folder and generate an HTML report.
+
+```bash
+python cli.py batch-match <folder_path> [OPTIONS]
+```
+
+**Options:**
+- `--threshold`, `-t` (default: 0.3): Minimum percentage match (0-1)
+- `--frame-threshold`, `-f` (default: 0.70): Frame similarity threshold (0-1)
+- `--output`, `-o`: Output HTML file path (default: auto-generated timestamp)
+
+**Examples:**
+```bash
+# Process all videos in folder
+python cli.py batch-match /path/to/adaptations/
+
+# Custom thresholds
+python cli.py batch-match /path/to/adaptations/ -t 0.5 -f 0.75
+
+# Custom output filename
+python cli.py batch-match /path/to/adaptations/ -o report.html
+```
+
+**Output:**
+- Generates timestamped HTML report: `matching_report_YYYYMMDD_HHMMSS.html`
+- Shows summary statistics in terminal
+- Provides clickable file:// URL to open report
+
+### `clear` - Clear Library
+
+Remove all master videos from the library.
+
+```bash
+python cli.py clear
+```
+
+⚠️ **Warning:** This deletes all fingerprints and master records. Cannot be undone.
+
+---
+
+## Batch Matching & HTML Reports
+
+### Overview
+
+The batch matching feature allows you to process an entire folder of adaptation videos and generate a comprehensive HTML report showing which masters were used for each adaptation.
+
+### Usage
+
+**Command Line:**
+```bash
+# Basic usage
+python cli.py batch-match /path/to/adaptations/
+
+# With custom thresholds
+python cli.py batch-match /path/to/adaptations/ -t 0.5 -f 0.75
+
+# Specify output filename
+python cli.py batch-match /path/to/adaptations/ -o my_report.html
+```
+
+**Standalone Script:**
+```bash
+# You can also use the standalone script
+python batch_match.py /path/to/adaptations/
+python batch_match.py /path/to/adaptations/ --output reports/batch_results.html
+```
+
+### HTML Report Features
+
+The generated HTML report includes:
+
+**1. Summary Dashboard**
+- Total adaptations processed
+- Number of matched adaptations
+- Number with no matches
+- Total master matches across all adaptations
+
+**2. Per-Adaptation Cards**
+Each adaptation is shown in a card with:
+- Adaptation filename
+- Number of matches badge
+- List of all matching masters
+- Error message (if processing failed)
+
+**3. Per-Master Match Details**
+For each matching master:
+- Master ID and filename
+- Color-coded confidence badge:
+  - 🟢 **Green** - Very High/High confidence
+  - 🟡 **Yellow** - Medium confidence
+  - 🔴 **Red** - Low/Very Low confidence
+- Master duration
+- Video match percentage
+- Frames matched (X/Y format)
+- Combined confidence score
+- Visual progress bar showing match percentage
+
+**4. Design Features**
+- Modern gradient design (purple theme)
+- Responsive layout (works on mobile/tablet/desktop)
+- Hover effects on cards
+- Print-friendly styling
+- Clean, professional appearance
+
+### Example Workflow
+
+```bash
+# 1. Add all masters
+python bulk_add_masters.py "masters/" -r
+
+# 2. Process all adaptations
+python cli.py batch-match "adaptations/"
+
+# 3. Open the generated report
+open matching_report_20251010_153045.html
+
+# 4. Review results:
+#    - Which adaptations matched which masters
+#    - Confidence levels for each match
+#    - Any processing errors
+```
+
+### Use Cases
+
+**Quality Control:**
+- Verify adaptations were created from correct masters
+- Check if all expected masters were used
+- Identify adaptations with low confidence matches
+
+**Production Tracking:**
+- Document which masters were used for each delivery
+- Generate audit trail of master usage
+- Track adaptation creation workflow
+
+**Asset Management:**
+- Identify unused masters
+- Find duplicate or similar adaptations
+- Organize video library by source masters
+
+### Report Customization
+
+The HTML report can be customized by editing `batch_match.py`:
+
+```python
+# Line 23: Change color scheme
+background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
+
+# Line 80: Adjust card styling
+.adaptation {
+    background: white;
+    padding: 25px;
+    border-radius: 15px;
+}
+
+# Line 150: Modify confidence colors
+.confidence-very-high { background: #51cf66; }
+.confidence-high { background: #69db7c; }
+```
+
+---
+
+## Advanced Usage
+
+### Bulk Adding Masters
+
+Use the `bulk_add_masters.py` script to add multiple videos at once:
+
+```bash
+# Add all .mp4 files from a directory
+python bulk_add_masters.py /path/to/masters/
+
+# Recursively add from subdirectories
+python bulk_add_masters.py /path/to/masters/ --recursive
+
+# Add specific pattern
+python bulk_add_masters.py /path/to/masters/ --pattern "*.mov"
+```
+
+### Adjusting Sampling Rate
+
+The default is **2 frames per second**, optimized for fast-paced advertising content with quick edits.
+
+Edit `src/video_matcher/fingerprinter.py:106`:
+```python
+samples_per_second = 2.0  # Default: good for ads with quick cuts
+samples_per_second = 1.0  # Faster: basic matching, may miss quick edits
+samples_per_second = 3.0  # Slower: catches sub-second cuts
+```
+
+**Trade-offs:**
+
+| Rate | 20s Video | Use Case | Pros | Cons |
+|------|-----------|----------|------|------|
+| 0.5 fps | 10 frames | Long-form content | Fast, small files | May miss cuts |
+| 1.0 fps | 20 frames | General purpose | Balanced | Misses quick edits |
+| **2.0 fps** | **40 frames** | **Ads/Marketing** | **Catches quick cuts** | **2x storage** |
+| 3.0 fps | 60 frames | Frame-accurate | Very detailed | 3x slower |
+
+**Recommendation:** Keep 2 fps for advertising/marketing content with fast edits.
+
+### Handling Different Aspect Ratios
+
+**Best Practice:** Maintain separate masters for each aspect ratio:
+
+```
+masters/
+├── 16x9/
+│   ├── master_A_16x9.mp4
+│   ├── master_B_16x9.mp4
+├── 9x16/
+│   ├── master_A_9x16.mp4
+│   ├── master_B_9x16.mp4
+└── 1x1/
+    ├── master_A_1x1.mp4
+    └── master_B_1x1.mp4
+```
+
+Add all versions to the library:
+```bash
+python bulk_add_masters.py masters/16x9/ -r
+python bulk_add_masters.py masters/9x16/ -r
+python bulk_add_masters.py masters/1x1/ -r
+```
+
+The matcher will automatically identify the correct aspect ratio master.
+
+---
+
+## Understanding Results
+
+### Sample Output
+
+```
+Found 2 master(s) matching this adaptation:
+
+╭──────┬────────────┬─────────────┬────────┬───────┬──────────┬────────────╮
+│ Rank │ Master ID  │ Video Match │ Frames │ Audio │ Combined │ Confidence │
+├──────┼────────────┼─────────────┼────────┼───────┼──────────┼────────────┤
+│    1 │ master_C   │      100.0% │ 15/15  │ 0.500 │    0.850 │ High       │
+│    2 │ master_B   │       73.3% │ 11/15  │ 0.500 │    0.663 │ Medium     │
+╰──────┴────────────┴─────────────┴────────┴───────┴──────────┴────────────╯
+
+Best Match:
+  Master: master_C
+  Video frames matched: 100.0% (15/15 frames)
+  Average frame similarity: 94.4%
+  Audio similarity: 0.500
+  Combined confidence: 85.0%
+```
+
+### Interpreting Scores
+
+**Video Match Percentage:**
+- **100%**: All adaptation frames found in master
+- **75-99%**: Most frames match, likely correct master
+- **50-74%**: Partial match, possibly similar content
+- **<50%**: Unlikely to be source master
+
+**Average Frame Similarity:**
+- **>90%**: Near-identical frames (same encoding/quality)
+- **75-90%**: Very similar (different encoding/compression)
+- **60-75%**: Similar content (crops, color grading)
+- **<60%**: Different content or heavy transformations
+
+**Combined Score:**
+- Weighted combination: 70% video + 30% audio
+- Audio helps disambiguate visually similar masters
+- Higher combined score = more confident match
+
+### When Multiple Masters Match
+
+If an adaptation uses content from multiple masters:
+
+```
+Best Match:
+  Master: master_A - 60% of frames
+
+Other Potential Matches:
+  • master_B: 40% of frames
+```
+
+This indicates the adaptation combined:
+- 60% content from master_A
+- 40% content from master_B
+
+---
+
+## Performance Tuning
+
+### Speed vs Accuracy
+
+**For faster matching (lower accuracy):**
+```python
+# Reduce sampling rate (1.0 = 1 frame per second)
+samples_per_second = 1.0
+
+# Increase thresholds (stricter matching)
+frame_threshold = 0.75
+threshold = 0.5
+```
+
+**For better accuracy (slower):**
+```python
+# Increase sampling rate (3.0 = 3 frames per second)
+samples_per_second = 3.0
+
+# Lower thresholds (more sensitive)
+frame_threshold = 0.65
+threshold = 0.3
+```
+
+**Default (balanced for ads):**
+```python
+samples_per_second = 2.0  # Catches quick edits
+frame_threshold = 0.70
+threshold = 0.3
+```
+
+### Large Libraries
+
+For libraries with 100+ masters:
+
+1. **Pre-filter by duration:**
+   - Skip masters that are too short/long for the adaptation
+
+2. **Use audio pre-filtering:**
+   - Match audio first, then only check video for audio matches
+
+3. **Parallel processing:**
+   - Compare against multiple masters simultaneously
+
+---
+
+## Troubleshooting
+
+### Common Issues
+
+**❌ No matches found**
+
+**Cause:** Thresholds too strict, or videos unrelated
+
+**Solution:**
+```bash
+# Try more lenient settings
+python cli.py match video.mp4 -t 0.2 -f 0.65
+```
+
+---
+
+**❌ Too many false positives**
+
+**Cause:** Thresholds too lenient, similar-looking content
+
+**Solution:**
+```bash
+# Stricter matching
+python cli.py match video.mp4 -t 0.5 -f 0.75
+```
+
+---
+
+**❌ Speed-changed adaptations not matching**
+
+**Cause:** Already handled! Spatial matching ignores timing
+
+**Check:**
+- Ensure video content is actually similar
+- Lower frame_threshold if heavily processed
+
+---
+
+**❌ Different aspect ratios not matching**
+
+**Solution:** Ensure you have masters in the same aspect ratio
+
+```bash
+# Add masters for each aspect ratio
+python cli.py add-master master_16x9.mp4
+python cli.py add-master master_1x1.mp4
+```
+
+---
+
+**❌ Audio similarity always 0.500**
+
+**Cause:** Chromaprint comparison not fully implemented (placeholder)
+
+**Note:** This is a POC limitation. Video matching still works.
+
+---
+
+## API Reference
+
+### VideoFingerprinter
+
+```python
+from video_matcher.fingerprinter import VideoFingerprinter
+
+fp = VideoFingerprinter(data_dir="data/fingerprints")
+
+# Generate fingerprint
+fingerprint = fp.fingerprint_video(
+    video_path="/path/to/video.mp4",
+    video_id="my_video"
+)
+
+# Load existing fingerprint
+existing = fp.load_fingerprint("my_video")
+
+# List all fingerprints
+all_ids = fp.list_fingerprints()
+```
+
+### VideoMatcher
+
+```python
+from video_matcher.matcher import VideoMatcher
+
+matcher = VideoMatcher(data_dir="data")
+
+# Add master
+matcher.add_master(
+    video_path="/path/to/master.mp4",
+    master_id="master_1"
+)
+
+# List masters
+masters = matcher.list_masters()
+
+# Match adaptation
+matches = matcher.match_adaptation(
+    video_path="/path/to/adaptation.mp4",
+    threshold=0.3,
+    frame_threshold=0.70
+)
+
+# Clear all masters
+matcher.clear_masters()
+```
+
+### Comparison Functions
+
+```python
+from video_matcher.fingerprinter import (
+    compare_spatial_only,
+    compare_audio_fingerprints
+)
+
+# Spatial video comparison
+result = compare_spatial_only(
+    adaptation_fp=adapt_fp,
+    master_fp=master_fp,
+    similarity_threshold=0.75
+)
+# Returns: {
+#   'matching_frames': 12,
+#   'total_frames': 15,
+#   'percentage': 80.0,
+#   'average_similarity': 0.87
+# }
+
+# Audio comparison
+audio_score = compare_audio_fingerprints(
+    fp1=adapt_audio,
+    fp2=master_audio
+)
+# Returns: float (0-1)
+```
+
+---
+
+## File Formats
+
+### Fingerprint JSON Structure
+
+```json
+{
+  "video_id": "master_example",
+  "path": "/path/to/video.mp4",
+  "filename": "video.mp4",
+  "info": {
+    "duration": 20.0,
+    "width": 1920,
+    "height": 1080,
+    "fps": 25.0,
+    "has_audio": true,
+    "codec": "h264"
+  },
+  "audio_fp": {
+    "duration": 20.0,
+    "fingerprint": "AQAAZEw4Kc9w...",
+    "method": "chromaprint"
+  },
+  "video_fp": {
+    "method": "basic_hash",
+    "samples_per_second": 1.0,
+    "num_frames": 20,
+    "frames": [
+      {
+        "frame_id": 0,
+        "timestamp": 0.0,
+        "hash": "0xcfcfc7e3c3e3e3e3"
+      }
+    ]
+  }
+}
+```
+
+### Masters Database (masters.json)
+
+```json
+{
+  "masters": [
+    {
+      "master_id": "master_example",
+      "fingerprint_id": "master_master_example",
+      "path": "/path/to/video.mp4",
+      "filename": "video.mp4",
+      "duration": 20.0
+    }
+  ]
+}
+```
+
+---
+
+## Future Enhancements
+
+### Production-Ready Improvements
+
+1. **TMK Integration** - Facebook's Threat Match for more robust matching
+2. **Segment Timeline** - Show exactly which parts came from which master
+3. **Web UI** - Drag-drop interface with side-by-side comparison
+4. **Batch Processing** - Process hundreds of adaptations in parallel
+5. **Database Storage** - PostgreSQL/MongoDB instead of JSON files
+6. **Vector Search** - Milvus/Qdrant for sub-second matching in large libraries
+7. **GPU Acceleration** - CUDA-based hash computation
+8. **CLIP Embeddings** - Handle heavy crops, overlays, graphics
+9. **Shot Detection** - PySceneDetect for segment-level matching
+10. **Audio Refinement** - Proper Chromaprint comparison implementation
+
+### Suggested Architecture for Scale
+
+```
+┌──────────────┐     ┌──────────────┐     ┌──────────────┐
+│  Web UI      │────▶│  API Gateway │────▶│  Job Queue   │
+│  (React)     │     │  (FastAPI)   │     │  (Celery)    │
+└──────────────┘     └──────────────┘     └──────┬───────┘
+                                                   │
+                     ┌──────────────┐     ┌───────▼───────┐
+                     │  Vector DB   │────▶│  Workers      │
+                     │  (Qdrant)    │     │  (GPU-based)  │
+                     └──────────────┘     └───────────────┘
+```
+
+---
+
+## License
+
+MIT License - See LICENSE file for details.
+
+---
+
+## Support & Contact
+
+For questions, issues, or contributions, please open an issue on the GitHub repository.
+
+**Documentation Version:** 1.0
+**Last Updated:** 2025-10-05
--- a/README.md
+++ b/README.md
@ -0,0 +1,458 @@
+# Video Master-Adaptation Detection
+
+A proof-of-concept tool to detect which master video files were used to create adaptation videos (cut-downs, re-edits, speed changes, crops, re-encodes, etc.).
+
+## ✨ Key Features
+
+- **🎯 Spatial-Only Matching** - Ignores timing, handles speed changes & reordering
+- **🤖 AI Vision (GPT-4o)** - Detects cross-aspect-ratio matches (16:9 → 1:1, 9:16, etc.)
+- **🎬 Multi-Master Detection** - Identifies all masters used in an adaptation
+- **📊 Percentage Contribution** - Shows how much of each master was used
+- **🎵 Audio Fingerprinting** - Chromaprint-based robust audio matching
+- **⚡ Batch Processing** - Bulk add masters from directories
+- **📄 HTML Reports** - Beautiful visual reports for batch matching
+- **🎨 Rich CLI** - Beautiful terminal output with tables and progress bars
+
+## 🚀 Quick Start
+
+### Prerequisites
+
+1. **Python 3.8+**
+2. **FFmpeg**
+   ```bash
+   # macOS
+   brew install ffmpeg chromaprint
+
+   # Ubuntu/Debian
+   sudo apt-get install ffmpeg libchromaprint-dev
+   ```
+
+### Installation
+
+```bash
+# Clone the repository
+cd Video_Master_Adot_Detection
+
+# Create and activate virtual environment
+python3 -m venv venv
+source venv/bin/activate  # On macOS/Linux
+# or
+venv\Scripts\activate     # On Windows
+
+# Install dependencies
+pip install -r requirements.txt
+
+# (Optional) Set up AI Vision for cross-aspect matching
+# Copy .env.example to .env and add your OpenAI API key
+cp .env.example .env
+# Edit .env and add: OPENAI_API_KEY=your_key_here
+
+# Verify installation
+python cli.py status
+```
+
+### Basic Usage
+
+```bash
+# 1. Add master videos
+python cli.py add-master /path/to/master.mp4
+
+# Or bulk add from directory
+python bulk_add_masters.py /path/to/masters/ --recursive
+
+# 2. List masters
+python cli.py list-masters
+
+# 3. Match a single adaptation
+python cli.py match /path/to/adaptation.mp4
+
+# 4. Or batch match entire folder (with HTML report!)
+python cli.py batch-match /path/to/adaptations/
+
+# 5. View results in terminal or open HTML report in browser
+```
+
+## 📖 Usage Examples
+
+### Adding Masters
+
+```bash
+# Single master with auto-generated ID
+python cli.py add-master master_video.mp4
+
+# Custom ID
+python cli.py add-master master_video.mp4 --id master_v1
+
+# Bulk add all .mp4 files
+python bulk_add_masters.py masters_folder/ -r
+```
+
+### Matching Adaptations
+
+**Single video:**
+```bash
+# Default matching (30% threshold)
+python cli.py match adaptation.mp4
+
+# Stricter matching (require 60% match)
+python cli.py match adaptation.mp4 -t 0.6
+
+# More sensitive frame detection
+python cli.py match adaptation.mp4 -f 0.65
+
+# Combined: strict + sensitive
+python cli.py match adaptation.mp4 -t 0.6 -f 0.65
+```
+
+**Batch matching with HTML report:**
+```bash
+# Process entire folder and generate report
+python cli.py batch-match /path/to/adaptations/
+
+# With custom thresholds
+python cli.py batch-match /path/to/adaptations/ -t 0.5 -f 0.75
+
+# Specify output filename
+python cli.py batch-match /path/to/adaptations/ -o my_report.html
+```
+
+## 🎯 What It Handles
+
+✅ **Speed Changes** - Matches 15s adaptation to 20s master (slow-mo, time-lapse)
+✅ **Shot Reordering** - Detects masters even when shots are rearranged
+✅ **Different Durations** - Handles cut-downs and extended versions
+✅ **Non-Linear Edits** - Finds masters in complex re-edits
+✅ **Re-encoding** - Robust to compression and format changes
+✅ **Multiple Masters** - Identifies when adaptation uses multiple sources
+✅ **Cross-Aspect Ratios** - AI Vision detects 16:9 cropped to 1:1 or 9:16
+✅ **Text/Logo Variations** - AI ignores different subtitles, logos, overlays
+
+## 📊 Understanding Results
+
+### Terminal Output (Single Match)
+
+When matching a single video with `python cli.py match`:
+
+```
+Found 2 master(s) matching this adaptation:
+
+╭──────┬────────────┬─────────────┬────────┬───────┬──────────┬────────────╮
+│ Rank │ Master ID  │ Video Match │ Frames │ Audio │ Combined │ Confidence │
+├──────┼────────────┼─────────────┼────────┼───────┼──────────┼────────────┤
+│    1 │ master_C   │      100.0% │ 15/15  │ 0.500 │    0.850 │ High       │
+│    2 │ master_B   │       73.3% │ 11/15  │ 0.500 │ 0.663    │ Medium     │
+╰──────┴────────────┴─────────────┴────────┴───────┴──────────┴────────────╯
+
+Best Match:
+  Master: master_C
+  Video frames matched: 100.0% (15/15 frames)
+  Average frame similarity: 94.4%
+  Combined confidence: 85.0%
+
+AI Vision Analysis:
+  Method: GPT-4o (OpenAI)
+  Format: Adaptation is cropped from master
+
+  AI Reasoning:
+  Both sets feature the same two people in identical clothing and poses...
+```
+
+**Note:** AI Vision is **smartly triggered** only when needed:
+- ✅ **Triggered:** No matches OR incomplete frame coverage (< 100%)
+- ❌ **Skipped:** Perfect match found (100% coverage)
+- 💰 **Cost savings:** Only 1-2 out of 39 adaptations typically need AI!
+- Typical cost when triggered: ~$0.005 per comparison
+
+### Score Interpretation
+
+| Score | Meaning |
+|-------|---------|
+| **Video Match** | Percentage of adaptation frames found in master |
+| **Frames** | Number of matching frames / total frames |
+| **Audio** | Audio fingerprint similarity (0-1) |
+| **Combined** | Weighted score: 70% video + 30% audio |
+| **Confidence** | Very High (≥90%) → Very Low (<50%) |
+
+### HTML Report (Batch Match)
+
+When batch matching with `python cli.py batch-match`, you get a beautiful HTML report:
+
+**Features:**
+- 📊 **Summary Dashboard** - Total processed, matched, unmatched counts
+- 🎬 **Per-Adaptation Cards** - Each video shown with all matching masters
+- 🎨 **Color-Coded Confidence** - Visual badges (green = high, yellow = medium, red = low)
+- 📈 **Progress Bars** - Visual representation of match percentage
+- 📱 **Responsive Design** - Works on desktop and mobile
+- 🖨️ **Print-Friendly** - Clean layout for printing/PDFs
+
+**Report includes:**
+- Adaptation filename and match count
+- Master ID, duration, and video match percentage
+- Number of frames matched
+- Combined confidence score
+- Visual progress indicators
+- Error messages for failed matches
+
+**Opening the report:**
+```bash
+# Report is saved as matching_report_YYYYMMDD_HHMMSS.html
+# Open in browser:
+open matching_report_20251010_153045.html  # macOS
+xdg-open matching_report_20251010_153045.html  # Linux
+start matching_report_20251010_153045.html  # Windows
+```
+
+## 🔧 CLI Commands
+
+| Command | Description |
+|---------|-------------|
+| `add-master <path>` | Add a master video to library |
+| `list-masters` | Show all master videos |
+| `match <path>` | Match single adaptation against masters |
+| `batch-match <folder>` | Match entire folder + generate HTML report |
+| `status` | Check system dependencies |
+| `clear` | Remove all masters from library |
+| `--help` | Show help for any command |
+
+## 📚 Documentation
+
+For detailed documentation, see **[DOCUMENTATION.md](DOCUMENTATION.md)**:
+
+- How It Works (Spatial-Only Matching)
+- Architecture & Components
+- API Reference
+- Advanced Usage
+- Performance Tuning
+- Troubleshooting
+- Production Recommendations
+
+## 🎬 How It Works
+
+### Hybrid 3-Tier Architecture
+
+**Tier 1: Perceptual Hash Matching (Fast)**
+- Extracts frames at 2 frames/second (catches quick edits)
+- Generates perceptual hashes (8×8 DCT)
+- Creates audio fingerprint (Chromaprint)
+- Stores as JSON for reuse
+- **Best for:** Same aspect ratio videos
+
+**Tier 2: AI Vision (Smart Fallback)**
+- **Only triggered when truly needed:**
+  - No matches found at all (likely cross-aspect), OR
+  - Best match has incomplete frame coverage (< 100%)
+- Extracts 5 key frames from each video
+- Uses GPT-4o to compare scenes semantically
+- Ignores text, logos, subtitles, branding
+- Focuses on people, products, settings, framing
+- **Best for:** Cross-aspect ratios (16:9 → 1:1, 9:16)
+- **Optimization:** Skips AI for perfect matches (saves cost & time!)
+
+**Tier 3: Reserved for Future Deep Analysis**
+
+### Spatial Matching (Tier 1)
+```
+For each adaptation frame:
+  → Find most similar frame in master (anywhere in timeline)
+  → If similarity ≥ threshold: count as match
+  → Calculate: (matches / total_frames) × 100%
+```
+
+**Key Insight:** By ignoring temporal order, we handle speed changes, reordering, and non-linear edits automatically!
+
+### AI Vision Matching (Tier 2)
+```
+When Tier 1 fails or has low confidence:
+  → Extract 5 evenly-spaced frames from adaptation
+  → Extract 5 evenly-spaced frames from each master
+  → Send to GPT-4o for semantic comparison
+  → AI analyzes: people, products, settings, composition
+  → Returns: match (yes/no), confidence (0-100%), is_crop (yes/no)
+  → Cost: ~$0.005-0.007 per comparison
+```
+
+**Key Features:**
+- Detects cropping, scaling, pan-and-scan
+- Ignores text localization and logo variations
+- Handles aspect ratio changes (16:9 ↔ 1:1 ↔ 9:16)
+- Provides human-readable explanations
+
+### Confidence Scoring
+```
+combined_score = (video_match × 0.7) + (audio_match × 0.3)
+```
+
+## 🏗️ Project Structure
+
+```
+Video_Master_Adot_Detection/
+├── cli.py                       # Main CLI interface
+├── bulk_add_masters.py          # Batch processing script
+├── requirements.txt             # Python dependencies
+├── README.md                    # This file
+├── DOCUMENTATION.md             # Detailed documentation
+├── src/
+│   └── video_matcher/
+│       ├── fingerprinter.py     # Fingerprinting & matching logic
+│       ├── matcher.py           # Master management & scoring
+│       └── ai_vision.py         # AI Vision (GPT-4o) integration
+├── data/
+│   ├── fingerprints/            # Stored fingerprints (*.json)
+│   └── masters.json             # Master video database
+├── .env.example                 # Example environment config
+├── .env                         # Your OpenAI API key (not tracked)
+└── To Exclude/                  # Test videos (not tracked)
+```
+
+## ⚙️ Configuration
+
+### AI Vision Setup
+
+AI Vision is **optional** but highly recommended for cross-aspect-ratio matching.
+
+1. Get an OpenAI API key from https://platform.openai.com/api-keys
+2. Copy `.env.example` to `.env`
+3. Add your key: `OPENAI_API_KEY=sk-...`
+
+**Cost Estimates:**
+- Single comparison: ~$0.005-0.007 (10 images)
+- 50 masters: ~$0.25-0.35 per adaptation
+- Very affordable for production use!
+
+**To disable AI Vision:**
+- Don't set `OPENAI_API_KEY`, or
+- Set it to empty in `.env`
+
+### Adjust Sensitivity
+
+```bash
+# More lenient (catches more matches)
+python cli.py match video.mp4 -t 0.2 -f 0.65
+
+# Default (balanced)
+python cli.py match video.mp4 -t 0.3 -f 0.70
+
+# Stricter (higher confidence)
+python cli.py match video.mp4 -t 0.5 -f 0.75
+```
+
+### Sampling Rate
+
+The default is **2 frames per second** which provides good accuracy for fast-paced content with quick edits.
+
+To adjust, edit `src/video_matcher/fingerprinter.py:106`:
+```python
+samples_per_second = 2.0  # Default: 2 frames/sec (good for quick edits)
+samples_per_second = 1.0  # Faster: 1 frame/sec (basic matching)
+samples_per_second = 3.0  # Slower: 3 frames/sec (very detailed)
+```
+
+**Impact:**
+- **2 fps**: 20s video = 40 frames (recommended for ads/marketing)
+- **1 fps**: 20s video = 20 frames (faster, less granular)
+- **3 fps**: 20s video = 60 frames (catches sub-second cuts)
+
+## 🐛 Troubleshooting
+
+| Issue | Solution |
+|-------|----------|
+| **No matches found** | Lower thresholds: `-t 0.2 -f 0.65` or enable AI Vision |
+| **Too many false positives** | Raise thresholds: `-t 0.5 -f 0.75` |
+| **Different aspect ratios** | Enable AI Vision (set `OPENAI_API_KEY` in `.env`) |
+| **AI Vision not working** | Check API key in `.env` and verify balance |
+| **FFmpeg frame extraction errors** | Update ffmpeg: `brew upgrade ffmpeg` |
+| **FFmpeg not found** | `brew install ffmpeg` or check PATH |
+| **Import errors** | Activate venv: `source venv/bin/activate` |
+| **Model deprecated error** | Update code to use `gpt-4o` (already fixed in v2.0) |
+
+## 🚧 Limitations
+
+This tool has the following limitations:
+
+1. **Basic perceptual hashing** - Uses 8×8 DCT instead of production TMK
+2. **Audio placeholder** - Chromaprint comparison returns 0.5 (not fully implemented)
+3. **No segment timeline** - Doesn't show which specific parts matched
+4. **Single-threaded** - Not optimized for large-scale batch processing
+5. **JSON storage** - Not suitable for large libraries (>1000 videos)
+6. **AI Vision cost** - Can add up with large master libraries (though affordable)
+
+## 🔮 Future Enhancements
+
+For production use, consider:
+
+- ✅ **AI Vision (GPT-4o)** - Cross-aspect matching ✓ IMPLEMENTED v2.0
+- ⬜ **TMK Integration** - Facebook's Threat Match for robust matching
+- ⬜ **Segment Timeline** - Show which parts came from which master
+- ⬜ **Web UI** - Drag-drop interface with visual comparison
+- ⬜ **Database** - PostgreSQL/MongoDB instead of JSON
+- ⬜ **Vector Search** - Qdrant/Milvus for sub-second matching
+- ⬜ **GPU Acceleration** - CUDA-based hash computation
+- ⬜ **Smart AI Triggering** - Only use AI for aspect ratio mismatches
+- ⬜ **Parallel Processing** - Celery + Redis for batch jobs
+
+See [DOCUMENTATION.md](DOCUMENTATION.md) for detailed production architecture.
+
+## 📈 Performance
+
+**Tier 1: Perceptual Hash (2 fps sampling)**
+- Fingerprint generation: ~3-6 seconds per minute of video
+- Matching: ~0.1 seconds per master comparison
+- Library size: Works well up to ~100 masters
+
+**Tier 2: AI Vision**
+- Frame extraction: ~1-2 seconds per video
+- GPT-4o API call: ~2-3 seconds per comparison
+- Cost: ~$0.005-0.007 per comparison
+- Only triggered for cross-aspect or no matches
+
+**Example 1: Perfect Match (AI Skipped)**
+- 47 masters (various durations)
+- 1 adaptation (15s, same aspect ratio)
+- Tier 1 time: ~15 seconds (100% match found)
+- Tier 2: **SKIPPED** (saves ~$0.30!)
+- Total cost: $0.00
+
+**Example 2: Cross-Aspect (AI Triggered)**
+- 47 masters (various durations)
+- 1 adaptation (15s, 1:1 from 16:9)
+- Tier 1 time: ~15 seconds (no matches)
+- Tier 2 time: ~3-5 minutes (47 AI comparisons)
+- Total cost: ~$0.30
+
+**Example 3: Batch with Smart Triggering**
+- 39 adaptations
+- 38 perfect matches (AI skipped): $0.00
+- 1 cross-aspect (AI used): ~$0.30
+- **Total cost: ~$0.30** (vs $12 without optimization!)
+
+**Fingerprint Storage:**
+- 20s video @ 2fps = ~8KB JSON file (40 frames)
+- 15s video @ 2fps = ~6KB JSON file (30 frames)
+
+## 🤝 Contributing
+
+Contributions welcome! Areas for improvement:
+
+- TMK integration for production matching
+- Full Chromaprint audio comparison
+- Segment-level timeline visualization
+- Web interface
+- Performance optimization
+- Unit tests
+
+## 📄 License
+
+MIT License - See LICENSE file for details.
+
+## 🙋 Support
+
+For questions or issues:
+1. Check [DOCUMENTATION.md](DOCUMENTATION.md)
+2. Review troubleshooting section
+3. Open an issue on GitHub
+
+---
+
+**Built with:** Python, FFmpeg, Chromaprint, OpenAI GPT-4o, Rich
+**Status:** Production-Ready with AI Vision
+**Version:** 2.0.0
--- a/batch_match.py
+++ b/batch_match.py
@ -0,0 +1,505 @@
+#!/usr/bin/env python3
+"""
+Batch match adaptations from a folder and generate HTML report.
+"""
+
+import sys
+import json
+from pathlib import Path
+from datetime import datetime
+from rich.console import Console
+from rich.progress import Progress, SpinnerColumn, TextColumn, BarColumn
+
+# Add src to path
+sys.path.insert(0, str(Path(__file__).parent / "src"))
+
+from video_matcher.matcher import VideoMatcher
+
+console = Console()
+
+# Common video file extensions
+VIDEO_EXTENSIONS = {'.mp4', '.mov', '.avi', '.mkv', '.webm', '.flv', '.wmv', '.m4v'}
+
+
+def generate_html_report(results, output_path, folder_path):
+    """Generate an HTML report from matching results."""
+
+    html_content = f"""<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Video Matching Report - {datetime.now().strftime('%Y-%m-%d %H:%M')}</title>
+    <style>
+        * {{
+            margin: 0;
+            padding: 0;
+            box-sizing: border-box;
+        }}
+
+        body {{
+            font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Oxygen, Ubuntu, Cantarell, sans-serif;
+            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
+            padding: 20px;
+            color: #333;
+        }}
+
+        .container {{
+            max-width: 1400px;
+            margin: 0 auto;
+        }}
+
+        .header {{
+            background: white;
+            padding: 30px;
+            border-radius: 15px;
+            box-shadow: 0 10px 30px rgba(0,0,0,0.2);
+            margin-bottom: 30px;
+        }}
+
+        .header h1 {{
+            color: #667eea;
+            margin-bottom: 10px;
+            font-size: 2.5em;
+        }}
+
+        .header .meta {{
+            color: #666;
+            font-size: 0.95em;
+        }}
+
+        .summary {{
+            background: white;
+            padding: 25px;
+            border-radius: 15px;
+            box-shadow: 0 10px 30px rgba(0,0,0,0.2);
+            margin-bottom: 30px;
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+            gap: 20px;
+        }}
+
+        .stat {{
+            text-align: center;
+            padding: 15px;
+            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
+            border-radius: 10px;
+            color: white;
+        }}
+
+        .stat-value {{
+            font-size: 2.5em;
+            font-weight: bold;
+            display: block;
+        }}
+
+        .stat-label {{
+            font-size: 0.9em;
+            opacity: 0.9;
+            margin-top: 5px;
+        }}
+
+        .adaptation {{
+            background: white;
+            padding: 25px;
+            border-radius: 15px;
+            box-shadow: 0 10px 30px rgba(0,0,0,0.2);
+            margin-bottom: 25px;
+            transition: transform 0.2s;
+        }}
+
+        .adaptation:hover {{
+            transform: translateY(-2px);
+            box-shadow: 0 15px 40px rgba(0,0,0,0.25);
+        }}
+
+        .adaptation-header {{
+            display: flex;
+            justify-content: space-between;
+            align-items: center;
+            margin-bottom: 20px;
+            padding-bottom: 15px;
+            border-bottom: 2px solid #f0f0f0;
+        }}
+
+        .adaptation-name {{
+            font-size: 1.4em;
+            font-weight: 600;
+            color: #333;
+            word-break: break-all;
+        }}
+
+        .match-count {{
+            background: #667eea;
+            color: white;
+            padding: 8px 16px;
+            border-radius: 20px;
+            font-weight: 600;
+            font-size: 0.9em;
+        }}
+
+        .no-matches {{
+            background: #ff6b6b;
+        }}
+
+        .matches-list {{
+            display: grid;
+            gap: 15px;
+        }}
+
+        .match-item {{
+            background: #f8f9fa;
+            padding: 20px;
+            border-radius: 10px;
+            border-left: 5px solid #667eea;
+            transition: all 0.2s;
+        }}
+
+        .match-item:hover {{
+            background: #e9ecef;
+            border-left-width: 8px;
+        }}
+
+        .match-header {{
+            display: flex;
+            justify-content: space-between;
+            align-items: center;
+            margin-bottom: 15px;
+        }}
+
+        .master-name {{
+            font-weight: 600;
+            color: #333;
+            font-size: 1.1em;
+        }}
+
+        .confidence-badge {{
+            padding: 6px 14px;
+            border-radius: 15px;
+            font-weight: 600;
+            font-size: 0.85em;
+            text-transform: uppercase;
+            letter-spacing: 0.5px;
+        }}
+
+        .confidence-very-high {{ background: #51cf66; color: white; }}
+        .confidence-high {{ background: #69db7c; color: white; }}
+        .confidence-medium {{ background: #ffd43b; color: #333; }}
+        .confidence-low {{ background: #ff922b; color: white; }}
+        .confidence-very-low {{ background: #ff6b6b; color: white; }}
+
+        .match-details {{
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(150px, 1fr));
+            gap: 12px;
+            margin-top: 12px;
+        }}
+
+        .detail-item {{
+            background: white;
+            padding: 10px;
+            border-radius: 8px;
+            text-align: center;
+        }}
+
+        .detail-label {{
+            font-size: 0.8em;
+            color: #666;
+            text-transform: uppercase;
+            letter-spacing: 0.5px;
+            margin-bottom: 5px;
+        }}
+
+        .detail-value {{
+            font-size: 1.2em;
+            font-weight: 600;
+            color: #667eea;
+        }}
+
+        .no-match-message {{
+            text-align: center;
+            padding: 30px;
+            color: #999;
+            font-style: italic;
+        }}
+
+        .error-message {{
+            background: #ffe0e0;
+            border-left: 5px solid #ff6b6b;
+            padding: 15px;
+            border-radius: 8px;
+            color: #c92a2a;
+        }}
+
+        .footer {{
+            text-align: center;
+            padding: 20px;
+            color: white;
+            margin-top: 30px;
+            font-size: 0.9em;
+        }}
+
+        .progress-bar {{
+            width: 100%;
+            height: 8px;
+            background: #e9ecef;
+            border-radius: 4px;
+            overflow: hidden;
+            margin-top: 8px;
+        }}
+
+        .progress-fill {{
+            height: 100%;
+            background: linear-gradient(90deg, #667eea 0%, #764ba2 100%);
+            transition: width 0.3s ease;
+        }}
+    </style>
+</head>
+<body>
+    <div class="container">
+        <div class="header">
+            <h1>🎬 Video Matching Report</h1>
+            <div class="meta">
+                <strong>Generated:</strong> {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}<br>
+                <strong>Source Folder:</strong> {folder_path}
+            </div>
+        </div>
+
+        <div class="summary">
+            <div class="stat">
+                <span class="stat-value">{len(results)}</span>
+                <span class="stat-label">Adaptations Processed</span>
+            </div>
+            <div class="stat">
+                <span class="stat-value">{sum(1 for r in results if r['matches'])}</span>
+                <span class="stat-label">Matched</span>
+            </div>
+            <div class="stat">
+                <span class="stat-value">{sum(1 for r in results if not r['matches'])}</span>
+                <span class="stat-label">No Matches</span>
+            </div>
+            <div class="stat">
+                <span class="stat-value">{sum(len(r['matches']) for r in results)}</span>
+                <span class="stat-label">Total Master Matches</span>
+            </div>
+        </div>
+"""
+
+    # Add each adaptation result
+    for result in results:
+        adaptation_name = result['adaptation_name']
+        matches = result['matches']
+        error = result.get('error')
+
+        match_class = 'no-matches' if not matches else ''
+        match_count = len(matches) if matches else 0
+
+        html_content += f"""
+        <div class="adaptation">
+            <div class="adaptation-header">
+                <div class="adaptation-name">{adaptation_name}</div>
+                <div class="match-count {match_class}">
+                    {match_count} Match{'es' if match_count != 1 else ''}
+                </div>
+            </div>
+"""
+
+        if error:
+            html_content += f"""
+            <div class="error-message">
+                <strong>Error:</strong> {error}
+            </div>
+"""
+        elif not matches:
+            html_content += """
+            <div class="no-match-message">
+                No matching masters found above threshold
+            </div>
+"""
+        else:
+            html_content += """
+            <div class="matches-list">
+"""
+            for idx, match in enumerate(matches, 1):
+                confidence = match['confidence'].lower().replace(' ', '-')
+
+                html_content += f"""
+                <div class="match-item">
+                    <div class="match-header">
+                        <div class="master-name">
+                            #{idx} {match['master_id']}
+                        </div>
+                        <div class="confidence-badge confidence-{confidence}">
+                            {match['confidence']}
+                        </div>
+                    </div>
+                    <div class="match-details">
+                        <div class="detail-item">
+                            <div class="detail-label">Duration</div>
+                            <div class="detail-value">{match['master_duration']:.0f}s</div>
+                        </div>
+                        <div class="detail-item">
+                            <div class="detail-label">Video Match</div>
+                            <div class="detail-value">{match['video_percentage']:.1f}%</div>
+                        </div>
+                        <div class="detail-item">
+                            <div class="detail-label">Frames</div>
+                            <div class="detail-value">{match['matching_frames']}/{match['total_frames']}</div>
+                        </div>
+                        <div class="detail-item">
+                            <div class="detail-label">Combined Score</div>
+                            <div class="detail-value">{match['combined_score']:.1%}</div>
+                        </div>
+                    </div>
+                    <div class="progress-bar">
+                        <div class="progress-fill" style="width: {match['video_percentage']:.0f}%"></div>
+                    </div>
+                </div>
+"""
+
+            html_content += """
+            </div>
+"""
+
+        html_content += """
+        </div>
+"""
+
+    html_content += """
+        <div class="footer">
+            Generated by Video Master-Adaptation Detection Tool<br>
+            🚀 Powered by spatial-only matching algorithm
+        </div>
+    </div>
+</body>
+</html>
+"""
+
+    # Write HTML file
+    with open(output_path, 'w', encoding='utf-8') as f:
+        f.write(html_content)
+
+
+def batch_match_folder(folder_path, threshold=0.80, frame_threshold=0.80, min_avg_similarity=0.90, output_file=None):
+    """
+    Match all videos in a folder against masters and generate report.
+
+    Args:
+        folder_path: Path to folder containing adaptation videos
+        threshold: Minimum percentage match threshold
+        frame_threshold: Frame similarity threshold
+        min_avg_similarity: Minimum average similarity of matched frames
+        output_file: Output HTML file path (default: auto-generated)
+    """
+    folder_path = Path(folder_path)
+
+    if not folder_path.exists():
+        console.print(f"[red]✗[/red] Folder not found: {folder_path}")
+        return
+
+    if not folder_path.is_dir():
+        console.print(f"[red]✗[/red] Not a directory: {folder_path}")
+        return
+
+    # Find all video files
+    video_files = []
+    for ext in VIDEO_EXTENSIONS:
+        video_files.extend(folder_path.glob(f"*{ext}"))
+        video_files.extend(folder_path.glob(f"*{ext.upper()}"))
+
+    if not video_files:
+        console.print(f"[yellow]No video files found in {folder_path}[/yellow]")
+        return
+
+    console.print(f"\n[bold]Found {len(video_files)} video file(s) to process[/bold]\n")
+
+    # Initialize matcher
+    matcher = VideoMatcher()
+
+    # Check if we have masters
+    masters = matcher.list_masters()
+    if not masters:
+        console.print("[red]✗[/red] No master videos found in library.")
+        console.print("Use 'python cli.py add-master' to add masters first.")
+        return
+
+    console.print(f"[cyan]Comparing against {len(masters)} master(s)...[/cyan]\n")
+
+    # Process each video
+    results = []
+
+    with Progress(
+        SpinnerColumn(),
+        TextColumn("[progress.description]{task.description}"),
+        BarColumn(),
+        TextColumn("[progress.percentage]{task.percentage:>3.0f}%"),
+        console=console
+    ) as progress:
+
+        task = progress.add_task("[cyan]Processing adaptations...", total=len(video_files))
+
+        for video_file in video_files:
+            progress.update(task, description=f"[cyan]Processing {video_file.name}...")
+
+            try:
+                matches = matcher.match_adaptation(
+                    str(video_file),
+                    threshold=threshold,
+                    frame_threshold=frame_threshold,
+                    min_avg_similarity=min_avg_similarity
+                )
+
+                results.append({
+                    'adaptation_name': video_file.name,
+                    'adaptation_path': str(video_file),
+                    'matches': matches,
+                    'error': None
+                })
+
+            except Exception as e:
+                console.print(f"[red]✗[/red] Error processing {video_file.name}: {e}")
+                results.append({
+                    'adaptation_name': video_file.name,
+                    'adaptation_path': str(video_file),
+                    'matches': [],
+                    'error': str(e)
+                })
+
+            progress.advance(task)
+
+    # Generate output filename if not specified
+    if output_file is None:
+        timestamp = datetime.now().strftime('%Y%m%d_%H%M%S')
+        output_file = f"matching_report_{timestamp}.html"
+
+    output_path = Path(output_file)
+
+    # Generate HTML report
+    console.print(f"\n[cyan]Generating HTML report...[/cyan]")
+    generate_html_report(results, output_path, str(folder_path))
+
+    # Summary
+    console.print(f"\n[bold green]✓ Report generated successfully![/bold green]")
+    console.print(f"\n[bold]Summary:[/bold]")
+    console.print(f"  Total adaptations: {len(results)}")
+    console.print(f"  Matched: {sum(1 for r in results if r['matches'])}")
+    console.print(f"  No matches: {sum(1 for r in results if not r['matches'])}")
+    console.print(f"  Total master matches: {sum(len(r['matches']) for r in results)}")
+    console.print(f"\n[bold cyan]📄 Report saved to:[/bold cyan] {output_path.absolute()}")
+    console.print(f"\n[dim]Open in browser: file://{output_path.absolute()}[/dim]")
+
+
+if __name__ == '__main__':
+    import click
+
+    @click.command()
+    @click.argument('folder_path', type=click.Path(exists=True))
+    @click.option('--threshold', '-t', default=0.80, type=float, help='Minimum percentage match (0-1)')
+    @click.option('--frame-threshold', '-f', default=0.80, type=float, help='Frame similarity threshold (0-1)')
+    @click.option('--min-avg-similarity', '-m', default=0.90, type=float, help='Minimum average similarity of matched frames (0-1)')
+    @click.option('--output', '-o', default=None, help='Output HTML file path')
+    def main(folder_path, threshold, frame_threshold, min_avg_similarity, output):
+        """Batch match all videos in a folder and generate HTML report."""
+        batch_match_folder(folder_path, threshold, frame_threshold, min_avg_similarity, output)
+
+    main()
--- a/bulk_add_masters.py
+++ b/bulk_add_masters.py
@ -0,0 +1,102 @@
+#!/usr/bin/env python3
+"""
+Bulk add master videos from a directory.
+"""
+
+import sys
+import click
+from pathlib import Path
+from rich.console import Console
+from rich.progress import Progress, SpinnerColumn, TextColumn, BarColumn
+
+# Add src to path
+sys.path.insert(0, str(Path(__file__).parent / "src"))
+
+from video_matcher.matcher import VideoMatcher
+
+console = Console()
+
+# Common video file extensions
+VIDEO_EXTENSIONS = {'.mp4', '.mov', '.avi', '.mkv', '.webm', '.flv', '.wmv', '.m4v'}
+
+
+@click.command()
+@click.argument('directory', type=click.Path(exists=True))
+@click.option('--recursive', '-r', is_flag=True, help='Recursively search subdirectories')
+@click.option('--pattern', '-p', default='*.mp4', help='File pattern to match (default: *.mp4)')
+def bulk_add(directory, recursive, pattern):
+    """Bulk add master videos from a directory."""
+
+    dir_path = Path(directory)
+
+    if not dir_path.is_dir():
+        console.print(f"[red]✗[/red] Error: {directory} is not a directory")
+        sys.exit(1)
+
+    # Find all video files
+    if recursive:
+        video_files = list(dir_path.rglob(pattern))
+    else:
+        video_files = list(dir_path.glob(pattern))
+
+    # Filter to only video extensions
+    video_files = [f for f in video_files if f.suffix.lower() in VIDEO_EXTENSIONS]
+
+    if not video_files:
+        console.print(f"[yellow]No video files found matching pattern '{pattern}'[/yellow]")
+        sys.exit(0)
+
+    console.print(f"\n[bold]Found {len(video_files)} video file(s)[/bold]\n")
+
+    # Show files to be added
+    for i, video_file in enumerate(video_files, 1):
+        console.print(f"  {i}. {video_file.name}")
+
+    console.print()
+
+    if not click.confirm('Add these videos as masters?'):
+        console.print("Cancelled.")
+        sys.exit(0)
+
+    # Initialize matcher
+    matcher = VideoMatcher()
+
+    # Process each video
+    success_count = 0
+    error_count = 0
+
+    with Progress(
+        SpinnerColumn(),
+        TextColumn("[progress.description]{task.description}"),
+        BarColumn(),
+        TextColumn("[progress.percentage]{task.percentage:>3.0f}%"),
+        console=console
+    ) as progress:
+
+        task = progress.add_task("[cyan]Adding masters...", total=len(video_files))
+
+        for video_file in video_files:
+            try:
+                # Use filename (without extension) as master_id
+                master_id = video_file.stem
+
+                progress.update(task, description=f"[cyan]Processing {video_file.name}...")
+
+                matcher.add_master(str(video_file), master_id)
+                success_count += 1
+
+            except Exception as e:
+                error_count += 1
+                console.print(f"[red]✗[/red] Error processing {video_file.name}: {e}")
+
+            progress.advance(task)
+
+    # Summary
+    console.print(f"\n[bold]Summary:[/bold]")
+    console.print(f"  [green]✓[/green] Successfully added: {success_count}")
+    if error_count > 0:
+        console.print(f"  [red]✗[/red] Errors: {error_count}")
+
+
+if __name__ == '__main__':
+    bulk_add()
--- a/cli.py
+++ b/cli.py
@ -0,0 +1,382 @@
+#!/usr/bin/env python3
+"""
+Video Master-Adaptation Detection CLI
+
+A proof-of-concept tool to detect which master video files were used
+to create adaptation videos.
+"""
+
+import sys
+import click
+from pathlib import Path
+from rich.console import Console
+from rich.table import Table
+from rich import box
+
+# Add src to path
+sys.path.insert(0, str(Path(__file__).parent / "src"))
+
+from video_matcher.matcher import VideoMatcher
+
+console = Console()
+
+
+@click.group()
+@click.version_option(version="0.1.0")
+def cli():
+    """Video Master-Adaptation Detection Tool"""
+    pass
+
+
+@cli.command()
+@click.argument('video_path', type=click.Path(exists=True))
+@click.option('--id', 'master_id', help='Custom ID for the master video')
+def add_master(video_path, master_id):
+    """Add a master video to the library."""
+    try:
+        matcher = VideoMatcher()
+        matcher.add_master(video_path, master_id)
+        console.print("[green]✓[/green] Master video added successfully")
+    except Exception as e:
+        console.print(f"[red]✗[/red] Error: {e}")
+        sys.exit(1)
+
+
+@cli.command()
+def list_masters():
+    """List all master videos in the library."""
+    try:
+        matcher = VideoMatcher()
+        masters = matcher.list_masters()
+
+        if not masters:
+            console.print("[yellow]No master videos found.[/yellow]")
+            console.print("Use 'add-master' to add master videos.")
+            return
+
+        table = Table(title="Master Videos", box=box.ROUNDED)
+        table.add_column("ID", style="cyan")
+        table.add_column("Filename", style="green")
+        table.add_column("Duration", style="yellow")
+        table.add_column("Path", style="dim")
+
+        for master in masters:
+            duration = f"{master.get('duration', 0):.1f}s"
+            table.add_row(
+                master['master_id'],
+                master['filename'],
+                duration,
+                master['path']
+            )
+
+        console.print(table)
+    except Exception as e:
+        console.print(f"[red]✗[/red] Error: {e}")
+        sys.exit(1)
+
+
+@cli.command()
+@click.argument('video_path', type=click.Path(exists=True))
+@click.option('--threshold', '-t', default=0.80, type=float, help='Minimum percentage of matching frames (0-1, e.g., 0.80 = 80%)')
+@click.option('--frame-threshold', '-f', default=0.80, type=float, help='Similarity threshold for individual frames (0-1)')
+@click.option('--min-avg-similarity', '-m', default=0.90, type=float, help='Minimum average similarity of matched frames (0-1)')
+def match(video_path, threshold, frame_threshold, min_avg_similarity):
+    """Match an adaptation video against master videos using spatial-only matching.
+
+    This method ignores temporal order and can handle:
+    - Speed changes (slow-mo, time-lapse)
+    - Shot reordering
+    - Non-linear edits
+    - Different durations
+    """
+    try:
+        matcher = VideoMatcher()
+
+        # Check if we have any masters
+        masters = matcher.list_masters()
+        if not masters:
+            console.print("[red]✗[/red] No master videos found in library.")
+            console.print("Use 'add-master' to add master videos first.")
+            sys.exit(1)
+
+        # Perform matching
+        matches = matcher.match_adaptation(video_path, threshold=threshold, frame_threshold=frame_threshold, min_avg_similarity=min_avg_similarity)
+
+        if not matches:
+            console.print(f"\n[yellow]No matches found above threshold {threshold}[/yellow]")
+            return
+
+        # Display results
+        console.print(f"\n[green]Found {len(matches)} master(s) matching this adaptation:[/green]\n")
+
+        table = Table(box=box.ROUNDED)
+        table.add_column("Rank", style="cyan", justify="right")
+        table.add_column("Master ID", style="green")
+        table.add_column("Duration", style="dim", justify="right")
+        table.add_column("Video Match", style="yellow", justify="right")
+        table.add_column("Frames", style="blue", justify="center")
+        table.add_column("Combined", style="cyan", justify="right")
+        table.add_column("Confidence", style="bold")
+        table.add_column("Method", style="magenta")
+
+        for idx, match in enumerate(matches, 1):
+            confidence = match['confidence']
+            matching_method = match.get('matching_method', 'perceptual_hash')
+
+            # Color code confidence
+            if confidence in ["Very High", "High"]:
+                conf_style = "green"
+            elif confidence == "Medium":
+                conf_style = "yellow"
+            else:
+                conf_style = "red"
+
+            # Method display
+            method_display = "AI Vision" if matching_method == "ai_vision" else "Hash"
+
+            table.add_row(
+                str(idx),
+                match['master_id'],
+                f"{match['master_duration']:.0f}s",
+                f"{match['video_percentage']:.1f}%",
+                f"{match['matching_frames']}/{match['total_frames']}",
+                f"{match['combined_score']:.3f}",
+                f"[{conf_style}]{confidence}[/{conf_style}]",
+                method_display
+            )
+
+        console.print(table)
+
+        # Show summary
+        if matches:
+            top = matches[0]
+            console.print(f"\n[bold]Best Match:[/bold]")
+            console.print(f"  Master: [green]{top['master_id']}[/green]")
+            console.print(f"  Duration: {top['master_duration']:.0f}s")
+            console.print(f"  Video frames matched: {top['video_percentage']:.1f}% ({top['matching_frames']}/{top['total_frames']} frames)")
+            console.print(f"  Average frame similarity: {top['average_frame_similarity']:.1%}")
+            console.print(f"  Audio similarity: {top['audio_similarity']:.3f}")
+            console.print(f"  Combined confidence: {top['combined_score']:.1%}")
+
+            # Show AI vision specific info if applicable
+            if top.get('matching_method') == 'ai_vision':
+                console.print(f"\n[bold magenta]AI Vision Analysis:[/bold magenta]")
+                console.print(f"  Method: GPT-4V (OpenAI)")
+                if top.get('is_crop'):
+                    console.print(f"  Format: [yellow]Adaptation is cropped from master[/yellow]")
+                if top.get('ai_explanation'):
+                    console.print(f"\n  [dim]AI Reasoning:[/dim]")
+                    # Show only the explanation part, not the full structured response
+                    explanation = top['ai_explanation']
+                    if 'EXPLANATION:' in explanation:
+                        explanation = explanation.split('EXPLANATION:')[1].strip()
+                    # Limit to first 200 chars for brevity
+                    if len(explanation) > 200:
+                        explanation = explanation[:200] + "..."
+                    console.print(f"  [dim]{explanation}[/dim]")
+
+            if len(matches) > 1:
+                # Group by score to show ties
+                top_score = top['combined_score']
+                tied_matches = [m for m in matches if m['combined_score'] == top_score]
+
+                if len(tied_matches) > 1:
+                    console.print(f"\n[bold yellow]Note:[/bold yellow] {len(tied_matches)} masters have identical scores.")
+                    console.print(f"  Ranked by duration (longest master selected as likely source):")
+                    for match in tied_matches[:5]:  # Show top 5 ties
+                        console.print(f"  • {match['master_id']} ({match['master_duration']:.0f}s)")
+
+                other_matches = [m for m in matches[1:] if m['combined_score'] != top_score]
+                if other_matches:
+                    console.print(f"\n[bold]Other Potential Matches:[/bold]")
+                    for match in other_matches[:10]:  # Limit to top 10
+                        console.print(f"  • {match['master_id']} ({match['master_duration']:.0f}s): {match['video_percentage']:.1f}% video, {match['combined_score']:.1%} combined")
+
+            console.print(f"\n[dim]Path: {top['master_path']}[/dim]")
+
+    except Exception as e:
+        console.print(f"[red]✗[/red] Error: {e}")
+        import traceback
+        traceback.print_exc()
+        sys.exit(1)
+
+
+@cli.command()
+def clear():
+    """Clear all master videos from the library."""
+    if click.confirm('Are you sure you want to clear all masters?'):
+        try:
+            matcher = VideoMatcher()
+            matcher.clear_masters()
+            console.print("[green]✓[/green] All masters cleared")
+        except Exception as e:
+            console.print(f"[red]✗[/red] Error: {e}")
+            sys.exit(1)
+
+
+@cli.command()
+@click.argument('folder_path', type=click.Path(exists=True))
+@click.option('--threshold', '-t', default=0.80, type=float, help='Minimum percentage match (0-1)')
+@click.option('--frame-threshold', '-f', default=0.80, type=float, help='Frame similarity threshold (0-1)')
+@click.option('--min-avg-similarity', '-m', default=0.90, type=float, help='Minimum average similarity of matched frames (0-1)')
+@click.option('--output', '-o', default=None, help='Output HTML file path')
+def batch_match(folder_path, threshold, frame_threshold, min_avg_similarity, output):
+    """Match all videos in a folder and generate HTML report.
+
+    This will process all video files in the specified folder, match them
+    against your master videos, and generate a beautiful HTML report showing
+    which masters were used for each adaptation.
+    """
+    try:
+        from pathlib import Path
+        from datetime import datetime
+        from rich.progress import Progress, SpinnerColumn, TextColumn, BarColumn
+
+        folder_path = Path(folder_path)
+
+        # Common video extensions
+        VIDEO_EXTENSIONS = {'.mp4', '.mov', '.avi', '.mkv', '.webm', '.flv', '.wmv', '.m4v'}
+
+        # Find all video files
+        video_files = []
+        for ext in VIDEO_EXTENSIONS:
+            video_files.extend(folder_path.glob(f"*{ext}"))
+            video_files.extend(folder_path.glob(f"*{ext.upper()}"))
+
+        if not video_files:
+            console.print(f"[yellow]No video files found in {folder_path}[/yellow]")
+            return
+
+        console.print(f"\n[bold]Found {len(video_files)} video file(s) to process[/bold]\n")
+
+        # Initialize matcher
+        matcher = VideoMatcher()
+
+        # Check if we have masters
+        masters = matcher.list_masters()
+        if not masters:
+            console.print("[red]✗[/red] No master videos found in library.")
+            console.print("Use 'add-master' to add masters first.")
+            sys.exit(1)
+
+        console.print(f"[cyan]Comparing against {len(masters)} master(s)...[/cyan]\n")
+
+        # Process each video
+        results = []
+
+        with Progress(
+            SpinnerColumn(),
+            TextColumn("[progress.description]{task.description}"),
+            BarColumn(),
+            TextColumn("[progress.percentage]{task.percentage:>3.0f}%"),
+            console=console
+        ) as progress:
+
+            task = progress.add_task("[cyan]Processing adaptations...", total=len(video_files))
+
+            for video_file in video_files:
+                progress.update(task, description=f"[cyan]Processing {video_file.name}...")
+
+                try:
+                    matches = matcher.match_adaptation(
+                        str(video_file),
+                        threshold=threshold,
+                        frame_threshold=frame_threshold,
+                        min_avg_similarity=min_avg_similarity
+                    )
+
+                    results.append({
+                        'adaptation_name': video_file.name,
+                        'adaptation_path': str(video_file),
+                        'matches': matches,
+                        'error': None
+                    })
+
+                except Exception as e:
+                    console.print(f"[red]✗[/red] Error processing {video_file.name}: {e}")
+                    results.append({
+                        'adaptation_name': video_file.name,
+                        'adaptation_path': str(video_file),
+                        'matches': [],
+                        'error': str(e)
+                    })
+
+                progress.advance(task)
+
+        # Generate output filename if not specified
+        if output is None:
+            timestamp = datetime.now().strftime('%Y%m%d_%H%M%S')
+            output = f"matching_report_{timestamp}.html"
+
+        output_path = Path(output)
+
+        # Generate HTML report (inline to avoid import issues)
+        console.print(f"\n[cyan]Generating HTML report...[/cyan]")
+
+        # Import the generation function from batch_match
+        sys.path.insert(0, str(Path(__file__).parent))
+        from batch_match import generate_html_report
+
+        generate_html_report(results, output_path, str(folder_path))
+
+        # Summary
+        console.print(f"\n[bold green]✓ Report generated successfully![/bold green]")
+        console.print(f"\n[bold]Summary:[/bold]")
+        console.print(f"  Total adaptations: {len(results)}")
+        console.print(f"  Matched: {sum(1 for r in results if r['matches'])}")
+        console.print(f"  No matches: {sum(1 for r in results if not r['matches'])}")
+        console.print(f"  Total master matches: {sum(len(r['matches']) for r in results)}")
+        console.print(f"\n[bold cyan]📄 Report saved to:[/bold cyan] {output_path.absolute()}")
+        console.print(f"\n[dim]Open in browser: file://{output_path.absolute()}[/dim]")
+
+    except Exception as e:
+        console.print(f"[red]✗[/red] Error: {e}")
+        import traceback
+        traceback.print_exc()
+        sys.exit(1)
+
+
+@cli.command()
+def status():
+    """Show system status and configuration."""
+    console.print("[bold]Video Master Detection - System Status[/bold]\n")
+
+    # Check dependencies
+    table = Table(title="Dependencies", box=box.SIMPLE)
+    table.add_column("Component", style="cyan")
+    table.add_column("Status", style="green")
+
+    # FFmpeg
+    import shutil
+    ffmpeg_available = shutil.which('ffmpeg') is not None
+    table.add_row("FFmpeg", "✓ Available" if ffmpeg_available else "✗ Not found")
+
+    # Chromaprint
+    try:
+        import acoustid
+        table.add_row("Chromaprint/AcoustID", "✓ Available")
+    except ImportError:
+        table.add_row("Chromaprint/AcoustID", "✗ Not available")
+
+    # TMK
+    try:
+        import tmkpy
+        table.add_row("TMK", "✓ Available")
+    except ImportError:
+        table.add_row("TMK", "✗ Not available (using basic hashing)")
+
+    console.print(table)
+
+    # Show library stats
+    matcher = VideoMatcher()
+    masters = matcher.list_masters()
+
+    console.print(f"\n[bold]Library Statistics[/bold]")
+    console.print(f"  Master videos: {len(masters)}")
+
+    if not ffmpeg_available:
+        console.print("\n[yellow]⚠ Warning: FFmpeg not found. Please install FFmpeg.[/yellow]")
+
+
+if __name__ == '__main__':
+    cli()
--- a/config.env
+++ b/config.env
@ -0,0 +1,10 @@
+OPENAI_API_KEY=sk-svcacct-HSREzGYDnN-vCVGAh6LhYqlNcJVF2oefMrY9oCsdDsQFmyVJyHpLb1eSb_mp_vP4YPl4T3BlbkFJzKaOrPghIzx76_22K8VjwO6j2JnoDEvrYDrgfrnA4WjD5sTMnhOqGHXximwGXFhUoYgA
+GOOGLE_API_KEY=AIzaSyDMWN_PAnyU7bPmtWcEKq4LJfiu1KuwUsU
+
+# Azure AD / MSAL Authentication Configuration
+AZURE_TENANT_ID=e519c2e6-bc6d-4fdf-8d9c-923c2f002385
+AZURE_CLIENT_ID=9079054c-9620-4757-a256-23413042f1ef
+
+# Flask Security Configuration
+FLASK_ENV=development
+SECRET_KEY=your-secret-key-here-change-in-production
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,18 @@
+# Core dependencies (audio fingerprinting)
+pyacoustid>=1.3.0
+
+# Video processing
+ffmpeg-python>=0.2.0
+
+# AI Vision (OpenAI GPT-4V for cross-aspect matching)
+openai>=1.12.0
+python-dotenv>=1.0.0
+
+# CLI
+click>=8.1.0
+rich>=13.7.0
+tqdm>=4.66.0
+
+# Utilities
+numpy>=1.24.0
+Pillow>=10.0.0
--- a/src/video_matcher/init.py
+++ b/src/video_matcher/init.py
@ -0,0 +1,3 @@
+"""Video Master-Adaptation Detection System."""
+
+__version__ = "0.1.0"
--- a/src/video_matcher/ai_vision.py
+++ b/src/video_matcher/ai_vision.py
@ -0,0 +1,290 @@
+"""AI Vision integration for cross-aspect-ratio video matching using OpenAI GPT-4V."""
+
+import os
+import base64
+import tempfile
+from pathlib import Path
+from typing import Dict, List, Optional, Tuple
+import ffmpeg
+
+# Load environment variables from .env file
+try:
+    from dotenv import load_dotenv
+    load_dotenv()
+except ImportError:
+    pass  # dotenv not installed, will use system env vars only
+
+
+class AIVisionMatcher:
+    """
+    Uses OpenAI GPT-4V to compare video frames for cross-aspect-ratio matching.
+    This is triggered as a fallback when perceptual hash matching fails.
+    """
+
+    def __init__(self, api_key: Optional[str] = None):
+        """
+        Initialize AI Vision matcher.
+
+        Args:
+            api_key: OpenAI API key (defaults to OPENAI_API_KEY env var)
+        """
+        self.api_key = api_key or os.getenv('OPENAI_API_KEY')
+
+        if not self.api_key:
+            print("  ⚠ Warning: OPENAI_API_KEY not set. AI vision matching disabled.")
+            self.enabled = False
+        else:
+            self.enabled = True
+
+        # Import OpenAI only if enabled
+        if self.enabled:
+            try:
+                from openai import OpenAI
+                self.client = OpenAI(api_key=self.api_key)
+            except ImportError:
+                print("  ⚠ Warning: openai package not installed. Run: pip install openai")
+                self.enabled = False
+
+    def extract_key_frames(self, video_path: str, num_frames: int = 5, max_dimension: int = 1024) -> List[str]:
+        """
+        Extract evenly-spaced key frames from a video.
+
+        Args:
+            video_path: Path to video file
+            num_frames: Number of frames to extract (default 5)
+            max_dimension: Maximum width/height for frames (default 1024 for cost)
+
+        Returns:
+            List of base64-encoded frame images
+        """
+        try:
+            # Get video info
+            probe = ffmpeg.probe(video_path)
+            video_info = next(s for s in probe['streams'] if s['codec_type'] == 'video')
+            duration = float(probe['format']['duration'])
+            width = int(video_info['width'])
+            height = int(video_info['height'])
+
+            # Calculate scale to fit within max_dimension
+            # For ffmpeg-python, we need to pass width and height separately
+            if width > height:
+                # Landscape: scale width to max_dimension, keep aspect ratio
+                scale_w = max_dimension if width > max_dimension else width
+                scale_h = -1 if width > max_dimension else height
+            else:
+                # Portrait: scale height to max_dimension, keep aspect ratio
+                scale_w = -1 if height > max_dimension else width
+                scale_h = max_dimension if height > max_dimension else height
+
+            frames_base64 = []
+
+            # Extract frames at evenly-spaced intervals
+            # Skip first and last 5% to avoid black frames/transitions
+            start_offset = duration * 0.05
+            end_offset = duration * 0.95
+            usable_duration = end_offset - start_offset
+
+            for i in range(num_frames):
+                # Calculate timestamp for this frame
+                if num_frames == 1:
+                    timestamp = duration / 2  # Middle frame
+                else:
+                    timestamp = start_offset + (usable_duration * i / (num_frames - 1))
+
+                # Create temp file for frame
+                with tempfile.NamedTemporaryFile(suffix='.jpg', delete=False) as tmp:
+                    tmp_path = tmp.name
+
+                try:
+                    # Extract frame using ffmpeg
+                    (
+                        ffmpeg
+                        .input(video_path, ss=timestamp)
+                        .filter('scale', w=scale_w, h=scale_h)
+                        .output(tmp_path, vframes=1, format='image2', vcodec='mjpeg')
+                        .overwrite_output()
+                        .run(capture_stdout=True, capture_stderr=True)
+                    )
+
+                    # Read and encode as base64
+                    with open(tmp_path, 'rb') as f:
+                        frame_bytes = f.read()
+                        frame_base64 = base64.b64encode(frame_bytes).decode('utf-8')
+                        frames_base64.append(frame_base64)
+
+                except ffmpeg.Error as e:
+                    print(f"  FFmpeg error at timestamp {timestamp:.2f}s: {e.stderr.decode() if e.stderr else str(e)}")
+                    continue
+                finally:
+                    # Clean up temp file
+                    if os.path.exists(tmp_path):
+                        os.unlink(tmp_path)
+
+            return frames_base64
+
+        except Exception as e:
+            print(f"  Error extracting frames from {video_path}: {e}")
+            return []
+
+    def compare_videos(self, adaptation_path: str, master_path: str,
+                      adaptation_name: str = "adaptation", master_name: str = "master") -> Dict:
+        """
+        Compare two videos using OpenAI GPT-4V to determine if they contain the same scenes.
+
+        Args:
+            adaptation_path: Path to adaptation video
+            master_path: Path to master video
+            adaptation_name: Name for adaptation (for display)
+            master_name: Name for master (for display)
+
+        Returns:
+            Dict with:
+                - match: bool (True if videos match)
+                - confidence: float (0-1)
+                - explanation: str (AI's reasoning)
+                - is_crop: bool (True if adaptation is a crop of master)
+                - cost: float (API cost in USD)
+        """
+        if not self.enabled:
+            return {
+                'match': False,
+                'confidence': 0.0,
+                'explanation': 'AI vision disabled (no API key)',
+                'is_crop': False,
+                'cost': 0.0
+            }
+
+        print(f"    Extracting frames from {adaptation_name}...")
+        adaptation_frames = self.extract_key_frames(adaptation_path, num_frames=5)
+
+        print(f"    Extracting frames from {master_name}...")
+        master_frames = self.extract_key_frames(master_path, num_frames=5)
+
+        if not adaptation_frames or not master_frames:
+            return {
+                'match': False,
+                'confidence': 0.0,
+                'explanation': 'Failed to extract frames',
+                'is_crop': False,
+                'cost': 0.0
+            }
+
+        print(f"    Analyzing with GPT-4V...")
+
+        # Build message with images
+        content = [
+            {
+                "type": "text",
+                "text": f"""You are a video forensics expert analyzing whether two videos contain the same source footage.
+
+**Critical Context:**
+- Set A ({adaptation_name}) may be created from Set B ({master_name}) through cropping, scaling, or pan-and-scan
+- The aspect ratios may differ (e.g., 16:9 cropped to 1:1 square or 9:16 vertical)
+- Set A might show zoomed/cropped portions of scenes from Set B
+
+**What to IGNORE completely:**
+- Text overlays, titles, captions, and subtitles
+- Logo size, placement, or styling differences
+- Different text languages or localization
+- Social media platform branding (Facebook, Instagram, TikTok logos)
+- Call-to-action text or price tags
+
+**What to FOCUS on:**
+- Are the PEOPLE the same? (faces, clothing, poses, actions)
+- Are the PRODUCTS the same? (items being shown, held, or featured)
+- Are the SETTINGS the same? (backgrounds, environments, locations)
+- Is the FRAMING similar? (same shots, even if cropped or zoomed)
+- Is the SEQUENCE similar? (same order of events/scenes)
+
+**Key Question:** Could Set A be a cropped/zoomed version of Set B, showing the same footage but from a different aspect ratio?
+
+**Your Task:**
+Compare Set A and Set B and determine if they contain the same source footage.
+
+**Set A ({adaptation_name}):** 5 frames from potential adaptation
+**Set B ({master_name}):** 5 frames from potential master source
+
+Provide your analysis in this EXACT format:
+MATCH: [Yes/No]
+CONFIDENCE: [0-100, where 100 = absolutely certain]
+IS_CROP: [Yes/No/Unclear - is Set A a crop/zoom of Set B?]
+EXPLANATION: [Describe what you see: are people, products, settings the same? Even if text/logos differ, is the underlying footage identical?]"""
+            }
+        ]
+
+        # Add adaptation frames
+        for i, frame in enumerate(adaptation_frames):
+            content.append({
+                "type": "image_url",
+                "image_url": {
+                    "url": f"data:image/jpeg;base64,{frame}",
+                    "detail": "low"  # Use low detail for cost savings
+                }
+            })
+
+        # Add master frames
+        for i, frame in enumerate(master_frames):
+            content.append({
+                "type": "image_url",
+                "image_url": {
+                    "url": f"data:image/jpeg;base64,{frame}",
+                    "detail": "low"
+                }
+            })
+
+        try:
+            # Call OpenAI API with latest vision model
+            response = self.client.chat.completions.create(
+                model="gpt-4o",  # Updated to latest GPT-4 with vision
+                messages=[{
+                    "role": "user",
+                    "content": content
+                }],
+                max_tokens=500
+            )
+
+            # Parse response
+            answer = response.choices[0].message.content
+
+            # Extract structured data from response
+            match = "MATCH: Yes" in answer or "MATCH: YES" in answer
+
+            # Extract confidence
+            confidence = 0.5
+            if "CONFIDENCE:" in answer:
+                try:
+                    conf_line = [line for line in answer.split('\n') if 'CONFIDENCE:' in line][0]
+                    conf_str = conf_line.split('CONFIDENCE:')[1].strip().split()[0]
+                    confidence = float(conf_str) / 100.0
+                except:
+                    pass
+
+            # Extract is_crop
+            is_crop = "IS_CROP: Yes" in answer or "IS_CROP: YES" in answer
+
+            # Calculate cost (approximate)
+            # GPT-4o vision: ~$0.00255 per image at low detail (170 tokens per image)
+            # Input: $2.50 per 1M tokens, Output: $10 per 1M tokens
+            # Low detail = ~170 tokens per image
+            num_images = len(adaptation_frames) + len(master_frames)
+            input_tokens = num_images * 170 + 300  # images + prompt text
+            output_tokens = 150  # estimated response
+            cost = (input_tokens / 1000000 * 2.50) + (output_tokens / 1000000 * 10)
+
+            return {
+                'match': match,
+                'confidence': confidence,
+                'explanation': answer,
+                'is_crop': is_crop,
+                'cost': cost
+            }
+
+        except Exception as e:
+            print(f"    Error calling OpenAI API: {e}")
+            return {
+                'match': False,
+                'confidence': 0.0,
+                'explanation': f'API error: {str(e)}',
+                'is_crop': False,
+                'cost': 0.0
+            }
--- a/src/video_matcher/fingerprinter.py
+++ b/src/video_matcher/fingerprinter.py
@ -0,0 +1,447 @@
+"""Video and audio fingerprinting utilities."""
+
+import os
+import json
+import subprocess
+import tempfile
+from pathlib import Path
+from typing import Dict, List, Optional, Tuple
+import hashlib
+
+try:
+    import acoustid
+    CHROMAPRINT_AVAILABLE = True
+except ImportError:
+    CHROMAPRINT_AVAILABLE = False
+    print("Warning: chromaprint/acoustid not available. Audio fingerprinting disabled.")
+
+try:
+    import tmkpy
+    TMK_AVAILABLE = True
+except ImportError:
+    TMK_AVAILABLE = False
+    print("Warning: tmkpy not available. Will use basic frame hashing instead.")
+
+import ffmpeg
+import numpy as np
+
+
+class VideoFingerprinter:
+    """Generate fingerprints for video files."""
+
+    def __init__(self, data_dir: str = "data/fingerprints"):
+        self.data_dir = Path(data_dir)
+        self.data_dir.mkdir(parents=True, exist_ok=True)
+
+    def get_video_info(self, video_path: str) -> Dict:
+        """Extract basic video metadata."""
+        try:
+            probe = ffmpeg.probe(video_path)
+            video_info = next(s for s in probe['streams'] if s['codec_type'] == 'video')
+            audio_info = next((s for s in probe['streams'] if s['codec_type'] == 'audio'), None)
+
+            return {
+                'duration': float(probe['format']['duration']),
+                'width': int(video_info['width']),
+                'height': int(video_info['height']),
+                'fps': eval(video_info['r_frame_rate']),
+                'has_audio': audio_info is not None,
+                'codec': video_info['codec_name']
+            }
+        except Exception as e:
+            print(f"Error getting video info: {e}")
+            return {}
+
+    def extract_audio_fingerprint(self, video_path: str) -> Optional[Dict]:
+        """Extract audio fingerprint using Chromaprint."""
+        if not CHROMAPRINT_AVAILABLE:
+            return None
+
+        try:
+            # Extract audio to temporary WAV file
+            with tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as tmp:
+                tmp_path = tmp.name
+
+            # Convert audio to mono 16kHz WAV
+            (
+                ffmpeg
+                .input(video_path)
+                .output(tmp_path, acodec='pcm_s16le', ac=1, ar=16000)
+                .overwrite_output()
+                .run(quiet=True, capture_stdout=True, capture_stderr=True)
+            )
+
+            # Generate fingerprint
+            duration, fp = acoustid.fingerprint_file(tmp_path)
+
+            # Clean up
+            os.unlink(tmp_path)
+
+            # Convert fingerprint to string if it's bytes
+            if isinstance(fp, bytes):
+                fp = fp.decode('utf-8')
+
+            return {
+                'duration': duration,
+                'fingerprint': fp,
+                'method': 'chromaprint'
+            }
+        except Exception as e:
+            print(f"Error extracting audio fingerprint: {e}")
+            return None
+
+    def extract_tmk_fingerprint(self, video_path: str) -> Optional[Dict]:
+        """Extract TMK video fingerprint."""
+        if not TMK_AVAILABLE:
+            return self._extract_basic_video_hash(video_path)
+
+        try:
+            # TMK implementation would go here
+            # For now, fall back to basic hashing
+            return self._extract_basic_video_hash(video_path)
+        except Exception as e:
+            print(f"Error extracting TMK fingerprint: {e}")
+            return None
+
+    def _extract_basic_video_hash(self, video_path: str, samples_per_second: float = 2.0) -> Dict:
+        """
+        Extract basic perceptual hash from video frames.
+        This is a fallback when TMK is not available.
+
+        Args:
+            video_path: Path to video file
+            samples_per_second: Number of frame samples per second (default 1.0 = 1 frame/sec)
+        """
+        try:
+            info = self.get_video_info(video_path)
+            duration = info.get('duration', 0)
+
+            if duration == 0:
+                return {'method': 'basic_hash', 'frames': []}
+
+            # Calculate number of frames to sample (at least 3)
+            num_frames = max(3, int(duration * samples_per_second))
+            time_interval = duration / num_frames
+
+            # Extract frames at regular intervals
+            frames = []
+            for i in range(num_frames):
+                timestamp = i * time_interval
+
+                # Extract single frame
+                out, _ = (
+                    ffmpeg
+                    .input(video_path, ss=timestamp)
+                    .output('pipe:', vframes=1, format='rawvideo', pix_fmt='gray')
+                    .run(capture_stdout=True, capture_stderr=True, quiet=True)
+                )
+
+                # Convert to numpy and resize to 8x8 for perceptual hash
+                frame = np.frombuffer(out, np.uint8).reshape(info['height'], info['width'])
+
+                # Simple downsample to 8x8
+                h, w = frame.shape
+                block_h, block_w = h // 8, w // 8
+                small = np.zeros((8, 8), dtype=np.uint8)
+                for y in range(8):
+                    for x in range(8):
+                        small[y, x] = frame[y*block_h:(y+1)*block_h, x*block_w:(x+1)*block_w].mean()
+
+                # Create perceptual hash
+                avg = small.mean()
+                hash_bits = (small > avg).flatten()
+                hash_hex = hex(int(''.join(['1' if b else '0' for b in hash_bits]), 2))
+
+                frames.append({
+                    'frame_id': i,
+                    'timestamp': timestamp,
+                    'hash': hash_hex
+                })
+
+            return {
+                'method': 'basic_hash',
+                'samples_per_second': samples_per_second,
+                'num_frames': num_frames,
+                'frames': frames,
+                # Keep old format for backward compatibility
+                'segments': frames,
+                'hashes': frames
+            }
+        except Exception as e:
+            print(f"Error extracting basic video hash: {e}")
+            return {'method': 'basic_hash', 'frames': [], 'segments': [], 'hashes': []}
+
+
+    def fingerprint_video(self, video_path: str, video_id: str) -> Dict:
+        """Generate complete fingerprint for a video file."""
+        print(f"Fingerprinting: {video_path}")
+
+        video_path = str(Path(video_path).resolve())
+
+        fingerprint = {
+            'video_id': video_id,
+            'path': video_path,
+            'filename': os.path.basename(video_path),
+            'info': self.get_video_info(video_path),
+            'audio_fp': self.extract_audio_fingerprint(video_path),
+            'video_fp': self.extract_tmk_fingerprint(video_path)
+        }
+
+        # Save fingerprint
+        fp_file = self.data_dir / f"{video_id}.json"
+        with open(fp_file, 'w') as f:
+            json.dump(fingerprint, f, indent=2)
+
+        print(f"  ✓ Saved fingerprint to {fp_file}")
+        return fingerprint
+
+    def load_fingerprint(self, video_id: str) -> Optional[Dict]:
+        """Load a previously saved fingerprint."""
+        fp_file = self.data_dir / f"{video_id}.json"
+        if not fp_file.exists():
+            return None
+
+        with open(fp_file, 'r') as f:
+            return json.load(f)
+
+    def list_fingerprints(self) -> List[str]:
+        """List all saved fingerprint IDs."""
+        return [f.stem for f in self.data_dir.glob("*.json")]
+
+
+def compare_audio_fingerprints(fp1: Dict, fp2: Dict) -> float:
+    """Compare two audio fingerprints and return similarity score (0-1)."""
+    if not fp1 or not fp2:
+        return 0.0
+
+    if not CHROMAPRINT_AVAILABLE:
+        return 0.0
+
+    try:
+        # Chromaprint comparison - this is simplified
+        # In production, use acoustid.compare or implement proper alignment
+        return 0.5  # Placeholder - proper implementation needed
+    except Exception as e:
+        print(f"Error comparing audio: {e}")
+        return 0.0
+
+
+def compare_video_fingerprints(fp1: Dict, fp2: Dict) -> float:
+    """Compare two video fingerprints and return similarity score (0-1)."""
+    if not fp1 or not fp2:
+        return 0.0
+
+    method1 = fp1.get('method')
+    method2 = fp2.get('method')
+
+    if method1 == 'basic_hash' and method2 == 'basic_hash':
+        return _compare_basic_hashes(fp1, fp2)
+
+    return 0.0
+
+
+def _compare_basic_hashes(fp1: Dict, fp2: Dict) -> float:
+    """
+    Compare basic perceptual hashes (legacy function for backward compatibility).
+    Returns overall similarity score.
+    """
+    segments1 = fp1.get('segments', fp1.get('hashes', []))
+    segments2 = fp2.get('segments', fp2.get('hashes', []))
+
+    if not segments1 or not segments2:
+        return 0.0
+
+    # Simple approach: compare hashes at similar timestamps
+    matches = 0
+    total = min(len(segments1), len(segments2))
+
+    for h1, h2 in zip(segments1, segments2):
+        if h1['hash'] == h2['hash']:
+            matches += 1
+        else:
+            # Calculate hamming distance for partial matches
+            try:
+                bits1 = bin(int(h1['hash'], 16))[2:].zfill(64)
+                bits2 = bin(int(h2['hash'], 16))[2:].zfill(64)
+                hamming = sum(b1 != b2 for b1, b2 in zip(bits1, bits2))
+                # Score based on similarity (64 bits total)
+                if hamming < 16:  # Less than 25% different
+                    matches += (64 - hamming) / 64
+            except:
+                pass
+
+    return matches / total if total > 0 else 0.0
+
+
+def compare_segments(adaptation_fp: Dict, master_fp: Dict, similarity_threshold: float = 0.8) -> Dict:
+    """
+    Compare adaptation segments against master segments.
+
+    Args:
+        adaptation_fp: Adaptation fingerprint with segments
+        master_fp: Master fingerprint with segments
+        similarity_threshold: Threshold for considering segments as matching (0-1)
+
+    Returns:
+        Dict with segment-level matching information
+    """
+    if not adaptation_fp or not master_fp:
+        return {'matching_segments': 0, 'total_segments': 0, 'percentage': 0.0, 'segment_matches': []}
+
+    # Handle both old format (hashes) and new format (segments)
+    adaptation_segments = adaptation_fp.get('segments', adaptation_fp.get('hashes', []))
+    master_segments = master_fp.get('segments', master_fp.get('hashes', []))
+
+    if not adaptation_segments or not master_segments:
+        return {'matching_segments': 0, 'total_segments': 0, 'percentage': 0.0, 'segment_matches': []}
+
+    segment_matches = []
+
+    # For each adaptation segment, find best matching master segment
+    for idx, adapt_seg in enumerate(adaptation_segments):
+        best_score = 0.0
+        best_master_seg = None
+        best_master_idx = None
+
+        # Compare against all master segments
+        for master_idx, master_seg in enumerate(master_segments):
+            score = _calculate_hash_similarity(adapt_seg['hash'], master_seg['hash'])
+
+            if score > best_score:
+                best_score = score
+                best_master_seg = master_seg
+                best_master_idx = master_idx
+
+        # If similarity exceeds threshold, consider it a match
+        is_match = best_score >= similarity_threshold
+
+        segment_matches.append({
+            'adaptation_segment': adapt_seg.get('segment_id', idx),
+            'adaptation_time': (adapt_seg.get('start_time'), adapt_seg.get('end_time')),
+            'matched': is_match,
+            'similarity': best_score,
+            'master_segment': best_master_seg.get('segment_id', best_master_idx) if best_master_seg else None,
+            'master_time': (best_master_seg.get('start_time'), best_master_seg.get('end_time')) if best_master_seg else None
+        })
+
+    matching_segments = sum(1 for m in segment_matches if m['matched'])
+    total_segments = len(adaptation_segments)
+    percentage = (matching_segments / total_segments * 100) if total_segments > 0 else 0.0
+
+    return {
+        'matching_segments': matching_segments,
+        'total_segments': total_segments,
+        'percentage': round(percentage, 1),
+        'segment_matches': segment_matches
+    }
+
+
+def _calculate_hash_similarity(hash1: str, hash2: str) -> float:
+    """Calculate similarity between two perceptual hashes (0-1)."""
+    try:
+        bits1 = bin(int(hash1, 16))[2:].zfill(64)
+        bits2 = bin(int(hash2, 16))[2:].zfill(64)
+        hamming = sum(b1 != b2 for b1, b2 in zip(bits1, bits2))
+        # Convert hamming distance to similarity score
+        return (64 - hamming) / 64
+    except:
+        return 0.0
+
+
+def compare_spatial_only(adaptation_fp: Dict, master_fp: Dict, similarity_threshold: float = 0.75, debug: bool = False) -> Dict:
+    """
+    Compare adaptation frames against master frames ignoring temporal order.
+    This handles speed changes, shot reordering, and non-linear edits.
+
+    For each adaptation frame, we check if it exists ANYWHERE in the master.
+
+    Args:
+        adaptation_fp: Adaptation fingerprint
+        master_fp: Master fingerprint
+        similarity_threshold: Threshold for considering frames as matching (0-1)
+        debug: Enable debug output showing similarity scores
+
+    Returns:
+        Dict with matching information including percentage
+    """
+    if not adaptation_fp or not master_fp:
+        return {
+            'matching_frames': 0,
+            'total_frames': 0,
+            'percentage': 0.0,
+            'matches': [],
+            'average_similarity': 0.0,
+            'matched_similarities': []
+        }
+
+    # Get frame hashes (support multiple legacy formats)
+    adapt_frames = (adaptation_fp.get('frames') or
+                   adaptation_fp.get('segments') or
+                   adaptation_fp.get('hashes') or [])
+
+    master_frames = (master_fp.get('frames') or
+                    master_fp.get('segments') or
+                    master_fp.get('hashes') or [])
+
+    if not adapt_frames or not master_frames:
+        return {
+            'matching_frames': 0,
+            'total_frames': 0,
+            'percentage': 0.0,
+            'matches': [],
+            'average_similarity': 0.0,
+            'matched_similarities': []
+        }
+
+    # Build a set of master hashes for quick lookup
+    master_hashes = [frame['hash'] for frame in master_frames]
+
+    matches = []
+    matching_count = 0
+    matched_similarities = []
+
+    # For each adaptation frame, find best match in master (anywhere in timeline)
+    for adapt_frame in adapt_frames:
+        best_score = 0.0
+        best_master_idx = None
+
+        # Compare against ALL master frames (spatial only, ignore time)
+        for master_idx, master_hash in enumerate(master_hashes):
+            score = _calculate_hash_similarity(adapt_frame['hash'], master_hash)
+
+            if score > best_score:
+                best_score = score
+                best_master_idx = master_idx
+
+        # Consider it a match if above threshold
+        is_match = best_score >= similarity_threshold
+        if is_match:
+            matching_count += 1
+            matched_similarities.append(best_score)
+
+        matches.append({
+            'adaptation_frame': adapt_frame.get('frame_id', adapt_frame.get('segment_id')),
+            'adaptation_timestamp': adapt_frame.get('timestamp'),
+            'matched': is_match,
+            'best_similarity': best_score,
+            'best_master_frame': best_master_idx,
+            'best_master_timestamp': master_frames[best_master_idx]['timestamp'] if best_master_idx is not None else None
+        })
+
+    total_frames = len(adapt_frames)
+    percentage = (matching_count / total_frames * 100) if total_frames > 0 else 0.0
+
+    # Calculate average of ONLY matched frames (not all frames)
+    avg_of_matches = sum(matched_similarities) / len(matched_similarities) if matched_similarities else 0.0
+
+    return {
+        'matching_frames': matching_count,
+        'total_frames': total_frames,
+        'percentage': round(percentage, 1),
+        'matches': matches,
+        'average_similarity': sum(m['best_similarity'] for m in matches) / len(matches) if matches else 0.0,
+        'matched_similarities': matched_similarities,
+        'average_of_matches': avg_of_matches
+    }
+
+
--- a/src/video_matcher/matcher.py
+++ b/src/video_matcher/matcher.py
@ -0,0 +1,294 @@
+"""Video matching logic."""
+
+import json
+from pathlib import Path
+from typing import Dict, List, Tuple
+from .fingerprinter import (
+    VideoFingerprinter,
+    compare_audio_fingerprints,
+    compare_video_fingerprints,
+    compare_segments,
+    compare_spatial_only
+)
+from .ai_vision import AIVisionMatcher
+
+
+class VideoMatcher:
+    """Match adaptation videos against master videos."""
+
+    def __init__(self, data_dir: str = "data", enable_ai_vision: bool = True):
+        self.data_dir = Path(data_dir)
+        self.fingerprinter = VideoFingerprinter(data_dir=str(self.data_dir / "fingerprints"))
+        self.masters_db = self.data_dir / "masters.json"
+        self._ensure_db()
+
+        # Initialize AI Vision matcher (Tier 2 fallback)
+        self.ai_vision = AIVisionMatcher() if enable_ai_vision else None
+        if self.ai_vision and self.ai_vision.enabled:
+            print("  ✓ AI Vision enabled (GPT-4V)")
+        elif enable_ai_vision:
+            print("  ⚠ AI Vision disabled (no API key)")
+
+    def _ensure_db(self):
+        """Ensure database file exists."""
+        if not self.masters_db.exists():
+            with open(self.masters_db, 'w') as f:
+                json.dump({'masters': []}, f)
+
+    def add_master(self, video_path: str, master_id: str = None) -> Dict:
+        """
+        Add a master video to the library.
+
+        Args:
+            video_path: Path to the master video file
+            master_id: Optional ID, defaults to filename without extension
+
+        Returns:
+            Fingerprint dictionary
+        """
+        video_path = Path(video_path).resolve()
+
+        if not video_path.exists():
+            raise FileNotFoundError(f"Video file not found: {video_path}")
+
+        if master_id is None:
+            master_id = video_path.stem
+
+        # Generate fingerprint
+        fingerprint = self.fingerprinter.fingerprint_video(str(video_path), f"master_{master_id}")
+
+        # Add to masters database
+        with open(self.masters_db, 'r') as f:
+            db = json.load(f)
+
+        # Check if already exists
+        existing = [m for m in db['masters'] if m['master_id'] == master_id]
+        if existing:
+            print(f"  ⚠ Master '{master_id}' already exists, updating...")
+            db['masters'] = [m for m in db['masters'] if m['master_id'] != master_id]
+
+        db['masters'].append({
+            'master_id': master_id,
+            'fingerprint_id': fingerprint['video_id'],
+            'path': str(video_path),
+            'filename': video_path.name,
+            'duration': fingerprint['info'].get('duration', 0)
+        })
+
+        with open(self.masters_db, 'w') as f:
+            json.dump(db, f, indent=2)
+
+        print(f"  ✓ Added master: {master_id}")
+        return fingerprint
+
+    def list_masters(self) -> List[Dict]:
+        """List all master videos in the library."""
+        with open(self.masters_db, 'r') as f:
+            db = json.load(f)
+        return db['masters']
+
+    def match_adaptation(self, video_path: str, threshold: float = 0.80, frame_threshold: float = 0.80, min_avg_similarity: float = 0.90) -> List[Dict]:
+        """
+        Match an adaptation video against all masters using spatial-only matching.
+        This ignores temporal order and handles speed changes, shot reordering, etc.
+
+        Args:
+            video_path: Path to the adaptation video
+            threshold: Minimum percentage of frames matching to report a master (0-1, default 0.80 = 80%)
+            frame_threshold: Similarity threshold for individual frames (0-1, default 0.80)
+            min_avg_similarity: Minimum average similarity of matched frames to consider valid (0-1, default 0.90)
+
+        Returns:
+            List of matches with percentage contribution from each master
+        """
+        video_path = Path(video_path).resolve()
+
+        if not video_path.exists():
+            raise FileNotFoundError(f"Video file not found: {video_path}")
+
+        print(f"\nAnalyzing adaptation: {video_path.name}")
+
+        # Generate fingerprint for adaptation
+        adaptation_id = f"adaptation_{video_path.stem}"
+        adaptation_fp = self.fingerprinter.fingerprint_video(str(video_path), adaptation_id)
+
+        # Load all master fingerprints
+        masters = self.list_masters()
+        print(f"\nComparing against {len(masters)} master(s)...")
+        print(f"Using spatial-only matching (ignores timing/speed changes)...")
+
+        matches = []
+
+        for master in masters:
+            master_fp = self.fingerprinter.load_fingerprint(master['fingerprint_id'])
+
+            if not master_fp:
+                print(f"  ⚠ Could not load fingerprint for {master['master_id']}")
+                continue
+
+            # Spatial-only video comparison (ignores temporal order)
+            video_comparison = compare_spatial_only(
+                adaptation_fp.get('video_fp'),
+                master_fp.get('video_fp'),
+                similarity_threshold=frame_threshold
+            )
+
+            video_percentage = video_comparison['percentage']
+            avg_similarity = video_comparison['average_similarity']
+            avg_of_matches = video_comparison.get('average_of_matches', 0.0)
+
+            # Calculate audio similarity
+            audio_score = compare_audio_fingerprints(
+                adaptation_fp.get('audio_fp'),
+                master_fp.get('audio_fp')
+            )
+
+            # Quality check: Only include masters that pass BOTH criteria:
+            # 1. Enough frames match (percentage threshold)
+            # 2. The matched frames are high quality (average similarity threshold)
+            passes_percentage = video_percentage >= (threshold * 100)
+            passes_quality = avg_of_matches >= min_avg_similarity if avg_of_matches > 0 else False
+
+            if passes_percentage and passes_quality:
+                # Calculate combined score (weighted by video + audio)
+                # Give more weight to video, but audio helps with edge cases
+                if audio_score > 0 and video_percentage > 0:
+                    combined_score = (video_percentage / 100 * 0.7) + (audio_score * 0.3)
+                else:
+                    combined_score = video_percentage / 100
+
+                matches.append({
+                    'master_id': master['master_id'],
+                    'master_file': master['filename'],
+                    'master_path': master['path'],
+                    'master_duration': master['duration'],
+                    'video_percentage': video_percentage,
+                    'audio_similarity': round(audio_score, 3),
+                    'average_frame_similarity': round(avg_similarity, 3),
+                    'matching_frames': video_comparison['matching_frames'],
+                    'total_frames': video_comparison['total_frames'],
+                    'combined_score': round(combined_score, 3),
+                    'confidence': self._get_confidence_level(combined_score)
+                })
+
+        # Sort by multiple criteria for better ranking when scores are tied
+        # 1. Combined score (primary)
+        # 2. Master duration (prefer longer masters as likely source)
+        # 3. Video percentage (tertiary)
+        matches.sort(key=lambda x: (
+            x['combined_score'],           # Primary: highest combined score
+            x['master_duration'],          # Secondary: longest master (likely source)
+            x['video_percentage']          # Tertiary: highest video match
+        ), reverse=True)
+
+        # TIER 2: AI Vision (Smart Fallback - Only when truly needed!)
+        # Trigger AI Vision ONLY when perceptual hash truly failed:
+        # 1. No matches found at all (likely cross-aspect), OR
+        # 2. Best match has incomplete frame coverage < 100% (partial/uncertain match)
+        if self.ai_vision and self.ai_vision.enabled:
+            should_use_ai = False
+            reason = None
+
+            if not matches:
+                # No matches found - likely cross-aspect or completely different content
+                should_use_ai = True
+                reason = "no matches found"
+            elif matches:
+                best_match = matches[0]
+                video_percentage = best_match['video_percentage']
+
+                # If best match doesn't have 100% frame coverage, AI should verify
+                # This catches cross-aspect, partial matches, or uncertain cases
+                if video_percentage < 100.0:
+                    should_use_ai = True
+                    reason = f"incomplete coverage ({video_percentage:.1f}% matched)"
+
+            if should_use_ai:
+                print(f"\n  Triggering AI Vision: {reason}")
+                print("  Analyzing with GPT-4o for cross-aspect matching...")
+
+                # Try AI vision against all masters (or just cross-aspect ones)
+                ai_matches = []
+                total_cost = 0.0
+
+                for master in masters:
+                    master_path = master['path']
+
+                    # Call AI vision
+                    ai_result = self.ai_vision.compare_videos(
+                        str(video_path),
+                        master_path,
+                        adaptation_name=video_path.name,
+                        master_name=master['master_id']
+                    )
+
+                    total_cost += ai_result['cost']
+
+                    if ai_result['match'] and ai_result['confidence'] >= 0.75:
+                        print(f"    ✓ AI Vision match: {master['master_id']} (confidence: {ai_result['confidence']:.0%}, cost: ${ai_result['cost']:.3f})")
+
+                        # Convert to standard match format
+                        ai_matches.append({
+                            'master_id': master['master_id'],
+                            'master_file': master['filename'],
+                            'master_path': master['path'],
+                            'master_duration': master['duration'],
+                            'video_percentage': ai_result['confidence'] * 100,
+                            'audio_similarity': 0.5,
+                            'average_frame_similarity': ai_result['confidence'],
+                            'matching_frames': int(30 * ai_result['confidence']),  # Estimate
+                            'total_frames': 30,
+                            'combined_score': ai_result['confidence'],
+                            'confidence': self._get_confidence_level(ai_result['confidence']),
+                            'matching_method': 'ai_vision',
+                            'ai_explanation': ai_result['explanation'],
+                            'is_crop': ai_result['is_crop']
+                        })
+
+                print(f"\n  AI Vision total cost: ${total_cost:.3f}")
+
+                if ai_matches:
+                    # Sort AI matches by confidence
+                    ai_matches.sort(key=lambda x: x['combined_score'], reverse=True)
+                    return ai_matches
+            else:
+                # AI Vision NOT triggered - perceptual hash found good matches
+                if matches:
+                    best = matches[0]
+                    print(f"\n  ✓ Perceptual hash found complete match ({best['video_percentage']:.1f}% coverage)")
+                    print(f"  → AI Vision skipped (saves ~${len(masters) * 0.006:.2f})")
+
+        # Filter to show only 100% video matches if available, otherwise highest percentage
+        if matches:
+            # Check if any 100% video matches exist
+            perfect_matches = [m for m in matches if m['video_percentage'] == 100.0]
+
+            if perfect_matches:
+                # Only return 100% matches
+                return perfect_matches
+            else:
+                # Find the highest video percentage
+                max_percentage = max(m['video_percentage'] for m in matches)
+                # Return all matches with that highest percentage
+                return [m for m in matches if m['video_percentage'] == max_percentage]
+
+        return matches
+
+    def _get_confidence_level(self, score: float) -> str:
+        """Convert numeric score to confidence level."""
+        if score >= 0.9:
+            return "Very High"
+        elif score >= 0.75:
+            return "High"
+        elif score >= 0.6:
+            return "Medium"
+        elif score >= 0.5:
+            return "Low"
+        else:
+            return "Very Low"
+
+    def clear_masters(self):
+        """Clear all masters from the database."""
+        with open(self.masters_db, 'w') as f:
+            json.dump({'masters': []}, f)
+        print("✓ Cleared all masters")