Coldaine · Coldaine · Feb 16, 2026 · Jan 6, 2026 · Jan 7, 2026 · Jan 7, 2026
diff --git a/.github/workflows/visual-tests.yml b/.github/workflows/visual-tests.yml
@@ -0,0 +1,270 @@
+name: Visual Tests
+
+on:
+  # Manual trigger with options
+  workflow_dispatch:
+    inputs:
+      run_claude_validation:
+        description: 'Run Claude vision validation'
+        required: false
+        default: true
+        type: boolean
+      python_version:
+        description: 'Python version'
+        required: false
+        default: '3.11'
+        type: string
+
+  # Also run on PRs that touch overlay code
+  pull_request:
+    paths:
+      - 'sage/overlay.py'
+      - 'scripts/visual_test_overlay.py'
+      - 'scripts/validate_screenshots.py'
+      - 'tests/**/test_overlay*.py'
+
+jobs:
+  visual-test:
+    name: Capture & Validate Screenshots
+    runs-on: ubuntu-latest
+
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v4
+
+      - name: Set up Python ${{ inputs.python_version || '3.11' }}
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ inputs.python_version || '3.11' }}
+          cache: 'pip'
+
+      - name: Install system dependencies
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y \
+            libdbus-1-dev \
+            libxcb-cursor0 \
+            libxcb-icccm4 \
+            libxcb-image0 \
+            libxcb-keysyms1 \
+            libxcb-randr0 \
+            libxcb-render-util0 \
+            libxcb-shape0 \
+            libxcb-xinerama0 \
+            libxcb-xfixes0 \
+            libxkbcommon-x11-0 \
+            x11-utils \
+            xvfb \
+            libegl1 \
+            libgl1 \
+            libglib2.0-0 \
+            scrot \
+            imagemagick
+
+      - name: Install Python dependencies
+        run: |
+          python -m pip install --upgrade pip
+          # Install without dbus extra to avoid build issues in CI
+          pip install pydantic pyyaml PySide6 watchdog
+          pip install pytest pytest-cov pytest-qt ruff mypy types-PyYAML
+          pip install anthropic
+          pip install -e . --no-deps
+
+      - name: Run visual tests (capture screenshots)
+        id: capture
+        run: |
+          # Create screenshots directory
+          mkdir -p screenshots
+
+          # Run visual test script under xvfb with xcb platform
+          xvfb-run -a --server-args="-screen 0 1920x1080x24" \
+            python scripts/visual_test_overlay.py
+
+          # List captured screenshots
+          echo "Captured screenshots:"
+          ls -la screenshots/
+
+          # Count screenshots for summary
+          SCREENSHOT_COUNT=$(ls -1 screenshots/overlay_test_*.png 2>/dev/null | wc -l)
+          echo "screenshot_count=$SCREENSHOT_COUNT" >> $GITHUB_OUTPUT
+
+          # Require all 5 screenshots
+          if [ "$SCREENSHOT_COUNT" -lt 5 ]; then
+            echo "::error::Expected 5 screenshots, only captured $SCREENSHOT_COUNT"
+            exit 1
+          fi
+        env:
+          QT_QPA_PLATFORM: xcb
+          DISPLAY: ':99'
+
+      - name: Generate screenshot montage
+        if: success()
+        run: |
+          # Create a montage of all screenshots for easy review
+          if ls screenshots/overlay_test_*.png 1> /dev/null 2>&1; then
+            montage screenshots/overlay_test_*.png -tile 2x3 -geometry +5+5 \
+              -background '#1a1a1a' -title 'Overlay Visual Tests' \
+              screenshots/montage.png || echo "Montage creation skipped"
+          fi
+
+      - name: Validate screenshots with Claude
+        id: validate
+        if: ${{ (github.event_name == 'workflow_dispatch' && inputs.run_claude_validation == true) || (github.event_name == 'pull_request' && secrets.ANTHROPIC_API_KEY != '') }}
-        if: ${{ (github.event_name == 'workflow_dispatch' && inputs.run_claude_validation == true) || (github.event_name == 'pull_request' && secrets.ANTHROPIC_API_KEY != '') }}
+        if: ${{ (github.event_name == 'workflow_dispatch' && inputs.run_claude_validation == true) || (github.event_name == 'pull_request' && secrets.ANTHROPIC_API_KEY) }}
-        if: ${{ (github.event_name == 'workflow_dispatch' && inputs.run_claude_validation == true) || (github.event_name == 'pull_request' && secrets.ANTHROPIC_API_KEY != '') }}
+        if: ${{ (github.event_name == 'workflow_dispatch' && inputs.run_claude_validation == true) || (github.event_name == 'pull_request' && secrets.ANTHROPIC_API_KEY) }}
+        run: |
+          echo "Running Claude vision validation..."
+
+          # Run validation and capture exit code
+          set +e
+          python scripts/validate_screenshots.py screenshots/ \
+            --output screenshots/validation_report.json
+          VALIDATION_EXIT_CODE=$?
+          set -e
+
+          # Store result for later steps
+          if [ $VALIDATION_EXIT_CODE -eq 0 ]; then
+            echo "validation_passed=true" >> $GITHUB_OUTPUT
+            echo "✅ All visual validations passed!"
+          elif [ $VALIDATION_EXIT_CODE -eq 1 ]; then
+            echo "validation_passed=false" >> $GITHUB_OUTPUT
+            echo "❌ Some visual validations failed"
+          else
+            echo "validation_passed=error" >> $GITHUB_OUTPUT
+            echo "⚠️ Validation encountered an error"
+          fi
+
+          exit 0  # Don't fail here, we'll check in a later step
+        env:
+          ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
+
+      - name: Skip validation notice
+        if: ${{ !((github.event_name == 'workflow_dispatch' && inputs.run_claude_validation == true) || (github.event_name == 'pull_request' && secrets.ANTHROPIC_API_KEY != '')) }}
+        run: |
+          echo "⚠️ Claude validation skipped"
+          echo ""
+          echo "To enable automated visual validation:"
+          echo "1. Go to Settings → Secrets and variables → Actions"
+          echo "2. Click 'New repository secret'"
+          echo "3. Name: ANTHROPIC_API_KEY"
+          echo "4. Value: Your Anthropic API key"
+
+      - name: Upload screenshots
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: overlay-screenshots-${{ github.sha }}
-          name: overlay-screenshots-${{ github.sha }}
+          name: overlay-screenshots-${{ github.run_number }}
-          name: overlay-screenshots-${{ github.sha }}
+          name: overlay-screenshots-${{ github.run_number }}
+          path: screenshots/
+          retention-days: 30
+
+      - name: Generate summary
+        if: always()
+        run: |
+          echo "## 🖼️ Visual Test Results" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+
+          # Screenshot capture results
+          echo "### 📸 Screenshot Capture" >> $GITHUB_STEP_SUMMARY
+          echo "**Screenshots captured:** ${{ steps.capture.outputs.screenshot_count }}" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+
+          # Validation results
+          echo "### 🤖 Claude Vision Validation" >> $GITHUB_STEP_SUMMARY
+          if [ -f screenshots/validation_report.json ]; then
+            # Parse and display results nicely
+            PASSED=$(cat screenshots/validation_report.json | python3 -c "import sys,json; d=json.load(sys.stdin); print(d['summary']['passed'])")
+            FAILED=$(cat screenshots/validation_report.json | python3 -c "import sys,json; d=json.load(sys.stdin); print(d['summary']['failed'])")
+            RATE=$(cat screenshots/validation_report.json | python3 -c "import sys,json; d=json.load(sys.stdin); print(d['summary']['pass_rate'])")
+
+            if [ "$FAILED" = "0" ]; then
+              echo "✅ **All validations passed!**" >> $GITHUB_STEP_SUMMARY
+            else
+              echo "❌ **Some validations failed**" >> $GITHUB_STEP_SUMMARY
+            fi
+            echo "" >> $GITHUB_STEP_SUMMARY
+            echo "| Metric | Value |" >> $GITHUB_STEP_SUMMARY
+            echo "|--------|-------|" >> $GITHUB_STEP_SUMMARY
+            echo "| Passed | $PASSED |" >> $GITHUB_STEP_SUMMARY
+            echo "| Failed | $FAILED |" >> $GITHUB_STEP_SUMMARY
+            echo "| Pass Rate | $RATE |" >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+
+            echo "<details><summary>Full Validation Report</summary>" >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+            echo '```json' >> $GITHUB_STEP_SUMMARY
+            cat screenshots/validation_report.json >> $GITHUB_STEP_SUMMARY
+            echo '```' >> $GITHUB_STEP_SUMMARY
+            echo "</details>" >> $GITHUB_STEP_SUMMARY
+          else
+            echo "⚠️ Validation was skipped (ANTHROPIC_API_KEY not configured)" >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+            echo "To enable:" >> $GITHUB_STEP_SUMMARY
+            echo "1. Go to **Settings → Secrets → Actions**" >> $GITHUB_STEP_SUMMARY
+            echo "2. Add secret: \`ANTHROPIC_API_KEY\`" >> $GITHUB_STEP_SUMMARY
+          fi
+          echo "" >> $GITHUB_STEP_SUMMARY
+
+          # Test scenarios table
+          echo "### 📋 Test Scenarios" >> $GITHUB_STEP_SUMMARY
+          echo "| Test | Description |" >> $GITHUB_STEP_SUMMARY
+          echo "|------|-------------|" >> $GITHUB_STEP_SUMMARY
+          echo "| 01_empty | Empty overlay (no suggestions) |" >> $GITHUB_STEP_SUMMARY
+          echo "| 02_suggestions | Demo suggestions displayed |" >> $GITHUB_STEP_SUMMARY
+          echo "| 03_single | Single suggestion chip |" >> $GITHUB_STEP_SUMMARY
+          echo "| 04_max_three | Maximum 3 suggestions (from 4 input) |" >> $GITHUB_STEP_SUMMARY
+          echo "| 05_cleared | Suggestions cleared |" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "📦 Download the **overlay-screenshots** artifact to review images manually." >> $GITHUB_STEP_SUMMARY
+
+      - name: Check validation result
+        if: ${{ steps.validate.outputs.validation_passed == 'false' }}
+        run: |
+          echo "❌ Claude validation found issues with the screenshots"
+          echo "Check the validation report in the artifacts for details"
+          exit 1
+
+  # Run standard overlay unit tests
+  overlay-unit-tests:
+    name: Overlay Unit Tests
+    runs-on: ubuntu-latest
+
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v4
+
+      - name: Set up Python 3.11
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.11'
+          cache: 'pip'
+
+      - name: Install system dependencies
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y \
+            libdbus-1-dev \
+            libxcb-cursor0 \
+            libxcb-icccm4 \
+            libxcb-image0 \
+            libxcb-keysyms1 \
+            libxcb-randr0 \
+            libxcb-render-util0 \
+            libxcb-shape0 \
+            libxcb-xinerama0 \
+            libxcb-xfixes0 \
+            libxkbcommon-x11-0 \
+            xvfb \
+            libegl1 \
+            libgl1
+
+      - name: Install Python dependencies
+        run: |
+          python -m pip install --upgrade pip
+          # Install without dbus extra to avoid build issues
+          pip install pydantic pyyaml PySide6 watchdog
+          pip install pytest pytest-cov pytest-qt ruff mypy types-PyYAML
+          pip install -e . --no-deps
+
+      - name: Run overlay tests
+        run: |
+          xvfb-run -a pytest tests/unit/test_overlay.py tests/e2e/test_overlay_signal.py -v --no-cov
+        env:
+          QT_QPA_PLATFORM: xcb
diff --git a/.gitignore b/.gitignore
@@ -62,3 +62,6 @@ config/*.local.yaml
 
 # DBus temp files
 *.pyc
+
+# Screenshots (generated by visual tests)
+screenshots/
diff --git a/README.md b/README.md
@@ -3,6 +3,7 @@
 > Context-aware keyboard shortcut suggestions for KDE Plasma (Wayland)
 
 [![CI](https://github.com/Coldaine/ShortcutSage/actions/workflows/ci.yml/badge.svg)](https://github.com/Coldaine/ShortcutSage/actions/workflows/ci.yml)
+[![Visual Tests](https://github.com/Coldaine/ShortcutSage/actions/workflows/visual-tests.yml/badge.svg)](https://github.com/Coldaine/ShortcutSage/actions/workflows/visual-tests.yml)
 [![Python 3.11+](https://img.shields.io/badge/python-3.11+-blue.svg)](https://www.python.org/downloads/)
 [![Code style: ruff](https://img.shields.io/badge/code%20style-ruff-000000.svg)](https://github.com/astral-sh/ruff)
 
@@ -107,9 +108,48 @@ shortcut-sage overlay --demo
 - Listens for DBus `Suggestions` signals from the daemon; `--demo` fills placeholder data without DBus
 - Honors `Qt.WindowDoesNotAcceptFocus` so it never steals focus while you work
 
+## Automated Visual Testing
+
+The overlay UI is validated using automated screenshot testing with Claude vision:
+
+- **GitHub Actions**: Captures screenshots under xvfb in CI
+- **Claude Vision**: Validates screenshots against specific criteria
+- **5 test scenarios**: Empty, 2 suggestions, single, max 3 (truncation), cleared
+- **Artifacts**: Screenshots available for manual review
+
+See [docs/plans/visual-test-checklist.md](docs/plans/visual-test-checklist.md) for details.
+
 ## Development
 
-### Running Tests
+### Quick Commands (using justfile)
+
+```bash
+# Setup environment
+just setup
+
+# Run all tests
+just test
+
+# Run tests without Qt/DBus (headless CI compatible)
+just test-headless
+
+# Run visual tests (requires graphical environment)
+just test-visual
+
+# Lint and format
+just lint
+just format
+
+# Simulate CI locally
+just ci
+
+# Run daemon/overlay
+just daemon
+just overlay
+just demo
+```
+
+### Running Tests Manually
 
 ```bash
 # All tests with coverage
@@ -123,6 +163,13 @@ pytest tests/integration
 
 # End-to-end tests (requires KDE)
 pytest tests/e2e
+
+# Visual tests (captures screenshots)
+python scripts/visual_test_overlay.py
+
+# Validate screenshots with Claude
+export ANTHROPIC_API_KEY='your-key'
+python scripts/validate_screenshots.py screenshots/
 ```
 
 ### Code Quality