Merge main into bl-selective-snapshot-update

Resolved conflict in pr-update-playwright-expectations.yaml by keeping the detailed comments from the feature branch while adopting the updated workflow name from main.
Merge latest main (v1.29.2) into bl-selective-snapshot-update
2026-04-24 08:19:51 +00:00 · 2025-10-19 03:46:37 +00:00 · 2025-10-14 11:56:10 -07:00 · 2025-10-14 11:03:41 -07:00 · 2025-10-12 20:27:25 -07:00 · 2025-10-12 16:00:38 -07:00
7 changed files with 1531 additions and 14 deletions
--- a/.github/workflows/ci-tests-e2e.yaml
+++ b/.github/workflows/ci-tests-e2e.yaml
@@ -143,7 +143,7 @@ jobs:
  merge-reports:
    needs: [playwright-tests-chromium-sharded]
    runs-on: ubuntu-latest
-    if: ${{ !cancelled() }}
+    if: ${{ always() && !cancelled() }}
    steps:
      - name: Checkout repository
        uses: actions/checkout@v5
@@ -169,6 +169,26 @@ jobs:
          PLAYWRIGHT_JSON_OUTPUT_NAME=playwright-report/report.json \
          pnpm exec playwright merge-reports --reporter=json ./all-blob-reports
      - name: Build failed screenshot manifest
        if: ${{ needs.playwright-tests-chromium-sharded.result == 'failure' }}
        run: |
          set -euo pipefail
          if ! pnpm tsx scripts/cicd/build-failed-screenshot-manifest.ts; then
            echo "ERROR: Failed to generate screenshot manifest"
            echo "This may indicate an issue with the Playwright JSON report or the manifest script"
            exit 1
          fi
        working-directory: ComfyUI_frontend
      - name: Upload failed screenshot manifest
        if: ${{ needs.playwright-tests-chromium-sharded.result == 'failure' }}
        uses: actions/upload-artifact@v4
        with:
          name: failed-screenshot-tests
          path: ComfyUI_frontend/ci-rerun/*.txt
          retention-days: 7
          if-no-files-found: ignore
      - name: Upload HTML report
        uses: actions/upload-artifact@v4
        with:
--- a/.github/workflows/pr-update-playwright-expectations.yaml
+++ b/.github/workflows/pr-update-playwright-expectations.yaml
@@ -1,4 +1,12 @@
 # Setting test expectation screenshots for Playwright
 #
 # This workflow uses a selective snapshot update strategy:
 # 1. When tests fail in CI, they generate a manifest of failed test locations (file:line)
 # 2. This workflow downloads that manifest from the failed test run artifacts
 # 3. Only the failed tests are re-run with --update-snapshots (much faster than running all tests)
 # 4. Updated snapshots are committed back to the PR branch
 #
 # Trigger: Add label "New Browser Test Expectations" OR comment "/update-playwright" on PR
 name: "PR: Update Playwright Expectations"
 on:
@@ -16,7 +24,7 @@ jobs:
    runs-on: ubuntu-latest
    if: >
      ( github.event_name == 'pull_request' && github.event.label.name == 'New Browser Test Expectations' ) ||
-      ( github.event.issue.pull_request && 
+      ( github.event.issue.pull_request &&
        github.event_name == 'issue_comment' &&
        (
          github.event.comment.author_association == 'OWNER' ||
@@ -55,43 +63,211 @@ jobs:
        uses: actions/checkout@v5
        with:
          ref: ${{ steps.get-branch.outputs.branch }}
      - name: Setup Frontend
        uses: ./.github/actions/setup-frontend
        with:
          include_build_step: true
      - name: Setup ComfyUI Server
        uses: ./.github/actions/setup-comfyui-server
        with:
          launch_server: true
      - name: Setup Playwright
        uses: ./.github/actions/setup-playwright
-      - name: Run Playwright tests and update snapshots
+
      - name: Locate failed screenshot manifest artifact
        id: locate-manifest
        uses: actions/github-script@v8
        with:
          script: |
            const { owner, repo } = context.repo
            let headSha = ''
            if (context.eventName === 'pull_request') {
              headSha = context.payload.pull_request.head.sha
            } else if (context.eventName === 'issue_comment') {
              const prNumber = context.payload.issue.number
              const pr = await github.rest.pulls.get({ owner, repo, pull_number: prNumber })
              headSha = pr.data.head.sha
            }
            if (!headSha) {
              core.setOutput('run_id', '')
              core.setOutput('has_manifest', 'false')
              return
            }
            const { data } = await github.rest.actions.listWorkflowRuns({
              owner,
              repo,
              workflow_id: 'tests-ci.yaml',
              head_sha: headSha,
              event: 'pull_request',
              per_page: 1,
            })
            const run = data.workflow_runs?.[0]
            let has = 'false'
            let runId = ''
            if (run) {
              runId = String(run.id)
              const { data: { artifacts = [] } } = await github.rest.actions.listWorkflowRunArtifacts({
                owner,
                repo,
                run_id: run.id,
                per_page: 100,
              })
              if (artifacts.some(a => a.name === 'failed-screenshot-tests' && !a.expired)) has = 'true'
            }
            core.setOutput('run_id', runId)
            core.setOutput('has_manifest', has)
      - name: Download failed screenshot manifest
        if: steps.locate-manifest.outputs.has_manifest == 'true'
        uses: actions/download-artifact@v4
        with:
          run-id: ${{ steps.locate-manifest.outputs.run_id }}
          name: failed-screenshot-tests
          path: ci-rerun
      - name: Re-run failed screenshot tests and update snapshots
        id: playwright-tests
        run: pnpm exec playwright test --update-snapshots
        continue-on-error: true
        run: |
          set -euo pipefail
          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
          echo "Selective Snapshot Update"
          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
          echo ""
          # Check if manifest exists
          if [ ! -d ci-rerun ]; then
            echo "ERROR: No manifest found in ci-rerun/ directory"
            echo "   This means no failed screenshot tests were detected in the latest CI run."
            echo "   Please ensure tests have been run and failures were recorded."
            exit 1
          fi
          shopt -s nullglob
          files=(ci-rerun/*.txt)
          if [ ${#files[@]} -eq 0 ]; then
            echo "ERROR: No manifest files found in ci-rerun/"
            echo "   Expected files like: chromium.txt, chromium-2x.txt, mobile-chrome.txt"
            exit 1
          fi
          echo "Found ${#files[@]} project manifest(s):"
          for f in "${files[@]}"; do
            project="$(basename "$f" .txt)"
            count=$(grep -c . "$f" 2>/dev/null || echo "0")
            echo "   - $project: $count failed test(s)"
          done
          echo ""
          # Re-run tests per project
          total_tests=0
          for f in "${files[@]}"; do
            project="$(basename "$f" .txt)"
            mapfile -t lines < "$f"
            filtered=( )
            # Validate and sanitize test paths to prevent command injection
            for l in "${lines[@]}"; do
              # Skip empty lines
              [ -z "$l" ] && continue
              # Validate format: must be browser_tests/...spec.ts:number
              if [[ "$l" =~ ^browser_tests/.+\.spec\.ts:[0-9]+$ ]]; then
                filtered+=("$l")
              else
                echo "WARNING: Skipping invalid test path: $l"
              fi
            done
            if [ ${#filtered[@]} -eq 0 ]; then
              echo "WARNING: Skipping $project (no valid tests in manifest)"
              continue
            fi
            echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
            echo "Updating snapshots for project: $project"
            echo "   Re-running ${#filtered[@]} failed test(s)..."
            echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
            PLAYWRIGHT_JSON_OUTPUT_NAME=playwright-report/report.json \
            pnpm exec playwright test --project="$project" --update-snapshots \
              --reporter=line --reporter=html \
              "${filtered[@]}"
            total_tests=$((total_tests + ${#filtered[@]}))
            echo ""
          done
          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
          echo "Completed snapshot updates for $total_tests test(s)"
          echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
      - uses: actions/upload-artifact@v4
        if: always()
        with:
          name: playwright-report
          path: ./playwright-report/
          retention-days: 30
      - name: Debugging info
        run: |
          echo "PR: ${{ github.event.issue.number }}"
          echo "Branch: ${{ steps.get-branch.outputs.branch }}"
          git status
      - name: Commit updated expectations
        id: commit
        run: |
          git config --global user.name 'github-actions'
          git config --global user.email 'github-actions@github.com'
          git add browser_tests
          if git diff --cached --quiet; then
-            echo "No changes to commit"
+            echo "No expectation updates detected; skipping commit."
            echo "changed=false" >> $GITHUB_OUTPUT
          else
            # Count changed snapshots
            changed_count=$(git diff --cached --name-only browser_tests | wc -l)
            echo "changed=true" >> $GITHUB_OUTPUT
            echo "count=$changed_count" >> $GITHUB_OUTPUT
            git commit -m "[automated] Update test expectations"
            git push origin ${{ steps.get-branch.outputs.branch }}
          fi
      - name: Generate workflow summary
        if: always()
        run: |
          echo "## Snapshot Update Summary" >> $GITHUB_STEP_SUMMARY
          echo "" >> $GITHUB_STEP_SUMMARY
          if [ "${{ steps.commit.outputs.changed }}" = "true" ]; then
            echo "**${{ steps.commit.outputs.count }} snapshot(s) updated**" >> $GITHUB_STEP_SUMMARY
            echo "" >> $GITHUB_STEP_SUMMARY
            echo "<details>" >> $GITHUB_STEP_SUMMARY
            echo "<summary>View updated files</summary>" >> $GITHUB_STEP_SUMMARY
            echo "" >> $GITHUB_STEP_SUMMARY
            echo "\`\`\`" >> $GITHUB_STEP_SUMMARY
            git diff HEAD~1 --name-only browser_tests 2>/dev/null || echo "No git history available" >> $GITHUB_STEP_SUMMARY
            echo "\`\`\`" >> $GITHUB_STEP_SUMMARY
            echo "</details>" >> $GITHUB_STEP_SUMMARY
          elif [ "${{ steps.commit.outputs.changed }}" = "false" ]; then
            echo "No snapshot changes detected" >> $GITHUB_STEP_SUMMARY
          else
            echo "WARNING: Snapshot update may have failed - check logs above" >> $GITHUB_STEP_SUMMARY
          fi
          echo "" >> $GITHUB_STEP_SUMMARY
          echo "---" >> $GITHUB_STEP_SUMMARY
          echo "" >> $GITHUB_STEP_SUMMARY
          echo "**Strategy:** Selective snapshot update (only failed tests re-run)" >> $GITHUB_STEP_SUMMARY
      - name: Add Done Reaction
        uses: peter-evans/create-or-update-comment@e8674b075228eee787fea43ef493e45ece1004c9
        if: github.event_name == 'issue_comment'
--- a/docs/PLAYWRIGHT_SELECTIVE_RERUN_ALTERNATIVES.md
+++ b/docs/PLAYWRIGHT_SELECTIVE_RERUN_ALTERNATIVES.md
@@ -0,0 +1,755 @@
 # Playwright Selective Test Rerun Alternatives
 This document analyzes alternatives for selectively re-running only failed Playwright tests for snapshot updates, comparing native Playwright features with the current custom manifest approach used in this project.
 ## Table of Contents
 - [Current Approach](#current-approach)
 - [Native Playwright Features](#native-playwright-features)
 - [Playwright Reporter Options](#playwright-reporter-options)
 - [GitHub Actions Integration Patterns](#github-actions-integration-patterns)
 - [Third-Party Solutions](#third-party-solutions)
 - [Comparison and Recommendations](#comparison-and-recommendations)
 ---
 ## Current Approach
 ### Implementation
 The project currently uses a **custom manifest-based approach** that:
 1. **Generates a manifest** of failed screenshot tests after CI runs
   - Script: `scripts/cicd/build-failed-screenshot-manifest.ts`
   - Parses JSON report to find tests with failed screenshot assertions
   - Creates per-project text files: `ci-rerun/{project}.txt`
   - Format: `file_path:line_number` (e.g., `browser_tests/menu.test.ts:42`)
 2. **Stores manifest as GitHub artifact**
   - Artifact name: `failed-screenshot-tests`
   - Retention: 7 days
   - Only uploaded when chromium sharded tests fail
 3. **Downloads manifest in update workflow**
   - Workflow: `.github/workflows/update-playwright-expectations.yaml`
   - Triggered by: PR label "New Browser Test Expectations" or `/update-playwright` comment
   - Falls back to full test suite if manifest not found
 4. **Re-runs only failed tests**
   ```bash
   for f in ci-rerun/*.txt; do
     project="$(basename "$f" .txt)"
     mapfile -t lines < "$f"
     # Filter empty lines
     pnpm exec playwright test --project="$project" --update-snapshots "${filtered[@]}"
   done
   ```
 ### Advantages
 - ✅ Works across workflow runs and different trigger mechanisms
 - ✅ Survives beyond single workflow execution
 - ✅ Precise control over which tests to re-run
 - ✅ Supports multiple projects with separate manifests
 - ✅ Works with sharded test runs (merged report)
 - ✅ Platform-agnostic approach (works on any CI/CD platform)
 ### Disadvantages
 - ❌ Custom implementation requires maintenance
 - ❌ Requires parsing JSON report format (could break with Playwright updates)
 - ❌ Additional artifact storage needed
 - ❌ More complex than native solutions
 ---
 ## Native Playwright Features
 ### 1. `--last-failed` CLI Flag
 **Availability:** Playwright v1.44.0+ (May 2024)
 #### How It Works
 ```bash
 # First run - execute all tests
 npx playwright test
 # Second run - only re-run failed tests
 npx playwright test --last-failed
 ```
 Playwright maintains a `.last-run.json` file in the `test-results/` directory that tracks failed tests.
 #### CLI Examples
 ```bash
 # Run only failed tests from last run
 npx playwright test --last-failed
 # Update snapshots for only failed tests
 npx playwright test --last-failed --update-snapshots
 # Combine with project filtering
 npx playwright test --last-failed --project=chromium
 # Debug failed tests
 npx playwright test --last-failed --debug
 ```
 #### File Location and Format
 - **Location:** `test-results/.last-run.json`
 - **Format:** JSON object containing failed test information
 - **Structure:** Contains a `failedTests: []` array with test identifiers
 - **Persistence:** Cleared when all tests pass on subsequent run
 #### Advantages
 - ✅ Built into Playwright (no custom code)
 - ✅ Simple CLI flag
 - ✅ Automatically maintained by Playwright
 - ✅ Works with all Playwright features (debug, UI mode, etc.)
 #### Limitations
 - ❌ **Not designed for CI/CD distributed testing** (per Playwright maintainers)
 - ❌ **Intended for local development only** ("inner loop scenario")
 - ❌ Cleared on new test runs (doesn't persist across clean environments)
 - ❌ **GitHub Actions starts with clean environment** - `.last-run.json` not available on retry
 - ❌ **Doesn't work with sharded tests** - each shard creates its own `.last-run.json`
 - ❌ No native way to merge `.last-run.json` across shards
 - ❌ Not designed for cross-workflow persistence
 #### CI/CD Workaround (Not Recommended)
 To use `--last-failed` in GitHub Actions, you would need to:
 ```yaml
 - name: Run Playwright tests
  id: playwright-test
  run: npx playwright test
 - name: Upload last run state
  if: failure()
  uses: actions/upload-artifact@v4
  with:
    name: last-run-state
    path: test-results/.last-run.json
 # In retry workflow:
 - name: Download last run state
  uses: actions/download-artifact@v4
  with:
    name: last-run-state
    path: test-results/
 - name: Rerun failed tests
  run: npx playwright test --last-failed --update-snapshots
 ```
 **Why This Isn't Ideal:**
 - Playwright maintainers explicitly state this is not the intended use case
 - Doesn't work well with sharded tests (multiple `.last-run.json` files)
 - Requires manual artifact management
 - More complex than the current custom approach for this use case
 ### 2. File:Line Syntax for Specific Tests
 Playwright supports running tests at specific line numbers:
 ```bash
 # Run a specific test at line 42
 npx playwright test tests/example.spec.ts:42
 # Multiple tests
 npx playwright test tests/file1.spec.ts:10 tests/file2.spec.ts:25
 # With snapshot updates
 npx playwright test tests/example.spec.ts:42 --update-snapshots
 # With project selection
 npx playwright test --project=chromium tests/example.spec.ts:42
 ```
 This is **exactly the format** the current custom manifest uses, making it compatible with Playwright's native CLI.
 ### 3. Test Filtering Options
 ```bash
 # Filter by grep pattern
 npx playwright test -g "screenshot"
 # Inverse grep
 npx playwright test --grep-invert "mobile"
 # By project
 npx playwright test --project=chromium
 # Multiple projects
 npx playwright test --project=chromium --project=firefox
 # Specific directory
 npx playwright test tests/screenshots/
 ```
 ---
 ## Playwright Reporter Options
 ### 1. JSON Reporter
 **Purpose:** Machine-readable test results
 #### Configuration
 ```typescript
 // playwright.config.ts
 export default defineConfig({
  reporter: [
    ['json', { outputFile: 'results.json' }]
  ]
 })
 ```
 Or via environment variable:
 ```bash
 PLAYWRIGHT_JSON_OUTPUT_NAME=results.json npx playwright test --reporter=json
 ```
 #### Output Structure
 ```json
 {
  "stats": {
    "expected": 100,
    "unexpected": 5,
    "flaky": 2,
    "skipped": 3
  },
  "suites": [
    {
      "title": "Test Suite",
      "specs": [
        {
          "file": "browser_tests/example.test.ts",
          "line": 42,
          "tests": [
            {
              "projectId": "chromium",
              "results": [
                {
                  "status": "failed",
                  "attachments": [
                    { "contentType": "image/png" }
                  ]
                }
              ]
            }
          ]
        }
      ]
    }
  ]
 }
 ```
 **This is the format** the current `build-failed-screenshot-manifest.ts` script parses.
 #### Advantages
 - ✅ Stable, documented JSON schema (`@playwright/test/reporter`)
 - ✅ Includes all test metadata (file, line, project, status, attachments)
 - ✅ Can be used programmatically
 - ✅ Supports multiple reporters simultaneously
 #### Current Project Usage
 ```yaml
 # In tests-ci.yaml
 PLAYWRIGHT_JSON_OUTPUT_NAME=playwright-report/report.json \
 pnpm exec playwright test --project=${{ matrix.browser }} \
  --reporter=list \
  --reporter=html \
  --reporter=json
 ```
 ### 2. Blob Reporter
 **Purpose:** Merging sharded test reports
 #### Configuration
 ```typescript
 // playwright.config.ts
 export default defineConfig({
  reporter: process.env.CI ? 'blob' : 'html'
 })
 ```
 #### Usage with Sharding
 ```bash
 # Run sharded test with blob output
 npx playwright test --shard=1/4 --reporter=blob
 # Merge blob reports
 npx playwright merge-reports --reporter=html ./all-blob-reports
 npx playwright merge-reports --reporter=json ./all-blob-reports
 ```
 #### Current Project Usage
 ```yaml
 # Sharded chromium tests
 - run: pnpm exec playwright test --project=chromium --shard=${{ matrix.shardIndex }}/${{ matrix.shardTotal }} --reporter=blob
  env:
    PLAYWRIGHT_BLOB_OUTPUT_DIR: ../blob-report
 # Merge reports job
 - run: |
    pnpm exec playwright merge-reports --reporter=html ./all-blob-reports
    PLAYWRIGHT_JSON_OUTPUT_NAME=playwright-report/report.json \
    pnpm exec playwright merge-reports --reporter=json ./all-blob-reports
 ```
 #### Advantages
 - ✅ Designed for distributed testing
 - ✅ Can merge into any reporter format (HTML, JSON, etc.)
 - ✅ Preserves all test information across shards
 #### Blob Reporter and `--last-failed`
 - ❌ Blob reports **do not contain** a merged `.last-run.json`
 - ❌ Each shard creates its own `.last-run.json` that isn't included in blob
 - ❌ GitHub issue [#30924](https://github.com/microsoft/playwright/issues/30924) requests this feature (currently unsupported)
 ### 3. Multiple Reporters
 You can use multiple reporters simultaneously:
 ```typescript
 export default defineConfig({
  reporter: [
    ['list'],           // Terminal output
    ['html'],           // Browse results
    ['json', { outputFile: 'results.json' }],  // Programmatic parsing
    ['junit', { outputFile: 'results.xml' }]   // CI integration
  ]
 })
 ```
 Or via CLI:
 ```bash
 npx playwright test --reporter=list --reporter=html --reporter=json
 ```
 ---
 ## GitHub Actions Integration Patterns
 ### Pattern 1: Comment-Triggered Workflow (JupyterLab Approach)
 **Example:** [jupyterlab/jupyterlab-git](https://github.com/jupyterlab/jupyterlab-git/blob/main/.github/workflows/update-integration-tests.yml)
 ```yaml
 name: Update Playwright Snapshots
 on:
  issue_comment:
    types: [created, edited]
 permissions:
  contents: write
  pull-requests: write
 jobs:
  update-snapshots:
    # Only run for authorized users on PRs with specific comment
    if: >
      (github.event.issue.author_association == 'OWNER' ||
       github.event.issue.author_association == 'COLLABORATOR' ||
       github.event.issue.author_association == 'MEMBER'
      ) && github.event.issue.pull_request &&
      contains(github.event.comment.body, 'please update snapshots')
    runs-on: ubuntu-latest
    steps:
    - name: React to the triggering comment
      run: gh api repos/${{ github.repository }}/issues/comments/${{ github.event.comment.id }}/reactions --raw-field 'content=+1'
      env:
        GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
    - name: Checkout
      uses: actions/checkout@v4
      with:
        token: ${{ secrets.GITHUB_TOKEN }}
    - name: Checkout PR branch
      run: gh pr checkout ${{ github.event.issue.number }}
      env:
        GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
    - name: Setup and run tests
      run: |
        npm ci
        npx playwright install --with-deps
        npx playwright test --update-snapshots
    - name: Commit and push
      run: |
        git config user.name 'github-actions'
        git config user.email 'github-actions@github.com'
        git add .
        git diff --cached --quiet || git commit -m "Update snapshots"
        git push
 ```
 #### Advantages
 - ✅ Simple comment-based trigger
 - ✅ Visual feedback (reaction on comment)
 - ✅ Authorization checks built-in
 - ✅ Auto-commits to PR branch
 #### Limitations
 - ❌ Runs **all** tests with `--update-snapshots` (not selective)
 - ❌ No integration with failed test information from CI
 ### Pattern 2: Label-Based Trigger + Manifest (Current Approach)
 ```yaml
 name: Update Playwright Expectations
 on:
  pull_request:
    types: [labeled]
  issue_comment:
    types: [created]
 jobs:
  test:
    if: >
      ( github.event_name == 'pull_request' &&
        github.event.label.name == 'New Browser Test Expectations' ) ||
      ( github.event.issue.pull_request &&
        startsWith(github.event.comment.body, '/update-playwright') )
    steps:
      # ... setup steps ...
      - name: Locate failed screenshot manifest artifact
        id: locate-manifest
        uses: actions/github-script@v8
        with:
          script: |
            const { owner, repo } = context.repo
            let headSha = ''
            if (context.eventName === 'pull_request') {
              headSha = context.payload.pull_request.head.sha
            } else if (context.eventName === 'issue_comment') {
              const prNumber = context.payload.issue.number
              const pr = await github.rest.pulls.get({ owner, repo, pull_number: prNumber })
              headSha = pr.data.head.sha
            }
            const { data } = await github.rest.actions.listWorkflowRuns({
              owner, repo,
              workflow_id: 'tests-ci.yaml',
              head_sha: headSha,
              per_page: 1,
            })
            const run = data.workflow_runs?.[0]
            let has = 'false'
            if (run) {
              const { data: { artifacts = [] } } = await github.rest.actions.listWorkflowRunArtifacts({
                owner, repo, run_id: run.id
              })
              if (artifacts.some(a => a.name === 'failed-screenshot-tests' && !a.expired))
                has = 'true'
            }
            core.setOutput('has_manifest', has)
      - name: Download failed screenshot manifest
        if: steps.locate-manifest.outputs.has_manifest == 'true'
        uses: actions/download-artifact@v4
        with:
          run-id: ${{ steps.locate-manifest.outputs.run_id }}
          name: failed-screenshot-tests
          path: ComfyUI_frontend/ci-rerun
      - name: Re-run failed screenshot tests
        run: |
          if [ ! -d ci-rerun ]; then
            echo "No manifest found; running full suite"
            pnpm exec playwright test --update-snapshots
            exit 0
          fi
          for f in ci-rerun/*.txt; do
            project="$(basename "$f" .txt)"
            mapfile -t lines < "$f"
            filtered=()
            for l in "${lines[@]}"; do
              [ -n "$l" ] && filtered+=("$l")
            done
            if [ ${#filtered[@]} -gt 0 ]; then
              echo "Re-running ${#filtered[@]} tests for project $project"
              pnpm exec playwright test --project="$project" --update-snapshots "${filtered[@]}"
            fi
          done
 ```
 #### Advantages
 - ✅ **Selective** - only re-runs failed screenshot tests
 - ✅ Works across different trigger mechanisms (label or comment)
 - ✅ Fallback to full suite if manifest not found
 - ✅ Per-project manifests support multiple browser configurations
 - ✅ Handles sharded tests via merged report
 ### Pattern 3: WordPress/Openverse Approach (Always Update)
 Proposed pattern (not fully implemented):
 1. CI always runs with `--update-snapshots` flag
 2. If snapshots change, create/update a secondary branch
 3. Open PR targeting the original PR branch
 4. Developer reviews snapshot changes before merging
 #### Advantages
 - ✅ Always generates correct snapshots
 - ✅ Snapshot changes are visible in separate PR
 - ✅ No test failures due to mismatched snapshots
 #### Limitations
 - ❌ Creates multiple PRs
 - ❌ More complex merge workflow
 - ❌ Potential for snapshot changes to mask real issues
 ### Pattern 4: Manual Workflow Dispatch
 ```yaml
 name: Update Snapshots
 on:
  workflow_dispatch:
    inputs:
      update-snapshots:
        description: 'Update snapshots'
        type: boolean
        default: false
      test-pattern:
        description: 'Test pattern (optional)'
        type: string
        required: false
 jobs:
  test:
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v4
      - name: Setup
        run: |
          npm ci
          npx playwright install --with-deps
      - name: Run tests
        run: |
          if [ "${{ inputs.update-snapshots }}" = "true" ]; then
            FLAGS="--update-snapshots"
          fi
          PATTERN="${{ inputs.test-pattern }}"
          npx playwright test ${PATTERN} ${FLAGS}
 ```
 #### Advantages
 - ✅ Full manual control
 - ✅ Can specify test patterns
 - ✅ Simple to understand
 #### Limitations
 - ❌ Requires manual triggering
 - ❌ Not integrated with CI failures
 ---
 ## Third-Party Solutions
 ### Currents.dev - Last Failed GitHub Action
 **Repository:** [currents-dev/playwright-last-failed](https://github.com/currents-dev/playwright-last-failed)
 #### Purpose
 Helps run last failed Playwright tests using Currents' cloud-based caching service.
 #### Usage
 ```yaml
 - name: Playwright Last Failed action
  id: last-failed-action
  uses: currents-dev/playwright-last-failed@v1
  with:
    pw-output-dir: test-results
    matrix-index: ${{ matrix.shard }}
    matrix-total: ${{ strategy.job-total }}
 ```
 #### How It Works
 - Uses Currents' cloud service to persist failed test information
 - Supports sharded tests via matrix parameters
 - Enables selective rerun of failed tests across workflow retries
 #### Advantages
 - ✅ Works with sharded tests
 - ✅ Persists across workflow runs
 - ✅ Supports GitHub Actions retry mechanism
 - ✅ Handles distributed testing
 #### Limitations
 - ❌ **Requires Currents subscription** (third-party paid service)
 - ❌ Dependency on external service
 - ❌ Data sent to third-party cloud
 - ❌ Additional cost
 - ❌ Vendor lock-in
 #### Recommendation
 **Not suitable for this project** due to:
 - External service dependency
 - Cost implications
 - The current custom solution is already working well
 ---
 ## Comparison and Recommendations
 ### Feature Matrix
 | Feature | Current Approach | `--last-failed` | Currents | Comment Trigger Only |
 |---------|-----------------|-----------------|----------|---------------------|
 | Works with sharded tests | ✅ Yes | ❌ No | ✅ Yes | ✅ Yes |
 | Persists across workflows | ✅ Yes | ❌ No | ✅ Yes | N/A |
 | Selective reruns | ✅ Yes | ✅ Yes | ✅ Yes | ❌ No (runs all) |
 | No external dependencies | ✅ Yes | ✅ Yes | ❌ No | ✅ Yes |
 | Simple implementation | ⚠️ Medium | ✅ Simple | ✅ Simple | ✅ Simple |
 | Maintenance overhead | ⚠️ Medium | ✅ Low | ✅ Low | ✅ Low |
 | Works in CI/CD | ✅ Yes | ⚠️ Workaround | ✅ Yes | ✅ Yes |
 | Cost | ✅ Free | ✅ Free | ❌ Paid | ✅ Free |
 | Supports multiple projects | ✅ Yes | ✅ Yes | ✅ Yes | ✅ Yes |
 ### Why `--last-failed` Isn't Suitable (Currently)
 1. **Not designed for CI/CD:** Playwright maintainers explicitly state it's for "inner loop scenario (local development)"
 2. **Doesn't work with sharded tests:** Each shard creates its own `.last-run.json` with no native merge
 3. **Clean environment issue:** GitHub Actions starts fresh, losing `.last-run.json`
 4. **Feature request pending:** GitHub issue [#30924](https://github.com/microsoft/playwright/issues/30924) requests blob report integration (not yet implemented)
 ### Recommendations
 #### Short Term: Keep Current Approach
 **Verdict: The current custom manifest approach is the best solution for this project's needs.**
 **Reasons:**
 1. ✅ **Works perfectly with sharded tests** - merges results across 8 shards
 2. ✅ **Persists across workflows** - artifact storage for 7 days
 3. ✅ **Selective reruns** - only failed screenshot tests
 4. ✅ **No external dependencies** - fully self-contained
 5. ✅ **Uses stable Playwright JSON format** - typed via `@playwright/test/reporter`
 6. ✅ **Already working well** - proven in production
 **Minor Improvements:**
 ```typescript
 // Add version check to warn if JSON schema changes
 import { version } from '@playwright/test/package.json'
 if (major(version) !== 1) {
  console.warn('Playwright major version changed - verify JSON schema compatibility')
 }
 // Add more robust error handling
 try {
  const report: JSONReport = JSON.parse(raw)
 } catch (error) {
  throw new Error(`Failed to parse Playwright JSON report: ${error.message}`)
 }
 // Consider adding tests for the manifest builder
 // e.g., tests/cicd/build-failed-screenshot-manifest.test.ts
 ```
 #### Long Term: Monitor Playwright Development
 **Watch for these features:**
 1. **Blob report + `.last-run.json` merge** - GitHub issue [#30924](https://github.com/microsoft/playwright/issues/30924)
 2. **Native CI/CD support for `--last-failed`** - may never happen (by design)
 3. **Report merging improvements** - GitHub issue [#33094](https://github.com/microsoft/playwright/issues/33094)
 **Migration path if native support improves:**
 ```yaml
 # Future potential approach (if Playwright adds this feature)
 - name: Merge reports with last-run
  run: |
    npx playwright merge-reports --reporter=html ./all-blob-reports
    npx playwright merge-reports --reporter=last-failed ./all-blob-reports
 - name: Upload merged last-run
  uses: actions/upload-artifact@v4
  with:
    name: last-run-state
    path: test-results/.last-run.json
 # In update workflow
 - name: Download last-run state
  uses: actions/download-artifact@v4
  with:
    name: last-run-state
    path: test-results/
 - name: Update snapshots for failed tests
  run: npx playwright test --last-failed --update-snapshots
 ```
 **However, this is speculative** - Playwright maintainers have indicated `--last-failed` is not intended for CI/CD.
 #### Alternative: Simplify to Full Suite Reruns
 If the custom manifest becomes too complex to maintain, consider:
 ```yaml
 - name: Re-run ALL screenshot tests
  run: |
    # Simple grep-based filtering for screenshot tests
    npx playwright test -g "screenshot" --update-snapshots
 ```
 **Trade-offs:**
 - ✅ Much simpler
 - ✅ No custom scripts
 - ❌ Slower (runs all screenshot tests, not just failed ones)
 - ❌ Potentially updates snapshots that weren't actually failing
 ---
 ## Conclusion
 The current custom manifest approach is **well-designed** and **appropriate** for this project's requirements:
 1. **Handles sharded tests** - critical for CI performance
 2. **Selective reruns** - saves time and resources
 3. **Stable implementation** - uses documented Playwright JSON schema
 4. **No external dependencies** - fully controlled
 While `--last-failed` is a nice feature for **local development**, Playwright's own documentation and maintainer comments confirm it's **not suitable for distributed CI/CD testing**, which is exactly what this project needs.
 The only potentially better solution (Currents) requires a paid external service, which adds cost and complexity without significant benefits over the current approach.
 **Recommendation: Keep the current implementation**, with minor improvements to error handling and documentation. Monitor Playwright development for native improvements, but don't expect `--last-failed` to become a viable alternative for this use case.
 ---
 ## References
 ### Official Playwright Documentation
 - [Command Line](https://playwright.dev/docs/test-cli)
 - [Reporters](https://playwright.dev/docs/test-reporters)
 - [Test Sharding](https://playwright.dev/docs/test-sharding)
 - [CI/CD Setup](https://playwright.dev/docs/ci-intro)
 ### Community Resources
 - [Playwright Solutions: How to Run Failures Only](https://playwrightsolutions.com/how-to-run-failures-only-from-the-last-playwright-run/)
 - [Medium: How to Run Only Last Failed Tests](https://medium.com/@testerstalk/how-to-run-only-last-failed-tests-in-playwright-e5e41472594a)
 - [Medium: Streamlining Visual Regression Testing](https://medium.com/@haleywardo/streamlining-playwright-visual-regression-testing-with-github-actions-e077fd33c27c)
 ### GitHub Issues
 - [#30924 - Last-failed with blob reports](https://github.com/microsoft/playwright/issues/30924)
 - [#33094 - Merging main run with --last-failed](https://github.com/microsoft/playwright/issues/33094)
 - [#28254 - Feature request for --last-failed](https://github.com/microsoft/playwright/issues/28254)
 ### Example Implementations
 - [JupyterLab Git - Update Integration Tests](https://github.com/jupyterlab/jupyterlab-git/blob/main/.github/workflows/update-integration-tests.yml)
 - [WordPress Openverse - Discussion #4535](https://github.com/WordPress/openverse/issues/4535)
 ### Third-Party Tools
 - [Currents - Playwright Last Failed Action](https://github.com/currents-dev/playwright-last-failed)
 - [Currents - Re-run Only Failed Tests](https://docs.currents.dev/guides/re-run-only-failed-tests)
--- a/docs/SNAPSHOT_UPDATE_FROM_ACTUALS.md
+++ b/docs/SNAPSHOT_UPDATE_FROM_ACTUALS.md
@@ -0,0 +1,482 @@
 # Snapshot Update from Actual Files (Fast Approach)
 **Date:** 2025-10-08
 **Status:** Proposed Optimization
 ## Overview
 When Playwright snapshot tests fail, Playwright **already generates the new ("actual") snapshots**. Instead of re-running tests with `--update-snapshots`, we can extract these actual snapshots from the `test-results/` directory and copy them to overwrite the expected snapshots.
 **Performance improvement:** ~1-2 minutes → **~10-30 seconds**
 ## How Playwright Stores Snapshots
 ### Expected (Baseline) Snapshots
 Stored in: `<test-file>-snapshots/<snapshot-name>-<project>-<platform>.png`
 **Example:**
 ```
 browser_tests/tests/interaction.spec.ts-snapshots/default-chromium-linux.png
 ```
 ### Failed Test Artifacts
 When a snapshot test fails, Playwright creates:
 ```
 test-results/<test-hash>/
  ├── <snapshot-name>-actual.png      # The NEW screenshot
  ├── <snapshot-name>-expected.png    # Copy of baseline
  └── <snapshot-name>-diff.png        # Visual diff
 ```
 **Example:**
 ```
 test-results/interaction-default-chromium-67af3c/
  ├── default-1-actual.png
  ├── default-1-expected.png
  └── default-1-diff.png
 ```
 ## Current Approach vs. Proposed Approach
 ### Current: Re-run Tests with `--update-snapshots`
 ```yaml
 # Current workflow (.github/workflows/update-playwright-expectations.yaml)
 - name: Re-run failed screenshot tests and update snapshots
  run: |
    # Download manifest of failed tests
    # For each project: chromium, chromium-2x, etc.
      # Run: playwright test --project="$project" --update-snapshots test1.spec.ts:42 test2.spec.ts:87 ...
 ```
 **Time:** ~2-5 minutes (depends on # of failed tests)
 **Why slow:**
 - Re-executes tests (browser startup, navigation, interactions)
 - Waits for elements, animations, etc.
 - Generates HTML report
 - Each test takes 5-15 seconds
 ### Proposed: Copy Actual → Expected
 ```yaml
 # Proposed workflow
 - name: Download test artifacts (includes test-results/)
 - name: Copy actual snapshots to expected locations
  run: pnpm tsx scripts/cicd/update-snapshots-from-actuals.ts
 - name: Commit and push
 ```
 **Time:** ~10-30 seconds (just file operations)
 **Why fast:**
 - No test execution
 - No browser startup
 - Just file copying
 - Parallel file operations
 ## Implementation Plan
 ### Step 1: Modify tests-ci.yaml
 Currently, test artifacts upload only the `playwright-report/` directory.
 **Add test-results/ to artifacts:**
 ```yaml
 # .github/workflows/tests-ci.yaml
 - uses: actions/upload-artifact@v4
  if: always()
  with:
    name: playwright-results-${{ matrix.browser }}  # New artifact
    path: |
      ComfyUI_frontend/test-results/**/*-actual.png
      ComfyUI_frontend/test-results/**/*-expected.png
      ComfyUI_frontend/test-results/**/*-diff.png
    retention-days: 7
 ```
 **Optimization:** Only upload actual snapshots for failed tests (saves artifact storage)
 ### Step 2: Create Script to Map Actuals → Expected
 **File:** `scripts/cicd/update-snapshots-from-actuals.ts`
 ```typescript
 import type { JSONReport, JSONReportTestResult } from '@playwright/test/reporter'
 import fs from 'node:fs'
 import fsp from 'node:fs/promises'
 import path from 'node:path'
 interface SnapshotMapping {
  actualPath: string      // test-results/.../snapshot-1-actual.png
  expectedPath: string    // browser_tests/tests/foo.spec.ts-snapshots/snapshot-chromium-linux.png
  testFile: string
  testName: string
  project: string
 }
 async function main() {
  const reportPath = path.join('playwright-report', 'report.json')
  if (!fs.existsSync(reportPath)) {
    console.log('No report.json found - no failed tests to update')
    return
  }
  const raw = await fsp.readFile(reportPath, 'utf8')
  const report: JSONReport = JSON.parse(raw)
  const mappings: SnapshotMapping[] = []
  // Parse JSON report to extract snapshot paths
  function collectFailedSnapshots(suite: any) {
    if (!suite) return
    for (const childSuite of suite.suites ?? []) {
      collectFailedSnapshots(childSuite)
    }
    for (const spec of suite.specs ?? []) {
      for (const test of spec.tests) {
        const lastResult = test.results[test.results.length - 1]
        if (lastResult?.status !== 'failed') continue
        // Check if test has image attachments (indicates screenshot test)
        const imageAttachments = lastResult.attachments.filter(
          (att: any) => att?.contentType?.startsWith('image/')
        )
        if (imageAttachments.length === 0) continue
        // Extract snapshot mapping from attachments
        for (const attachment of imageAttachments) {
          const attachmentPath = attachment.path
          if (!attachmentPath || !attachmentPath.includes('-actual.png')) {
            continue
          }
          // Parse test-results path to determine expected location
          // test-results/interaction-default-chromium-67af3c/default-1-actual.png
          // → browser_tests/tests/interaction.spec.ts-snapshots/default-chromium-linux.png
          const actualPath = attachmentPath
          const expectedPath = inferExpectedPath(actualPath, spec.file, test.projectId)
          if (expectedPath) {
            mappings.push({
              actualPath,
              expectedPath,
              testFile: spec.file,
              testName: test.annotations[0]?.description || test.title,
              project: test.projectId
            })
          }
        }
      }
    }
  }
  collectFailedSnapshots(report)
  if (mappings.length === 0) {
    console.log('No failed snapshot tests found')
    return
  }
  console.log(`Found ${mappings.length} snapshots to update`)
  // Copy actual → expected
  let successCount = 0
  let errorCount = 0
  for (const mapping of mappings) {
    try {
      if (!fs.existsSync(mapping.actualPath)) {
        console.warn(`⚠️  Actual file not found: ${mapping.actualPath}`)
        errorCount++
        continue
      }
      // Ensure expected directory exists
      const expectedDir = path.dirname(mapping.expectedPath)
      await fsp.mkdir(expectedDir, { recursive: true })
      // Copy actual → expected
      await fsp.copyFile(mapping.actualPath, mapping.expectedPath)
      console.log(`✓ Updated: ${path.basename(mapping.expectedPath)}`)
      successCount++
    } catch (error) {
      console.error(`✗ Failed to update ${mapping.expectedPath}:`, error)
      errorCount++
    }
  }
  console.log(`\n✅ Successfully updated ${successCount} snapshots`)
  if (errorCount > 0) {
    console.log(`⚠️  Failed to update ${errorCount} snapshots`)
    process.exit(1)
  }
 }
 /**
 * Infer the expected snapshot path from the actual path
 *
 * Actual: test-results/interaction-default-chromium-67af3c/default-1-actual.png
 * Expected: browser_tests/tests/interaction.spec.ts-snapshots/default-chromium-linux.png
 */
 function inferExpectedPath(actualPath: string, testFile: string, projectId: string): string | null {
  try {
    // Extract snapshot name from actual path
    // "default-1-actual.png" → "default"
    const actualFilename = path.basename(actualPath)
    const snapshotName = actualFilename.replace(/-\d+-actual\.png$/, '')
    // Determine platform (linux, darwin, win32)
    const platform = process.platform === 'linux' ? 'linux'
                   : process.platform === 'darwin' ? 'darwin'
                   : 'win32'
    // Build expected path
    const testDir = path.dirname(testFile)
    const testBasename = path.basename(testFile)
    const snapshotsDir = path.join(testDir, `${testBasename}-snapshots`)
    const expectedFilename = `${snapshotName}-${projectId}-${platform}.png`
    return path.join(snapshotsDir, expectedFilename)
  } catch (error) {
    console.error(`Failed to infer expected path for ${actualPath}:`, error)
    return null
  }
 }
 main().catch((err) => {
  console.error('Failed to update snapshots:', err)
  process.exit(1)
 })
 ```
 ### Step 3: Better Approach - Use Playwright's Attachment Metadata
 The JSON reporter actually includes the **expected snapshot path** in the attachments!
 **Simplified script:**
 ```typescript
 async function main() {
  const report: JSONReport = JSON.parse(await fsp.readFile('playwright-report/report.json', 'utf8'))
  const updates: Array<{ actual: string; expected: string }> = []
  for (const result of getAllTestResults(report)) {
    if (result.status !== 'failed') continue
    for (const attachment of result.attachments) {
      // Playwright includes both actual and expected in attachments
      if (attachment.name?.includes('-actual') && attachment.path) {
        const actualPath = attachment.path
        // Find corresponding expected attachment
        const expectedAttachment = result.attachments.find(
          att => att.name === attachment.name.replace('-actual', '-expected')
        )
        if (expectedAttachment?.path) {
          // The expected path in attachment points to the test-results copy
          // But we can infer the real expected path from the attachment metadata
          const expectedPath = inferRealExpectedPath(expectedAttachment)
          updates.push({ actual: actualPath, expected: expectedPath })
        }
      }
    }
  }
  // Copy files
  for (const { actual, expected } of updates) {
    await fsp.copyFile(actual, expected)
    console.log(`✓ Updated: ${path.relative(process.cwd(), expected)}`)
  }
 }
 ```
 ### Step 4: Update GitHub Actions Workflow
 ```yaml
 # .github/workflows/update-playwright-expectations.yaml
 name: Update Playwright Expectations
 on:
  issue_comment:
    types: [created]
 jobs:
  update:
    if: |
      github.event.issue.pull_request &&
      contains(github.event.comment.body, '/update-snapshots') &&
      contains(fromJSON('["OWNER", "MEMBER", "COLLABORATOR"]'),
               github.event.comment.author_association)
    runs-on: ubuntu-latest
    steps:
      - name: React to comment
        uses: actions/github-script@v8
        with:
          script: |
            github.rest.reactions.createForIssueComment({
              comment_id: context.payload.comment.id,
              content: '+1'
            })
      - name: Checkout PR
        run: gh pr checkout ${{ github.event.issue.number }}
        env:
          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
      - name: Setup Frontend
        uses: ./.github/actions/setup-frontend
      - name: Get latest failed test run
        id: get-run
        uses: actions/github-script@v8
        with:
          script: |
            const pr = await github.rest.pulls.get({
              owner: context.repo.owner,
              repo: context.repo.repo,
              pull_number: context.payload.issue.number
            })
            const runs = await github.rest.actions.listWorkflowRuns({
              owner: context.repo.owner,
              repo: context.repo.repo,
              workflow_id: 'tests-ci.yaml',
              head_sha: pr.data.head.sha,
              per_page: 1
            })
            core.setOutput('run_id', runs.data.workflow_runs[0]?.id || '')
      - name: Download test results
        uses: actions/download-artifact@v4
        with:
          run-id: ${{ steps.get-run.outputs.run_id }}
          pattern: playwright-results-*
          path: ComfyUI_frontend/test-results
          merge-multiple: true
      - name: Download JSON report
        uses: actions/download-artifact@v4
        with:
          run-id: ${{ steps.get-run.outputs.run_id }}
          pattern: playwright-report-*
          path: ComfyUI_frontend/playwright-report
          merge-multiple: true
      - name: Update snapshots from actuals
        working-directory: ComfyUI_frontend
        run: pnpm tsx scripts/cicd/update-snapshots-from-actuals.ts
      - name: Commit and push
        working-directory: ComfyUI_frontend
        run: |
          git config user.name 'github-actions'
          git config user.email 'github-actions@github.com'
          git add browser_tests/**/*-snapshots/*.png
          if git diff --cached --quiet; then
            echo "No snapshot changes detected"
          else
            git commit -m "[automated] Update test expectations"
            git push
          fi
 ```
 ## Performance Comparison
 ### Current Approach: Re-run Tests
 | Step | Time |
 |------|------|
 | Download manifest | 5s |
 | Install Playwright browsers | 20s |
 | Re-run 50 failed tests | 2-3 min |
 | Generate report | 10s |
 | Commit and push | 10s |
 | **Total** | **~3-4 min** |
 ### Proposed Approach: Copy Actuals
 | Step | Time |
 |------|------|
 | Download test-results artifacts | 10s |
 | Download JSON report | 2s |
 | Run copy script | 5s |
 | Commit and push | 10s |
 | **Total** | **~30s** |
 **Speedup: 6-8x faster** ⚡
 ## Advantages
 ✅ **Much faster** - No test re-execution
 ✅ **Simpler** - No need for manifest generation
 ✅ **Fewer dependencies** - No Playwright browser install needed
 ✅ **Less resource usage** - No ComfyUI server, no browser processes
 ✅ **More reliable** - File operations are deterministic
 ✅ **Already tested** - The snapshots were generated during the actual test run
 ## Disadvantages / Edge Cases
 ❌ **New snapshots** - If a test creates a snapshot for the first time, there's no existing expected file. This is rare and can be handled by fallback to re-running.
 ❌ **Deleted tests** - Old snapshots won't be cleaned up automatically. Could add a cleanup step.
 ❌ **Multiple projects** - Each project (chromium, chromium-2x, mobile-chrome) generates separate actuals. The script needs to handle all of them.
 ❌ **Artifact storage** - Storing test-results/ increases artifact size. Mitigation: Only upload `-actual.png` files, not traces/videos.
 ## Hybrid Approach (Recommended)
 Use the fast copy approach **with fallback**:
 ```yaml
 - name: Update snapshots
  run: |
    # Try fast approach first
    if pnpm tsx scripts/cicd/update-snapshots-from-actuals.ts; then
      echo "✓ Updated snapshots from actuals"
    else
      echo "⚠ Fast update failed, falling back to re-running tests"
      # Fallback to current approach
      pnpm exec playwright test --update-snapshots --project=chromium ...
    fi
 ```
 ## Implementation Checklist
 - [ ] Create `scripts/cicd/update-snapshots-from-actuals.ts`
 - [ ] Update `tests-ci.yaml` to upload `test-results/` artifacts
 - [ ] Update `update-playwright-expectations.yaml` to use new script
 - [ ] Add fallback logic for edge cases
 - [ ] Test with actual PR
 - [ ] Update documentation
 - [ ] Consider switching from label trigger → comment trigger (`/update-snapshots`)
 ## Related Links
 - **Playwright snapshot docs:** https://playwright.dev/docs/test-snapshots
 - **JSON reporter types:** `@playwright/test/reporter`
 - **GitHub Actions artifacts:** https://docs.github.com/en/actions/using-workflows/storing-workflow-data-as-artifacts
 - **Issue #22064:** Playwright feature request for better snapshot file alignment
 ## Conclusion
 This approach is **significantly faster** and **simpler** than re-running tests. The main trade-off is artifact storage size, but this can be mitigated by only uploading actual snapshots (not traces/videos).
 **Recommendation:** Implement this as the primary approach with fallback to re-running tests for edge cases.
--- a/scripts/cicd/build-failed-screenshot-manifest.ts
+++ b/scripts/cicd/build-failed-screenshot-manifest.ts
@@ -0,0 +1,87 @@
 import type {
  JSONReport,
  JSONReportSpec,
  JSONReportSuite,
  JSONReportTestResult
 } from '@playwright/test/reporter'
 import fs from 'node:fs'
 import fsp from 'node:fs/promises'
 import path from 'node:path'
 const argv = process.argv.slice(2)
 const getArg = (flag: string, fallback: string) => {
  const i = argv.indexOf(flag)
  if (i >= 0 && i + 1 < argv.length) return argv[i + 1]
  return fallback
 }
 async function main() {
  // Defaults mirror the workflow layout
  const reportPath = getArg(
    '--report',
    path.join('playwright-report', 'report.json')
  )
  const outDir = getArg('--out', path.join('ci-rerun'))
  if (!fs.existsSync(reportPath)) {
    throw Error(`Report not found at ${reportPath}`)
  }
  const raw = await fsp.readFile(reportPath, 'utf8')
  let data: JSONReport
  try {
    data = JSON.parse(raw)
  } catch (error) {
    throw new Error(
      `Failed to parse Playwright JSON report at ${reportPath}. ` +
        `The report file may be corrupted or incomplete. ` +
        `Error: ${error instanceof Error ? error.message : String(error)}`
    )
  }
  const hasScreenshotSignal = (r: JSONReportTestResult) => {
    return r.attachments.some((att) => att?.contentType?.startsWith('image/'))
  }
  const out = new Map<string, Set<string>>()
  const collectFailedScreenshots = (suite?: JSONReportSuite) => {
    if (!suite) return
    const childSuites = suite.suites ?? []
    for (const childSuite of childSuites) collectFailedScreenshots(childSuite)
    const specs: JSONReportSpec[] = suite.specs ?? []
    for (const spec of specs) {
      const file = spec.file
      const line = spec.line
      const loc = `${file}:${line}`
      for (const test of spec.tests) {
        const project = test.projectId
        const last = test.results[test.results.length - 1]
        const failedScreenshot =
          last && last.status === 'failed' && hasScreenshotSignal(last)
        if (!failedScreenshot) continue
        if (!out.has(project)) out.set(project, new Set())
        const projectSet = out.get(project)
        if (projectSet) {
          projectSet.add(loc)
        }
      }
    }
  }
  const report: JSONReport = data
  const rootSuites = report.suites ?? []
  for (const suite of rootSuites) collectFailedScreenshots(suite)
  await fsp.mkdir(outDir, { recursive: true })
  for (const [project, set] of out.entries()) {
    const f = path.join(outDir, `${project}.txt`)
    await fsp.writeFile(f, Array.from(set).join('\n') + '\n', 'utf8')
  }
 }
 main().catch((err) => {
  console.error('Manifest generation failed:', err)
  process.exit(1)
 })
--- a/tests-ui/tests/renderer/core/layout/layoutStore.test.ts
+++ b/tests-ui/tests/renderer/core/layout/layoutStore.test.ts
@@ -1,11 +1,8 @@
 import { beforeEach, describe, expect, it, vi } from 'vitest'
 import { layoutStore } from '@/renderer/core/layout/store/layoutStore'
-import {
+import { LayoutSource } from '@/renderer/core/layout/types'
-  type LayoutChange,
+import type { LayoutChange, NodeLayout } from '@/renderer/core/layout/types'
  LayoutSource,
  type NodeLayout
 } from '@/renderer/core/layout/types'
 describe('layoutStore CRDT operations', () => {
  beforeEach(() => {
--- a/tests-ui/tests/renderer/extensions/vueNodes/composables/useNodeEventHandlers.test.ts
+++ b/tests-ui/tests/renderer/extensions/vueNodes/composables/useNodeEventHandlers.test.ts
@@ -1,10 +1,10 @@
 import { beforeEach, describe, expect, it, vi } from 'vitest'
 import { computed, shallowRef } from 'vue'
-import {
+import { useGraphNodeManager } from '@/composables/graph/useGraphNodeManager'
-  type GraphNodeManager,
+import type {
-  type VueNodeData,
+  GraphNodeManager,
-  useGraphNodeManager
+  VueNodeData
 } from '@/composables/graph/useGraphNodeManager'
 import { useVueNodeLifecycle } from '@/composables/graph/useVueNodeLifecycle'
 import type {
Author	SHA1	Message	Date
snomiao	4bdfb57f9b	Merge main into bl-selective-snapshot-update Resolved conflict in pr-update-playwright-expectations.yaml by keeping the detailed comments from the feature branch while adopting the updated workflow name from main.	2025-10-19 03:46:37 +00:00
bymyself	ebd20a815e	Merge latest main (v1.29.2) into bl-selective-snapshot-update	2025-10-14 11:56:10 -07:00
bymyself	9616b91700	Merge latest main into bl-selective-snapshot-update Resolved conflicts by: - Keeping our selective snapshot update logic in workflows - Accepting main's Vue node refactoring changes	2025-10-14 11:03:41 -07:00
bymyself	939d1a0e44	Merge branch 'main' into bl-selective-snapshot-update Resolved conflicts in update-playwright-expectations.yaml by: - Keeping main's improvements: concurrency control, comment reactions, better branch checkout - Keeping our selective snapshot update logic with validation - Keeping our workflow summary generation - Combined both sets of improvements for a robust solution Fixed eslint configuration issue where vite.config.mts was in both allowDefaultProject and tsconfig.json	2025-10-12 20:27:25 -07:00
bymyself	df6723415b	Address review comments and improve workflow - Add workflow documentation explaining selective update strategy - Improve logging with clear output formatting (no emojis) - Add GitHub Actions workflow summary with file change details - Fix command injection vulnerability by validating test paths with regex - Add error handling for JSON.parse with descriptive messages - Replace non-null assertion with safer null checking pattern - Add explicit error handling for TypeScript script execution	2025-10-12 16:00:38 -07:00
Benjamin Lu	83ff415815	Merge remote-tracking branch 'origin/main' into bl-selective-snapshot-update	2025-10-07 19:29:01 -07:00
Benjamin Lu	87d3111d5c	Only update snapshots of failed	2025-10-06 19:07:22 -07:00