Merge remote-tracking branch 'origin/main' into link-gh-action-with-webview

Svilen-Stefanov · Svilen-Stefanov · commit ba5d7787eaec · 2026-06-11T18:38:35.000+02:00
# Conflicts:
#	.codeboarding/analysis.json
#	.codeboarding/health/health_report.json
diff --git a/.codeboarding/analysis.json b/.codeboarding/analysis.json
@@ -1,7 +1,7 @@
 {
   "metadata": {
-    "generated_at": "2026-06-11T15:51:00.405452+00:00",
-    "commit_hash": "7e07060289fb7516657e6c428fdec5e631fbfd72",
+    "generated_at": "2026-06-11T16:36:04.958976+00:00",
+    "commit_hash": "e9aa6435ce9f0ffe6726d5c1a3758980f79f1c3b",
     "repo_name": "CodeBoarding-action",
     "depth_level": 1,
     "file_coverage_summary": {
@@ -14,7 +14,7 @@
       }
     }
   },
-  "description": "The CodeBoarding-action pipeline automates structural code analysis and visualization by orchestrating engine execution across Git branches, generating visual diffs of code changes, and integrating these insights into GitHub PRs via IDE-specific deep links.",
+  "description": "The CodeBoarding system orchestrates the analysis of git repositories, performs structural diffing between analysis states, and generates actionable visual feedback for pull requests by integrating with developer environments.",
   "files": {
     "scripts/cb_engine.py": {
       "method_keys": [
@@ -377,8 +377,8 @@
   },
   "components": [
     {
-      "name": "Analysis Orchestrator",
-      "description": "Coordinates the execution flow of the CodeBoarding engine, managing the lifecycle of base, head, and health analysis runs. The unclustered connections reveal a complex internal state machine (scripts.cb_engine.run_base, scripts.cb_engine.run_head, scripts.cb_engine.run_health, scripts.cb_engine.validate_base_analysis) that defines the core pipeline logic of the GitHub Action.",
+      "name": "Engine Orchestrator",
+      "description": "Manages the execution environment and lifecycle of the CodeBoarding analysis engine. It handles the checkout of different git references, executes the analysis, and validates the integrity of the generated data before downstream processing.",
       "key_entities": [
         {
           "qualified_name": "scripts.cb_engine.main",
@@ -429,8 +429,8 @@
       "can_expand": true
     },
     {
-      "name": "Visual Diff Generator",
-      "description": "Transforms raw analysis data and structural changes into visual representations, specifically Mermaid.js diagrams, highlighting architectural shifts. The new connections (scripts.diff_to_mermaid._diff_components, scripts.diff_to_mermaid._diff_relations, scripts.diff_to_mermaid._has_structural_changes) indicate a sophisticated logic for identifying architectural regressions or evolutions.",
+      "name": "Visual Diff Engine",
+      "description": "The core analytical component that compares two sets of analysis data. It identifies structural modifications (additions, removals, or changes in relationships), filters for relevance to reduce diagram noise, and renders the final architectural diff using Mermaid.js syntax.",
       "key_entities": [
         {
           "qualified_name": "scripts.diff_to_mermaid.main",
@@ -451,10 +451,10 @@
           "reference_end_line": 521
         },
         {
-          "qualified_name": "scripts.diff_to_mermaid._diff_components",
+          "qualified_name": "scripts.diff_to_mermaid._filter_changed",
           "reference_file": "scripts/diff_to_mermaid.py",
-          "reference_start_line": 162,
-          "reference_end_line": 207
+          "reference_start_line": 312,
+          "reference_end_line": 354
         }
       ],
       "source_cluster_ids": [
@@ -503,8 +503,8 @@
       "can_expand": true
     },
     {
-      "name": "UX & Integration Layer",
-      "description": "Manages the interaction between the action and the GitHub environment, including the generation of PR comments, status updates, and user-facing links. The addition of scripts.build_cta.py introduces specific logic for generating 'Call to Action' links and webview integrations, expanding the layer's responsibility from simple reporting to interactive developer experience (DevEx) tooling.",
+      "name": "Engagement & Feedback Manager",
+      "description": "Enhances the PR comment with interactive elements. It detects the developer's environment and generates deep-links to local IDEs or the CodeBoarding dashboard, transforming a static diagram into an actionable entry point for code review.",
       "key_entities": [
         {
           "qualified_name": "scripts.build_cta.main",
@@ -545,18 +545,18 @@
   ],
   "components_relations": [
     {
-      "relation": "Provides analysis artifacts to",
-      "src_name": "Analysis Orchestrator",
-      "dst_name": "Visual Diff Generator",
+      "relation": "Supplies validated JSON analysis files to",
+      "src_name": "Engine Orchestrator",
+      "dst_name": "Visual Diff Engine",
       "src_id": "1",
       "dst_id": "2",
       "edge_count": 0,
       "is_static": false
     },
     {
-      "relation": "Passes rendered diagrams to",
-      "src_name": "Visual Diff Generator",
-      "dst_name": "UX & Integration Layer",
+      "relation": "Provides structural context and identified changes to",
+      "src_name": "Visual Diff Engine",
+      "dst_name": "Engagement & Feedback Manager",
       "src_id": "2",
       "dst_id": "3",
       "edge_count": 0,
diff --git a/.codeboarding/health/health_report.json b/.codeboarding/health/health_report.json
@@ -1,13 +1,13 @@
 {
   "repository_name": "CodeBoarding-action",
-  "timestamp": "2026-06-11T15:50:45.582495+00:00",
-  "overall_score": 0.9996183206106869,
+  "timestamp": "2026-06-11T16:35:41.927521+00:00",
+  "overall_score": 0.999609375,
   "check_summaries": [
     {
       "check_name": "function_size",
       "description": "Checks that functions/methods do not exceed line count thresholds",
       "check_type": "standard",
-      "total_entities_checked": 43,
+      "total_entities_checked": 42,
       "findings_count": 0,
       "warning_count": 0,
       "score": 1.0,
@@ -17,7 +17,7 @@
       "check_name": "fan_out",
       "description": "Checks efferent coupling: how many other functions each function calls",
       "check_type": "standard",
-      "total_entities_checked": 43,
+      "total_entities_checked": 42,
       "findings_count": 0,
       "warning_count": 0,
       "score": 1.0,
@@ -27,7 +27,7 @@
       "check_name": "fan_in",
       "description": "Checks afferent coupling: how many other functions call each function",
       "check_type": "standard",
-      "total_entities_checked": 43,
+      "total_entities_checked": 42,
       "findings_count": 0,
       "warning_count": 0,
       "score": 1.0,
@@ -43,6 +43,24 @@
       "score": 1.0,
       "finding_groups": []
     },
+    {
+      "check_name": "circular_dependencies",
+      "description": "Detects circular dependencies between packages",
+      "check_type": "circular_dependencies",
+      "cycles": [],
+      "packages_checked": 1,
+      "packages_in_cycles": 0
+    },
+    {
+      "check_name": "package_instability",
+      "description": "Computes Martin's instability metric (I = Ce / (Ca + Ce)) per package",
+      "check_type": "standard",
+      "total_entities_checked": 0,
+      "findings_count": 0,
+      "warning_count": 0,
+      "score": 1.0,
+      "finding_groups": []
+    },
     {
       "check_name": "unused_code_diagnostics",
       "description": "Detects unused imports, variables, functions, and dead code via LSP diagnostics",
diff --git a/.github/workflows/refresh-baseline.yml b/.github/workflows/refresh-baseline.yml
@@ -0,0 +1,192 @@
+# One-off / on-demand baseline refresh for THIS repo's own committed analysis.
+#
+# Why this exists: the webview "explore in browser" link compares a PR's head
+# against the analysis.json committed at the PR base (a commit on main). That base
+# is only meaningful if main's committed analysis.json is current. The PR review
+# workflow never writes to main, so without this, main's baseline goes stale and
+# every PR diffs against an outdated snapshot.
+#
+# Run it manually (Actions -> "Refresh CodeBoarding baseline" -> Run workflow) to
+# regenerate .codeboarding/analysis.json against main's current tree and commit it.
+# It generates a FRESH full analysis (LLM) for main's HEAD, so commit_hash matches
+# the commit it lands on. This is the manually-triggered form of the "baseline
+# keeper" described in docs/COMMIT_STRATEGY.md.
+
+name: Refresh CodeBoarding baseline
+
+on:
+  workflow_dispatch:
+    inputs:
+      depth_level:
+        description: 'Analysis depth (1-3). Match the review workflow for a comparable baseline.'
+        required: false
+        default: '1'
+
+permissions:
+  contents: write   # commit the regenerated analysis.json to main
+
+concurrency:
+  group: codeboarding-refresh-baseline
+  cancel-in-progress: false
+
+jobs:
+  refresh:
+    runs-on: ubuntu-latest
+    timeout-minutes: 60
+    steps:
+      # Root checkout: provides the action's own scripts (cb_engine.py) AND is where
+      # the regenerated analysis.json is committed back. The engine and the analyzed
+      # tree go into SEPARATE subdirectories so the engine never analyzes itself.
+      - name: Checkout this repo (main)
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      # Second checkout of this same repo as the analysis TARGET, isolated from the
+      # action scripts + engine at the workspace root (mirrors the review action's
+      # target-repo/ layout so the engine analyzes only the repo's own tree).
+      - name: Checkout analysis target
+        uses: actions/checkout@v4
+        with:
+          path: target-repo
+          fetch-depth: 0
+
+      - name: Read engine ref from action.yml
+        id: engine
+        shell: bash
+        run: |
+          # Default the engine ref to the action.yml input default, so the baseline
+          # is generated with the same engine the review workflow pins.
+          REF="$(grep -A3 "engine_ref:" action.yml | grep "default:" | head -1 | sed -E "s/.*default: *'?([^'\"]+)'?.*/\1/")"
+          echo "ref=${REF:-v0.12.0}" >> "$GITHUB_OUTPUT"
+          echo "Engine ref: ${REF:-v0.12.0}"
+
+      - name: Checkout CodeBoarding engine
+        uses: actions/checkout@v4
+        with:
+          repository: CodeBoarding/CodeBoarding
+          ref: ${{ steps.engine.outputs.ref }}
+          path: codeboarding-engine
+          persist-credentials: false
+
+      - uses: actions/setup-python@v5
+        with:
+          python-version: '3.13'
+      - uses: actions/setup-node@v4
+        with:
+          node-version: '20'
+      - uses: astral-sh/setup-uv@v4
+        with:
+          enable-cache: true
+
+      - name: Cache uv venv (engine)
+        uses: actions/cache@v4
+        with:
+          path: codeboarding-engine/.venv
+          key: cb-uv-${{ runner.os }}-${{ hashFiles('codeboarding-engine/pyproject.toml', 'codeboarding-engine/uv.lock') }}
+
+      - name: Cache LSP servers
+        uses: actions/cache@v4
+        with:
+          path: |
+            codeboarding-engine/static_analyzer/servers/node_modules
+            codeboarding-engine/static_analyzer/servers/bin
+          key: cb-lsp-${{ runner.os }}-v1
+          restore-keys: cb-lsp-${{ runner.os }}-
+
+      - name: Install Python dependencies
+        working-directory: codeboarding-engine
+        shell: bash
+        run: |
+          test -d .venv || uv venv
+          uv pip install -e .
+
+      - name: Install LSP servers
+        working-directory: codeboarding-engine
+        shell: bash
+        run: uv run python install.py --auto-install-npm
+
+      - name: Generate baseline analysis for main
+        id: gen
+        working-directory: codeboarding-engine
+        shell: bash
+        env:
+          STATIC_ANALYSIS_CONFIG: ${{ github.workspace }}/codeboarding-engine/static_analysis_config.yml
+          PROJECT_ROOT: ${{ github.workspace }}/codeboarding-engine
+          DIAGRAM_DEPTH_LEVEL: ${{ inputs.depth_level }}
+          CACHING_DOCUMENTATION: 'false'
+          ENABLE_MONITORING: 'false'
+          ACTION_PATH: ${{ github.workspace }}
+          TARGET: ${{ github.workspace }}/target-repo
+          OUT_DIR: ${{ runner.temp }}/cb-baseline
+          REPO_NAME: ${{ github.event.repository.name }}
+          DEPTH: ${{ inputs.depth_level }}
+          MAIN_SHA: ${{ github.sha }}
+          # Key + model pins live in SECRETS (not vars) in this repo, same as the
+          # review workflow consumes them. Read raw here; normalize in the script.
+          RAW_OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }}
+          RAW_AGENT_MODEL: ${{ secrets.AGENT_MODEL }}
+          RAW_PARSING_MODEL: ${{ secrets.PARSING_MODEL }}
+        run: |
+          # Normalize EXACTLY like the review action's key prep (action.yml). A raw
+          # secret can carry surrounding whitespace/newlines, wrapping quotes, or a
+          # leading "OPENROUTER_API_KEY=" prefix; any of those land in the
+          # Authorization header and OpenRouter rejects it as "Missing Authentication
+          # header" (a 401 that looks like a bad key but is a malformed header).
+          # The previous fix stripped only whitespace, leaving quotes/prefix → still 401.
+          _strip() { printf '%s' "$1" | tr -d '[:space:]' | sed -e 's/^"//;s/"$//' -e "s/^'//;s/'\$//"; }
+          KEY="$(_strip "$RAW_OPENROUTER_API_KEY")"
+          # Drop a leading "OPENROUTER_API_KEY=" if the secret was stored with it.
+          case "$KEY" in OPENROUTER_API_KEY=*) KEY="${KEY#OPENROUTER_API_KEY=}";; esac
+          KEY="$(_strip "$KEY")"
+          [ -n "$KEY" ] || { echo "::error::OPENROUTER_API_KEY secret is not set."; exit 1; }
+          echo "::add-mask::$KEY"
+          export OPENROUTER_API_KEY="$KEY"
+          AGENT_MODEL="$(_strip "$RAW_AGENT_MODEL")"
+          PARSING_MODEL="$(_strip "$RAW_PARSING_MODEL")"
+          export AGENT_MODEL="${AGENT_MODEL:-google/gemini-3-flash-preview}"
+          export PARSING_MODEL="${PARSING_MODEL:-google/gemini-3.1-flash-lite-preview}"
+          echo "Provider: openrouter; key length: ${#OPENROUTER_API_KEY}"
+          # Preflight the key against OpenRouter so a malformed/expired key fails here
+          # with a clear message instead of deep inside the engine's retry loop.
+          PRE=$(curl -sS -o /dev/null -w "%{http_code}" -H "Authorization: Bearer $OPENROUTER_API_KEY" \
+            --max-time 10 https://openrouter.ai/api/v1/auth/key || echo "curl-fail")
+          echo "OpenRouter /auth/key preflight: HTTP $PRE"
+          [ "$PRE" = "200" ] || { echo "::error::OpenRouter rejected the key (HTTP $PRE). Check the OPENROUTER_API_KEY secret value (no quotes/prefix/newline)."; exit 1; }
+          mkdir -p "$OUT_DIR"
+          # Run the same full-analysis path the review action uses for a base.
+          uv run python "$ACTION_PATH/scripts/cb_engine.py" base \
+            --repo "$TARGET" \
+            --out "$OUT_DIR" \
+            --name "$REPO_NAME" \
+            --run-id "${GITHUB_RUN_ID}-${GITHUB_RUN_ATTEMPT}-baseline" \
+            --depth "$DEPTH" \
+            --source-sha "$MAIN_SHA"
+          [ -f "$OUT_DIR/analysis.json" ] || { echo "::error::Baseline analysis ran but analysis.json is missing."; exit 1; }
+          # Optional health report, if the engine produced one.
+          uv run python "$ACTION_PATH/scripts/cb_engine.py" health \
+            --artifact-dir "$OUT_DIR" \
+            --repo "$TARGET" \
+            --name "$REPO_NAME" \
+            --issues-out "${RUNNER_TEMP}/cb-issues.txt" || true
+
+      - name: Commit baseline to main
+        shell: bash
+        env:
+          OUT_DIR: ${{ runner.temp }}/cb-baseline
+        run: |
+          mkdir -p .codeboarding/health
+          cp "$OUT_DIR/analysis.json" .codeboarding/analysis.json
+          if [ -f "$OUT_DIR/health/health_report.json" ]; then
+            cp "$OUT_DIR/health/health_report.json" .codeboarding/health/health_report.json
+          fi
+          git add .codeboarding/analysis.json .codeboarding/health/health_report.json 2>/dev/null || git add .codeboarding/analysis.json
+          if git diff --cached --quiet; then
+            echo "::notice::Baseline already current; nothing to commit."
+            exit 0
+          fi
+          git config user.name "codeboarding[bot]"
+          git config user.email "codeboarding[bot]@users.noreply.github.com"
+          git commit -m "chore(codeboarding): refresh architecture baseline [skip ci]"
+          git push
+          echo "Committed refreshed baseline to ${GITHUB_REF_NAME} ($(git rev-parse --short HEAD))."