#!/usr/bin/env bash
# ─────────────────────────────────────────────────────────────────────────────
# UBS Meta-Runner (v1.0)
# Unified dispatcher for Ultimate Bug Scanner across JS/TS, Python, C/C++, Rust, Go, Java, Ruby, Swift, C#, Elixir
# - Detects languages
# - Ensures modules (lazy download)
# - Runs modules concurrently
# - Merges outputs (text/json/sarif) with jq
# ─────────────────────────────────────────────────────────────────────────────

# ─────────────────────────────────────────────────────────────────────────────
# Bail early on ancient bash (macOS ships bash 3.2 which lacks associative
# arrays, `declare -A`, `readarray`, etc.).  Keep this check before `set -E`
# so it works even under the stock /bin/bash.
# ─────────────────────────────────────────────────────────────────────────────
if [ "${BASH_VERSINFO[0]:-0}" -lt 4 ]; then
  echo "ERROR: UBS requires bash >= 4.0 (you have ${BASH_VERSION:-unknown})." >&2
  echo "" >&2
  echo "macOS ships bash 3.2 due to licensing.  Install a modern bash with:" >&2
  echo "  brew install bash" >&2
  echo "" >&2
  echo "Then re-run this script with:  /opt/homebrew/bin/bash $0 \"\$@\"" >&2
  echo "Or add /opt/homebrew/bin/bash to /etc/shells and chsh." >&2
  exit 1
fi

set -Eeuo pipefail
shopt -s lastpipe || true
trap '' SIGPIPE 2>/dev/null || true

UBS_VERSION="5.3.2"
# Module / helper fetches must be checksum-stable for an installed
# release, so they pin to the tagged tree matching this script's
# UBS_VERSION. main is reserved for the self-update probe below
# (which is what advances a stale install onto a newer tag).
# Issue #43: pinning to "main" caused every installed copy to break
# the moment main moved past the release the user installed.
REPO_RAW_BASE="https://raw.githubusercontent.com/Dicklesworthstone/ultimate_bug_scanner"
REPO_RAW="${REPO_RAW_BASE}/v${UBS_VERSION}"
REPO_RAW_LATEST="${REPO_RAW_BASE}/main"
MODULE_PATH_TEMPLATE="$REPO_RAW/modules/ubs-%s.sh"
MODULE_PATH_TEMPLATE_LATEST="$REPO_RAW_LATEST/modules/ubs-%s.sh"

# Known-good module digests (sha256) for supply-chain verification.
declare -A MODULE_CHECKSUMS=(
  [cpp]='f054b77189ac66e81fa5c918d4605430272ccb67d9c875f126673182fda85805'
  [csharp]='aa49faa22bf85a0cb3da4a667e1ab2d2b8960473ec2f8694aac3dffe9f8861f6'
  [elixir]='a231939f444a0f8dc8db97122d08898f589d8cd0dbca4e44197bb16f01b6cae9'
  [golang]='a2507466d961932e821465de17ca10571f8be010909fb29db1d032e25a604f77'
  [java]='9d6df2d271d7c20caa97248a82ba71d4c14970dd31fc30b0b82c7902269af4a2'
  [js]='d472bc608e90ca35f32000253a71c7c001507c56603d5a3d231de59804521551'
  [python]='e61c1b4885519572f8aead605fe7be5df066a5160edbbb42b6e1a3bf75f94fde'
  [ruby]='0973251abcd905bb6892ede0448657f460aca67f821ccc97e60645be2a1c5447'
  [rust]='26249823d0ddd77ef86aed424dbe587ee53cb3e30c186810a5292d0dae325740'
  [swift]='abb8b2e29fa7aa735db056757e6daa4c4b6d618e3251448ed3e9855cf491e9c0'
)

# Helper assets used by some modules (AST correlation and type narrowing).
declare -A HELPER_CHECKSUMS=(
  ['helpers/async_task_handles_csharp.py']='a1efff32352dab3dafce18e96a39a1bd2fa4085305ba1604a799fbd3e09d3022'
  ['helpers/resource_lifecycle_cpp.py']='efc9f28047a23246589399309acacea675d2fe2354d011e4c667fdcaebf7dfa8'
  ['helpers/resource_lifecycle_csharp.py']='6a3562049d3e616781ccf941a56a8abc1925fd6b0d95d510a66a35118ee95f28'
  ['helpers/resource_lifecycle_go.go']='10215d2c772dd7905a7e9c60a56899a9d702f1c950e1bfd30d4eb90b190e38bd'
  ['helpers/resource_lifecycle_java.py']='c005da1519eaa751ccf6fa45f99f884aaa30492f91b7c1b527f7f9b782df39f1'
  ['helpers/resource_lifecycle_py.py']='1e884ff42c988fa6a19f9b8f8375bde2334ebcde61735bc4f10b7dc3c900483e'
  ['helpers/resource_lifecycle_ruby.py']='beffcd5bcac833e4dba7f49e04e296837846eff46580eab27565d1cb429b1dc2'
  ['helpers/resource_lifecycle_swift.py']='33a78e83acdffaf0d05b05d240bff5f408d55cd9798d0ae01bd69c36f3afbd0f'
  ['helpers/type_narrowing_csharp.py']='b9b0c16f67608dfc79addcb44d0638ef7e4af96840220bdd671e98ac1f5ca12c'
  ['helpers/type_narrowing_kotlin.py']='6f0f4482e8c349d15ac2830956baf193eedd2461d1ef836267c78da86c78ad79'
  ['helpers/type_narrowing_rust.py']='355ad60ce6dffb9a7c63169cb83705854612c931e2e8c3a166a81b0cb810647f'
  ['helpers/type_narrowing_swift.py']='f950bafa92391964e4779c77d37dcc11b0ffeab9bc351be439b4709c0f01b41a'
  ['helpers/type_narrowing_ts.js']='c26e30a0cc2690065bb50d1b17e5d696096dceaa6f3c87a5fcb883260ed3a32b'
)

# ─────────────────────────────────────────────────────────────────────────────
# Capabilities & helpers (must be defined before first use)
# ─────────────────────────────────────────────────────────────────────────────
need_cmd(){ command -v "$1" >/dev/null 2>&1; }
date_iso(){ if [[ "${CI_MODE:-0}" -eq 1 ]]; then date -u '+%Y-%m-%dT%H:%M:%SZ'; else date '+%Y-%m-%d %H:%M:%S'; fi; }
json_escape(){
  local s="${1:-}"
  s=${s//\\/\\\\}
  s=${s//\"/\\\"}
  s=${s//$'\n'/\\n}
  s=${s//$'\r'/\\r}
  s=${s//$'\t'/\\t}
  printf '%s' "$s"
}

load_ignore_patterns(){
  local file="$1"
  [[ -f "$file" ]] || return 0
  if ! need_cmd python3; then
    say "${YELLOW}${WARN}${RESET} python3 is required to parse ignore file $file (skipping)"
    return 0
  fi
  local csv
  csv=$(python3 - "$file" <<'PY' 2>/dev/null
import sys, pathlib
path = pathlib.Path(sys.argv[1])
if not path.exists():
    sys.exit(0)
patterns = []
seen = set()
for raw in path.read_text().splitlines():
    stripped = raw.strip()
    if not stripped or stripped.startswith('#'):
        continue
    stripped = stripped.rstrip('/')
    if stripped.startswith('./'):
        stripped = stripped[2:]
    if not stripped or stripped in seen:
        continue
    seen.add(stripped)
    patterns.append(stripped)
print(",".join(patterns))
PY
)
  csv="${csv//$'\n'/}"
  csv="${csv%,}"
  if [[ -n "$csv" ]]; then
    if [[ -n "$GLOBAL_EXCLUDE_PATTERNS" ]]; then
      GLOBAL_EXCLUDE_PATTERNS="$GLOBAL_EXCLUDE_PATTERNS,$csv"
    else
      GLOBAL_EXCLUDE_PATTERNS="$csv"
    fi
    local human="${csv//,/ }"
    say "${DIM}${INFO}${RESET} Ignoring paths from ${file} → ${human}"
  fi
}

HELPER_ASSETS=(
  "helpers/async_task_handles_csharp.py"
  "helpers/resource_lifecycle_cpp.py"
  "helpers/resource_lifecycle_csharp.py"
  "helpers/resource_lifecycle_py.py"
  "helpers/resource_lifecycle_go.go"
  "helpers/resource_lifecycle_java.py"
  "helpers/resource_lifecycle_ruby.py"
  "helpers/resource_lifecycle_swift.py"
  "helpers/type_narrowing_csharp.py"
  "helpers/type_narrowing_ts.js"
  "helpers/type_narrowing_rust.py"
  "helpers/type_narrowing_kotlin.py"
  "helpers/type_narrowing_swift.py"
)

HELPERS_READY=0

# Pinned ast-grep release for tool-cache auto-provisioning (JS/TS accuracy).
AST_GREP_VERSION="0.40.1"
AST_GREP_BASE_URL="https://github.com/ast-grep/ast-grep/releases/download/${AST_GREP_VERSION}"
TOOLS_DIR_DEFAULT="${XDG_DATA_HOME:-$HOME/.local/share}/ubs/tools"
TOOLS_DIR="${UBS_TOOLS_DIR:-$TOOLS_DIR_DEFAULT}"

# Known-good ast-grep asset digests (sha256) for supply-chain verification.
declare -A AST_GREP_ASSET_SHA256=(
  [aarch64-apple-darwin]='d40d260d6a2c6c6963079e79d3c57e7988b2de08edca7cfa6c270b5fef591dd7'
  [x86_64-apple-darwin]='1ffefbce66ceb4eabd307157ca02991d9734adfb43ac9f4b298788e935b6e04a'
  [aarch64-unknown-linux-gnu]='24f7d0a99dfa45cf65c6e175e1bceaac24f04d2b84807d832c4205a17d2270ab'
  [x86_64-unknown-linux-gnu]='774d6080dedbf8859a51e78d2be1cb84715454627b3995c2ff533ed755975012'
  [x86_64-pc-windows-msvc]='4ac3d772c3d87aff8913708219ad3ca73cff2fff4846fd12f9967e87e55fc94e'
)

# Colors (respect NO_COLOR or non-tty)
if [[ -n "${NO_COLOR:-}" || ! -t 1 ]]; then
  RED= GREEN= YELLOW= BLUE= MAGENTA= CYAN= WHITE= GRAY= BOLD= DIM= RESET=
else
  RED='\033[0;31m'; GREEN='\033[0;32m'; YELLOW='\033[1;33m'; BLUE='\033[0;34m'
  MAGENTA='\033[0;35m'; CYAN='\033[0;36m'; WHITE='\033[1;37m'; GRAY='\033[0;90m'
  BOLD='\033[1m'; DIM='\033[2m'; RESET='\033[0m'
fi
CHECK="✓"; WARN="⚠"; INFO="ℹ"; X="✗"
say(){
  if [[ "${FORMAT:-text}" == "json" || "${FORMAT:-text}" == "jsonl" || "${FORMAT:-text}" == "sarif" || "${FORMAT:-text}" == "toon" ]]; then
    echo -e "$*" >&2
  else
    echo -e "$*"
  fi
}
say_err(){ echo -e "$*" >&2; }

looks_like_toon_rust_encoder(){
  local bin="${1:-}"
  [[ -z "$bin" ]] && return 1
  # Hard ban: never accept (or invoke) the Node.js encoder as the TOON backend.
  local base="${bin##*/}"
  if [[ "$base" == "toon" || "$base" == "toon.exe" ]]; then
    return 1
  fi

  # `tru --help` begins with "TOON reference implementation in Rust (JSON <-> TOON)".
  # `tru --version` prints "tru X.Y.Z".
  local help ver
  help="$("$bin" --help 2>&1 | head -n 5 || true)"
  if [[ "$help" == *"TOON reference implementation in Rust"* ]]; then
    return 0
  fi

  ver="$("$bin" --version 2>&1 | head -n 1 || true)"
  if [[ "$ver" =~ ^tru[[:space:]][0-9] ]]; then
    return 0
  fi

  return 1
}

print_with_permalinks(){
  local file="$1"
  if [[ -z "$file" || ! -s "$file" ]]; then return; fi
  if [[ -z "$GIT_BLOB_BASE" ]]; then
    cat "$file"
    return
  fi
  python3 - "$SOURCE_PROJECT_DIR" "$GIT_BLOB_BASE" "$file" <<'PY' 2>/dev/null || cat "$file"
import sys, pathlib, re
root = pathlib.Path(sys.argv[1]).resolve()
blob = sys.argv[2].rstrip('/')
input_path = pathlib.Path(sys.argv[3])
pattern = re.compile(r'^(\s*)((?:[A-Za-z]:)?[^:]+?):(\d+)(?::(\d+))?')

def to_url(path_str, line):
    candidate = pathlib.Path(path_str)
    if not candidate.is_absolute():
        candidate = root / candidate
    try:
        resolved = candidate.resolve(strict=True)
    except Exception:
        return None
    if not resolved.is_file():
        return None
    try:
        rel = resolved.relative_to(root)
    except Exception:
        return None
    return f"{blob}/{rel.as_posix()}#L{line}"

with input_path.open('r', encoding='utf-8', errors='ignore') as fh:
    for raw in fh:
        m = pattern.match(raw)
        if not m:
            sys.stdout.write(raw)
            continue
        path_str = (m.group(2) or "").strip()
        url = to_url(path_str, m.group(3))
        if not url:
            sys.stdout.write(raw)
            continue
        sys.stdout.write(raw.rstrip('\n') + f" ({url})\n")
PY
}

on_err(){ local ec=$? ln=${BASH_LINENO[0]:-?} cmd=${BASH_COMMAND:-?}; say "${RED}${BOLD}Error${RESET}${DIM} (exit $ec)${RESET} ${WHITE}line $ln:${RESET} $cmd"; exit $ec; }
trap on_err ERR

# ─────────────────────────────────────────────────────────────────────────────
# CLI
# ─────────────────────────────────────────────────────────────────────────────
PROJECT_DIR="."
# Format precedence: CLI > UBS_OUTPUT_FORMAT > TOON_DEFAULT_FORMAT > "text"
FORMAT="${UBS_OUTPUT_FORMAT:-${TOON_DEFAULT_FORMAT:-text}}"  # text|json|jsonl|sarif|toon
# TOON encoder binary (default: tru from toon_rust; never use the Node.js `toon` CLI)
# Resolution order: TOON_TRU_BIN > TOON_BIN > tru
TOON_BIN="${TOON_TRU_BIN:-${TOON_BIN:-tru}}"
CI_MODE=0
FAIL_ON_WARNING=0
VERBOSE=0
QUIET=0
ONLY_LANGS=""              # csv: js,python,cpp,rust
EXCLUDE_LANGS=""           # csv
IGNORE_FILE=""
DEFAULT_IGNORES="node_modules,venv,.venv,env,.env,site-packages,dist,build,vendor,target,bin,obj,.idea,.vscode,.git,.hg,.svn,__pycache__,.mypy_cache,.pytest_cache,.ruff_cache,coverage,.gradle,DerivedData,bundler,gems,wheels"
# Safety guards: maximum directory size (MB) and whether to refuse home/root dirs
MAX_DIR_SIZE_MB="${UBS_MAX_DIR_SIZE_MB:-1000}"  # 1GB default; set 0 to disable
SKIP_SIZE_CHECK="${UBS_SKIP_SIZE_CHECK:-0}"
REFUSE_HOME_ROOT="${UBS_REFUSE_HOME_ROOT:-1}"  # 1 = refuse, 0 = allow
GLOBAL_EXCLUDE_PATTERNS="$DEFAULT_IGNORES"
FILTERED_PROJECT_DIR=""
MODULE_DIR_DEFAULT="${XDG_DATA_HOME:-$HOME/.local/share}/ubs/modules"
MODULE_DIR="$MODULE_DIR_DEFAULT"
UPDATE_MODULES=0
JOBS="${JOBS:-0}"
SKIP_TYPE_NARROWING=0
CSHARP_MODULE_ARGS=()
MODE="scan"
SESSION_ENTRIES=1
SESSION_RAW=0
SESSION_LOG_DIR_OVERRIDE=""
VERIFY_MODULE_ERR=""
VERIFY_HELPER_ERR=""
ALL_LANGS=(js python cpp rust golang java ruby swift csharp elixir)
# Per-language category skip lists, populated by --skip-LANG=N flags.
# Bare --skip=N continues to apply globally via UBS_SKIP_CATEGORIES (issue #52).
declare -A SKIP_BY_LANG=()
# Track whether the user passed a bare --skip=N (separate from --skip-LANG=N)
# so we can warn when it might silence different categories in different
# language modules.
BARE_SKIP_USED=0
UPDATE_ONLY=0
FORCE_SELF_UPDATE=0
CATEGORY_FILTER=""
COMPARISON_FILE=""
REPORT_JSON_PATH=""
HTML_REPORT_PATH=""
SHAREABLE_MODE=0
GIT_MODE=""  # staged, diff, or empty
SCAN_FILES=()  # explicit file list from --files or multiple positional args
GIT_REMOTE_URL=""
GIT_REMOTE_HTTP=""
GIT_COMMIT_SHA=""
GIT_BLOB_BASE=""
SARIF_AUTOMATION_ID=""
SHOW_VERSION=0
BEADS_JSONL_PATH=""
SUGGEST_IGNORE=0
JSONL_DETAIL=1               # 1=include findings, 0=summary only (for backward compat)

# Tool cache / JS AST engine
AST_GREP_BIN=""
AST_GREP_SOURCE=""

if [[ "${1:-}" == "doctor" ]]; then
  MODE="doctor"
  shift
elif [[ "${1:-}" == "sessions" || "${1:-}" == "session-log" ]]; then
  MODE="sessions"
  shift
fi

usage() {
  cat <<USAGE >&2
Usage: ubs [options] [PROJECT_DIR]
       ubs [options] FILE1 FILE2 ...
       ubs --files FILE1,FILE2,... [options] [PROJECT_DIR]
       ubs doctor [options]
       ubs sessions [--entries N] [--raw]

Options:
  --format=FMT            text|json|jsonl|sarif|toon (default: text)
  --version               Print version and exit
  --ci                    CI mode (stable timestamps)
  --fail-on-warning       Exit non-zero if warnings or critical exist
  -v, --verbose           Pass -v to child scanners (if supported)
  -q, --quiet             Reduce console output (also passes -q to scanners)
  --only=CSV              Restrict to languages: js,python,c,cpp,rust,golang,java,ruby,swift,csharp,cs,elixir,ex
  --exclude=CSV           Exclude languages
  --module-dir=DIR        Where to store/lookup modules (default: $MODULE_DIR_DEFAULT)
  --category=CSV          Focus on category packs (e.g., resource-lifecycle for AST lifecycle analyzers)
  --comparison=FILE       Baseline JSON to diff combined results against
  --report-json=FILE      Write combined summary JSON to FILE
  --html-report=FILE      Emit shareable HTML report to FILE
  --beads-jsonl=FILE      Also write combined findings to JSONL for Beads/strung
  --jsonl-summary-only    JSONL output: emit only summary counts, no individual findings
  --suggest-ignore        Print large-directory ignore suggestions (without modifying files)
  --update                Update the installed ubs binary and exit
  --non-interactive       No-op (accepted for installer/cron compatibility)
  --update-modules        Force re-download of modules before run
  --jobs=N                Parallelism hint (passed to children if supported)
  --ignore-file=PATH      Read additional ignore globs (default: PROJECT/.ubsignore if present)
  --skip-size-check       Skip directory size guard (use with care)
  --skip-type-narrowing   Skip JS/Rust/Kotlin/Swift/C# type narrowing checks (falls back to basic heuristics)
  --skip-LANG=CSV         Skip categories in ONE language only (LANG is js/python/cpp/rust/golang/java/ruby/swift/csharp/elixir;
                          aliases c/cs/ex accepted). Example: --skip-js=8 --skip-rust=3
                          Use this instead of bare --skip=N in polyglot repos: category numbers are NOT stable across
                          languages (e.g. JS cat 8 = Function & Scope Issues, Rust cat 8 = SECURITY FINDINGS). Issue #52.
  --no-dotnet             Pass through to the C# module: skip dotnet checks
  --no-build              Pass through to the C# module: skip dotnet build
  --no-test               Pass through to the C# module: skip dotnet test
  --no-format             Pass through to the C# module: skip dotnet format
  --no-deps               Pass through to the C# module: skip dotnet package checks
  --dotnet-target=PATH    Pass through to the C# module: select solution/project for dotnet commands
  --no-auto-update        Disable auto-update (even if UBS_ENABLE_AUTO_UPDATE=1)
  --staged                Scan only files staged for commit (git index)
  --diff, --git-diff      Scan only modified files (working tree vs HEAD)
  --files=F1,F2,...       Scan only the listed files (comma or space separated)
  -h, --help              Show this help

Environment Variables:
  UBS_OUTPUT_FORMAT=FMT       Default output format (text|json|jsonl|sarif|toon)
                              Overridden by --format CLI flag
  TOON_DEFAULT_FORMAT=FMT     Global fallback format if UBS_OUTPUT_FORMAT not set
  TOON_TRU_BIN=PATH           Explicit path to tru encoder (overrides TOON_BIN)
  TOON_BIN=PATH               TOON encoder binary (default: tru)
                              Set to a specific toon_rust encoder path if needed (do not use Node.js toon)
  UBS_MAX_DIR_SIZE_MB=N       Max directory size in MB before refusing to scan (default: 1000)
                              Set to 0 to disable this safety check
  UBS_SKIP_SIZE_CHECK=1       Skip directory size guard entirely
  UBS_REFUSE_HOME_ROOT=0|1    Whether to refuse scanning \$HOME or / (default: 1)
                              Set to 0 to allow scanning these directories

Examples:
  ubs .                       # auto-detect languages and scan
  ubs --staged                # scan only staged files (pre-commit style)
  ubs --diff                  # scan only modified files (quick check)
  ubs --files=a.js,b.py .     # scan specific files in current dir
  ubs src/a.js src/b.py       # multiple positional args (same effect)
  ubs --format=json --ci .    # machine-readable combined JSON
  ubs --format=toon .         # TOON format (~50% smaller than JSON)
  ubs --only=js,python .      # restrict language set
  ubs doctor --fix            # validate cached modules & redownload corrupted copies
  ubs sessions --entries 1    # view the most recent installer summary
  UBS_OUTPUT_FORMAT=toon ubs .  # set default format via env var
  UBS_MAX_DIR_SIZE_MB=0 ubs . # disable size check for large directories
USAGE
}

doctor_usage(){
  cat <<DOC >&2
Usage: ubs doctor [options]

Options:
  --module-dir=DIR   Override the module cache directory (default: $MODULE_DIR_DEFAULT)
  --fix              Automatically download or refresh cached modules
  -h, --help         Show this help message
DOC
}

sessions_usage(){
  cat <<SESS >&2
Usage: ubs sessions [options]

Options:
  --entries=N        Show the last N install sessions (default: 1)
  --raw              Print the entire session log as-is
  --config-dir=DIR   Override the config directory (defaults to \$XDG_CONFIG_HOME/ubs)
  -h, --help         Show this help message
SESS
}

show_session_history(){
  local entries="$1"
  local raw="$2"
  local override="$3"
  local base_dir
  if [[ -n "$override" ]]; then
    base_dir="$override"
  else
    base_dir="${XDG_CONFIG_HOME:-$HOME/.config}/ubs"
  fi
  local log_file="$base_dir/session.md"
  if [[ ! -f "$log_file" ]]; then
    say "${RED}$X no session history found${RESET} (expected at ${log_file})"
    exit 1
  fi
  local entries_int=1
  if [[ "$entries" =~ ^[0-9]+$ ]]; then
    entries_int="$entries"
  fi
  if [[ "$entries_int" -lt 1 ]]; then
    entries_int=1
  fi
  if [[ "$raw" -eq 1 ]]; then
    say "${BLUE}${INFO}${RESET} Showing session log from ${log_file}"
    cat "$log_file"
    exit 0
  fi
  if ! need_cmd python3; then
    say "${RED}$X python3 required${RESET} to format session history"
    exit 1
  fi
  say "${BLUE}${INFO}${RESET} Showing last ${entries_int} session(s) from ${log_file}"
  python3 - "$log_file" "$entries_int" <<'PY' 2>/dev/null
import sys, pathlib
from itertools import islice

path = pathlib.Path(sys.argv[1])
entries = max(1, int(sys.argv[2]))
text = path.read_text(encoding='utf-8', errors='ignore').strip()
if not text:
    print("No session entries recorded.")
    sys.exit(1)
sections = [block.strip() for block in text.split('\n---\n') if block.strip()]
if not sections:
    print("No session entries recorded.")
    sys.exit(1)
subset = sections[-entries:]
for idx, block in enumerate(subset):
    print(block)
    if idx != len(subset) - 1:
        print("\n---\n")
PY
}

DOCTOR_FIX=0
if [[ "$MODE" == "doctor" ]]; then
  while [[ $# -gt 0 ]]; do
    case "$1" in
      --module-dir=*) MODULE_DIR="${1#*=}"; shift;;
      --module-dir)
        if [[ $# -lt 2 ]]; then doctor_usage; exit 2; fi
        shift; MODULE_DIR="$1"; shift;;
      --fix) DOCTOR_FIX=1; shift;;
      -h|--help) doctor_usage; exit 0;;
      *)
        say "${RED}$X unknown doctor option${RESET}: $1"
        doctor_usage
        exit 2
        ;;
    esac
  done
elif [[ "$MODE" == "sessions" ]]; then
  while [[ $# -gt 0 ]]; do
    case "$1" in
      --entries=*) SESSION_ENTRIES="${1#*=}"; shift;;
      --entries)
        if [[ $# -lt 2 ]]; then sessions_usage; exit 2; fi
        shift; SESSION_ENTRIES="$1"; shift;;
      --raw) SESSION_RAW=1; shift;;
      --config-dir=*) SESSION_LOG_DIR_OVERRIDE="${1#*=}"; shift;;
      --config-dir)
        if [[ $# -lt 2 ]]; then sessions_usage; exit 2; fi
        shift; SESSION_LOG_DIR_OVERRIDE="$1"; shift;;
      -h|--help) sessions_usage; exit 0;;
      *)
        say "${RED}$X unknown sessions option${RESET}: $1"
        sessions_usage
        exit 2
        ;;
    esac
  done
else
  while [[ $# -gt 0 ]]; do
    case "$1" in
      --format=*) FORMAT="${1#*=}"; shift;;
      --version|-V) SHOW_VERSION=1; shift;;
      --ci) CI_MODE=1; shift;;
      --fail-on-warning) FAIL_ON_WARNING=1; shift;;
      -v|--verbose) VERBOSE=1; shift;;
      -q|--quiet) QUIET=1; shift;;
      --update) UPDATE_ONLY=1; FORCE_SELF_UPDATE=1; shift;;
      --non-interactive) shift;;
      --only=*) ONLY_LANGS="${1#*=}"; shift;;
      --exclude=*) EXCLUDE_LANGS="${1#*=}"; shift;;
      --category=*) CATEGORY_FILTER="${1#*=}"; shift;;
      --category)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        shift; CATEGORY_FILTER="$1"; shift;;
      --comparison=*|--baseline=*) COMPARISON_FILE="${1#*=}"; SHAREABLE_MODE=1; SARIF_AUTOMATION_ID="ubs-comparison"; shift;;
      --comparison|--baseline)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        shift; COMPARISON_FILE="$1"; SHAREABLE_MODE=1; SARIF_AUTOMATION_ID="ubs-comparison"; shift;;
      --report-json=*) REPORT_JSON_PATH="${1#*=}"; SHAREABLE_MODE=1; shift;;
      --report-json)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        shift; REPORT_JSON_PATH="$1"; SHAREABLE_MODE=1; shift;;
      --html-report=*) HTML_REPORT_PATH="${1#*=}"; SHAREABLE_MODE=1; shift;;
      --html-report)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        shift; HTML_REPORT_PATH="$1"; SHAREABLE_MODE=1; shift;;
      --beads-jsonl=*) BEADS_JSONL_PATH="${1#*=}"; shift;;
      --beads-jsonl)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        shift; BEADS_JSONL_PATH="$1"; shift;;
      --suggest-ignore) SUGGEST_IGNORE=1; shift;;
      --jsonl-summary-only) JSONL_DETAIL=0; shift;;
      --ignore-file=*) IGNORE_FILE="${1#*=}"; shift;;
      --skip-size-check) SKIP_SIZE_CHECK=1; shift;;
      --module-dir=*) MODULE_DIR="${1#*=}"; shift;;
      --module-dir)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        shift; MODULE_DIR="$1"; shift;;
      --update-modules) UPDATE_MODULES=1; shift;;
      --jobs=*) JOBS="${1#*=}"; shift;;
      --skip-type-narrowing) SKIP_TYPE_NARROWING=1; shift;;
      --no-dotnet|--no-build|--no-test|--no-format|--no-deps)
        CSHARP_MODULE_ARGS+=("$1")
        shift;;
      --dotnet-target=*)
        CSHARP_MODULE_ARGS+=("$1")
        shift;;
      --dotnet-target)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        CSHARP_MODULE_ARGS+=("$1" "$2")
        shift 2;;
      --no-auto-update) export UBS_NO_AUTO_UPDATE=1; shift;;
      --staged) GIT_MODE="staged"; shift;;
      --diff|--git-diff) GIT_MODE="diff"; shift;;
      --files=*) IFS=',' read -r -a _f <<<"${1#*=}"; SCAN_FILES+=("${_f[@]}"); shift;;
      --files)
        if [[ $# -lt 2 ]]; then usage; exit 2; fi
        shift; IFS=',' read -r -a _f <<<"$1"; SCAN_FILES+=("${_f[@]}"); shift;;
      --profile=*)
        export UBS_PROFILE="${1#*=}"
        if [[ "$UBS_PROFILE" == "strict" ]]; then FAIL_ON_WARNING=1; fi
        shift;;
      --skip=*)
        export UBS_SKIP_CATEGORIES="${1#*=}"
        BARE_SKIP_USED=1
        shift;;
      --skip-*=*)
        # --skip-LANG=N[,M,...] applies only to the matching language module
        # (issue #52). LANG accepts the same aliases as --only / --exclude
        # (e.g. --skip-c is normalized to --skip-cpp at run time, after the
        # normalize_lang helper is defined). The earlier --skip-size-check /
        # --skip-type-narrowing arms above shadow this glob for those flags.
        _sk_lang_key="${1#--skip-}"
        _sk_lang_key="${_sk_lang_key%%=*}"
        _sk_lang_val="${1#*=}"
        if [[ -n "${SKIP_BY_LANG[$_sk_lang_key]:-}" ]]; then
          SKIP_BY_LANG["$_sk_lang_key"]="${SKIP_BY_LANG[$_sk_lang_key]},$_sk_lang_val"
        else
          SKIP_BY_LANG["$_sk_lang_key"]="$_sk_lang_val"
        fi
        unset _sk_lang_key _sk_lang_val
        shift;;
      -h|--help) usage; exit 0;;
      *)
        if [[ "$PROJECT_DIR" == "." ]]; then
          # First positional arg: could be a directory OR a file
          if [[ -d "$1" ]]; then
            PROJECT_DIR="$1"
          else
            SCAN_FILES+=("$1")
          fi
        else
          # Additional positional args: accumulate as files
          SCAN_FILES+=("$1")
        fi
        shift;;
    esac
  done
  if [[ "$UPDATE_ONLY" -eq 1 ]]; then
    PROJECT_DIR="$(pwd -P)"
  else
    if [[ -d "$PROJECT_DIR" ]]; then
      if ! PROJECT_DIR="$(cd "$PROJECT_DIR" 2>/dev/null && pwd -P)"; then
        say "${RED}$X cannot access project directory${RESET}: $PROJECT_DIR"
        exit 2
      fi
    elif [[ -f "$PROJECT_DIR" ]]; then
      proj_dir="$(dirname "$PROJECT_DIR")"
      proj_base="$(basename "$PROJECT_DIR")"
      if ! proj_dir="$(cd "$proj_dir" 2>/dev/null && pwd -P)"; then
        say "${RED}$X cannot access project path${RESET}: $PROJECT_DIR"
        exit 2
      fi
      PROJECT_DIR="$proj_dir/$proj_base"
    else
      say "${RED}$X path not found${RESET}: $PROJECT_DIR"
      exit 2
    fi
  fi
fi
SOURCE_PROJECT_DIR="$PROJECT_DIR"
TARGETED_SCAN_MODE=0
if [[ -n "$GIT_MODE" || ${#SCAN_FILES[@]} -gt 0 ]]; then
  TARGETED_SCAN_MODE=1
fi
RUN_SCAN_GUARDS=0
if [[ "$MODE" == "scan" && "$UPDATE_ONLY" -eq 0 ]]; then
  RUN_SCAN_GUARDS=1
fi

if [[ "$SHOW_VERSION" -eq 1 ]]; then
  short_sha=""
  if git rev-parse --short HEAD >/dev/null 2>&1; then
    short_sha="$(git rev-parse --short HEAD 2>/dev/null || true)"
  fi
  say "UBS Meta-Runner v${UBS_VERSION}${short_sha:+ (git $short_sha)}"
  exit 0
fi

# Load ignore patterns early so size checks can respect .ubsignore
if [[ "$MODE" != "doctor" && "$UPDATE_ONLY" -eq 0 ]]; then
  if [[ -z "$IGNORE_FILE" && -f "$SOURCE_PROJECT_DIR/.ubsignore" ]]; then
    IGNORE_FILE="$SOURCE_PROJECT_DIR/.ubsignore"
  fi
  if [[ -n "$IGNORE_FILE" ]]; then
    load_ignore_patterns "$IGNORE_FILE"
  fi
fi

# ─────────────────────────────────────────────────────────────────────────────
# Safety guards: prevent disk exhaustion when scanning large or sensitive dirs
# Fixes GitHub issue #12: UBS copies entire scan directory to /tmp
# ─────────────────────────────────────────────────────────────────────────────

# Check 1: Refuse to scan home directory or root (unless explicitly allowed)
if [[ "$RUN_SCAN_GUARDS" -eq 1 && "$TARGETED_SCAN_MODE" -eq 0 && "$REFUSE_HOME_ROOT" -eq 1 && -d "$SOURCE_PROJECT_DIR" ]]; then
  resolved_dir="$(cd "$SOURCE_PROJECT_DIR" 2>/dev/null && pwd -P)"
  if [[ "$resolved_dir" == "$HOME" ]]; then
    say "${RED}${X}${RESET} ${BOLD}Refusing to scan home directory${RESET}"
    say "${DIM}UBS copies the scan target to /tmp, which can exhaust disk space on large directories.${RESET}"
    say "${DIM}If you really want to scan \$HOME, set${RESET} UBS_REFUSE_HOME_ROOT=0"
    exit 2
  fi
  if [[ "$resolved_dir" == "/" ]]; then
    say "${RED}${X}${RESET} ${BOLD}Refusing to scan root directory${RESET}"
    say "${DIM}UBS copies the scan target to /tmp, which can exhaust disk space.${RESET}"
    say "${DIM}If you really want to scan /, set${RESET} UBS_REFUSE_HOME_ROOT=0"
    exit 2
  fi
fi

dir_size_mb_filtered(){
  local dir="$1"
  local patterns_csv="${2:-}"
  local result=""
  local du_can_exclude=0
  if need_cmd du; then
    local -a du_args=()
    if [[ -n "$patterns_csv" ]] && du --help 2>/dev/null | grep -q -- '--exclude'; then
      # du --exclude matches patterns against each entry's basename, not the
      # full relative path.  Path-based patterns (containing '/') silently
      # fail to match anything, causing the size calculation to ignore the
      # exclusion entirely (GitHub issue #16).  Detect this and fall through
      # to the Python fallback which handles path-based patterns correctly.
      local has_path_pattern=0
      local -a pats=()
      IFS=',' read -r -a pats <<<"$patterns_csv"
      for pat in "${pats[@]}"; do
        if [[ -n "$pat" ]]; then
          du_args+=( "--exclude=$pat" )
          [[ "$pat" == */* ]] && has_path_pattern=1
        fi
      done
      [[ "$has_path_pattern" -eq 0 ]] && du_can_exclude=1
    fi
    # Only use du when no patterns are needed or du supports --exclude
    # AND all patterns are simple (no path separators); otherwise fall
    # through to the Python fallback which handles exclusions correctly
    # on all platforms (fixes macOS/BSD du which lacks --exclude, and
    # path-based patterns which du --exclude silently ignores — #16).
    if [[ -z "$patterns_csv" || "$du_can_exclude" -eq 1 ]]; then
      result=$(du -sm "${du_args[@]}" "$dir" 2>/dev/null | cut -f1)
      if [[ "$result" =~ ^[0-9]+$ ]]; then
        echo "$result"
        return 0
      fi
      result=$(du -sk "${du_args[@]}" "$dir" 2>/dev/null | cut -f1)
      if [[ "$result" =~ ^[0-9]+$ ]]; then
        echo $((result / 1024))
        return 0
      fi
    fi
  fi
  if need_cmd python3; then
    python3 - "$dir" "$patterns_csv" <<'PY'
import fnmatch
import os
import pathlib
import sys

root = pathlib.Path(sys.argv[1]).resolve()
patterns_csv = sys.argv[2] if len(sys.argv) > 2 else ""
patterns = [p for p in patterns_csv.split(",") if p]

def excluded(rel_path, name):
    for pat in patterns:
        if fnmatch.fnmatch(rel_path, pat) or fnmatch.fnmatch(name, pat):
            return True
        for part in pathlib.Path(rel_path).parts:
            if fnmatch.fnmatch(part, pat):
                return True
    return False

total = 0
for base, dirs, files in os.walk(root, topdown=True):
    rel_root = os.path.relpath(base, root)
    pruned = []
    for d in dirs:
        rel = os.path.join(rel_root, d) if rel_root != "." else d
        if excluded(rel, d):
            continue
        pruned.append(d)
    dirs[:] = pruned

    for f in files:
        rel = os.path.join(rel_root, f) if rel_root != "." else f
        if excluded(rel, f):
            continue
        try:
            total += (pathlib.Path(base) / f).stat().st_size
        except OSError:
            pass

print(int(total / 1024 / 1024))
PY
    return 0
  fi
  echo "0"
}

# Check 2: Refuse directories larger than MAX_DIR_SIZE_MB (unless set to 0)
if [[ "$RUN_SCAN_GUARDS" -eq 1 && "$TARGETED_SCAN_MODE" -eq 0 && "$SKIP_SIZE_CHECK" -eq 0 && "$MAX_DIR_SIZE_MB" -gt 0 && -d "$SOURCE_PROJECT_DIR" ]]; then
  dir_size_mb="$(dir_size_mb_filtered "$SOURCE_PROJECT_DIR" "$GLOBAL_EXCLUDE_PATTERNS")"
  if [[ "${QUIET:-0}" -eq 0 ]]; then
    say "${DIM}${INFO}${RESET} Scan size after ignores: ${dir_size_mb}MB (limit ${MAX_DIR_SIZE_MB}MB)"
  fi
  if [[ "$dir_size_mb" -gt "$MAX_DIR_SIZE_MB" ]]; then
    say "${RED}${X}${RESET} ${BOLD}Directory too large (after ignores)${RESET}: ${dir_size_mb}MB exceeds limit of ${MAX_DIR_SIZE_MB}MB"
    say "${DIM}UBS copies the scan target to /tmp before analysis, which can exhaust disk space.${RESET}"
    say "${DIM}This safety check prevents accidental scans of large directories like \$HOME.${RESET}"
    say ""
    say "${DIM}Options:${RESET}"
    say "${DIM}  • Scan a smaller subdirectory instead${RESET}"
    say "${DIM}  • Increase the limit:${RESET} UBS_MAX_DIR_SIZE_MB=5000 ubs ..."
    say "${DIM}  • Disable the check:${RESET} UBS_MAX_DIR_SIZE_MB=0 ubs ..."
    exit 2
  fi
fi

if [[ -n "$CATEGORY_FILTER" ]]; then
  CATEGORY_FILTER="${CATEGORY_FILTER,,}"
  if [[ "$CATEGORY_FILTER" == "resource-lifecycle" ]]; then
    SHAREABLE_MODE=$((SHAREABLE_MODE+0))
    if [[ -z "$ONLY_LANGS" ]]; then
      ONLY_LANGS="python,golang,java,swift,csharp"
    fi
    export UBS_CATEGORY_FILTER="$CATEGORY_FILTER"
  else
    say "${YELLOW}${WARN}${RESET} Unknown category filter: $CATEGORY_FILTER"
    CATEGORY_FILTER=""
    unset UBS_CATEGORY_FILTER
  fi
else
  unset UBS_CATEGORY_FILTER
fi

ensure_dir(){ mkdir -p "$1" 2>/dev/null || { say "${RED}$X cannot create $1${RESET}"; exit 1; }; }

script_dir(){
  # Resolve the real directory of this script, following symlinks.
  # Critical for macOS Homebrew where /opt/homebrew/bin/ubs is a relative
  # symlink (e.g. ../Cellar/ubs/5.0.7/bin/ubs).  We must resolve the
  # relative target against the *symlink's* parent dir, not CWD.
  #
  # The set -E (errtrace) flag causes the ERR trap to fire inside
  # functions.  Guard every cd so a failed cd never triggers on_err
  # and kills the script.

  # Fast path: use realpath if available (Linux, macOS 12.3+, Homebrew coreutils)
  local self="${BASH_SOURCE[0]}"
  if command -v realpath >/dev/null 2>&1; then
    local rp
    rp="$(realpath "$self" 2>/dev/null)" || true
    if [[ -n "$rp" ]]; then
      dirname "$rp"
      return 0
    fi
  fi

  # Fallback: manual symlink-chase loop
  local source="$self"
  while [ -L "$source" ]; do
    local link_dir
    link_dir="$(cd -P "$(dirname "$source")" 2>/dev/null && pwd)" || link_dir=""
    source="$(readlink "$source")" || true
    # If readlink returned a relative path, resolve it against the
    # directory that contained the symlink we just read.
    if [[ "$source" != /* && -n "$link_dir" ]]; then
      source="$link_dir/$source"
    fi
  done
  # Use dirname + cd -P to canonicalize; || true prevents ERR trap on failure
  local resolved
  resolved="$(cd -P "$(dirname "$source")" 2>/dev/null && pwd)" || true
  if [[ -n "$resolved" ]]; then
    echo "$resolved"
  else
    # Last resort: return dirname as-is (non-canonical but usable)
    dirname "$source"
  fi
}

prepare_metrics_dir(){
  local dir="$1"
  rm -rf "$dir" 2>/dev/null || true
  mkdir -p "$dir" 2>/dev/null || true
}

finalize_module_dir(){
  local configured="${MODULE_DIR:-}"
  if [[ -z "$configured" ]]; then
    MODULE_DIR="$MODULE_DIR_DEFAULT"
  else
    MODULE_DIR="$configured"
    while [[ "$MODULE_DIR" == */ && "$MODULE_DIR" != "/" ]]; do
      MODULE_DIR="${MODULE_DIR%/}"
    done
    [[ -z "$MODULE_DIR" ]] && MODULE_DIR="$MODULE_DIR_DEFAULT"
  fi
  ensure_dir "$MODULE_DIR"
  local resolved
  if resolved=$(cd "$MODULE_DIR" 2>/dev/null && pwd -P); then
    MODULE_DIR="$resolved"
  fi
}

resolve_git_metadata(){
  local root
  if ! root=$(git -C "$SOURCE_PROJECT_DIR" rev-parse --show-toplevel 2>/dev/null); then
    return
  fi
  local remote commit
  remote=$(git -C "$root" config --get remote.origin.url 2>/dev/null || true)
  commit=$(git -C "$root" rev-parse HEAD 2>/dev/null || true)
  [[ -n "$remote" && -n "$commit" ]] || return
  GIT_REMOTE_URL="$remote"
  GIT_COMMIT_SHA="$commit"
  GIT_REMOTE_HTTP=""
  case "$remote" in
    git@github.com:*)
      local path_part=${remote#git@github.com:}
      path_part=${path_part%.git}
      GIT_REMOTE_HTTP="https://github.com/${path_part}"
      GIT_BLOB_BASE="https://github.com/${path_part}/blob/${commit}"
      ;;
    https://github.com/*)
      local path_part=${remote#https://github.com/}
      path_part=${path_part%.git}
      GIT_REMOTE_HTTP="https://github.com/${path_part}"
      GIT_BLOB_BASE="https://github.com/${path_part}/blob/${commit}"
      ;;
    git://github.com/*)
      local path_part=${remote#git://github.com/}
      path_part=${path_part%.git}
      GIT_REMOTE_HTTP="https://github.com/${path_part}"
      GIT_BLOB_BASE="https://github.com/${path_part}/blob/${commit}"
      ;;
    *)
      GIT_BLOB_BASE=""
      ;;
  esac
}

prepare_git_workspace(){
  local mode="$1"
  if ! need_cmd git; then
    say "${RED}$X git not found; cannot run --$mode${RESET}"
    exit 1
  fi

  local scan_root="$SOURCE_PROJECT_DIR"
  if [[ -f "$scan_root" ]]; then
    scan_root="$(dirname "$scan_root")"
  fi

  local repo_root
  if ! repo_root="$(git -C "$scan_root" rev-parse --show-toplevel 2>/dev/null)"; then
    say "${RED}$X not a git repository; cannot run --$mode${RESET}"
    exit 1
  fi

  local scan_rel=""
  if [[ "$scan_root" == "$repo_root" ]]; then
    scan_rel=""
  elif [[ "$scan_root" == "$repo_root/"* ]]; then
    scan_rel="${scan_root#"$repo_root"/}"
  else
    say "${RED}$X scan path is outside git root; cannot run --$mode${RESET}"
    exit 1
  fi

  local raw_files=()
  if [[ "$mode" == "staged" ]]; then
    while IFS= read -r file; do [[ -n "$file" ]] && raw_files+=("$file"); done < <(
      git -C "$repo_root" diff --name-only --cached --diff-filter=ACMR
    )
  else
    while IFS= read -r file; do [[ -n "$file" ]] && raw_files+=("$file"); done < <(
      git -C "$repo_root" diff --name-only --diff-filter=ACMR HEAD
    )
  fi

  local files=()
  if [[ -n "$scan_rel" ]]; then
    for file in "${raw_files[@]}"; do
      if [[ "$file" == "$scan_rel/"* ]]; then
        files+=("${file#"$scan_rel"/}")
      fi
    done
  else
    files=("${raw_files[@]}")
  fi

  # Apply .ubsignore / GLOBAL_EXCLUDE_PATTERNS filtering to the staged file list
  # so that ignored paths are never copied into the shadow workspace.
  if [[ -n "$GLOBAL_EXCLUDE_PATTERNS" && ${#files[@]} -gt 0 ]] && need_cmd python3; then
    local filtered_csv
    filtered_csv=$(printf '%s\n' "${files[@]}" | python3 -c "
import sys, fnmatch, pathlib
patterns = sys.argv[1].split(',')
for line in sys.stdin:
    f = line.rstrip('\n')
    if not f:
        continue
    name = pathlib.PurePosixPath(f).name
    excluded = False
    for pat in patterns:
        if not pat:
            continue
        if fnmatch.fnmatch(f, pat) or fnmatch.fnmatch(name, pat):
            excluded = True
            break
        for part in pathlib.PurePosixPath(f).parts:
            if fnmatch.fnmatch(part, pat):
                excluded = True
                break
        if excluded:
            break
    if not excluded:
        print(f)
" "$GLOBAL_EXCLUDE_PATTERNS" 2>/dev/null) || true
    if [[ -n "$filtered_csv" ]]; then
      local filtered_files=()
      while IFS= read -r f; do
        [[ -n "$f" ]] && filtered_files+=("$f")
      done <<<"$filtered_csv"
      files=("${filtered_files[@]}")
    else
      files=()
    fi
  fi

  if [[ ${#files[@]} -eq 0 ]]; then
    say "${GREEN}${CHECK} No changed files to scan.${RESET}"
    exit 0
  fi
  
  if ! need_cmd rsync; then
    say "${RED}$X rsync not found; required for --$mode${RESET}"
    exit 1
  fi
  
  local dest="$TMPDIR_RUN/git_scan"
  rm -rf "$dest" 2>/dev/null || true
  ensure_dir "$dest"
  
  say "${BLUE}${INFO} Preparing shadow workspace for $mode files (${#files[@]} detected)${RESET}"
  
  # Use rsync with --files-from to copy only the target files while preserving hierarchy
  local file_list="$TMPDIR_RUN/files_to_scan.txt"
  printf "%s\n" "${files[@]}" > "$file_list"
  
  if rsync -a --files-from="$file_list" "$scan_root/" "$dest/" >/dev/null 2>&1; then
    FILTERED_PROJECT_DIR="$dest"
    PROJECT_DIR="$FILTERED_PROJECT_DIR"
    say "${DIM}${INFO}${RESET} Scanning shadow workspace at ${FILTERED_PROJECT_DIR}"
  else
    say "${RED}$X Failed to prepare shadow workspace${RESET}"
    exit 1
  fi
}

# Copy an explicit list of files (from --files or multiple positional args)
# into a shadow workspace so the rest of the pipeline scans only those files.
prepare_files_workspace(){
  local scan_root="$SOURCE_PROJECT_DIR"
  if [[ -f "$scan_root" ]]; then
    scan_root="$(dirname "$scan_root")"
  fi

  # Resolve each path relative to scan_root; reject missing files
  local resolved=()
  local f rel
  for f in "${SCAN_FILES[@]}"; do
    [[ -z "$f" ]] && continue
    if [[ "$f" == /* ]]; then
      # Absolute path — make it relative to scan_root
      if [[ -f "$f" ]]; then
        rel="${f#"$scan_root"/}"
        resolved+=("$rel")
      else
        say "${RED}$X file not found${RESET}: $f"
        exit 2
      fi
    elif [[ -f "$scan_root/$f" ]]; then
      resolved+=("$f")
    elif [[ -f "$f" ]]; then
      # Relative to cwd, convert to relative to scan_root
      local abs
      abs="$(cd "$(dirname "$f")" && pwd -P)/$(basename "$f")"
      rel="${abs#"$scan_root"/}"
      resolved+=("$rel")
    else
      say "${RED}$X file not found${RESET}: $f"
      exit 2
    fi
  done

  if [[ ${#resolved[@]} -eq 0 ]]; then
    say "${RED}$X no valid files specified for explicit file scan${RESET}"
    exit 2
  fi

  if ! need_cmd rsync; then
    say "${RED}$X rsync not found; required for explicit file scans${RESET}"
    exit 1
  fi

  local dest="$TMPDIR_RUN/files_scan"
  rm -rf "$dest" 2>/dev/null || true
  ensure_dir "$dest"

  say "${BLUE}${INFO} Preparing shadow workspace for ${#resolved[@]} specified file(s)${RESET}"

  local file_list="$TMPDIR_RUN/explicit_files.txt"
  printf "%s\n" "${resolved[@]}" > "$file_list"

  if rsync -a --files-from="$file_list" "$scan_root/" "$dest/" >/dev/null 2>&1; then
    FILTERED_PROJECT_DIR="$dest"
    PROJECT_DIR="$FILTERED_PROJECT_DIR"
    say "${DIM}${INFO}${RESET} Scanning shadow workspace at ${FILTERED_PROJECT_DIR}"
  else
    say "${RED}$X Failed to prepare files workspace${RESET}"
    exit 1
  fi
}

checksum_tool_name(){
  if need_cmd sha256sum; then echo "sha256sum"; return 0; fi
  if need_cmd shasum; then echo "shasum -a 256"; return 0; fi
  if need_cmd openssl; then echo "openssl dgst -sha256"; return 0; fi
  return 1
}

compute_sha256(){
  local path="$1"
  if need_cmd sha256sum; then sha256sum "$path" | awk '{print $1}'; return 0; fi
  if need_cmd shasum; then shasum -a 256 "$path" | awk '{print $1}'; return 0; fi
  if need_cmd openssl; then openssl dgst -sha256 "$path" | awk '{print $NF}'; return 0; fi
  return 1
}

# ─────────────────────────────────────────────────────────────────────────────
# Tool cache: ast-grep (JS/TS accuracy)
# ─────────────────────────────────────────────────────────────────────────────
detect_os_target(){
  local raw
  raw="$(uname -s 2>/dev/null | tr '[:upper:]' '[:lower:]')"
  case "$raw" in
    darwin) echo "apple-darwin"; return 0 ;;
    linux) echo "unknown-linux-gnu"; return 0 ;;
    msys*|mingw*|cygwin*) echo "pc-windows-msvc"; return 0 ;;
  esac
  return 1
}

detect_arch_target(){
  local raw
  raw="$(uname -m 2>/dev/null)"
  case "$raw" in
    x86_64|amd64) echo "x86_64"; return 0 ;;
    arm64|aarch64) echo "aarch64"; return 0 ;;
  esac
  return 1
}

ast_grep_target_triple(){
  local arch os
  arch="$(detect_arch_target)" || return 1
  os="$(detect_os_target)" || return 1
  echo "${arch}-${os}"
}

find_ast_grep_in_path(){
  local -a dirs
  IFS=':' read -r -a dirs <<<"${PATH:-}"
  local name dir candidate
  for name in ast-grep sg; do
    for dir in "${dirs[@]}"; do
      [[ -n "$dir" ]] || continue
      candidate="$dir/$name"
      [[ -x "$candidate" ]] || continue
      if verify_ast_grep_bin "$candidate"; then
        echo "$candidate"
        return 0
      fi
    done
  done
  return 1
}

download_url_to_file(){
  local url="$1" dest="$2"
  if need_cmd curl; then
    curl -fsSL "$url" -o "$dest"
    return 0
  fi
  if need_cmd wget; then
    wget -q "$url" -O "$dest"
    return 0
  fi
  return 1
}

extract_zip_member(){
  local zip_path="$1" member="$2" out_path="$3"
  if need_cmd python3; then
    python3 - "$zip_path" "$member" "$out_path" <<'PY' 2>/dev/null || return 1
import sys, zipfile
from pathlib import Path

zip_path, member, out_path = sys.argv[1:4]
z = zipfile.ZipFile(zip_path)
if member not in z.namelist():
    raise SystemExit(2)
dest = Path(out_path)
dest.parent.mkdir(parents=True, exist_ok=True)
with z.open(member) as src, dest.open('wb') as out:
    out.write(src.read())
PY
    return 0
  fi
  if need_cmd unzip; then
    unzip -p "$zip_path" "$member" >"$out_path"
    return 0
  fi
  return 1
}

ensure_ast_grep_tool_cache(){
  local target expected asset url tool_root zip_path bin_name bin_path
  target="$(ast_grep_target_triple)" || return 1
  expected="${AST_GREP_ASSET_SHA256[$target]:-}"
  [[ -n "$expected" ]] || return 1

  asset="app-${target}.zip"
  url="${AST_GREP_BASE_URL}/${asset}"
  tool_root="$TOOLS_DIR/ast-grep/${AST_GREP_VERSION}/${target}"
  zip_path="$tool_root/$asset"

  bin_name="ast-grep"
  if [[ "$target" == *pc-windows-msvc ]]; then
    bin_name="ast-grep.exe"
  fi
  bin_path="$tool_root/$bin_name"

  ensure_dir "$tool_root"

  local need_download=0
  if [[ ! -f "$zip_path" ]]; then
    need_download=1
  else
    local current_sha
    if ! current_sha="$(compute_sha256 "$zip_path")"; then
      return 2
    fi
    [[ "$current_sha" == "$expected" ]] || need_download=1
  fi

  if [[ "$need_download" -eq 1 ]]; then
    [[ "${QUIET:-0}" -eq 0 ]] && say_err "${DIM}${INFO}${RESET} Downloading ast-grep ${AST_GREP_VERSION} (${target})..."
    local tmp_zip
    tmp_zip="$(mktemp -t ubs-ast-grep.XXXXXX 2>/dev/null || mktemp "${TMPDIR:-/tmp}/ubs-ast-grep.XXXXXX" 2>/dev/null)" || {
      say_err "${RED}$X failed to create temp file for module download${RESET}"
      return 1
    }
    if ! download_url_to_file "$url" "$tmp_zip"; then
      say_err "${RED}${X}${RESET} failed to download ast-grep: $url"
      say_err "${DIM}Install ast-grep manually (https://ast-grep.github.io/) or re-run install.sh.${RESET}"
      return 1
    fi
    local sha
    if ! sha="$(compute_sha256 "$tmp_zip")"; then
      say_err "${RED}${X}${RESET} cannot verify ast-grep download (no sha256 tool available)"
      return 2
    fi
    if [[ "$sha" != "$expected" ]]; then
      say_err "${RED}${X}${RESET} ast-grep checksum mismatch for ${asset}"
      say_err "${DIM}Expected: ${expected}${RESET}"
      say_err "${DIM}Got:      ${sha}${RESET}"
      return 1
    fi
    mv "$tmp_zip" "$zip_path"
  fi

  if ! extract_zip_member "$zip_path" "$bin_name" "$bin_path"; then
    say_err "${RED}${X}${RESET} failed to extract ${bin_name} from ${zip_path}"
    return 1
  fi
  chmod +x "$bin_path" 2>/dev/null || true
  if ! verify_ast_grep_bin "$bin_path"; then
    say_err "${RED}${X}${RESET} extracted ast-grep did not execute correctly: $bin_path"
    return 1
  fi
  echo "$bin_path"
}

ensure_ast_grep(){
  local found
  if found="$(find_ast_grep_in_path)"; then
    AST_GREP_BIN="$found"
    AST_GREP_SOURCE="path"
    return 0
  fi

  local target
  target="$(ast_grep_target_triple)" || {
    say_err "${RED}${X}${RESET} Environment error: unsupported platform for ast-grep tool cache"
    return 1
  }

  if [[ -z "${AST_GREP_ASSET_SHA256[$target]:-}" ]]; then
    say_err "${RED}${X}${RESET} Environment error: no ast-grep asset configured for $target"
    return 1
  fi
  if ! ( need_cmd curl || need_cmd wget ); then
    say_err "${RED}${X}${RESET} Environment error: need curl or wget to auto-provision ast-grep"
    return 1
  fi
  if ! checksum_tool_name >/dev/null 2>&1; then
    say_err "${RED}${X}${RESET} Environment error: need sha256sum, shasum, or openssl to verify ast-grep downloads"
    return 1
  fi
  if ! ( need_cmd python3 || need_cmd unzip ); then
    say_err "${RED}${X}${RESET} Environment error: need python3 or unzip to extract ast-grep tool cache"
    return 1
  fi

  found="$(ensure_ast_grep_tool_cache)" || return $?
  AST_GREP_BIN="$found"
  AST_GREP_SOURCE="cache"
  return 0
}

ast_grep_cached_bin_path(){
  local target bin_name
  target="$(ast_grep_target_triple)" || return 1
  bin_name="ast-grep"
  if [[ "$target" == *pc-windows-msvc ]]; then
    bin_name="ast-grep.exe"
  fi
  echo "$TOOLS_DIR/ast-grep/${AST_GREP_VERSION}/${target}/${bin_name}"
}

verify_ast_grep_bin(){
  local bin="$1"
  [[ -n "$bin" && -x "$bin" ]] || return 1
  "$bin" --version 2>&1 | grep -qi "ast-grep" || return 1
  "$bin" scan -h >/dev/null 2>&1 || return 1

  # UBS depends on JSON-stream output for AST-powered rules. Confirm the binary
  # supports `--json=stream` (via either `run -p` or the legacy `--pattern` form).
  local tmpdir tmpfile
  tmpdir="$(mktemp -d 2>/dev/null || mktemp -d -t ubs-ag-verify.XXXXXX)" || return 1
  tmpfile="$tmpdir/verify.js"
  printf 'const x = 1; x = 2;\n' >"$tmpfile" 2>/dev/null || true

  if "$bin" run -p '$X = $Y' "$tmpfile" --json=stream >/dev/null 2>&1; then
    [[ -n "$tmpdir" && "$tmpdir" != "/" ]] && rm -rf "$tmpdir" 2>/dev/null || true
    return 0
  fi
  if "$bin" --pattern '$X = $Y' "$tmpfile" --json=stream >/dev/null 2>&1; then
    [[ -n "$tmpdir" && "$tmpdir" != "/" ]] && rm -rf "$tmpdir" 2>/dev/null || true
    return 0
  fi

  [[ -n "$tmpdir" && "$tmpdir" != "/" ]] && rm -rf "$tmpdir" 2>/dev/null || true
  return 1
}

apply_inline_suppressions(){
  if ! need_cmd python3; then cat; return 0; fi
  local py_script
  py_script="$(mktemp -t ubs_suppress.XXXXXX 2>/dev/null || mktemp -t ubs_suppress)"
  cat >"$py_script" <<'PY'
import sys, re, io
from pathlib import Path

# Robust I/O handling for varied environments
try:
    input_stream = io.TextIOWrapper(sys.stdin.buffer, encoding='utf-8', errors='replace')
    output_stream = io.TextIOWrapper(sys.stdout.buffer, encoding='utf-8', errors='replace')
except Exception:
    input_stream = sys.stdin
    output_stream = sys.stdout

ANSI_ESCAPE = re.compile(r'\x1B(?:[@-Z\\-_]|\[[0-?]*[ -/]*[@-~])')
FINDING_PATTERN = re.compile(r'^\s*((?:[A-Za-z]:)?[^:]+?):(\d+)(?::(\d+))?')
SUPPRESSION_MARKERS = ["ubs:ignore", "ubs: disable", "nolint", "noqa"]

def strip_ansi(text):
    return ANSI_ESCAPE.sub('', text)

def has_suppression(line_content):
    if not line_content: return False
    lower = line_content.lower()
    return any(m in lower for m in SUPPRESSION_MARKERS)

def main():
    lines = []
    try:
        # Read all lines first to ensure we consume the stream (prevents SIGPIPE upstream)
        lines = input_stream.readlines()
        
        file_cache = {}
        
        for line in lines:
            clean_line = strip_ansi(line)
            match = FINDING_PATTERN.match(clean_line)
            
            if not match:
                output_stream.write(line)
                continue
            
            file_path_str = (match.group(1) or "").strip()
            try:
                line_no = int(match.group(2))
            except ValueError:
                output_stream.write(line)
                continue
            
            if file_path_str not in file_cache:
                try:
                    p = Path(file_path_str)
                    # Check existence relative to CWD
                    if p.is_file():
                        file_cache[file_path_str] = p.read_text(encoding='utf-8', errors='replace').splitlines()
                    else:
                        file_cache[file_path_str] = None
                except:
                    file_cache[file_path_str] = None
            
            content = file_cache[file_path_str]
            suppressed = False
            if content:
                idx = line_no - 1
                # Check line itself (idx) and previous line (idx-1) for comments
                if 0 <= idx < len(content) and has_suppression(content[idx]):
                    suppressed = True
                elif 0 <= idx-1 < len(content) and has_suppression(content[idx-1]):
                    suppressed = True
            
            if not suppressed:
                output_stream.write(line)
                
    except Exception as e:
        # If python fails, we MUST consume stdin and dump to stdout to avoid breaking the pipe
        sys.stderr.write(f"[ubs] warning: inline suppression failed ({e}); passthrough enabled\n")
        try:
            # Try to dump what we read plus the rest
            for l in lines: output_stream.write(l)
            output_stream.write(input_stream.read())
        except:
            pass

if __name__ == "__main__":
    main()
PY
  python3 "$py_script"
  rm -f "$py_script"
}

should_verify_module_path(){
  local path="$1"
  [[ -n "$path" && -n "$MODULE_DIR" ]] || return 1
  if [[ "$MODULE_DIR" == "/" ]]; then
    [[ "$path" == /* ]]
  else
    case "$path" in
      "$MODULE_DIR"/*) return 0;;
      *) return 1;;
    esac
  fi
}

verify_module_checksum(){
  local lang="$1" path="$2"
  local expected="${MODULE_CHECKSUMS[$lang]:-}"
  VERIFY_MODULE_ERR=""
  should_verify_module_path "$path" || return 0
  [[ -n "$expected" ]] || return 0
  if [[ ! -f "$path" ]]; then
    VERIFY_MODULE_ERR="module file not found at $path"
    return 1
  fi
  local actual
  if ! actual="$(compute_sha256 "$path")"; then
    VERIFY_MODULE_ERR="unable to compute checksum (install sha256sum, shasum, or openssl)"
    return 2
  fi
  if [[ "$actual" != "$expected" ]]; then
    VERIFY_MODULE_ERR="checksum mismatch for $lang (expected $expected, got $actual)"
    return 1
  fi
  return 0
}

verify_helper_checksum(){
  local rel="$1" path="$2"
  local expected="${HELPER_CHECKSUMS[$rel]:-}"
  VERIFY_HELPER_ERR=""
  should_verify_module_path "$path" || return 0
  [[ -n "$expected" ]] || return 0
  if [[ ! -f "$path" ]]; then
    VERIFY_HELPER_ERR="helper file not found at $path"
    return 1
  fi
  local actual
  if ! actual="$(compute_sha256 "$path")"; then
    VERIFY_HELPER_ERR="unable to compute checksum (install sha256sum, shasum, or openssl)"
    return 2
  fi
  if [[ "$actual" != "$expected" ]]; then
    VERIFY_HELPER_ERR="checksum mismatch for $rel (expected $expected, got $actual)"
    return 1
  fi
  return 0
}

DOCTOR_FAILS=0
DOCTOR_WARNINGS=0
doctor_report(){
  local level="$1" message="$2"
  case "$level" in
    ok)
      say "  ${GREEN}${CHECK}${RESET} $message"
      ;;
    warn)
      DOCTOR_WARNINGS=$((DOCTOR_WARNINGS+1))
      say "  ${YELLOW}${WARN}${RESET} $message"
      ;;
    info)
      say "  ${CYAN}${INFO}${RESET} $message"
      ;;
    err)
      DOCTOR_FAILS=$((DOCTOR_FAILS+1))
      say "  ${RED}${X}${RESET} $message"
      ;;
  esac
}

doctor_check_cached_helpers(){
  local fix="$1"
  local rel helper_path verify_status
  for rel in "${HELPER_ASSETS[@]:-}"; do
    helper_path="$MODULE_DIR/$rel"
    if [[ -f "$helper_path" ]]; then
      if verify_helper_checksum "$rel" "$helper_path"; then
        doctor_report ok "helper checksum verified ($helper_path)"
      else
        verify_status=$?
        if [[ $verify_status -eq 2 ]]; then
          doctor_report err "helper $rel: $VERIFY_HELPER_ERR"
        else
          if [[ "$fix" -eq 1 ]]; then
            say "    ${DIM}Refreshing helper $rel...${RESET}"
            if download_helper_asset "$rel" "$helper_path"; then
              doctor_report ok "helper refreshed and verified ($rel)"
            else
              doctor_report err "Failed to refresh helper $rel: ${VERIFY_HELPER_ERR:-see logs}"
            fi
          else
            doctor_report err "helper $rel: $VERIFY_HELPER_ERR (re-run with --fix)"
          fi
        fi
      fi
    else
      if [[ "$fix" -eq 1 ]]; then
        say "    ${DIM}Caching helper $rel...${RESET}"
        if download_helper_asset "$rel" "$helper_path"; then
          doctor_report ok "helper downloaded and verified ($rel)"
        else
          doctor_report err "Failed to download helper $rel: ${VERIFY_HELPER_ERR:-see logs}"
        fi
      else
        doctor_report warn "helper $rel not cached yet (use --fix to pre-download)"
      fi
    fi
  done
}

run_doctor(){
  local fix="$1"
  DOCTOR_FAILS=0
  DOCTOR_WARNINGS=0
  say "${BOLD}UBS Doctor${RESET}"
  doctor_report info "Module cache: ${DIM}$MODULE_DIR${RESET}"
  doctor_report info "Tool cache:   ${DIM}$TOOLS_DIR${RESET}"

  local checksum_tool
  if checksum_tool=$(checksum_tool_name); then
    doctor_report ok "Checksum tool available: $checksum_tool"
  else
    doctor_report err "No checksum tool found (install sha256sum, shasum, or openssl)"
  fi

  if need_cmd curl; then
    doctor_report ok "curl available for module downloads"
  elif need_cmd wget; then
    doctor_report ok "wget available for module downloads"
  else
    doctor_report warn "Neither curl nor wget present; network module updates will fail"
  fi

  if [[ -w "$MODULE_DIR" ]]; then
    doctor_report ok "Module cache is writable"
  else
    doctor_report err "Module cache is not writable: $MODULE_DIR"
  fi

  # External dependency readiness (JS/TS AST engine)
  local ast_bin="" ast_source="" ast_version=""
  if [[ -n "${UBS_AST_GREP_BIN:-}" ]]; then
    if [[ -x "${UBS_AST_GREP_BIN}" ]]; then
      ast_bin="${UBS_AST_GREP_BIN}"
      ast_source="env"
    else
      local resolved
      resolved="$(command -v "${UBS_AST_GREP_BIN}" 2>/dev/null || true)"
      if [[ -n "$resolved" && -x "$resolved" ]]; then
        ast_bin="$resolved"
        ast_source="env"
      fi
    fi
  fi
  if [[ -z "$ast_bin" ]]; then
    if ast_bin="$(find_ast_grep_in_path 2>/dev/null)"; then
      ast_source="path"
    else
      ast_bin=""
    fi
  fi
  if [[ -z "$ast_bin" ]]; then
    local cached
    cached="$(ast_grep_cached_bin_path 2>/dev/null || true)"
    if [[ -n "$cached" && -x "$cached" ]]; then
      ast_bin="$cached"
      ast_source="cache"
    fi
  fi

  if [[ -n "$ast_bin" ]] && verify_ast_grep_bin "$ast_bin"; then
    ast_version="$("$ast_bin" --version 2>/dev/null | head -n 1 || true)"
    doctor_report ok "ast-grep: ready (${ast_source}) ${DIM}${ast_version}${RESET}"
    doctor_report info "ast-grep bin: ${DIM}$ast_bin${RESET}"
  else
    if [[ "$fix" -eq 1 ]]; then
      if ensure_ast_grep; then
        ast_version="$("$AST_GREP_BIN" --version 2>/dev/null | head -n 1 || true)"
        doctor_report ok "ast-grep: installed (${AST_GREP_SOURCE}) ${DIM}${ast_version}${RESET}"
        doctor_report info "ast-grep bin: ${DIM}${AST_GREP_BIN}${RESET}"
      else
        doctor_report err "ast-grep: missing/unusable (JS/TS scans will fail)."
      fi
    else
      doctor_report warn "ast-grep: missing/unusable (JS/TS scans will fail). Run: ubs doctor --fix"
    fi
  fi

  local lang module_path verify_status cached_modules=0
  for lang in "${ALL_LANGS[@]}"; do
    module_path="$(resolve_module_path "$lang")"
    if should_verify_module_path "$module_path"; then
      cached_modules=1
      if [[ -f "$module_path" ]]; then
        if verify_module_checksum "$lang" "$module_path"; then
          doctor_report ok "$lang module checksum verified ($module_path)"
        else
          verify_status=$?
          if [[ $verify_status -eq 2 ]]; then
            doctor_report err "$lang module: $VERIFY_MODULE_ERR"
          else
            if [[ "$fix" -eq 1 ]]; then
              say "    ${DIM}Refreshing $lang module...${RESET}"
              if download_module "$lang" "$module_path"; then
                doctor_report ok "$lang module refreshed and verified"
              else
                doctor_report err "Failed to refresh $lang module: ${VERIFY_MODULE_ERR:-see logs}"
              fi
            else
              doctor_report err "$lang module: $VERIFY_MODULE_ERR (re-run with --fix)"
            fi
          fi
        fi
      else
        if [[ "$fix" -eq 1 ]]; then
          say "    ${DIM}Caching $lang module...${RESET}"
          if download_module "$lang" "$module_path"; then
            doctor_report ok "$lang module downloaded and verified"
          else
            doctor_report err "Failed to download $lang module: ${VERIFY_MODULE_ERR:-see logs}"
          fi
        else
          doctor_report warn "$lang module not cached yet (use --fix to pre-download)"
        fi
      fi
    else
      if [[ -x "$module_path" ]]; then
        doctor_report info "$lang module supplied by $(dirname "$module_path") (custom/bundled, checksum skipped)"
      else
        doctor_report warn "$lang module expected at $module_path but is not executable"
      fi
    fi
  done

  if [[ "$cached_modules" -eq 1 ]]; then
    doctor_check_cached_helpers "$fix"
  fi

  if [[ $DOCTOR_FAILS -gt 0 ]]; then
    say "${RED}${X}${RESET} Doctor detected $DOCTOR_FAILS blocking issue(s)."
    return 1
  fi
  if [[ $DOCTOR_WARNINGS -gt 0 ]]; then
    say "${YELLOW}${WARN}${RESET} Doctor completed with $DOCTOR_WARNINGS warning(s)."
  else
    say "${GREEN}${CHECK}${RESET} Environment looks good."
  fi
  return 0
}

apply_ignore_filters(){
  [[ -n "$GLOBAL_EXCLUDE_PATTERNS" ]] || return 0
  [[ -d "$SOURCE_PROJECT_DIR" ]] || return 0

  local dest="$TMPDIR_RUN/scan"
  rm -rf "$dest" 2>/dev/null || true
  ensure_dir "$dest"
  local -a patterns
  IFS=',' read -r -a patterns <<<"$GLOBAL_EXCLUDE_PATTERNS"

  # Helper: check if destination has at least one file (copy succeeded meaningfully)
  dest_has_files() {
    [[ -n "$(find "$dest" -type f 2>/dev/null | head -n 1)" ]]
  }

  # Try rsync first (fastest and most reliable)
  if need_cmd rsync; then
    local -a args=(-a --delete)
    for pat in "${patterns[@]}"; do
      [[ -z "$pat" ]] && continue
      args+=( "--exclude=$pat" )
    done
    if rsync "${args[@]}" "$SOURCE_PROJECT_DIR"/ "$dest"/ >/dev/null 2>&1 && dest_has_files; then
      FILTERED_PROJECT_DIR="$dest"
      PROJECT_DIR="$FILTERED_PROJECT_DIR"
      say "${DIM}${INFO}${RESET} Created filtered scan workspace at ${FILTERED_PROJECT_DIR}"
      return 0
    fi
    # Rsync failed or produced empty result; clean up and try next method
    rm -rf "$dest" 2>/dev/null || true
    ensure_dir "$dest"
  fi

  # Fallback: use tar with --exclude (commonly available on Windows via Git Bash/MSYS)
  if need_cmd tar; then
    local -a tar_excludes=()
    for pat in "${patterns[@]}"; do
      [[ -z "$pat" ]] && continue
      tar_excludes+=( "--exclude=$pat" )
    done
    if (cd "$SOURCE_PROJECT_DIR" && tar cf - "${tar_excludes[@]}" . 2>/dev/null) | (cd "$dest" && tar xf - 2>/dev/null) && dest_has_files; then
      FILTERED_PROJECT_DIR="$dest"
      PROJECT_DIR="$FILTERED_PROJECT_DIR"
      say "${DIM}${INFO}${RESET} Created filtered scan workspace at ${FILTERED_PROJECT_DIR} (tar fallback)"
      return 0
    fi
    # Tar failed or produced empty result; clean up and try next method
    rm -rf "$dest" 2>/dev/null || true
    ensure_dir "$dest"
  fi

  # Python fallback (most reliable cross-platform)
  if need_cmd python3; then
    local patterns_json
    patterns_json=$(printf '%s\n' "${patterns[@]}" | python3 -c "import sys, json; print(json.dumps([l.strip() for l in sys.stdin if l.strip()]))" 2>/dev/null)
    if [[ -n "$patterns_json" ]] && python3 - "$SOURCE_PROJECT_DIR" "$dest" "$patterns_json" <<'PY' 2>/dev/null
import sys, os, shutil, json, fnmatch, pathlib

src = pathlib.Path(sys.argv[1]).resolve()
dst = pathlib.Path(sys.argv[2]).resolve()
patterns = json.loads(sys.argv[3])

def should_exclude(rel_path, name):
    for pat in patterns:
        if fnmatch.fnmatch(rel_path, pat) or fnmatch.fnmatch(name, pat):
            return True
        # Check path components
        for part in pathlib.Path(rel_path).parts:
            if fnmatch.fnmatch(part, pat):
                return True
    return False

for root, dirs, files in os.walk(src, topdown=True):
    root_path = pathlib.Path(root)
    rel_root = root_path.relative_to(src)
    dst_root = dst / rel_root

    # Filter directories (modifying dirs in-place prunes traversal)
    dirs[:] = [d for d in dirs if not should_exclude(str(rel_root / d), d)]

    # Create destination directory
    dst_root.mkdir(parents=True, exist_ok=True)

    # Copy files that aren't excluded
    for f in files:
        rel_file = str(rel_root / f) if str(rel_root) != '.' else f
        if not should_exclude(rel_file, f):
            try:
                shutil.copy2(root_path / f, dst_root / f)
            except (OSError, shutil.Error):
                pass  # Skip files that can't be copied
PY
    then
      if dest_has_files; then
        FILTERED_PROJECT_DIR="$dest"
        PROJECT_DIR="$FILTERED_PROJECT_DIR"
        say "${DIM}${INFO}${RESET} Created filtered scan workspace at ${FILTERED_PROJECT_DIR} (python fallback)"
        return 0
      fi
    fi
  fi

  say "${YELLOW}${WARN}${RESET} Failed to apply ignore filters; scanning original tree"
  rm -rf "$dest" 2>/dev/null || true
}

# Suggest directories worth adding to .ubsignore. Defined here next to
# apply_ignore_filters and well before the execution-section call site
# (around line ~2305) — bash resolves function names at call time, so
# a definition lower in the file caused `--suggest-ignore` to exit
# 127 with "suggest_ignore_candidates: command not found" (issue #44).
# Keep this function above any caller, even when the script gets
# reorganized.
suggest_ignore_candidates(){
  local threshold=200
  IFS=',' read -r -a defaults <<<"$DEFAULT_IGNORES"
  say "${BLUE}${INFO}${RESET} Ignore suggestions (directories with >${threshold} files not already default-ignored):"
  find "$PROJECT_DIR" -maxdepth 1 -mindepth 1 -type d 2>/dev/null | while read -r d; do
    local base=$(basename "$d")
    local skip=0
    for df in "${defaults[@]}"; do [[ "$base" == "$df" ]] && skip=1; done
    [[ "$skip" -eq 1 ]] && continue
    local count=$(find "$d" -type f 2>/dev/null | wc -l | awk '{print $1+0}')
    if [[ "$count" -gt $threshold ]]; then
      say "  ${GRAY}$base${RESET} (${count} files) → consider adding to .ubsignore"
    fi
  done
}

restore_original_paths(){
  local file="$1"
  [[ -n "$FILTERED_PROJECT_DIR" && -f "$file" ]] || return 0
  if ! need_cmd python3; then return 0; fi
  python3 - "$FILTERED_PROJECT_DIR" "$SOURCE_PROJECT_DIR" "$file" <<'PY' 2>/dev/null || true
import sys, pathlib
src = sys.argv[1]
dst = sys.argv[2]
path = pathlib.Path(sys.argv[3])
try:
    data = path.read_text()
except OSError:
    sys.exit(0)
path.write_text(data.replace(src, dst))
PY
}

if [[ "$MODE" == "sessions" ]]; then
  show_session_history "$SESSION_ENTRIES" "$SESSION_RAW" "$SESSION_LOG_DIR_OVERRIDE"
  exit 0
fi

# Detectors (fast ripgrep if available, else find)
detect_lang(){
  local lang="$1" found=1
  case "$lang" in
    js)
      if need_cmd rg; then
        rg -q --hidden -g '!node_modules/**' -g '!dist/**' -g '!build/**' -g '!coverage/**' -g '!*.min.*' -g '!venv/**' -g '!.venv/**' \
           -g '*.{js,jsx,ts,tsx,mjs,cjs}' -g 'package.json' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name node_modules -o -name dist -o -name build -o -name coverage -o -name venv -o -name .venv -o -name .git \) -prune -o \
          -type f \( -name '*.js' -o -name '*.jsx' -o -name '*.ts' -o -name '*.tsx' -o -name '*.mjs' -o -name '*.cjs' -o -name 'package.json' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    python)
      if need_cmd rg; then
        rg -q --hidden -g '!venv/**' -g '!.venv/**' -g '!**/__pycache__/**' -g '!build/**' -g '!dist/**' \
           -g '*.py' -g 'pyproject.toml' -g 'requirements.txt' -g 'setup.py' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name venv -o -name .venv -o -name __pycache__ -o -name build -o -name dist -o -name .git \) -prune -o \
          -type f \( -name '*.py' -o -name 'pyproject.toml' -o -name 'requirements.txt' -o -name 'setup.py' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    c)
      if need_cmd rg; then
        rg -q --hidden -g '!build/**' -g '!out/**' -g '!**/.cache/**' \
           -g '*.{c,h}' -g 'Makefile' -g 'compile_commands.json' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name build -o -name out -o -name .cache -o -name .git \) -prune -o \
          -type f \( -name '*.c' -o -name '*.h' -o -name 'Makefile' -o -name 'compile_commands.json' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    cpp)
      if need_cmd rg; then
        rg -q --hidden -g '!build/**' -g '!out/**' -g '!**/.cache/**' \
           -g '*.{c,cc,cpp,cxx,h,hh,hpp,hxx}' -g 'CMakeLists.txt' -g 'compile_commands.json' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name build -o -name out -o -name .cache -o -name .git \) -prune -o \
          -type f \( -name '*.c' -o -name '*.cc' -o -name '*.cpp' -o -name '*.cxx' -o -name '*.h' -o -name '*.hh' -o -name '*.hpp' -o -name '*.hxx' -o -name 'CMakeLists.txt' -o -name 'compile_commands.json' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    rust)
      if need_cmd rg; then
        rg -q --hidden -g '!target/**' -g '!**/.cargo/**' -g '*.rs' -g 'Cargo.toml' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name target -o -name .cargo -o -name .git \) -prune -o \
          -type f \( -name '*.rs' -o -name 'Cargo.toml' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    golang)
      if need_cmd rg; then
        rg -q --hidden -g '!vendor/**' -g '!bin/**' -g '!dist/**' -g '!build/**' \
           -g '*.go' -g 'go.mod' -g 'go.sum' -g 'go.work' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name vendor -o -name bin -o -name dist -o -name build -o -name .git \) -prune -o \
          -type f \( -name '*.go' -o -name 'go.mod' -o -name 'go.sum' -o -name 'go.work' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    java)
      if need_cmd rg; then
        rg -q --hidden -g '!target/**' -g '!build/**' -g '!out/**' -g '!dist/**' \
           -g '*.java' -g '*.kt' -g '*.kts' -g 'pom.xml' -g 'build.gradle' -g 'build.gradle.kts' -g 'settings.gradle' -g 'settings.gradle.kts' -g 'gradlew' -g 'mvnw' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name target -o -name build -o -name out -o -name dist -o -name .git \) -prune -o \
          -type f \( -name '*.java' -o -name '*.kt' -o -name '*.kts' -o -name 'pom.xml' -o -name 'build.gradle' -o -name 'build.gradle.kts' -o -name 'settings.gradle' -o -name 'settings.gradle.kts' -o -name 'gradlew' -o -name 'mvnw' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    ruby)
      if need_cmd rg; then
        rg -q --hidden -g '!vendor/bundle/**' -g '!tmp/**' -g '!dist/**' \
           -g '*.rb' -g 'Gemfile' -g 'Gemfile.lock' -g '*.gemspec' -g 'Rakefile' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name vendor -o -name bundle -o -name tmp -o -name dist -o -name .git \) -prune -o \
          -type f \( -name '*.rb' -o -name 'Gemfile' -o -name 'Gemfile.lock' -o -name '*.gemspec' -o -name 'Rakefile' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    swift)
      if need_cmd rg; then
        rg -q --hidden -g '!DerivedData/**' -g '!build/**' -g '!buck-out/**' -g '!dist/**' \
           -g '*.swift' -g '*.metal' -g 'Package.swift' -g '*.xcodeproj/project.pbxproj' -g '*.xcworkspace/contents.xcworkspacedata' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name DerivedData -o -name build -o -name buck-out -o -name dist -o -name .git \) -prune -o \
          -type f \( -name '*.swift' -o -name '*.metal' -o -name 'Package.swift' -o -name '*.xcodeproj' -o -name '*.xcworkspace' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    csharp)
      if need_cmd rg; then
        rg -q --hidden -g '!bin/**' -g '!obj/**' -g '!packages/**' -g '!dist/**' -g '!build/**' -g '!coverage/**' -g '!TestResults/**' \
           -g '*.cs' -g '*.csx' -g '*.csproj' -g '*.sln' -g 'Directory.Build.props' -g 'Directory.Build.targets' -g 'global.json' -g 'nuget.config' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name bin -o -name obj -o -name packages -o -name dist -o -name build -o -name coverage -o -name TestResults -o -name .git \) -prune -o \
          -type f \( -name '*.cs' -o -name '*.csx' -o -name '*.csproj' -o -name '*.sln' -o -name 'Directory.Build.props' -o -name 'Directory.Build.targets' -o -name 'global.json' -o -name 'nuget.config' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
    elixir)
      if need_cmd rg; then
        rg -q --hidden -g '!_build/**' -g '!deps/**' -g '!.elixir_ls/**' -g '!cover/**' \
           -g '*.ex' -g '*.exs' -g 'mix.exs' -g 'mix.lock' . "$PROJECT_DIR" 2>/dev/null && found=0
      else
        find "$PROJECT_DIR" \( -name _build -o -name deps -o -name .elixir_ls -o -name cover -o -name .git \) -prune -o \
          -type f \( -name '*.ex' -o -name '*.exs' -o -name 'mix.exs' -o -name 'mix.lock' \) -print -quit 2>/dev/null | grep -q . && found=0
      fi
      ;;
  esac
  return $found
}

# ─────────────────────────────────────────────────────────────────────────────
# Module resolution & download
# ─────────────────────────────────────────────────────────────────────────────
resolve_module_path(){
  local lang="$1"
  local base="ubs-$lang"
  local sd md
  sd="$(script_dir)"
  md="$MODULE_DIR"
  # Priority: PATH → local modules/ → XDG module dir
  if command -v "$base" >/dev/null 2>&1; then command -v "$base"; return 0; fi
  if [ -x "$sd/modules/$base.sh" ]; then echo "$sd/modules/$base.sh"; return 0; fi
  if [ -x "$md/$base.sh" ]; then echo "$md/$base.sh"; return 0; fi
  echo "$md/$base.sh"
}

download_module(){
  local lang="$1" path="$2"
  ensure_dir "$(dirname "$path")"
  local release_url latest_url url label tmp head err_msg
  release_url=$(printf '%s' "$MODULE_PATH_TEMPLATE" | sed "s/%s/$lang/")
  latest_url=$(printf '%s' "$MODULE_PATH_TEMPLATE_LATEST" | sed "s/%s/$lang/")
  local -a urls=("$release_url")
  if [[ "$latest_url" != "$release_url" ]]; then
    urls+=("$latest_url")
  fi
  local total=${#urls[@]} idx=0
  for url in "${urls[@]}"; do
    idx=$((idx + 1))
    label="release"
    if [[ "$url" == "$latest_url" && "$url" != "$release_url" ]]; then
      label="main fallback"
    fi
    say "${BLUE}${INFO}${RESET} fetching module ${BOLD}$lang${RESET} (${label}) → ${DIM}$path${RESET}"
    tmp="$(mktemp -t "ubs-${lang}.XXXXXX" 2>/dev/null || mktemp "${TMPDIR:-/tmp}/ubs-${lang}.XXXXXX" 2>/dev/null)" || {
      say "${RED}$X failed to create temp file for module download${RESET}"
      return 1
    }
    if need_cmd curl; then
      if ! curl -fsSL "$url" -o "$tmp"; then
        err_msg="failed to download module $lang"
      else
        err_msg=""
      fi
    elif need_cmd wget; then
      if ! wget -q "$url" -O "$tmp"; then
        err_msg="failed to download module $lang"
      else
        err_msg=""
      fi
    else
      say "${RED}$X neither curl nor wget available${RESET}"
      rm -f "$tmp" 2>/dev/null || true
      return 1
    fi
    if [[ -n "$err_msg" ]]; then
      rm -f "$tmp" 2>/dev/null || true
      if [[ "$idx" -lt "$total" ]]; then
        say "${YELLOW}${WARN}${RESET} ${err_msg} from ${label}; trying main fallback..."
        continue
      fi
      say "${RED}$X ${err_msg}${RESET}"
      return 1
    fi
    # sanity checks
    if [ ! -s "$tmp" ]; then
      rm -f "$tmp" 2>/dev/null || true
      if [[ "$idx" -lt "$total" ]]; then
        say "${YELLOW}${WARN}${RESET} empty module file for $lang from ${label}; trying main fallback..."
        continue
      fi
      say "${RED}$X empty module file for $lang${RESET}"
      return 1
    fi
    head="$(head -n 1 "$tmp" | tr -d '\r')"
    if [[ ! "$head" =~ ^#! ]]; then
      rm -f "$tmp" 2>/dev/null || true
      if [[ "$idx" -lt "$total" ]]; then
        say "${YELLOW}${WARN}${RESET} module missing shebang for $lang from ${label}; trying main fallback..."
        continue
      fi
      say "${RED}$X module missing shebang (lang=$lang)${RESET}"
      return 1
    fi
    if should_verify_module_path "$path"; then
      VERIFY_MODULE_ERR=""
      local expected="${MODULE_CHECKSUMS[$lang]:-}"
      if [[ -n "$expected" ]]; then
        local sha
        if ! sha="$(compute_sha256 "$tmp")"; then
          VERIFY_MODULE_ERR="unable to compute checksum (install sha256sum, shasum, or openssl)"
        elif [[ "$sha" != "$expected" ]]; then
          VERIFY_MODULE_ERR="checksum mismatch for $lang (expected $expected, got $sha)"
        fi
      fi
      if [[ -n "${VERIFY_MODULE_ERR:-}" ]]; then
        err_msg="${VERIFY_MODULE_ERR}"
        rm -f "$tmp" 2>/dev/null || true
        if [[ "$idx" -lt "$total" ]]; then
          say "${YELLOW}${WARN}${RESET} module ${BOLD}$lang${RESET} from ${label} failed verification (${err_msg}); trying main fallback..."
          continue
        fi
        say "${RED}$X failed to verify module ${BOLD}$lang${RESET}: $err_msg"
        return 1
      fi
    fi
    if ! mv "$tmp" "$path"; then
      say "${RED}$X failed to finalize module ${BOLD}$lang${RESET} to ${DIM}$path${RESET}"
      rm -f "$tmp" 2>/dev/null || true
      return 1
    fi
    chmod +x "$path" 2>/dev/null || true
    return 0
  done
  return 1
}

download_helper_asset(){
  local rel="$1" path="$2"
  ensure_dir "$(dirname "$path")"
  local release_url="${REPO_RAW}/modules/${rel}"
  local latest_url="${REPO_RAW_LATEST}/modules/${rel}"
  local url label tmp err_msg
  local -a urls=("$release_url")
  if [[ "$latest_url" != "$release_url" ]]; then
    urls+=("$latest_url")
  fi
  local total=${#urls[@]} idx=0
  for url in "${urls[@]}"; do
    idx=$((idx + 1))
    label="release"
    if [[ "$url" == "$latest_url" && "$url" != "$release_url" ]]; then
      label="main fallback"
    fi
    say "${BLUE}${INFO}${RESET} fetching helper ${BOLD}$rel${RESET} (${label}) → ${DIM}$path${RESET}"
    tmp="$(mktemp -t "ubs-helper.XXXXXX" 2>/dev/null || mktemp "${TMPDIR:-/tmp}/ubs-helper.XXXXXX" 2>/dev/null)" || {
      say "${RED}$X failed to create temp file for helper download${RESET}"
      return 1
    }
    if need_cmd curl; then
      if ! curl -fsSL "$url" -o "$tmp"; then
        err_msg="failed to download helper $rel"
      else
        err_msg=""
      fi
    elif need_cmd wget; then
      if ! wget -q "$url" -O "$tmp"; then
        err_msg="failed to download helper $rel"
      else
        err_msg=""
      fi
    else
      say "${RED}$X neither curl nor wget available${RESET}"
      rm -f "$tmp" 2>/dev/null || true
      return 1
    fi
    if [[ -n "$err_msg" ]]; then
      rm -f "$tmp" 2>/dev/null || true
      if [[ "$idx" -lt "$total" ]]; then
        say "${YELLOW}${WARN}${RESET} ${err_msg} from ${label}; trying main fallback..."
        continue
      fi
      say "${RED}$X ${err_msg}${RESET}"
      return 1
    fi
    if [ ! -s "$tmp" ]; then
      rm -f "$tmp" 2>/dev/null || true
      if [[ "$idx" -lt "$total" ]]; then
        say "${YELLOW}${WARN}${RESET} empty helper file for $rel from ${label}; trying main fallback..."
        continue
      fi
      say "${RED}$X empty helper file for $rel${RESET}"
      return 1
    fi
    if should_verify_module_path "$path"; then
      VERIFY_HELPER_ERR=""
      local expected="${HELPER_CHECKSUMS[$rel]:-}"
      if [[ -n "$expected" ]]; then
        local sha
        if ! sha="$(compute_sha256 "$tmp")"; then
          VERIFY_HELPER_ERR="unable to compute checksum (install sha256sum, shasum, or openssl)"
        elif [[ "$sha" != "$expected" ]]; then
          VERIFY_HELPER_ERR="checksum mismatch for $rel (expected $expected, got $sha)"
        fi
      fi
      if [[ -n "${VERIFY_HELPER_ERR:-}" ]]; then
        err_msg="${VERIFY_HELPER_ERR}"
        rm -f "$tmp" 2>/dev/null || true
        if [[ "$idx" -lt "$total" ]]; then
          say "${YELLOW}${WARN}${RESET} helper ${BOLD}$rel${RESET} from ${label} failed verification (${err_msg}); trying main fallback..."
          continue
        fi
        say "${RED}$X failed to verify helper ${BOLD}$rel${RESET}: $err_msg"
        return 1
      fi
    fi
    if ! mv "$tmp" "$path"; then
      say "${RED}$X failed to finalize helper ${BOLD}$rel${RESET} to ${DIM}$path${RESET}"
      rm -f "$tmp" 2>/dev/null || true
      return 1
    fi
    return 0
  done
  return 1
}

ensure_helper_asset(){
  local rel="$1"
  local path="$MODULE_DIR/$rel"
  if [ "$UPDATE_MODULES" -eq 1 ] || [ ! -f "$path" ]; then
    download_helper_asset "$rel" "$path" || return 1
  fi
  if should_verify_module_path "$path" && [ -f "$path" ]; then
    if ! verify_helper_checksum "$rel" "$path"; then
      local verify_code=$?
      if [[ $verify_code -eq 2 ]]; then
        say "${RED}$X ${VERIFY_HELPER_ERR}${RESET}"
        rm -f "$path" 2>/dev/null || true
        return 1
      fi
      say "${YELLOW}${WARN}${RESET} cached helper $rel failed verification (${VERIFY_HELPER_ERR:-corrupt}); refreshing..."
      download_helper_asset "$rel" "$path" || { rm -f "$path" 2>/dev/null || true; return 1; }
    fi
  fi
  return 0
}

ensure_cached_helpers(){
  local mode="${1:-scan}" # scan|doctor
  if [[ "$mode" == "scan" && "${UPDATE_MODULES:-0}" -eq 0 && "${HELPERS_READY:-0}" -eq 1 ]]; then
    return 0
  fi

  local failures=0
  local rel
  for rel in "${HELPER_ASSETS[@]:-}"; do
    if ! ensure_helper_asset "$rel"; then
      failures=$((failures+1))
      if [[ "$mode" == "scan" ]]; then
        say "${YELLOW}${WARN}${RESET} helper unavailable: ${DIM}$rel${RESET} (${VERIFY_HELPER_ERR:-download/verification failed}); continuing with reduced accuracy"
      fi
    fi
  done

  if [[ "$failures" -eq 0 ]]; then
    HELPERS_READY=1
  fi

  if [[ "$mode" == "doctor" ]]; then
    return "$failures"
  fi
  return 0
}

ensure_module(){
  local lang="$1" path="$2"
  if [ "$UPDATE_MODULES" -eq 1 ] || [ ! -x "$path" ]; then
    download_module "$lang" "$path" || return 1
  fi
  if should_verify_module_path "$path" && [ -x "$path" ]; then
    if ! verify_module_checksum "$lang" "$path"; then
      local verify_code=$?
      if [[ $verify_code -eq 2 ]]; then
        say "${RED}$X ${VERIFY_MODULE_ERR}${RESET}"
        return 1
      fi
      say "${YELLOW}${WARN}${RESET} cached $lang module failed verification (${VERIFY_MODULE_ERR:-corrupt}); refreshing..."
      download_module "$lang" "$path" || return 1
    fi
    ensure_cached_helpers "scan" || true
  fi
  return 0
}

# ─────────────────────────────────────────────────────────────────────────────
# Self-update logic
# ─────────────────────────────────────────────────────────────────────────────
check_and_update_self(){
  # Auto-update is opt-in (security-first). Enable by setting:
  #   UBS_ENABLE_AUTO_UPDATE=1
  # Always skip in CI, or when explicitly disabled via UBS_NO_AUTO_UPDATE / --no-auto-update.
  if [[ "${FORCE_SELF_UPDATE:-0}" -eq 0 ]]; then
    [[ "${UBS_ENABLE_AUTO_UPDATE:-0}" -eq 1 ]] || return 0
    if [[ "${UBS_NO_AUTO_UPDATE:-0}" -eq 1 || "${CI_MODE:-0}" -eq 1 ]]; then return 0; fi
  fi
  
  # Only update if we're running the installed binary (not a local repo script)
  # Heuristic: if the script dir contains .git, we're likely in a dev environment
  if [[ -d "$(script_dir)/.git" ]]; then return 0; fi

  # Or if we are not writable
  if [[ ! -w "$0" ]]; then return 0; fi

  local self_path="$0"
  # Self-update intentionally probes main (REPO_RAW_LATEST) rather than
  # the release-pinned REPO_RAW — otherwise we'd compare against our
  # own pinned tag and never see a newer release.
  local remote_url="$REPO_RAW_LATEST/ubs"
  local last_check_file="${XDG_CACHE_HOME:-$HOME/.cache}/ubs/last_update_check"
  ensure_dir "$(dirname "$last_check_file")"

  # Check at most once every 24 hours
  if [[ "${FORCE_SELF_UPDATE:-0}" -eq 0 && -f "$last_check_file" ]]; then
    local last_check
    last_check=$(cat "$last_check_file" 2>/dev/null || echo 0)
    local now
    now=$(date +%s)
    if (( now - last_check < 86400 )); then
      return 0
    fi
  fi

  if [[ "${QUIET:-0}" -eq 0 ]]; then
    say_err "${DIM}Checking for updates...${RESET}"
  fi

  # Fetch remote version string or hash from the script itself
  # We look for UBS_VERSION="X.Y.Z"
  local remote_content
  if need_cmd curl; then
    remote_content=$(curl -fsSL "$remote_url") || return 0
  elif need_cmd wget; then
    remote_content=$(wget -qO- "$remote_url") || return 0
  else
    return 0
  fi

  local remote_version
  remote_version=$(printf '%s' "$remote_content" | grep -oE 'UBS_VERSION="[0-9.]+"' | head -n1 | cut -d'"' -f2)
  
  if [[ -z "$remote_version" ]]; then return 0; fi

  if [[ "$remote_version" != "$UBS_VERSION" ]]; then
    if [[ "${QUIET:-0}" -eq 0 ]]; then
      say_err "${BLUE}${INFO}${RESET} Updating ubs from ${UBS_VERSION} to ${remote_version}..."
    fi
    
    # Write new content to temp file
    local tmp_self
    tmp_self="$(mktemp -t ubs-self.XXXXXX 2>/dev/null || mktemp "${TMPDIR:-/tmp}/ubs-self.XXXXXX" 2>/dev/null)"
    printf '%s' "$remote_content" > "$tmp_self"
    chmod +x "$tmp_self"
    
    # Move over current script
    if mv "$tmp_self" "$self_path"; then
      if [[ "${QUIET:-0}" -eq 0 ]]; then
        say_err "${GREEN}${CHECK}${RESET} Updated successfully."
      fi
      # Update check timestamp
      date +%s > "$last_check_file"
      # Re-exec self to run the new version
      exec "$self_path" "$@"
    else
      rm -f "$tmp_self"
      say_err "${YELLOW}${WARN}${RESET} Failed to update ubs binary."
    fi
  else
    # Update check timestamp even if no update found
    date +%s > "$last_check_file"
  fi
}

finalize_module_dir
resolve_git_metadata || true  # Git metadata is optional; don't fail on repos without remotes

if [[ "$MODE" == "doctor" ]]; then
  run_doctor "$DOCTOR_FIX"
  exit $?
fi

# Run auto-update before main logic
check_and_update_self "$@"

if [[ "$UPDATE_ONLY" -eq 1 ]]; then
  [[ "${QUIET:-0}" -eq 0 ]] && say_err "${GREEN}${CHECK}${RESET} Update check complete."
  exit 0
fi

# ─────────────────────────────────────────────────────────────────────────────
# Execution / aggregation
# ─────────────────────────────────────────────────────────────────────────────
TMPDIR_RUN="$(mktemp -d 2>/dev/null || mktemp -d -t ubsrun.XXXXXX)"
cleanup(){
  local dir="${TMPDIR_RUN:-}"
  [[ -n "$dir" && "$dir" != "/" ]] || return 0
  rm -rf "$dir" 2>/dev/null || true
}
trap cleanup EXIT
COMBINED_JSON_FILE="$TMPDIR_RUN/combined.json"

if [[ "$TARGETED_SCAN_MODE" -eq 0 ]]; then
  apply_ignore_filters
fi
if [[ "$SUGGEST_IGNORE" -eq 1 ]]; then
  suggest_ignore_candidates
fi

if [[ -n "$GIT_MODE" ]]; then
  prepare_git_workspace "$GIT_MODE"
elif [[ ${#SCAN_FILES[@]} -gt 0 ]]; then
  prepare_files_workspace
fi

# Normalize language alias to module name (e.g. "c" -> "cpp").
normalize_lang(){
  case "$1" in
    c) echo "cpp" ;;
    cs|csharp|csharp-dotnet|dotnet|c#) echo "csharp" ;;
    ex|elixir|phoenix) echo "elixir" ;;
    *) echo "$1" ;;
  esac
}

# ─────────────────────────────────────────────────────────────────────────────
# Per-language category name lookup (issue #52)
# ─────────────────────────────────────────────────────────────────────────────
# Used to render an informative warning when bare --skip=N is set while more
# than one language module is scheduled to run. Numbers are NOT stable across
# modules — e.g. JS cat 8 = Function & Scope Issues, Rust cat 8 = SECURITY
# FINDINGS — so silencing one number in every language at once is a footgun.
# Source: print_header "N. NAME" lines harvested from each modules/ubs-*.sh.
category_name_for(){
  local lang="$1" cat="$2"
  case "$lang" in
    js)
      case "$cat" in
        1) echo "NULL SAFETY & DEFENSIVE PROGRAMMING";;
        2) echo "MATH & ARITHMETIC PITFALLS";;
        3) echo "ARRAY & COLLECTION SAFETY";;
        4) echo "TYPE COERCION & COMPARISON TRAPS";;
        5) echo "ASYNC/AWAIT & PROMISE PITFALLS";;
        6) echo "ERROR HANDLING ANTI-PATTERNS";;
        7) echo "SECURITY VULNERABILITIES";;
        8) echo "FUNCTION & SCOPE ISSUES";;
        9) echo "PARSING & TYPE CONVERSION BUGS";;
        10) echo "CONTROL FLOW GOTCHAS";;
        11) echo "DEBUGGING & PRODUCTION CODE";;
        12) echo "MEMORY LEAKS & PERFORMANCE";;
        13) echo "VARIABLE & SCOPE ISSUES";;
        14) echo "CODE QUALITY MARKERS";;
        15) echo "REGEX & STRING SAFETY";;
        16) echo "DOM MANIPULATION SAFETY";;
        17) echo "TYPESCRIPT STRICTNESS";;
        18) echo "NODE.JS I/O & MODULES";;
        19) echo "RESOURCE LIFECYCLE CORRELATION";;
        *) echo "(no category $cat)";;
      esac;;
    python)
      case "$cat" in
        1) echo "NONE / DEFENSIVE PROGRAMMING";;
        2) echo "NUMERIC / ARITHMETIC PITFALLS";;
        3) echo "COLLECTION SAFETY";;
        4) echo "COMPARISON & TYPE CHECKING TRAPS";;
        5) echo "ASYNC/AWAIT PITFALLS";;
        6) echo "ERROR HANDLING ANTI-PATTERNS";;
        7) echo "SECURITY VULNERABILITIES";;
        8) echo "FUNCTION & SCOPE ISSUES (incl. CRITICAL Mutable default args)";;
        9) echo "PARSING & TYPE CONVERSION BUGS";;
        10) echo "CONTROL FLOW GOTCHAS";;
        11) echo "DEBUGGING & PRODUCTION CODE";;
        12) echo "PERFORMANCE & MEMORY";;
        13) echo "VARIABLE & SCOPE";;
        14) echo "CODE QUALITY MARKERS";;
        15) echo "REGEX & STRING SAFETY";;
        16) echo "I/O & RESOURCE SAFETY";;
        17) echo "TYPING STRICTNESS";;
        18) echo "PYTHON I/O & MODULE USAGE";;
        19) echo "RESOURCE LIFECYCLE CORRELATION";;
        20) echo "UV-POWERED EXTRA ANALYZERS";;
        21) echo "DEPRECATIONS & PY3.13 MIGRATIONS";;
        22) echo "PACKAGING & CONFIG HYGIENE";;
        23) echo "NOTEBOOK HYGIENE";;
        *) echo "(no category $cat)";;
      esac;;
    rust)
      case "$cat" in
        1) echo "OWNERSHIP & ERROR HANDLING MACROS";;
        2) echo "UNSAFE & MEMORY OPERATIONS";;
        3) echo "CONCURRENCY & ASYNC PITFALLS";;
        4) echo "NUMERIC & FLOATING-POINT";;
        5) echo "COLLECTIONS & ITERATORS";;
        6) echo "STRING & ALLOCATION SMELLS";;
        7) echo "FILESYSTEM & PROCESS";;
        8) echo "SECURITY FINDINGS (incl. critical TLS bypass, hardcoded secrets)";;
        9) echo "CODE QUALITY MARKERS";;
        10) echo "MODULE & VISIBILITY ISSUES";;
        11) echo "TESTS & BENCHES HYGIENE";;
        12) echo "LINTS & STYLE (fmt/clippy)";;
        13) echo "BUILD HEALTH (check/test)";;
        14) echo "DEPENDENCY HYGIENE";;
        15) echo "API MISUSE (COMMON)";;
        16) echo "DOMAIN-SPECIFIC HEURISTICS";;
        17) echo "AST-GREP RULE PACK FINDINGS";;
        18) echo "META STATISTICS & INVENTORY";;
        19) echo "RESOURCE LIFECYCLE CORRELATION";;
        20) echo "ASYNC LOCKING ACROSS AWAIT";;
        21) echo "PANIC SURFACES & UNWINDING";;
        22) echo "SUSPICIOUS CASTS & TRUNCATION";;
        23) echo "PARSING & VALIDATION ROBUSTNESS";;
        24) echo "PERF/DoS HOTSPOTS";;
        *) echo "(no category $cat)";;
      esac;;
    golang)
      case "$cat" in
        1) echo "CONCURRENCY & GOROUTINE SAFETY";;
        2) echo "CHANNELS & SELECT";;
        3) echo "CONTEXT PROPAGATION & CANCELLATION";;
        4) echo "HTTP CLIENT/SERVER SAFETY";;
        5) echo "RESOURCE LIFECYCLE & DEFER";;
        6) echo "ERROR HANDLING & WRAPPING";;
        7) echo "JSON & ENCODING";;
        8) echo "FILESYSTEM & I/O";;
        9) echo "CRYPTOGRAPHY & SECURITY";;
        10) echo "REFLECTION & UNSAFE";;
        11) echo "IMPORT HYGIENE";;
        12) echo "MODULE & BUILD HYGIENE";;
        13) echo "TESTING PRACTICES";;
        14) echo "LOGGING & PRINTF";;
        15) echo "STYLE & MODERNIZATION";;
        16) echo "PANIC/RECOVER & TIME PATTERNS (AST Pack)";;
        17) echo "RESOURCE LIFECYCLE CORRELATION";;
        18) echo "GO TOOLING (OPTIONAL)";;
        19) echo "DEPENDENCY & BUILD DRIFT";;
        20) echo "NIL PANICS FROM DEFER ORDERING (AST)";;
        21) echo "DATABASE & SQL ROBUSTNESS";;
        22) echo "SHUTDOWN & RESOURCE RELEASE (HTTP/NET)";;
        *) echo "(no category $cat)";;
      esac;;
    java)
      case "$cat" in
        1) echo "NULL & OPTIONAL PITFALLS";;
        2) echo "EQUALITY & HASHCODE";;
        3) echo "CONCURRENCY & THREADING";;
        4) echo "SECURITY";;
        5) echo "I/O & RESOURCES";;
        6) echo "LOGGING & DEBUGGING";;
        7) echo "REGEX & STRING PITFALLS";;
        8) echo "COLLECTIONS & GENERICS";;
        9) echo "SWITCH & CONTROL FLOW";;
        10) echo "STREAMS & PERFORMANCE";;
        11) echo "SERIALIZATION & COMPATIBILITY";;
        12) echo "JAVA 21 FEATURES (INFO)";;
        13) echo "SQL CONSTRUCTION (HEURISTICS)";;
        14) echo "ANNOTATIONS & NULLNESS (HEURISTICS)";;
        15) echo "AST-GREP RULE PACK FINDINGS";;
        16) echo "BUILD HEALTH (Maven/Gradle)";;
        17) echo "META STATISTICS & INVENTORY";;
        18) echo "MISC API MISUSE";;
        19) echo "RESOURCE SAFETY & RESOURCE LIFECYCLE CORRELATION";;
        20) echo "PATH HANDLING & FILESYSTEM";;
        21) echo "HARD-CODED SECRETS (HEURISTICS)";;
        22) echo "LOGGING BEST PRACTICES";;
        *) echo "(no category $cat)";;
      esac;;
    cpp)
      case "$cat" in
        1) echo "MEMORY & RAII";;
        2) echo "EXCEPTIONS & ERROR HANDLING";;
        3) echo "CONCURRENCY & ATOMICS";;
        4) echo "MODERNIZATION (C++20+)";;
        5) echo "POINTER & LIFETIME HAZARDS";;
        6) echo "NUMERIC & ARITHMETIC PITFALLS";;
        7) echo "UNDEFINED BEHAVIOR RISK ZONE";;
        8) echo "HEADER & INCLUDE HYGIENE";;
        9) echo "STL & ALGORITHMS";;
        10) echo "STRING & I/O SAFETY";;
        11) echo "MACROS & PREPROCESSOR TRAPS";;
        12) echo "CMAKE & BUILD HYGIENE";;
        13) echo "CODE QUALITY MARKERS";;
        14) echo "PERFORMANCE & ALLOCATION PRESSURE";;
        15) echo "TEST/DEBUG LEFTOVERS";;
        16) echo "RESOURCE LIFECYCLE CORRELATION";;
        *) echo "(no category $cat)";;
      esac;;
    ruby)
      case "$cat" in
        1) echo "NIL / DEFENSIVE PROGRAMMING";;
        2) echo "NUMERIC / ARITHMETIC PITFALLS";;
        3) echo "COLLECTION SAFETY";;
        4) echo "COMPARISON & IDIOMS";;
        5) echo "EXCEPTIONS & ERROR HANDLING";;
        6) echo "SECURITY VULNERABILITIES";;
        7) echo "SHELL / SUBPROCESS SAFETY";;
        8) echo "I/O & RESOURCE LIFECYCLE CORRELATION";;
        9) echo "PARSING & TYPE CONVERSION BUGS";;
        10) echo "CONTROL FLOW GOTCHAS";;
        11) echo "DEBUGGING & PRODUCTION CODE";;
        12) echo "PERFORMANCE & MEMORY";;
        13) echo "VARIABLE & SCOPE";;
        14) echo "CODE QUALITY MARKERS";;
        15) echo "REGEX & STRING SAFETY";;
        16) echo "CONCURRENCY & PARALLELISM";;
        17) echo "RUBY/RAILS PRACTICALS";;
        19) echo "BUNDLER-POWERED EXTRA ANALYZERS";;
        *) echo "(no category $cat)";;
      esac;;
    swift)
      case "$cat" in
        1) echo "OPTIONALS / FORCE OPERATIONS";;
        2) echo "CONCURRENCY / TASK";;
        3) echo "CLOSURES / CAPTURE LISTS";;
        4) echo "URLSESSION / NETWORKING";;
        5) echo "ERROR HANDLING";;
        6) echo "SECURITY";;
        7) echo "CRYPTO / HASHING";;
        8) echo "FILES & I/O";;
        9) echo "THREADING / MAIN";;
        10) echo "PERFORMANCE";;
        11) echo "DEBUG / PRODUCTION";;
        12) echo "REGEX";;
        13) echo "SWIFTUI / COMBINE";;
        14) echo "MEMORY / RETAIN";;
        15) echo "CODE QUALITY MARKERS";;
        16) echo "RESOURCE LIFECYCLE";;
        17) echo "INFO.PLIST / ATS";;
        18) echo "DEPRECATED APIs";;
        19) echo "BUILD / SIGNING";;
        20) echo "PACKAGING / SPM";;
        21) echo "UI/UX SAFETY";;
        22) echo "TESTS / HYGIENE";;
        23) echo "LOCALIZATION / INTERNATIONALIZATION";;
        *) echo "(no category $cat)";;
      esac;;
    csharp)
      case "$cat" in
        1) echo "Exceptions & Nullability Hazards";;
        2) echo "Resources & IDisposable Footguns";;
        3) echo "Concurrency & Async Pitfalls";;
        4) echo "Numeric & Floating-Point Traps";;
        5) echo "Collections & LINQ Gotchas";;
        6) echo "Strings & Allocation Smells";;
        7) echo "Filesystem / Process / IO Risks";;
        8) echo "Security Red Flags";;
        9) echo "Code Quality Markers";;
        10) echo "API Misuse & Correctness";;
        11) echo "Tests / Debug Leftovers";;
        12) echo "Formatting & Analyzer Signals";;
        13) echo "Build & Test Health";;
        14) echo "Dependency Hygiene (NuGet)";;
        15) echo "Exception Handling Anti-patterns";;
        16) echo "ASP.NET / Web Pitfalls";;
        17) echo "AST-Grep Rule Pack";;
        18) echo "Project Inventory";;
        19) echo "Resource Lifecycle Correlation";;
        20) echo "Async Locks / Semaphores / Await-in-Lock";;
        21) echo "Exception Surfaces & Rethrow Issues";;
        22) echo "Suspicious Casts & Truncation";;
        23) echo "Parsing & Validation Robustness";;
        24) echo "Perf / DoS Hotspots";;
        *) echo "(no category $cat)";;
      esac;;
    elixir)
      case "$cat" in
        1) echo "PATTERN MATCHING & GUARDS";;
        2) echo "ERROR HANDLING & EXCEPTIONS";;
        3) echo "PROCESS & OTP LIFECYCLE";;
        4) echo "SECURITY VULNERABILITIES";;
        5) echo "PHOENIX-SPECIFIC ISSUES";;
        6) echo "ECTO & DATABASE";;
        7) echo "CONCURRENCY & MESSAGING";;
        8) echo "I/O & RESOURCE LIFECYCLE";;
        9) echo "DEBUGGING & PRODUCTION CODE";;
        10) echo "PERFORMANCE & MEMORY";;
        11) echo "CODE QUALITY MARKERS";;
        12) echo "CONFIGURATION & ENVIRONMENT";;
        13) echo "TESTING PATTERNS";;
        14) echo "DEPENDENCY & MIX HYGIENE";;
        15) echo "STRING & BINARY SAFETY";;
        16) echo "MIX-POWERED EXTRA ANALYZERS";;
        *) echo "(no category $cat)";;
      esac;;
    *) echo "(unknown language $lang)";;
  esac
}

# Emit a stderr warning when bare --skip=N is set while >1 language module
# will run. Category numbers are not stable across modules (issue #52), so
# users hitting this footgun should switch to per-language --skip-LANG=N.
warn_ambiguous_skip(){
  local skip_csv="$1"; shift
  local -a active_langs=("$@")
  [[ -z "$skip_csv" ]] && return 0
  [[ "${#active_langs[@]}" -lt 2 ]] && return 0
  IFS=',' read -r -a _wac <<<"$skip_csv"
  local cat lang line
  say_err ""
  say_err "${YELLOW}${WARN} WARNING:${RESET} bare --skip=${skip_csv} silences DIFFERENT categories in each language module."
  say_err "${YELLOW}${WARN}${RESET} Category numbers are NOT stable across modules (issue #52). What --skip=${skip_csv} hides:"
  for cat in "${_wac[@]}"; do
    cat="${cat//[[:space:]]/}"
    [[ -z "$cat" ]] && continue
    for lang in "${active_langs[@]}"; do
      line="$(category_name_for "$lang" "$cat")"
      say_err "${YELLOW}${WARN}${RESET}   ${WHITE}--skip=${cat}${RESET} in ${CYAN}${lang}${RESET}: ${line}"
    done
  done
  say_err "${YELLOW}${WARN}${RESET} To silence in only one language, use --skip-LANG=${skip_csv} (e.g. --skip-js=${skip_csv} or --skip-rust=${skip_csv})."
  say_err ""
  unset _wac
}

# Build selected language set
select_langs(){
  local detected=()
  for L in "${ALL_LANGS[@]}"; do
    detect_lang "$L" && detected+=("$L")
  done
  # apply --only / --exclude
  local filtered=() i
  if [[ -n "$ONLY_LANGS" ]]; then
    IFS=',' read -r -a want <<<"$ONLY_LANGS"
    for i in "${detected[@]}"; do
      for w in "${want[@]}"; do [[ "$i" == "$w" ]] && filtered+=("$i"); done
    done
    # Also accept aliases: --only=c should match detected cpp
    for w in "${want[@]}"; do
      local nw; nw="$(normalize_lang "$w")"
      if [[ "$nw" != "$w" ]]; then
        for i in "${detected[@]}"; do
          [[ "$i" == "$nw" ]] && filtered+=("$i")
        done
      fi
    done
  else
    filtered=("${detected[@]}")
  fi
  if [[ -n "$EXCLUDE_LANGS" ]]; then
    IFS=',' read -r -a drop <<<"$EXCLUDE_LANGS"
    local keep=()
    for i in "${filtered[@]}"; do
      local skip=0; for d in "${drop[@]}"; do [[ "$i" == "$d" || "$(normalize_lang "$d")" == "$i" ]] && skip=1; done
      [[ $skip -eq 0 ]] && keep+=("$i")
    done
    filtered=("${keep[@]}")
  fi
  # Normalize all language names to module names and deduplicate.
  local normalized=() seen_langs=""
  for i in "${filtered[@]}"; do
    local n; n="$(normalize_lang "$i")"
    if [[ " $seen_langs " != *" $n "* ]]; then
      normalized+=("$n")
      seen_langs="$seen_langs $n"
    fi
  done
  echo "${normalized[@]}"
}

# Run a module job
run_lang(){
  local lang="$1" module="$2" fmt="$3"
  local out_txt="$TMPDIR_RUN/$lang.txt"
  local out_json="$TMPDIR_RUN/$lang.json"
  local out_sarif="$TMPDIR_RUN/$lang.sarif"
  local out_findings="$TMPDIR_RUN/$lang.findings.json"
  local err="$TMPDIR_RUN/$lang.err"
  local status_file="$TMPDIR_RUN/$lang.status"
  local metrics_dir="$TMPDIR_RUN/$lang.metrics"
  local module_status=0
  local start_ts=$SECONDS

  if [[ "${QUIET:-0}" -eq 0 ]]; then
    say_err "${DIM}Scanning $lang...${RESET}"
  fi

  local args=()
  [[ "$CI_MODE" -eq 1 ]] && args+=("--ci")
  [[ "$FAIL_ON_WARNING" -eq 1 ]] && args+=("--fail-on-warning")
  [[ "$VERBOSE" -eq 1 ]] && args+=('-v')
  [[ "${QUIET:-0}" -eq 1 ]] && args+=('-q')
  [[ "$JOBS" -gt 0 ]] && args+=("--jobs=$JOBS")
  if [[ "$lang" == "csharp" && ${#CSHARP_MODULE_ARGS[@]} -gt 0 ]]; then
    args+=("${CSHARP_MODULE_ARGS[@]}")
  fi
  if [[ -n "$GLOBAL_EXCLUDE_PATTERNS" && ${#SCAN_FILES[@]} -eq 0 ]]; then
    args+=("--exclude=$GLOBAL_EXCLUDE_PATTERNS")
  fi
  # Issue #52: combine the global (bare --skip=N) and per-language
  # (--skip-LANG=N) skip CSVs before forwarding to the module. The module
  # accepts a single comma-separated --skip= value.
  local _combined_skip=""
  if [[ -n "${UBS_SKIP_CATEGORIES:-}" ]]; then
    _combined_skip="$UBS_SKIP_CATEGORIES"
  fi
  if [[ -n "${SKIP_BY_LANG[$lang]:-}" ]]; then
    if [[ -n "$_combined_skip" ]]; then
      _combined_skip="${_combined_skip},${SKIP_BY_LANG[$lang]}"
    else
      _combined_skip="${SKIP_BY_LANG[$lang]}"
    fi
  fi
  [[ -n "$_combined_skip" ]] && args+=("--skip=$_combined_skip")
  args+=("$PROJECT_DIR")

  case "$fmt" in
    json|jsonl|toon)
      prepare_metrics_dir "$metrics_dir"
      local -a report_args=()
      if [[ "$lang" == "js" ]]; then
        report_args=(--report-json="$out_findings")
      elif [[ "$lang" == "csharp" ]]; then
        report_args=(--emit-findings-json="$out_findings")
      fi

      if UBS_METRICS_DIR="$metrics_dir" UBS_LANG="$lang" UBS_SKIP_TYPE_NARROWING="$SKIP_TYPE_NARROWING" \
        "$BASH" "$module" "${args[@]}" "${report_args[@]}" --format=json >"$out_json" 2>"$err"; then
        module_status=0
      else
        module_status=$?
      fi
      restore_original_paths "$out_json"
      # Modules that implement --format=json must emit a UBS summary *object*.
      # If they emit other JSON types (e.g., an array of findings), fall back to
      # text mode so we can still produce a stable combined summary.
      if need_cmd jq && jq -e 'type=="object" and (.files|type)=="number" and (.critical|type)=="number" and (.warning|type)=="number" and (.info|type)=="number"' "$out_json" >/dev/null 2>&1; then
        jq --arg language "$lang" '. + {language: $language}' "$out_json" > "$out_json.tmp" && mv "$out_json.tmp" "$out_json"
        attach_metrics_to_json "$out_json" "$metrics_dir"
      else
        prepare_metrics_dir "$metrics_dir"
        if UBS_METRICS_DIR="$metrics_dir" UBS_LANG="$lang" UBS_SKIP_TYPE_NARROWING="$SKIP_TYPE_NARROWING" \
          "$BASH" "$module" "${args[@]}" "${report_args[@]}" 2>>"$err" | apply_inline_suppressions >"$out_txt" 2>>"$err"; then
          module_status=0
        else
          module_status="${PIPESTATUS[0]}"
        fi
        restore_original_paths "$out_txt"
        parse_text_to_json "$lang" "$out_txt" "$out_json"
        attach_metrics_to_json "$out_json" "$metrics_dir"
      fi
      ;;
    sarif)
      prepare_metrics_dir "$metrics_dir"
      if UBS_METRICS_DIR="$metrics_dir" UBS_LANG="$lang" UBS_SKIP_TYPE_NARROWING="$SKIP_TYPE_NARROWING" \
        "$BASH" "$module" "${args[@]}" --format=sarif >"$out_sarif" 2>"$err"; then
        module_status=0
      else
        module_status=$?
      fi
      restore_original_paths "$out_sarif"
      if need_cmd jq && jq -e . "$out_sarif" >/dev/null 2>&1; then
        parse_sarif_to_json "$lang" "$out_sarif" "$out_json" || true
        attach_metrics_to_json "$out_json" "$metrics_dir" 2>/dev/null || true
      else
        prepare_metrics_dir "$metrics_dir"
        if UBS_METRICS_DIR="$metrics_dir" UBS_LANG="$lang" UBS_SKIP_TYPE_NARROWING="$SKIP_TYPE_NARROWING" \
          "$BASH" "$module" "${args[@]}" 2>>"$err" | apply_inline_suppressions >"$out_txt" 2>>"$err"; then
          module_status=0
        else
          module_status="${PIPESTATUS[0]}"
        fi
        restore_original_paths "$out_txt"
        minimal_sarif_from_text "$lang" "$out_txt" >"$out_sarif"
        parse_text_to_json "$lang" "$out_txt" "$out_json"
        attach_metrics_to_json "$out_json" "$metrics_dir"
      fi
      ;;
    text|*)
      prepare_metrics_dir "$metrics_dir"
      if UBS_METRICS_DIR="$metrics_dir" UBS_LANG="$lang" UBS_SKIP_TYPE_NARROWING="$SKIP_TYPE_NARROWING" \
        "$BASH" "$module" "${args[@]}" 2>"$err" | apply_inline_suppressions >"$out_txt" 2>>"$err"; then
        module_status=0
      else
        module_status="${PIPESTATUS[0]}"
      fi
      restore_original_paths "$out_txt"
      parse_text_to_json "$lang" "$out_txt" "$out_json"
      attach_metrics_to_json "$out_json" "$metrics_dir"
      ;;
  esac

  local duration=$((SECONDS - start_ts))
  if [[ "${QUIET:-0}" -eq 0 ]]; then
    say_err "${DIM}Finished $lang (${duration}s)${RESET}"
  fi

  echo "$module_status" >"$status_file"
  return "$module_status"
}

# Parse legacy text logs → JSON summary (robust to colors)
parse_text_to_json(){
  local lang="$1" txt="$2" json="$3"
  local critical=0 warning=0 info=0 files=0
  # Strip ANSI, normalize
  local cleaned; cleaned="$(sed -E 's/\x1B\[[0-9;]*[mK]//g' "$txt" | tr -d '\r\0')"
  critical=$(printf '%s\n' "$cleaned" | grep -E 'Critical issues:|CRITICAL' | grep -Eo '[0-9]+' | tail -n1 || true)
  warning=$(printf '%s\n' "$cleaned" | grep -E 'Warning issues:|Warning' | grep -Eo '[0-9]+' | tail -n1 || true)
  info=$(printf '%s\n' "$cleaned" | grep -E 'Info items:|Info' | grep -Eo '[0-9]+' | tail -n1 || true)
  files=$(printf '%s\n' "$cleaned" | grep -E 'Files scanned:' | grep -Eo '[0-9]+' | tail -n1 || true)
  if [[ -z "$files" ]]; then
    files=$(printf '%s\n' "$cleaned" \
      | grep -E 'Files:[[:space:]]*[0-9]+' \
      | head -n1 \
      | grep -Eo '[0-9]+' \
      | head -n1 || true)
  fi
  critical=${critical:-0}; warning=${warning:-0}; info=${info:-0}; files=${files:-0}
  local proj_display
  proj_display="$(json_escape "${SOURCE_PROJECT_DIR:-$PROJECT_DIR}")"
  cat >"$json" <<JSON
{"language":"$lang","project":"$proj_display","files":$files,"critical":$critical,"warning":$warning,"info":$info,"timestamp":"$(date_iso)"}
JSON
}

attach_metrics_to_json(){
  local json_path="$1" metrics_dir="$2"
  [[ -f "$json_path" ]] || return 0
  [[ -d "$metrics_dir" ]] || return 0
  local files=()
  while IFS= read -r -d '' f; do files+=("$f"); done < <(find "$metrics_dir" -maxdepth 1 -type f -name '*.json' -print0 2>/dev/null)
  [[ ${#files[@]} -gt 0 ]] || return 0
  if command -v python3 >/dev/null 2>&1; then
    python3 - "$json_path" "${files[@]}" <<'PY'
import json, sys
from pathlib import Path

json_path = Path(sys.argv[1])
with json_path.open() as fh:
    data = json.load(fh)
if not isinstance(data, dict):
    sys.exit(0)
extras = data.get("extras", {})
for extra_path in map(Path, sys.argv[2:]):
    try:
        payload = json.loads(extra_path.read_text())
    except Exception:
        continue
    if isinstance(payload, dict):
        extras.update(payload)
if extras:
    data["extras"] = extras
    json_path.write_text(json.dumps(data))
PY
  fi
}

minimal_sarif_from_text(){
  local lang="$1" txt="$2"
  local critical=0 warning=0 info=0
  local cleaned; cleaned="$(sed -E 's/\x1B\[[0-9;]*[mK]//g' "$txt" | tr -d '\r')"
  critical=$(printf '%s\n' "$cleaned" | grep -E 'Critical issues:|CRITICAL' | grep -Eo '[0-9]+' | tail -n1 || true)
  warning=$(printf '%s\n' "$cleaned" | grep -E 'Warning issues:|Warning' | grep -Eo '[0-9]+' | tail -n1 || true)
  info=$(printf '%s\n' "$cleaned" | grep -E 'Info items:|Info' | grep -Eo '[0-9]+' | tail -n1 || true)
  cat <<SARIF
{"version":"2.1.0","runs":[{"tool":{"driver":{"name":"UBS ($lang)","informationUri":"https://github.com/Dicklesworthstone/ultimate_bug_scanner"}},"results":[
  {"ruleId":"summary.critical","level":"error","message":{"text":"$critical critical findings"}},
  {"ruleId":"summary.warning","level":"warning","message":{"text":"$warning warnings"}},
  {"ruleId":"summary.info","level":"note","message":{"text":"$info info items"}}
]}]}
SARIF
}

parse_sarif_to_json(){
  local lang="$1" sarif="$2" json="$3"
  [[ -f "$sarif" ]] || return 1
  if ! need_cmd jq; then
    say "${YELLOW}${WARN}${RESET} jq not available; cannot parse SARIF"
    return 1
  fi
  local critical warning info files
  critical=$(jq '[.runs[]?.results[]? | select((.level // "warning") == "error")] | length' "$sarif" 2>/dev/null || echo 0)
  warning=$(jq '[.runs[]?.results[]? | select((.level // "warning") == "warning")] | length' "$sarif" 2>/dev/null || echo 0)
  info=$(jq '[.runs[]?.results[]? | select((.level // "warning") == "note")] | length' "$sarif" 2>/dev/null || echo 0)
  files=$(jq '[.runs[]?.results[]?.locations[]?.physicalLocation?.artifactLocation?.uri?] | unique | length' "$sarif" 2>/dev/null || echo 0)
  critical=${critical:-0}; warning=${warning:-0}; info=${info:-0}; files=${files:-0}
  local proj_display
  proj_display="$(json_escape "${SOURCE_PROJECT_DIR:-$PROJECT_DIR}")"
  cat >"$json" <<JSON
{"language":"$lang","project":"$proj_display","files":$files,"critical":$critical,"warning":$warning,"info":$info,"timestamp":"$(date_iso)"}
JSON
}

merge_json_scanners(){
  # Exclude *.findings.json from summary merge (those are detailed findings)
  local jsons=()
  for f in "$TMPDIR_RUN"/*.json; do
    [[ "$f" == *.findings.json ]] && continue
    [[ -f "$f" ]] && jsons+=("$f")
  done
  if [[ ${#jsons[@]} -eq 0 ]]; then
    say "${YELLOW}${WARN}${RESET} No scanner JSON files found"; return 1
  fi
  if ! need_cmd jq; then
    say "${YELLOW}${WARN}${RESET} jq not found; cannot emit combined JSON"; return 1
  fi
  # First merge the summary JSONs
  local base_json
  base_json=$(jq -s --arg project "$SOURCE_PROJECT_DIR" --arg ts "$(date_iso)" '
    def nz(x): if (x|type)=="number" then x else 0 end;
    {project:$project, timestamp:$ts, scanners: .,
     totals:{
       critical: (map(nz(.critical)) | add),
       warning:  (map(nz(.warning))  | add),
       info:     (map(nz(.info))     | add),
       files:    (map(nz(.files))    | add)
     }}' "${jsons[@]}")

  # Now merge in findings from *.findings.json files (if any exist)
  local findings_jsons=( "$TMPDIR_RUN"/*.findings.json )
  if [[ -f "${findings_jsons[0]}" ]]; then
    # Build a map of language -> findings array
    local findings_map="{}"
    local fm_parts=""
    for f in "${findings_jsons[@]}"; do
      [[ -f "$f" ]] || continue
      local lang_name
      lang_name=$(basename "$f" .findings.json)
      local part
      part=$(jq -c --arg lang "$lang_name" '{($lang): .findings}' "$f" 2>/dev/null) || continue
      [[ -n "$part" ]] && fm_parts+="$part"$'\n'
    done
    if [[ -n "$fm_parts" ]]; then
      findings_map=$(printf '%s' "$fm_parts" | jq -s 'add // {}')
    fi

    # Merge findings into each scanner entry (only if we have valid findings_map)
    if [[ -n "$findings_map" && "$findings_map" != "{}" && "$findings_map" != "null" ]]; then
      echo "$base_json" | jq --argjson fm "$findings_map" '
        .scanners |= map(
          if .language and $fm[.language] then
            . + {findings: $fm[.language]}
          else . end
        )'
    else
      echo "$base_json"
    fi
  else
    echo "$base_json"
  fi
}

generate_combined_json(){
  [[ -n "$COMBINED_JSON_FILE" ]] || return 1
  if [[ -s "$COMBINED_JSON_FILE" ]]; then return 0; fi
  if ! need_cmd jq; then return 1; fi
  merge_json_scanners >"$COMBINED_JSON_FILE" 2>/dev/null || return 1
  return 0
}

merge_sarif_runs(){
  local sarifs=( "$TMPDIR_RUN"/*.sarif )
  # Check if any sarif files exist (glob might expand to literal if no matches)
  if [[ ${#sarifs[@]} -eq 0 ]] || [[ ! -f "${sarifs[0]}" ]]; then
    say "${YELLOW}${WARN}${RESET} No SARIF files found to merge"
    echo '{"version":"2.1.0","runs":[]}'
    return 0
  fi
  if ! need_cmd jq; then
    say "${YELLOW}${WARN}${RESET} jq not found; cannot merge SARIF; printing first artifact"; cat "${sarifs[0]}"; return 0
  fi
  # Filter to only valid JSON files
  local valid_sarifs=()
  for f in "${sarifs[@]}"; do
    if [[ -f "$f" ]] && jq -e . "$f" >/dev/null 2>&1; then
      valid_sarifs+=("$f")
    else
      say_err "${DIM}Skipping invalid SARIF: $f${RESET}"
    fi
  done
  if [[ ${#valid_sarifs[@]} -eq 0 ]]; then
    say "${YELLOW}${WARN}${RESET} No valid SARIF files to merge"
    echo '{"version":"2.1.0","runs":[]}'
    return 0
  fi
  # Accept either raw SARIF root or wrapped under "sarifLog"
  # Note: (... | add) // [] handles the case where add returns null (empty/null arrays)
  local jq_err="$TMPDIR_RUN/sarif-merge.err"
  if jq -s --arg repo "$GIT_REMOTE_HTTP" --arg rev "$GIT_COMMIT_SHA" --arg auto "$SARIF_AUTOMATION_ID" '
      def toRuns(x):
        if x.sarifLog? then (x.sarifLog.runs // [])
        elif x.version? and x.runs? then (x.runs // [])
        else [] end;
      def attachMeta(run):
        (if ($repo|length) > 0 then run + {versionControlProvenance:[{repositoryUri:$repo, revisionId:$rev}]}
         else run end)
        | (if ($auto|length) > 0 then . + {automationDetails:{id:$auto}} else . end);
      {"version":"2.1.0","runs": ((map(toRuns(.)) | add) // [] | map(attachMeta(.)))}' "${valid_sarifs[@]}" 2>"$jq_err"; then
    return 0
  fi

  # Common when the user truncates output: `ubs --format=sarif ... | head -n 20`.
  # Do not treat SIGPIPE/EPIPE as a fatal error.
  if grep -q "Broken pipe" "$jq_err" 2>/dev/null; then
    return 0
  fi

  say_err "${YELLOW}${WARN}${RESET} Failed to merge SARIF runs"
  cat "$jq_err" >&2 || true
  return 1
}

write_jsonl_summary(){
  local dest="$1"
  if ! generate_combined_json; then return 1; fi
  local tmp="$TMPDIR_RUN/combined.jsonl"
  local ts="$(date_iso)"
  if ! need_cmd jq; then return 1; fi

  if [[ "${JSONL_DETAIL:-1}" -eq 1 ]]; then
    # Detailed mode: emit each finding as its own JSONL line
    jq -c --arg project "$SOURCE_PROJECT_DIR" --arg ts "$ts" '
      .scanners[] as $s |
      ($s.findings // [])[] |
      {type:"finding", project:$project, language:$s.language} + .
    ' "$COMBINED_JSON_FILE" >"$tmp" 2>/dev/null || true

    # Also emit scanner summaries
    jq -c --arg project "$SOURCE_PROJECT_DIR" --arg ts "$ts" '
      .scanners[] | {type:"scanner", project:$project, language, files, critical, warning, info, timestamp:(.timestamp // $ts)}
    ' "$COMBINED_JSON_FILE" >>"$tmp"
  else
    # Summary-only mode (legacy behavior)
    jq -c --arg project "$SOURCE_PROJECT_DIR" --arg ts "$ts" '
      .scanners[] | {type:"scanner", project:$project, language, files, critical, warning, info, timestamp:(.timestamp // $ts)}
    ' "$COMBINED_JSON_FILE" >"$tmp"
  fi

  # Always emit totals
  jq -c --arg project "$SOURCE_PROJECT_DIR" --arg ts "$ts" '
    {type:"totals", project:$project, files:(.totals.files//0), critical:(.totals.critical//0),
     warning:(.totals.warning//0), info:(.totals.info//0), timestamp:(.timestamp // $ts)}
  ' "$COMBINED_JSON_FILE" >>"$tmp"

  if [[ -n "$dest" ]]; then
    mkdir -p "$(dirname "$dest")"
    cp "$tmp" "$dest"
  else
    cat "$tmp"
  fi
}

# Emit a structured "no supported languages" result and exit.
#
# When none of UBS's supported languages are detected (e.g. a Dart-only repo, or
# a --files list with only unsupported extensions) no scanner runs. Previously
# the meta-runner printed a text warning and exited 0 with EMPTY stdout for every
# machine format, so automation parsing the JSON/SARIF saw "no output + exit 0"
# and could not distinguish "scanned clean" from "nothing was scanned". This
# emits an explicit, machine-readable result for each format so review gates can
# detect the no-coverage case instead of recording false confidence. Exit stays
# 0 because UBS itself ran correctly — there was simply nothing in scope.
emit_no_langs_result(){
  local proj="${SOURCE_PROJECT_DIR:-$PROJECT_DIR}"
  local supported="${ALL_LANGS[*]}"
  case "$FORMAT" in
    json|toon)
      local proj_e supported_json="" first=1 l
      proj_e="$(json_escape "$proj")"
      for l in "${ALL_LANGS[@]}"; do
        if [[ $first -eq 1 ]]; then supported_json="\"$(json_escape "$l")\""; first=0
        else supported_json+=",\"$(json_escape "$l")\""; fi
      done
      local payload
      payload=$(printf '{"result":"no-supported-languages","exit_code":0,"project":"%s","detected_languages":[],"supported_languages":[%s],"totals":{"critical":0,"warning":0,"info":0,"files":0},"scanners":[]}\n' "$proj_e" "$supported_json")
      if [[ "$FORMAT" == "toon" ]] && command -v "$TOON_BIN" >/dev/null 2>&1 && looks_like_toon_rust_encoder "$TOON_BIN"; then
        printf '%s' "$payload" | "$TOON_BIN" --encode || printf '%s' "$payload"
      else
        printf '%s' "$payload"
      fi
      ;;
    jsonl)
      local proj_e; proj_e="$(json_escape "$proj")"
      printf '{"type":"no-supported-languages","project":"%s","detected_languages":[],"supported_languages":"%s"}\n' "$proj_e" "$(json_escape "$supported")"
      printf '{"type":"totals","project":"%s","files":0,"critical":0,"warning":0,"info":0}\n' "$proj_e"
      ;;
    sarif)
      local proj_e; proj_e="$(json_escape "$proj")"
      printf '{"version":"2.1.0","runs":[{"tool":{"driver":{"name":"ubs","informationUri":"https://github.com/Dicklesworthstone/ultimate_bug_scanner","rules":[]}},"results":[],"invocations":[{"executionSuccessful":true,"exitCode":0,"properties":{"result":"no-supported-languages","project":"%s","supportedLanguages":"%s"}}]}]}\n' "$proj_e" "$(json_escape "$supported")"
      ;;
    text|*)
      say "${YELLOW}${WARN}${RESET} no supported languages detected in ${proj}"
      say "${DIM}UBS did not run any scanner: nothing was checked (this is NOT a pass).${RESET}"
      say "${DIM}Supported languages: ${supported}${RESET}"
      ;;
  esac
  exit 0
}

# ─────────────────────────────────────────────────────────────────────────────
# Banner & preflight
# ─────────────────────────────────────────────────────────────────────────────
if [[ "${FORMAT:-text}" == "text" ]]; then
  say "${BOLD}${CYAN}"
  cat <<'BANNER'
╔══════════════════════════════════════════════════════════════════════════════╗
║  ██╗   ██╗██╗  ████████╗██╗███╗   ███╗ █████╗ ████████╗███████╗              ║
║  ██║   ██║██║  ╚══██╔══╝██║████╗ ████║██╔══██╗╚══██╔══╝██╔════╝              ║
║  ██║   ██║██║     ██║   ██║██╔████╔██║███████║   ██║   █████╗                ║
║  ██║   ██║██║     ██║   ██║██║╚██╔╝██║██╔══██║   ██║   ██╔══╝                ║
║  ╚██████╔╝███████╗██║   ██║██║ ╚═╝ ██║██║  ██║   ██║   ███████╗              ║
║   ╚═════╝ ╚══════╝╚═╝   ╚═╝╚═╝     ╚═╝╚═╝  ╚═╝   ╚═╝   ╚══════╝              ║
║                                                                              ║
║  ██████╗ ██╗   ██╗ ██████╗         __       __                               ║
║  ██╔══██╗██║   ██║██╔════╝         \ `-'"-'` /                               ║
║  ██████╔╝██║   ██║██║  ███╗        / \_   _/ \                               ║
║  ██╔══██╗██║   ██║██║   ██║        |  d\_/b  |                               ║
║  ██████╔╝╚██████╔╝╚██████╔╝       .'\   V   /'.                              ║
║  ╚═════╝  ╚═════╝  ╚═════╝        /   '-...-'   \                            ║
║                                  | /         \ |                             ║
║                                  \/\         /\/                             ║
║                                  ==(||)---(||)==                             ║
║                                                                              ║
║  ███████╗  ██████╗   █████╗ ███╗   ██╗███╗   ██╗███████╗██████╗              ║
║  ██╔════╝  ██╔═══╝  ██╔══██╗████╗  ██║████╗  ██║██╔════╝██╔══██╗             ║
║  ███████╗  ██║      ███████║██╔██╗ ██║██╔██╗ ██║█████╗  ██████╔╝             ║
║  ╚════██║  ██║      ██╔══██║██║╚██╗██║██║╚██╗██║██╔══╝  ██╔══██╗             ║
║  ███████║  ██████╗  ██║  ██║██║ ╚████║██║ ╚████║███████╗██║  ██║             ║
║  ╚══════╝  ╚═════╝  ╚═╝╚═╝  ╚═══╝╚═╝  ╚═══╝╚══════╝╚═╝  ╚═╝                  ║
║                                                                              ║
║   JS / TS • PYTHON • C / C++ • RUST • GO • JAVA • RUBY                       ║
║   SWIFT • C# • ELIXIR                                                        ║
║                    UBS: ULTIMATE BUG SCANNER • SARIF FUSION ☄️               ║
║                                                                              ║
║                                                                              ║
║                     Night Owl QA                                             ║
║                     “We see bugs before you do.”                             ║
╚══════════════════════════════════════════════════════════════════════════════╝
BANNER
  say "${RESET}"
fi

say "${CYAN}${BOLD}UBS Meta-Runner v${UBS_VERSION}${RESET}  ${DIM}$(date_iso)${RESET}"
say "${WHITE}Project:${RESET} ${CYAN}$SOURCE_PROJECT_DIR${RESET}"
say "${WHITE}Format:${RESET}  ${CYAN}$FORMAT${RESET}"

langs=( $(select_langs) )
if [[ ${#langs[@]} -eq 0 ]]; then emit_no_langs_result; fi
say "${WHITE}Detected:${RESET} ${CYAN}${langs[*]}${RESET}"

# Issue #52: warn when bare --skip=N silences different categories per module.
if [[ "$BARE_SKIP_USED" -eq 1 && -n "${UBS_SKIP_CATEGORIES:-}" ]]; then
  warn_ambiguous_skip "$UBS_SKIP_CATEGORIES" "${langs[@]}"
fi

# Issue #52: normalize per-language skip keys (e.g. --skip-c → --skip-cpp)
# now that normalize_lang is defined.
if [[ "${#SKIP_BY_LANG[@]}" -gt 0 ]]; then
  declare -A _SKIP_NORMALIZED=()
  for _slk in "${!SKIP_BY_LANG[@]}"; do
    _sln="$(normalize_lang "$_slk")"
    if [[ -n "${_SKIP_NORMALIZED[$_sln]:-}" ]]; then
      _SKIP_NORMALIZED["$_sln"]="${_SKIP_NORMALIZED[$_sln]},${SKIP_BY_LANG[$_slk]}"
    else
      _SKIP_NORMALIZED["$_sln"]="${SKIP_BY_LANG[$_slk]}"
    fi
  done
  # Replace SKIP_BY_LANG with the normalized map.
  unset SKIP_BY_LANG
  declare -A SKIP_BY_LANG=()
  for _slk in "${!_SKIP_NORMALIZED[@]}"; do
    SKIP_BY_LANG["$_slk"]="${_SKIP_NORMALIZED[$_slk]}"
  done
  unset _SKIP_NORMALIZED _slk _sln
fi

# Ensure ast-grep is available for JS/TS runs (tool-cache auto-provisioning).
if [[ " ${langs[*]} " == *" js "* ]]; then
  if ensure_ast_grep; then
    export UBS_AST_GREP_BIN="$AST_GREP_BIN"
    if [[ "${QUIET:-0}" -eq 0 ]]; then
      say_err "${DIM}${INFO}${RESET} ast-grep (${AST_GREP_SOURCE}): ${AST_GREP_BIN}"
    fi
  else
    say_err "${RED}${X}${RESET} Environment error: ast-grep is required for accurate JS/TS scanning."
    say_err "${DIM}Fix: install ast-grep (https://ast-grep.github.io/) or run the UBS installer.${RESET}"
    if [[ "$FORMAT" == "json" || "$FORMAT" == "jsonl" || "$FORMAT" == "toon" ]]; then
      printf '{"error":"environment","exit_code":2,"failed_modules":["js"]}\n'
    fi
    exit 2
  fi
fi

# Resolve & ensure modules
declare -A MODULE_PATHS
for L in "${langs[@]}"; do
  p="$(resolve_module_path "$L")"
  ensure_module "$L" "$p" || { say "${RED}$X failed to ensure module for $L${RESET}"; exit 1; }
  MODULE_PATHS["$L"]="$p"
done

# ─────────────────────────────────────────────────────────────────────────────
# Execute modules concurrently
# ─────────────────────────────────────────────────────────────────────────────
declare -A PID_LANG=()
pids=()
for L in "${langs[@]}"; do
  run_lang "$L" "${MODULE_PATHS[$L]}" "$FORMAT" &
  pid=$!
  pids+=("$pid")
  PID_LANG["$pid"]="$L"
done

# Wait & collect statuses
status=0
HAS_ENV_ERROR=0
ENV_ERROR_LANGS=()
for pid in "${pids[@]}"; do
  rc=0
  if wait "$pid"; then
    rc=0
  else
    rc=$?
  fi
  if [[ "$rc" -eq 2 ]]; then
    HAS_ENV_ERROR=1
    ENV_ERROR_LANGS+=("${PID_LANG[$pid]:-unknown}")
  fi
  if [[ "$rc" -gt "$status" ]]; then
    status="$rc"
  fi
done

# ─────────────────────────────────────────────────────────────────────────────
# Environment error handling (exit code 2)
# ─────────────────────────────────────────────────────────────────────────────
env_error_excerpt(){
  local lang="$1"
  local err_file="$TMPDIR_RUN/$lang.err"
  local txt_file="$TMPDIR_RUN/$lang.txt"
  if [[ -s "$err_file" ]]; then
    sed -E 's/\x1B\[[0-9;]*[mK]//g' "$err_file" | tail -n 50
    return 0
  fi
  if [[ -s "$txt_file" ]]; then
    sed -E 's/\x1B\[[0-9;]*[mK]//g' "$txt_file" \
      | awk 'f{print} /Environment error:/{f=1}' \
      | tail -n 50
  fi
}

emit_env_error_report(){
  say_err "${RED}${X}${RESET} Environment error: one or more scanners could not run correctly."
  say_err "${DIM}This is a tooling/dependency problem, not a code-quality failure.${RESET}"
  for lang in "${ENV_ERROR_LANGS[@]}"; do
    say_err ""
    say_err "${RED}${X}${RESET} ${BOLD}${lang}${RESET} (exit 2)"
    env_error_excerpt "$lang" | sed 's/^/  /' >&2 || true
  done
}

emit_env_error_json(){
  local proj; proj="$(json_escape "${SOURCE_PROJECT_DIR:-$PROJECT_DIR}")"
  local modules_json=""
  local first=1
  for lang in "${ENV_ERROR_LANGS[@]}"; do
    local lang_json; lang_json="$(json_escape "$lang")"
    if [[ $first -eq 1 ]]; then
      modules_json="\"$lang_json\""
      first=0
    else
      modules_json+=",\"$lang_json\""
    fi
  done
  printf '{"error":"environment","exit_code":2,"project":"%s","failed_modules":[%s]}\n' "$proj" "$modules_json"
}

# ─────────────────────────────────────────────────────────────────────────────
# Emit unified result
# ─────────────────────────────────────────────────────────────────────────────
case "$FORMAT" in
  json)
    if [[ "$HAS_ENV_ERROR" -eq 1 ]]; then
      emit_env_error_report
      emit_env_error_json
      status=2
    else
      if generate_combined_json; then
        cat "$COMBINED_JSON_FILE"
      else
        if ! merge_json_scanners; then
          say "${RED}$X could not produce combined JSON${RESET}"
          [[ "$status" -lt 1 ]] && status=1
        fi
      fi
    fi
    ;;
  jsonl)
    if [[ "$HAS_ENV_ERROR" -eq 1 ]]; then
      emit_env_error_report
      emit_env_error_json
      status=2
    else
      if write_jsonl_summary ""; then
        :
      else
        say "${RED}$X could not produce JSONL output${RESET}"
        [[ "$status" -lt 1 ]] && status=1
      fi
    fi
    ;;
  sarif)
    if [[ "$HAS_ENV_ERROR" -eq 1 ]]; then
      emit_env_error_report
      status=2
    else
      merge_sarif_runs
    fi
    ;;
  toon)
    if [[ "$HAS_ENV_ERROR" -eq 1 ]]; then
      emit_env_error_report
      emit_env_error_json
      status=2
    else
      # Check if TOON encoder is available (UBS_TEST_FORCE_NO_TOON=1 forces fallback for testing)
      # TOON_BIN can be set to toon_rust's tru binary for better performance
      toon_skip_reason=""
      if [[ "${UBS_TEST_FORCE_NO_TOON:-0}" == "1" ]]; then
        toon_skip_reason="disabled by UBS_TEST_FORCE_NO_TOON=1"
      elif ! command -v "$TOON_BIN" >/dev/null 2>&1; then
        toon_skip_reason="not found in PATH"
      elif ! looks_like_toon_rust_encoder "$TOON_BIN"; then
        toon_skip_reason="does not appear to be toon_rust (expected tru)"
      fi

      if [[ -z "$toon_skip_reason" ]]; then
        if generate_combined_json; then
          "$TOON_BIN" --encode < "$COMBINED_JSON_FILE"
        else
          if ! merge_json_scanners | "$TOON_BIN" --encode; then
            say "${RED}$X could not produce TOON output${RESET}"
            [[ "$status" -lt 1 ]] && status=1
          fi
        fi
      else
        say_err "${YELLOW}Warning: $TOON_BIN (TOON encoder) $toon_skip_reason; falling back to --format=json${RESET}"
        say_err "${DIM}  --format=toon requires 'tru' from https://github.com/Dicklesworthstone/toon_rust${RESET}"
        say_err "${DIM}  Install: curl -fsSL https://raw.githubusercontent.com/Dicklesworthstone/toon_rust/main/install.sh | bash${RESET}"
        say_err "${DIM}  Or set TOON_TRU_BIN=/path/to/tru if it's installed elsewhere.${RESET}"
        say_err "${DIM}  Note: the Node.js 'toon' CLI and upstream toon-format/toon-rust's 'toon' binary are different projects and not supported here.${RESET}"
        if generate_combined_json; then
          cat "$COMBINED_JSON_FILE"
        else
          if ! merge_json_scanners; then
            say "${RED}$X could not produce combined JSON${RESET}"
            [[ "$status" -lt 1 ]] && status=1
          fi
        fi
      fi
    fi
    ;;
  text|*)
    for L in "${langs[@]}"; do
      say "\n${MAGENTA}${BOLD}──────── $L ────────${RESET}"
      if [ -s "$TMPDIR_RUN/$L.txt" ]; then
        print_with_permalinks "$TMPDIR_RUN/$L.txt"
      elif [ -s "$TMPDIR_RUN/$L.json" ]; then
        say "${DIM}[json summary]${RESET}"
        cat "$TMPDIR_RUN/$L.json"
      elif [ -s "$TMPDIR_RUN/$L.sarif" ]; then
        say "${DIM}[sarif summary]${RESET}"
        cat "$TMPDIR_RUN/$L.sarif"
      fi
    done
    if [[ "$HAS_ENV_ERROR" -eq 1 ]]; then
      say "\n${RED}${BOLD}──────── Environment Error ────────${RESET}"
      say "${RED}${X}${RESET} One or more scanners could not run correctly (exit 2)."
      say "${DIM}This is a tooling/dependency problem, not a code-quality failure.${RESET}"
      say "${DIM}See the affected scanner output above for remediation guidance.${RESET}"
      status=2
    else
      # Combined human summary (if JSON pieces exist)
      if need_cmd jq && ls "$TMPDIR_RUN"/*.json >/dev/null 2>&1; then
        say "\n${WHITE}${BOLD}──────── Combined Summary ────────${RESET}"
        if generate_combined_json; then
          jq -r '"Files: \(.totals.files)\nCritical: \(.totals.critical)\nWarning: \(.totals.warning)\nInfo: \(.totals.info)"' "$COMBINED_JSON_FILE"
          totals=$(jq -r '.totals' "$COMBINED_JSON_FILE")
        else
          merge_json_scanners | jq -r '"Files: \(.totals.files)\nCritical: \(.totals.critical)\nWarning: \(.totals.warning)\nInfo: \(.totals.info)"'
          totals=$(merge_json_scanners | jq -r '.totals')
        fi
        crit=$(printf '%s' "$totals" | jq -r '.critical')
        warn=$(printf '%s' "$totals" | jq -r '.warning')
        desired=0
        if [[ "$FAIL_ON_WARNING" -eq 1 && $((crit+warn)) -gt 0 ]]; then desired=1; fi
        if [[ "$FAIL_ON_WARNING" -eq 0 && "$crit" -gt 0 ]]; then desired=1; fi
        if [[ "$desired" -gt "$status" ]]; then status="$desired"; fi
      fi
    fi
    ;;
	esac

	# Ensure exit status reflects merged totals in machine formats too.
	# Some modules emit machine output but always exit 0; the meta-runner should still fail
	# when critical findings exist (or warnings in --fail-on-warning mode).
	if [[ "$HAS_ENV_ERROR" -eq 0 && ( "$FORMAT" == "json" || "$FORMAT" == "jsonl" || "$FORMAT" == "sarif" || "$FORMAT" == "toon" ) ]]; then
	  if need_cmd jq && generate_combined_json; then
	    crit=$(jq -r '.totals.critical // 0' "$COMBINED_JSON_FILE" 2>/dev/null || echo 0)
	    warn=$(jq -r '.totals.warning // 0' "$COMBINED_JSON_FILE" 2>/dev/null || echo 0)
	    crit=${crit:-0}; warn=${warn:-0}
	    desired=0
	    if [[ "$FAIL_ON_WARNING" -eq 1 && $((crit + warn)) -gt 0 ]]; then desired=1; fi
	    if [[ "$FAIL_ON_WARNING" -eq 0 && "$crit" -gt 0 ]]; then desired=1; fi
	    if [[ "$desired" -gt "$status" ]]; then status="$desired"; fi
	  fi
	fi

	if [[ "$HAS_ENV_ERROR" -eq 1 ]]; then
	  [[ -n "$BEADS_JSONL_PATH" ]] && say_err "${YELLOW}${WARN}${RESET} Skipping Beads JSONL export due to environment error."
	  [[ -n "$REPORT_JSON_PATH" || -n "$HTML_REPORT_PATH" || -n "$COMPARISON_FILE" ]] \
    && say_err "${YELLOW}${WARN}${RESET} Skipping shareable artifacts due to environment error."
	  exit "$status"
	fi

if [[ -n "$BEADS_JSONL_PATH" ]]; then
  if ! write_jsonl_summary "$BEADS_JSONL_PATH"; then
    say "${YELLOW}${WARN}${RESET} Could not write Beads JSONL to $BEADS_JSONL_PATH"
  else
    say "${DIM}${INFO}${RESET} Beads JSONL written to $BEADS_JSONL_PATH"
  fi
fi

SHAREABLE_REQUEST=0
if [[ "$HAS_ENV_ERROR" -eq 0 ]]; then
  [[ -n "$REPORT_JSON_PATH" || -n "$HTML_REPORT_PATH" || -n "$COMPARISON_FILE" ]] && SHAREABLE_REQUEST=1
fi

if [[ "$HAS_ENV_ERROR" -eq 0 && $SHAREABLE_REQUEST -eq 1 ]]; then
  if generate_combined_json; then
    SHAREABLE_JSON_FILE="$COMBINED_JSON_FILE"
    SHAREABLE_TIMESTAMP="$(date_iso)"
    if ! need_cmd python3; then
      say "${YELLOW}${WARN}${RESET} python3 not available; cannot build shareable artifacts"
    else
      python3 - "$SHAREABLE_JSON_FILE" "${COMPARISON_FILE:-}" \
        "${REPORT_JSON_PATH:-}" "${HTML_REPORT_PATH:-}" \
        "${GIT_REMOTE_HTTP:-}" "${GIT_COMMIT_SHA:-}" "${GIT_BLOB_BASE:-}" \
        "$SHAREABLE_TIMESTAMP" <<'PY' 1>&2
import json, sys, pathlib, datetime, html
combined_path, baseline_path, out_json, out_html, repo_url, commit, blob_base, ts = sys.argv[1:9]
root = pathlib.Path(combined_path)
if not root.exists():
    sys.exit(0)
combined = json.loads(root.read_text())

def load_optional(path):
    if not path:
        return None
    p = pathlib.Path(path)
    if not p.exists():
        return None
    try:
        return json.loads(p.read_text())
    except Exception:
        return None

baseline = load_optional(baseline_path)

shareable = combined.copy()
shareable["generated_at"] = ts
if repo_url:
    git = {"repository": repo_url}
    if commit:
        git["commit"] = commit
    if blob_base:
        git["blob_base"] = blob_base
    shareable["git"] = git

def get_totals(doc):
    if not doc:
        return {"files":0,"critical":0,"warning":0,"info":0}
    t = doc.get("totals", {})
    return {
        "files": int(t.get("files", 0) or 0),
        "critical": int(t.get("critical", 0) or 0),
        "warning": int(t.get("warning", 0) or 0),
        "info": int(t.get("info", 0) or 0),
    }

cur_totals = get_totals(combined)
base_totals = get_totals(baseline)

if baseline is not None:
    shareable["comparison"] = {
        "baseline_path": baseline_path,
        "delta": {
            "critical": cur_totals["critical"] - base_totals["critical"],
            "warning": cur_totals["warning"] - base_totals["warning"],
            "info": cur_totals["info"] - base_totals["info"],
        },
        "baseline_totals": base_totals,
    }

if out_json:
    out_path = pathlib.Path(out_json)
    out_path.parent.mkdir(parents=True, exist_ok=True)
    out_path.write_text(json.dumps(shareable, indent=2), encoding="utf-8")

if out_html:
    totals_html = f"""
    <table>
      <tr><th>Metric</th><th>Current</th><th>Baseline</th><th>Δ</th></tr>
      <tr><td>Critical</td><td>{cur_totals['critical']}</td><td>{base_totals['critical']}</td><td>{cur_totals['critical']-base_totals['critical']}</td></tr>
      <tr><td>Warning</td><td>{cur_totals['warning']}</td><td>{base_totals['warning']}</td><td>{cur_totals['warning']-base_totals['warning']}</td></tr>
      <tr><td>Info</td><td>{cur_totals['info']}</td><td>{base_totals['info']}</td><td>{cur_totals['info']-base_totals['info']}</td></tr>
    </table>
    """
    scanners = shareable.get("scanners", [])
    scanner_rows = []
    for entry in scanners:
        lang = entry.get("language", "-")
        ct = entry.get("critical", entry.get("totals", {}).get("critical"))
        wt = entry.get("warning", entry.get("totals", {}).get("warning"))
        it = entry.get("info", entry.get("totals", {}).get("info"))
        scanner_rows.append(f"<tr><td>{html.escape(str(lang))}</td><td>{ct or 0}</td><td>{wt or 0}</td><td>{it or 0}</td></tr>")
    scanners_html = "\n".join(scanner_rows)
    doc = f"""
    <html><head><meta charset='utf-8'><title>UBS Report</title>
    <style>body{{font-family:Arial,sans-serif;padding:1.5rem;background:#111;color:#eee;}}
    table{{border-collapse:collapse;margin-top:1rem;}}
    th,td{{border:1px solid #444;padding:0.4rem 0.8rem;text-align:left;}}
    h1{{margin-bottom:0;}}
    .meta{{color:#aaa;font-size:0.9rem;}}
    </style></head><body>
    <h1>Ultimate Bug Scanner Report</h1>
    <div class='meta'>Generated {html.escape(ts)}</div>
    {totals_html}
    <h2>Per-language totals</h2>
    <table><tr><th>Language</th><th>Critical</th><th>Warning</th><th>Info</th></tr>{scanners_html}</table>
    </body></html>
    """
    out_path = pathlib.Path(out_html)
    out_path.parent.mkdir(parents=True, exist_ok=True)
    out_path.write_text(doc, encoding="utf-8")

print(f"Shareable summary written (critical={cur_totals['critical']}, warning={cur_totals['warning']}, info={cur_totals['info']})")
PY
    fi
  else
    say "${YELLOW}${WARN}${RESET} jq not available; cannot build shareable artifacts"
  fi
fi

exit "$status"