From 47c7371f1dd952ef0cc5283114aa30395e264658 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:01:41 -0500
Subject: [PATCH 01/26] add performance and benchmarking roadmap track

---
 ROADMAP.md | 51 +++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 51 insertions(+)

diff --git a/ROADMAP.md b/ROADMAP.md
index 7f51d9b..771ecbd 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -367,3 +367,54 @@ Goal: lock the language and embedding API for long-term support.
 - [x] Zero known P0/P1 correctness bugs.
 - [x] CI green across supported platforms and Go versions.
 - [x] Release process rehearsed and repeatable.
+
+---
+
+## v1.1.0 - Performance and Benchmarking
+
+Goal: make performance improvements measurable, repeatable, and protected against regressions.
+
+### Runtime Performance
+
+- [ ] Profile evaluator hotspots and prioritize top 3 CPU paths by cumulative time.
+- [ ] Reduce `Script.Call` overhead for short-running scripts (frame/env setup and teardown).
+- [ ] Optimize method dispatch and member access fast paths.
+- [ ] Reduce allocations in common collection transforms (`map`, `select`, `reduce`, `chunk`, `window`).
+- [ ] Optimize typed argument/return validation for nested composite types.
+
+### Memory and Allocation Discipline
+
+- [ ] Reduce transient allocations in stdlib JSON/Regex/String helper paths.
+- [ ] Reduce temporary map/array churn in module and capability boundary code paths.
+- [ ] Add per-benchmark allocation targets (`allocs/op`) for hot runtime paths.
+- [ ] Add focused regression tests for high-allocation call patterns.
+
+### Benchmark Coverage
+
+- [ ] Expand benchmark suite for compile, call, control-flow, and typed-runtime workloads.
+- [ ] Add capability-heavy benchmarks (db/events/context adapters + contract validation).
+- [ ] Add module-system benchmarks (`require`, cache hits, cache misses, cycle paths).
+- [ ] Add stdlib benchmarks for JSON/Regex/Time/String/Array/Hash hot operations.
+- [ ] Add representative end-to-end benchmarks using `tests/complex/*.vibe` workloads.
+
+### Benchmark Tooling and CI
+
+- [ ] Add a single benchmark runner command/script with stable flags and output format.
+- [ ] Persist benchmark baselines in versioned artifacts for release comparison.
+- [ ] Add PR-time benchmark smoke checks with threshold-based alerts.
+- [ ] Add scheduled full benchmark runs with trend reporting.
+- [ ] Document benchmark interpretation and triage workflow.
+
+### Profiling and Diagnostics
+
+- [ ] Add reproducible CPU profile capture workflow for compile and runtime benchmarks.
+- [ ] Add memory profile capture workflow for allocation-heavy scenarios.
+- [ ] Add flamegraph generation instructions and hotspot triage checklist.
+- [ ] Add a short "performance playbook" for validating optimizations before merge.
+
+### v1.1.0 Definition of Done
+
+- [ ] Benchmarks cover runtime, capability, module, and stdlib hot paths.
+- [ ] CI reports benchmark deltas for guarded smoke benchmarks.
+- [ ] Measurable improvements are achieved versus v1.0.0 baselines.
+- [ ] Performance and benchmarking workflows are documented and maintainable.

From 368a3fc331956096374c8b6eb4a270b70cceb3d3 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:13:42 -0500
Subject: [PATCH 02/26] add stable benchmark runner script and tooling docs

---
 Justfile                 |  2 +-
 docs/tooling.md          | 17 +++++++
 scripts/bench_runtime.sh | 98 ++++++++++++++++++++++++++++++++++++++++
 3 files changed, 116 insertions(+), 1 deletion(-)
 create mode 100755 scripts/bench_runtime.sh

diff --git a/Justfile b/Justfile
index 7df0e2a..ceabbac 100644
--- a/Justfile
+++ b/Justfile
@@ -4,7 +4,7 @@ test:
 	go test ./...
 
 bench:
-	go test ./vibes -run '^$' -bench '^BenchmarkExecution' -benchmem
+	scripts/bench_runtime.sh
 
 lint:
 	gofmt -l . | (! read)
diff --git a/docs/tooling.md b/docs/tooling.md
index bb903fa..52d71ff 100644
--- a/docs/tooling.md
+++ b/docs/tooling.md
@@ -66,3 +66,20 @@ REPL command set:
 
 - `:help`, `:vars`, `:globals`, `:functions`, `:types`
 - `:last_error`, `:clear`, `:reset`, `:quit`
+
+## Benchmark Runner
+
+Use the benchmark runner script for stable local perf baselines.
+
+```bash
+scripts/bench_runtime.sh
+```
+
+Common options:
+
+- `--pattern '^BenchmarkExecution(ArrayPipeline|TallyLoop)$'`
+- `--count 5`
+- `--benchtime 2s`
+- `--out benchmarks/array_vs_tally.txt`
+
+The script is also wired into `just bench`.
diff --git a/scripts/bench_runtime.sh b/scripts/bench_runtime.sh
new file mode 100755
index 0000000..7032c5a
--- /dev/null
+++ b/scripts/bench_runtime.sh
@@ -0,0 +1,98 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+usage() {
+  cat >&2 <<'EOF'
+usage: scripts/bench_runtime.sh [options]
+
+Runs VibeScript Go benchmarks with stable defaults and records output.
+
+options:
+  --count <n>        Benchmark count (default: 3)
+  --benchtime <dur>  Benchtime passed to `go test` (default: 1s)
+  --pattern <regex>  Benchmark regex (default: ^BenchmarkExecution)
+  --package <path>   Go package to benchmark (default: ./vibes)
+  --cpu <list>       CPU list for `go test -cpu` (default: 1)
+  --out <file>       Output file (default: benchmarks/latest.txt)
+  -h, --help         Show this help
+EOF
+}
+
+count="3"
+benchtime="1s"
+pattern="^BenchmarkExecution"
+pkg="./vibes"
+cpu="1"
+out_file="benchmarks/latest.txt"
+
+while [[ $# -gt 0 ]]; do
+  case "$1" in
+    --count)
+      count="${2:-}"
+      shift 2
+      ;;
+    --benchtime)
+      benchtime="${2:-}"
+      shift 2
+      ;;
+    --pattern)
+      pattern="${2:-}"
+      shift 2
+      ;;
+    --package)
+      pkg="${2:-}"
+      shift 2
+      ;;
+    --cpu)
+      cpu="${2:-}"
+      shift 2
+      ;;
+    --out)
+      out_file="${2:-}"
+      shift 2
+      ;;
+    -h|--help)
+      usage
+      exit 0
+      ;;
+    *)
+      echo "unknown argument: $1" >&2
+      usage
+      exit 2
+      ;;
+  esac
+done
+
+mkdir -p "$(dirname "$out_file")"
+
+go_version="$(go version)"
+git_commit="$(git rev-parse --short HEAD 2>/dev/null || echo unknown)"
+timestamp="$(date -u +%Y-%m-%dT%H:%M:%SZ)"
+
+command=(
+  go test "$pkg"
+  -run '^$'
+  -bench "$pattern"
+  -benchmem
+  -count "$count"
+  -benchtime "$benchtime"
+  -cpu "$cpu"
+)
+
+{
+  echo "# VibeScript benchmark run"
+  echo "# timestamp: $timestamp"
+  echo "# git_commit: $git_commit"
+  echo "# go_version: $go_version"
+  echo "# package: $pkg"
+  echo "# bench_pattern: $pattern"
+  echo "# count: $count"
+  echo "# benchtime: $benchtime"
+  echo "# cpu: $cpu"
+  echo "# command: ${command[*]}"
+  echo
+  "${command[@]}"
+} | tee "$out_file"
+
+echo
+echo "benchmark output written to $out_file"

From fb9313359da32bc3c769d96cf86ed224f86b0d3e Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:15:46 -0500
Subject: [PATCH 03/26] retarget performance roadmap milestone to pre-1.0 track

---
 ROADMAP.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/ROADMAP.md b/ROADMAP.md
index 771ecbd..f6c6385 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -370,7 +370,7 @@ Goal: lock the language and embedding API for long-term support.
 
 ---
 
-## v1.1.0 - Performance and Benchmarking
+## v0.20.0 - Performance and Benchmarking (1.0 Push)
 
 Goal: make performance improvements measurable, repeatable, and protected against regressions.
 
@@ -412,9 +412,9 @@ Goal: make performance improvements measurable, repeatable, and protected agains
 - [ ] Add flamegraph generation instructions and hotspot triage checklist.
 - [ ] Add a short "performance playbook" for validating optimizations before merge.
 
-### v1.1.0 Definition of Done
+### v0.20.0 Definition of Done
 
 - [ ] Benchmarks cover runtime, capability, module, and stdlib hot paths.
 - [ ] CI reports benchmark deltas for guarded smoke benchmarks.
-- [ ] Measurable improvements are achieved versus v1.0.0 baselines.
+- [ ] Measurable improvements are achieved before the v1.0.0 release tag.
 - [ ] Performance and benchmarking workflows are documented and maintainable.

From 293063c0b656f2f36c2e03e621ca398289eb0c15 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:19:37 -0500
Subject: [PATCH 04/26] add benchmark smoke thresholds and CI gate

---
 .github/workflows/benchmarks.yml |  5 +-
 ROADMAP.md                       |  4 +-
 benchmarks/smoke_thresholds.txt  | 13 +++++
 docs/tooling.md                  | 12 ++++
 scripts/bench_smoke_check.sh     | 99 ++++++++++++++++++++++++++++++++
 5 files changed, 130 insertions(+), 3 deletions(-)
 create mode 100644 benchmarks/smoke_thresholds.txt
 create mode 100755 scripts/bench_smoke_check.sh

diff --git a/.github/workflows/benchmarks.yml b/.github/workflows/benchmarks.yml
index b792d9a..cb7d685 100644
--- a/.github/workflows/benchmarks.yml
+++ b/.github/workflows/benchmarks.yml
@@ -18,10 +18,13 @@ jobs:
         with:
           go-version-file: go.mod
 
+      - name: Benchmark smoke gates
+        run: ./scripts/bench_smoke_check.sh
+
       - name: Run benchmarks
         run: |
           mkdir -p .bench
-          go test ./vibes -run '^$' -bench '^BenchmarkExecution' -benchmem | tee .bench/benchmark.txt
+          scripts/bench_runtime.sh --count 1 --out .bench/benchmark.txt
 
       - name: Publish benchmark summary
         run: |
diff --git a/ROADMAP.md b/ROADMAP.md
index f6c6385..2104fbb 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -399,9 +399,9 @@ Goal: make performance improvements measurable, repeatable, and protected agains
 
 ### Benchmark Tooling and CI
 
-- [ ] Add a single benchmark runner command/script with stable flags and output format.
+- [x] Add a single benchmark runner command/script with stable flags and output format.
 - [ ] Persist benchmark baselines in versioned artifacts for release comparison.
-- [ ] Add PR-time benchmark smoke checks with threshold-based alerts.
+- [x] Add PR-time benchmark smoke checks with threshold-based alerts.
 - [ ] Add scheduled full benchmark runs with trend reporting.
 - [ ] Document benchmark interpretation and triage workflow.
 
diff --git a/benchmarks/smoke_thresholds.txt b/benchmarks/smoke_thresholds.txt
new file mode 100644
index 0000000..bb2391f
--- /dev/null
+++ b/benchmarks/smoke_thresholds.txt
@@ -0,0 +1,13 @@
+# Benchmark smoke thresholds for CI guardrails.
+# Format:
+# <benchmark_name> <max_ns_per_op> <max_allocs_per_op>
+#
+# Keep thresholds intentionally loose enough to avoid platform flake,
+# but tight enough to catch obvious regressions.
+
+BenchmarkExecutionArithmeticLoop 5000000 1000
+BenchmarkExecutionMethodDispatchLoop 8000000 6000
+BenchmarkExecutionCapabilityFindLoop 12000000 9000
+BenchmarkExecutionJSONStringifyLoop 3000000 4000
+BenchmarkExecutionRegexReplaceAllLoop 4000000 4000
+BenchmarkExecutionTallyLoop 10000000 2000
diff --git a/docs/tooling.md b/docs/tooling.md
index 52d71ff..9634614 100644
--- a/docs/tooling.md
+++ b/docs/tooling.md
@@ -83,3 +83,15 @@ Common options:
 - `--out benchmarks/array_vs_tally.txt`
 
 The script is also wired into `just bench`.
+
+## Benchmark Smoke Gates
+
+Use the smoke-check script to catch obvious performance regressions before
+running the full suite:
+
+```bash
+scripts/bench_smoke_check.sh
+```
+
+Thresholds live in `benchmarks/smoke_thresholds.txt` and are checked against
+both `ns/op` and `allocs/op`.
diff --git a/scripts/bench_smoke_check.sh b/scripts/bench_smoke_check.sh
new file mode 100755
index 0000000..90dca43
--- /dev/null
+++ b/scripts/bench_smoke_check.sh
@@ -0,0 +1,99 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+threshold_file="${1:-benchmarks/smoke_thresholds.txt}"
+
+if [[ ! -f "$threshold_file" ]]; then
+  echo "threshold file not found: $threshold_file" >&2
+  exit 2
+fi
+
+declare -A max_ns
+declare -A max_allocs
+benchmarks=()
+
+while read -r name ns allocs; do
+  if [[ -z "${name:-}" || "${name:0:1}" == "#" ]]; then
+    continue
+  fi
+  benchmarks+=("$name")
+  max_ns["$name"]="$ns"
+  max_allocs["$name"]="$allocs"
+done < "$threshold_file"
+
+if [[ ${#benchmarks[@]} -eq 0 ]]; then
+  echo "no benchmark thresholds configured in $threshold_file" >&2
+  exit 2
+fi
+
+pattern="^($(IFS='|'; echo "${benchmarks[*]}"))$"
+tmp_out="$(mktemp)"
+trap 'rm -f "$tmp_out"' EXIT
+
+go test ./vibes \
+  -run '^$' \
+  -bench "$pattern" \
+  -benchmem \
+  -count 1 \
+  -benchtime 100ms \
+  -cpu 1 | tee "$tmp_out"
+
+declare -A actual_ns
+declare -A actual_allocs
+
+while read -r bench ns allocs; do
+  actual_ns["$bench"]="$ns"
+  actual_allocs["$bench"]="$allocs"
+done < <(
+  awk '
+    /^Benchmark/ {
+      bench=$1
+      sub(/-[0-9]+$/, "", bench)
+      ns=""
+      allocs=""
+      for (i = 1; i <= NF; i++) {
+        if ($i == "ns/op") ns=$(i-1)
+        if ($i == "allocs/op") allocs=$(i-1)
+      }
+      if (bench != "" && ns != "" && allocs != "") {
+        print bench, ns, allocs
+      }
+    }
+  ' "$tmp_out"
+)
+
+failures=0
+
+echo
+printf "%-40s %12s %12s %12s %12s\n" "Benchmark" "ns/op" "max_ns/op" "allocs/op" "max_allocs"
+for bench in "${benchmarks[@]}"; do
+  ns="${actual_ns[$bench]:-}"
+  allocs="${actual_allocs[$bench]:-}"
+  max_ns_value="${max_ns[$bench]}"
+  max_allocs_value="${max_allocs[$bench]}"
+
+  if [[ -z "$ns" || -z "$allocs" ]]; then
+    echo "missing benchmark result for $bench" >&2
+    failures=$((failures + 1))
+    continue
+  fi
+
+  printf "%-40s %12s %12s %12s %12s\n" "$bench" "$ns" "$max_ns_value" "$allocs" "$max_allocs_value"
+
+  if (( ns > max_ns_value )); then
+    echo "regression: $bench ns/op $ns exceeds $max_ns_value" >&2
+    failures=$((failures + 1))
+  fi
+  if (( allocs > max_allocs_value )); then
+    echo "regression: $bench allocs/op $allocs exceeds $max_allocs_value" >&2
+    failures=$((failures + 1))
+  fi
+done
+
+if (( failures > 0 )); then
+  echo "benchmark smoke check failed ($failures regression signals)" >&2
+  exit 1
+fi
+
+echo
+echo "benchmark smoke check passed"

From cbe5e6a8fbb672a9f86ff720daaf5277ad040a89 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:20:45 -0500
Subject: [PATCH 05/26] add benchmark profile capture workflow and docs

---
 Justfile                 |   3 ++
 ROADMAP.md               |   4 +-
 docs/tooling.md          |  21 ++++++++
 scripts/bench_profile.sh | 111 +++++++++++++++++++++++++++++++++++++++
 4 files changed, 137 insertions(+), 2 deletions(-)
 create mode 100755 scripts/bench_profile.sh

diff --git a/Justfile b/Justfile
index ceabbac..3381d10 100644
--- a/Justfile
+++ b/Justfile
@@ -6,6 +6,9 @@ test:
 bench:
 	scripts/bench_runtime.sh
 
+bench-profile pattern='^BenchmarkExecutionArrayPipeline$':
+	scripts/bench_profile.sh --pattern "{{pattern}}"
+
 lint:
 	gofmt -l . | (! read)
 	golangci-lint run --timeout=10m
diff --git a/ROADMAP.md b/ROADMAP.md
index 2104fbb..97a405a 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -407,8 +407,8 @@ Goal: make performance improvements measurable, repeatable, and protected agains
 
 ### Profiling and Diagnostics
 
-- [ ] Add reproducible CPU profile capture workflow for compile and runtime benchmarks.
-- [ ] Add memory profile capture workflow for allocation-heavy scenarios.
+- [x] Add reproducible CPU profile capture workflow for compile and runtime benchmarks.
+- [x] Add memory profile capture workflow for allocation-heavy scenarios.
 - [ ] Add flamegraph generation instructions and hotspot triage checklist.
 - [ ] Add a short "performance playbook" for validating optimizations before merge.
 
diff --git a/docs/tooling.md b/docs/tooling.md
index 9634614..707c81f 100644
--- a/docs/tooling.md
+++ b/docs/tooling.md
@@ -95,3 +95,24 @@ scripts/bench_smoke_check.sh
 
 Thresholds live in `benchmarks/smoke_thresholds.txt` and are checked against
 both `ns/op` and `allocs/op`.
+
+## Benchmark Profiling
+
+Capture benchmark CPU/memory profiles plus `pprof` top summaries:
+
+```bash
+scripts/bench_profile.sh --pattern '^BenchmarkExecutionArrayPipeline$'
+```
+
+Artifacts are written under `benchmarks/profiles/<timestamp>/`:
+
+- `bench.txt`
+- `cpu.out`, `cpu.top.txt`
+- `mem.out`, `mem.top.txt`
+- `meta.txt`
+
+This is also available as:
+
+```bash
+just bench-profile
+```
diff --git a/scripts/bench_profile.sh b/scripts/bench_profile.sh
new file mode 100755
index 0000000..4a9b2b1
--- /dev/null
+++ b/scripts/bench_profile.sh
@@ -0,0 +1,111 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+usage() {
+  cat >&2 <<'EOF'
+usage: scripts/bench_profile.sh [options]
+
+Runs a benchmark with CPU and memory profiles and writes profile summaries.
+
+options:
+  --pattern <regex>   Benchmark regex (default: ^BenchmarkExecutionArrayPipeline$)
+  --package <path>    Go package to benchmark (default: ./vibes)
+  --benchtime <dur>   Benchtime passed to `go test` (default: 1s)
+  --count <n>         Benchmark count (default: 1)
+  --cpu <list>        CPU list for `go test -cpu` (default: 1)
+  --outdir <path>     Output directory (default: benchmarks/profiles/<timestamp>)
+  -h, --help          Show this help
+EOF
+}
+
+pattern="^BenchmarkExecutionArrayPipeline$"
+pkg="./vibes"
+benchtime="1s"
+count="1"
+cpu="1"
+timestamp="$(date -u +%Y%m%dT%H%M%SZ)"
+outdir="benchmarks/profiles/${timestamp}"
+
+while [[ $# -gt 0 ]]; do
+  case "$1" in
+    --pattern)
+      pattern="${2:-}"
+      shift 2
+      ;;
+    --package)
+      pkg="${2:-}"
+      shift 2
+      ;;
+    --benchtime)
+      benchtime="${2:-}"
+      shift 2
+      ;;
+    --count)
+      count="${2:-}"
+      shift 2
+      ;;
+    --cpu)
+      cpu="${2:-}"
+      shift 2
+      ;;
+    --outdir)
+      outdir="${2:-}"
+      shift 2
+      ;;
+    -h|--help)
+      usage
+      exit 0
+      ;;
+    *)
+      echo "unknown argument: $1" >&2
+      usage
+      exit 2
+      ;;
+  esac
+done
+
+mkdir -p "$outdir"
+
+bench_out="${outdir}/bench.txt"
+cpu_profile="${outdir}/cpu.out"
+mem_profile="${outdir}/mem.out"
+cpu_top="${outdir}/cpu.top.txt"
+mem_top="${outdir}/mem.top.txt"
+meta="${outdir}/meta.txt"
+
+command=(
+  go test "$pkg"
+  -run '^$'
+  -bench "$pattern"
+  -benchmem
+  -count "$count"
+  -benchtime "$benchtime"
+  -cpu "$cpu"
+  -cpuprofile "$cpu_profile"
+  -memprofile "$mem_profile"
+)
+
+{
+  echo "timestamp=${timestamp}"
+  echo "pattern=${pattern}"
+  echo "package=${pkg}"
+  echo "benchtime=${benchtime}"
+  echo "count=${count}"
+  echo "cpu=${cpu}"
+  echo "go_version=$(go version)"
+  echo "git_commit=$(git rev-parse --short HEAD 2>/dev/null || echo unknown)"
+  echo "command=${command[*]}"
+} > "$meta"
+
+"${command[@]}" | tee "$bench_out"
+
+go tool pprof -top -nodecount=60 "$cpu_profile" > "$cpu_top"
+go tool pprof -top -nodecount=60 "$mem_profile" > "$mem_top"
+
+echo
+echo "profile output written to ${outdir}"
+echo "  bench: ${bench_out}"
+echo "  cpu profile: ${cpu_profile}"
+echo "  mem profile: ${mem_profile}"
+echo "  cpu top: ${cpu_top}"
+echo "  mem top: ${mem_top}"

From c6c221fdfe7367380f28d5c156fe9de6e4967e8a Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:53:29 -0500
Subject: [PATCH 06/26] expand benchmark coverage across runtime workloads

---
 benchmarks/smoke_thresholds.txt     |   5 +
 scripts/bench_runtime.sh            |   4 +-
 vibes/execution_benchmark_test.go   |   5 +-
 vibes/performance_benchmark_test.go | 373 ++++++++++++++++++++++++++++
 4 files changed, 384 insertions(+), 3 deletions(-)
 create mode 100644 vibes/performance_benchmark_test.go

diff --git a/benchmarks/smoke_thresholds.txt b/benchmarks/smoke_thresholds.txt
index bb2391f..f3df605 100644
--- a/benchmarks/smoke_thresholds.txt
+++ b/benchmarks/smoke_thresholds.txt
@@ -6,8 +6,13 @@
 # but tight enough to catch obvious regressions.
 
 BenchmarkExecutionArithmeticLoop 5000000 1000
+BenchmarkExecutionArrayPipeline 30000000 20000
 BenchmarkExecutionMethodDispatchLoop 8000000 6000
 BenchmarkExecutionCapabilityFindLoop 12000000 9000
+BenchmarkExecutionCapabilityWorkflowLoop 14000000 15000
+BenchmarkExecutionJSONParseLoop 3000000 5000
 BenchmarkExecutionJSONStringifyLoop 3000000 4000
 BenchmarkExecutionRegexReplaceAllLoop 4000000 4000
 BenchmarkExecutionTallyLoop 10000000 2000
+BenchmarkCallShortScript 20000 60
+BenchmarkModuleRequireCacheHit 120000 220
diff --git a/scripts/bench_runtime.sh b/scripts/bench_runtime.sh
index 7032c5a..c8fbad5 100755
--- a/scripts/bench_runtime.sh
+++ b/scripts/bench_runtime.sh
@@ -10,7 +10,7 @@ Runs VibeScript Go benchmarks with stable defaults and records output.
 options:
   --count <n>        Benchmark count (default: 3)
   --benchtime <dur>  Benchtime passed to `go test` (default: 1s)
-  --pattern <regex>  Benchmark regex (default: ^BenchmarkExecution)
+  --pattern <regex>  Benchmark regex (default: ^Benchmark)
   --package <path>   Go package to benchmark (default: ./vibes)
   --cpu <list>       CPU list for `go test -cpu` (default: 1)
   --out <file>       Output file (default: benchmarks/latest.txt)
@@ -20,7 +20,7 @@ EOF
 
 count="3"
 benchtime="1s"
-pattern="^BenchmarkExecution"
+pattern="^Benchmark"
 pkg="./vibes"
 cpu="1"
 out_file="benchmarks/latest.txt"
diff --git a/vibes/execution_benchmark_test.go b/vibes/execution_benchmark_test.go
index 01396ac..09d8162 100644
--- a/vibes/execution_benchmark_test.go
+++ b/vibes/execution_benchmark_test.go
@@ -8,7 +8,10 @@ import (
 type benchmarkDBCapability struct{}
 
 func (benchmarkDBCapability) Find(ctx context.Context, req DBFindRequest) (Value, error) {
-	return NewHash(map[string]Value{"score": NewInt(1)}), nil
+	return NewHash(map[string]Value{
+		"id":    req.ID,
+		"score": NewInt(1),
+	}), nil
 }
 
 func (benchmarkDBCapability) Query(ctx context.Context, req DBQueryRequest) (Value, error) {
diff --git a/vibes/performance_benchmark_test.go b/vibes/performance_benchmark_test.go
new file mode 100644
index 0000000..356bf10
--- /dev/null
+++ b/vibes/performance_benchmark_test.go
@@ -0,0 +1,373 @@
+package vibes
+
+import (
+	"context"
+	"os"
+	"path/filepath"
+	"testing"
+)
+
+type benchmarkEventsCapability struct{}
+
+func (benchmarkEventsCapability) Publish(ctx context.Context, req EventPublishRequest) (Value, error) {
+	return NewHash(map[string]Value{
+		"topic": NewString(req.Topic),
+		"ok":    NewBool(true),
+	}), nil
+}
+
+func benchmarkContextResolver(context.Context) (Value, error) {
+	return NewHash(map[string]Value{
+		"player_id": NewString("player-1"),
+		"tenant_id": NewString("tenant-1"),
+	}), nil
+}
+
+func benchmarkSourceFromFile(b *testing.B, rel string) string {
+	b.Helper()
+	path := filepath.Join("..", filepath.FromSlash(rel))
+	source, err := os.ReadFile(path)
+	if err != nil {
+		b.Fatalf("read %s: %v", path, err)
+	}
+	return string(source)
+}
+
+func benchmarkEngineWithModules() *Engine {
+	return MustNewEngine(Config{
+		StepQuota:        2_000_000,
+		MemoryQuotaBytes: 2 << 20,
+		ModulePaths:      []string{filepath.FromSlash("testdata/modules")},
+	})
+}
+
+func BenchmarkCompileControlFlowWorkload(b *testing.B) {
+	source := benchmarkSourceFromFile(b, "tests/complex/loops.vibe")
+	engine := benchmarkEngine()
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := engine.Compile(source); err != nil {
+			b.Fatalf("compile failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkCompileTypedWorkload(b *testing.B) {
+	source := benchmarkSourceFromFile(b, "tests/complex/typed.vibe")
+	engine := benchmarkEngine()
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := engine.Compile(source); err != nil {
+			b.Fatalf("compile failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkCompileMassiveWorkload(b *testing.B) {
+	source := benchmarkSourceFromFile(b, "tests/complex/massive.vibe")
+	engine := benchmarkEngine()
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := engine.Compile(source); err != nil {
+			b.Fatalf("compile failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkCallShortScript(b *testing.B) {
+	script := compileScriptWithEngine(b, benchmarkEngine(), `def run
+  1
+end`)
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", nil, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkCallControlFlowWorkload(b *testing.B) {
+	script := compileScriptWithEngine(b, benchmarkEngine(), `def run(limit)
+  i = 0
+  total = 0
+
+  while i < limit
+    i = i + 1
+    if i % 2 == 0
+      next
+    end
+    if i > 75
+      break
+    end
+    total = total + i
+  end
+
+  total
+end`)
+
+	args := []Value{NewInt(200)}
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", args, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkCallTypedCompositeValidation(b *testing.B) {
+	script := compileScriptWithEngine(b, benchmarkEngine(), `def run(rows: array<{ id: string, values: array<int> }>) -> int
+  total = 0
+  rows.each do |row: { id: string, values: array<int> }|
+    row[:values].each do |value: int|
+      total = total + value
+    end
+  end
+  total
+end`)
+
+	rows := make([]Value, 40)
+	for i := range rows {
+		values := make([]Value, 4)
+		for j := range values {
+			values[j] = NewInt(int64(i + j))
+		}
+		rows[i] = NewHash(map[string]Value{
+			"id":     NewString("row"),
+			"values": NewArray(values),
+		})
+	}
+
+	args := []Value{NewArray(rows)}
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", args, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkExecutionCapabilityWorkflowLoop(b *testing.B) {
+	script := compileScriptWithEngine(b, benchmarkEngine(), `def run(n)
+  total = 0
+  for i in 1..n
+    player_id = ctx[:player_id]
+    row = db.find("Player", player_id)
+    events.publish("scores.seen", { player_id: row[:id], score: row[:score] })
+    total = total + row[:score]
+  end
+  total
+end`)
+
+	args := []Value{NewInt(200)}
+	opts := CallOptions{Capabilities: []CapabilityAdapter{
+		MustNewDBCapability("db", benchmarkDBCapability{}),
+		MustNewEventsCapability("events", benchmarkEventsCapability{}),
+		MustNewContextCapability("ctx", benchmarkContextResolver),
+	}}
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", args, opts); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkExecutionTimeParseFormatLoop(b *testing.B) {
+	script := compileScriptWithEngine(b, benchmarkEngine(), `def run(raw, n)
+  out = ""
+  for i in 1..n
+    out = Time.parse(raw).format("2006-01-02T15:04:05Z07:00")
+  end
+  out
+end`)
+
+	args := []Value{NewString("2026-02-21T12:45:00Z"), NewInt(80)}
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", args, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkExecutionStringNormalizeLoop(b *testing.B) {
+	script := compileScriptWithEngine(b, benchmarkEngine(), `def run(text, n)
+  out = ""
+  for i in 1..n
+    out = text.squish.downcase.split(" ").join("-")
+  end
+  out
+end`)
+
+	args := []Value{NewString("  VibeScript   Runtime   Benchmarks  "), NewInt(80)}
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", args, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkExecutionHashTransformLoop(b *testing.B) {
+	script := compileScriptWithEngine(b, benchmarkEngine(), `def run(payload, n)
+  out = {}
+  for i in 1..n
+    merged = payload.merge({ seen: i })
+    selected = merged.slice(:id, :name, :score, :seen)
+    out = selected.transform_values do |value|
+      value
+    end
+  end
+  out
+end`)
+
+	payload := NewHash(map[string]Value{
+		"id":       NewString("player-7"),
+		"name":     NewString("alex"),
+		"score":    NewInt(42),
+		"active":   NewBool(true),
+		"region":   NewString("us-east-1"),
+		"attempts": NewInt(3),
+	})
+	args := []Value{payload, NewInt(80)}
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", args, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkModuleRequireCacheHit(b *testing.B) {
+	engine := benchmarkEngineWithModules()
+	script := compileScriptWithEngine(b, engine, `def run(value)
+  mod = require("helper")
+  mod.double(value)
+end`)
+
+	args := []Value{NewInt(12)}
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", args, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkModuleRequireCacheMiss(b *testing.B) {
+	moduleRoot := b.TempDir()
+	modulePath := filepath.Join(moduleRoot, "dynamic.vibe")
+	if err := os.WriteFile(modulePath, []byte("def value\n  7\nend\n"), 0o644); err != nil {
+		b.Fatalf("write module: %v", err)
+	}
+
+	engine := MustNewEngine(Config{
+		StepQuota:        2_000_000,
+		MemoryQuotaBytes: 2 << 20,
+		ModulePaths:      []string{moduleRoot},
+	})
+	script := compileScriptWithEngine(b, engine, `def run
+  mod = require("dynamic")
+  mod.value
+end`)
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		engine.ClearModuleCache()
+		if _, err := script.Call(context.Background(), "run", nil, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkModuleRequireCyclePath(b *testing.B) {
+	moduleRoot := b.TempDir()
+	if err := os.WriteFile(filepath.Join(moduleRoot, "a.vibe"), []byte(`require("b")
+def value
+  1
+end
+`), 0o644); err != nil {
+		b.Fatalf("write module a: %v", err)
+	}
+	if err := os.WriteFile(filepath.Join(moduleRoot, "b.vibe"), []byte(`require("a")
+def value
+  2
+end
+`), 0o644); err != nil {
+		b.Fatalf("write module b: %v", err)
+	}
+
+	engine := MustNewEngine(Config{
+		StepQuota:        2_000_000,
+		MemoryQuotaBytes: 2 << 20,
+		ModulePaths:      []string{moduleRoot},
+	})
+	script := compileScriptWithEngine(b, engine, `def run
+  require("a")
+end`)
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", nil, CallOptions{}); err == nil {
+			b.Fatalf("expected cycle error")
+		}
+	}
+}
+
+func BenchmarkComplexRunAnalytics(b *testing.B) {
+	engine := benchmarkEngine()
+	script := compileScriptFromFileWithEngine(b, engine, filepath.Join("..", "tests", "complex", "analytics.vibe"))
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", nil, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkComplexRunTyped(b *testing.B) {
+	engine := benchmarkEngine()
+	script := compileScriptFromFileWithEngine(b, engine, filepath.Join("..", "tests", "complex", "typed.vibe"))
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", nil, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}
+
+func BenchmarkComplexRunMassive(b *testing.B) {
+	engine := benchmarkEngine()
+	script := compileScriptFromFileWithEngine(b, engine, filepath.Join("..", "tests", "complex", "massive.vibe"))
+
+	b.ReportAllocs()
+	b.ResetTimer()
+	for range b.N {
+		if _, err := script.Call(context.Background(), "run", nil, CallOptions{}); err != nil {
+			b.Fatalf("call failed: %v", err)
+		}
+	}
+}

From 5e20a8124f7f031eeda92f0eeb7ba0d74e50f816 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:53:35 -0500
Subject: [PATCH 07/26] add benchmark baselines and scheduled trend reporting

---
 .github/workflows/benchmarks.yml      |  59 +++++++++--
 benchmarks/baselines/README.md        |  26 +++++
 benchmarks/baselines/v0.20.0-full.txt |  41 ++++++++
 benchmarks/baselines/v0.20.0-pr.txt   |  41 ++++++++
 docs/tooling.md                       |  66 +++++++++++-
 scripts/bench_compare_baseline.sh     | 140 ++++++++++++++++++++++++++
 scripts/bench_smoke_check.sh          |   6 +-
 7 files changed, 370 insertions(+), 9 deletions(-)
 create mode 100644 benchmarks/baselines/README.md
 create mode 100644 benchmarks/baselines/v0.20.0-full.txt
 create mode 100644 benchmarks/baselines/v0.20.0-pr.txt
 create mode 100755 scripts/bench_compare_baseline.sh

diff --git a/.github/workflows/benchmarks.yml b/.github/workflows/benchmarks.yml
index cb7d685..06bb92d 100644
--- a/.github/workflows/benchmarks.yml
+++ b/.github/workflows/benchmarks.yml
@@ -5,6 +5,8 @@ on:
     branches: [master]
   pull_request:
   workflow_dispatch:
+  schedule:
+    - cron: "0 6 * * 1"
 
 jobs:
   benchmark:
@@ -18,26 +20,71 @@ jobs:
         with:
           go-version-file: go.mod
 
+      - name: Configure benchmark profile
+        run: |
+          if [[ "${{ github.event_name }}" == "schedule" ]]; then
+            echo "BENCH_COUNT=1" >> "$GITHUB_ENV"
+            echo "BENCH_TIME=2s" >> "$GITHUB_ENV"
+            echo "BENCH_BASELINE=benchmarks/baselines/v0.20.0-full.txt" >> "$GITHUB_ENV"
+            echo "BENCH_PROFILE=full" >> "$GITHUB_ENV"
+          else
+            echo "BENCH_COUNT=1" >> "$GITHUB_ENV"
+            echo "BENCH_TIME=1s" >> "$GITHUB_ENV"
+            echo "BENCH_BASELINE=benchmarks/baselines/v0.20.0-pr.txt" >> "$GITHUB_ENV"
+            echo "BENCH_PROFILE=pr" >> "$GITHUB_ENV"
+          fi
+
       - name: Benchmark smoke gates
-        run: ./scripts/bench_smoke_check.sh
+        if: github.event_name != 'schedule'
+        run: |
+          set -o pipefail
+          mkdir -p .bench
+          ./scripts/bench_smoke_check.sh | tee .bench/smoke.txt
 
       - name: Run benchmarks
         run: |
           mkdir -p .bench
-          scripts/bench_runtime.sh --count 1 --out .bench/benchmark.txt
+          scripts/bench_runtime.sh \
+            --count "$BENCH_COUNT" \
+            --benchtime "$BENCH_TIME" \
+            --out ".bench/benchmark-$BENCH_PROFILE.txt"
+
+      - name: Compare benchmark trend against baseline
+        run: |
+          ./scripts/bench_compare_baseline.sh \
+            "$BENCH_BASELINE" \
+            ".bench/benchmark-$BENCH_PROFILE.txt" | tee ".bench/trend-$BENCH_PROFILE.txt"
 
       - name: Publish benchmark summary
         run: |
           {
-            echo "## Benchmark Results"
+            if [[ -f .bench/smoke.txt ]]; then
+              echo "## Benchmark Smoke Gates"
+              echo ""
+              echo '```text'
+              cat .bench/smoke.txt
+              echo '```'
+              echo ""
+            fi
+            echo "## Benchmark Trend vs Baseline ($BENCH_PROFILE)"
+            echo ""
+            echo '```text'
+            cat ".bench/trend-$BENCH_PROFILE.txt"
+            echo '```'
+            echo ""
+            echo "## Benchmark Results ($BENCH_PROFILE)"
             echo ""
             echo '```text'
-            cat .bench/benchmark.txt
+            cat ".bench/benchmark-$BENCH_PROFILE.txt"
             echo '```'
           } >> "$GITHUB_STEP_SUMMARY"
 
       - name: Upload benchmark artifact
         uses: actions/upload-artifact@v4
         with:
-          name: benchmark-results
-          path: .bench/benchmark.txt
+          name: benchmark-results-${{ github.event_name }}-${{ github.run_number }}
+          path: |
+            .bench/benchmark-*.txt
+            .bench/trend-*.txt
+            .bench/smoke.txt
+          if-no-files-found: warn
diff --git a/benchmarks/baselines/README.md b/benchmarks/baselines/README.md
new file mode 100644
index 0000000..0c2d73f
--- /dev/null
+++ b/benchmarks/baselines/README.md
@@ -0,0 +1,26 @@
+# Benchmark Baselines
+
+This directory stores versioned benchmark baseline artifacts for release
+comparison.
+
+## Files
+
+- `v0.20.0-pr.txt`: baseline for PR/push benchmark profile.
+  - Generated with: `scripts/bench_runtime.sh --count 1 --benchtime 1s`
+- `v0.20.0-full.txt`: baseline for scheduled full benchmark profile.
+  - Generated with: `scripts/bench_runtime.sh --count 1 --benchtime 2s`
+
+## Usage
+
+Compare a current run against a baseline:
+
+```bash
+scripts/bench_compare_baseline.sh benchmarks/baselines/v0.20.0-pr.txt benchmarks/latest.txt
+```
+
+## Updating Baselines
+
+1. Run benchmark profile with stable settings for the target release.
+2. Write output to a new versioned file in this directory.
+3. Keep prior baseline files for historical comparison.
+4. Update workflow/docs references if the active baseline changes.
diff --git a/benchmarks/baselines/v0.20.0-full.txt b/benchmarks/baselines/v0.20.0-full.txt
new file mode 100644
index 0000000..ed81407
--- /dev/null
+++ b/benchmarks/baselines/v0.20.0-full.txt
@@ -0,0 +1,41 @@
+# VibeScript benchmark run
+# timestamp: 2026-02-21T18:34:37Z
+# git_commit: cbe5e6a
+# go_version: go version go1.26.0 darwin/arm64
+# package: ./vibes
+# bench_pattern: ^Benchmark
+# count: 1
+# benchtime: 2s
+# cpu: 1
+# command: go test ./vibes -run ^$ -bench ^Benchmark -benchmem -count 1 -benchtime 2s -cpu 1
+
+goos: darwin
+goarch: arm64
+pkg: github.com/mgomes/vibescript/vibes
+cpu: Apple M1 Max
+BenchmarkExecutionArithmeticLoop         	    1971	   1041766 ns/op	    9144 B/op	     553 allocs/op
+BenchmarkExecutionArrayPipeline          	     139	  17398372 ns/op	  928432 B/op	   15350 allocs/op
+BenchmarkExecutionMethodDispatchLoop     	     841	   2829313 ns/op	  199664 B/op	    2779 allocs/op
+BenchmarkExecutionCapabilityFindLoop     	     541	   4433641 ns/op	  395376 B/op	    5571 allocs/op
+BenchmarkExecutionJSONParseLoop          	    2347	   1093538 ns/op	  206192 B/op	    3723 allocs/op
+BenchmarkExecutionJSONStringifyLoop      	    3628	    663761 ns/op	  102724 B/op	    2464 allocs/op
+BenchmarkExecutionRegexReplaceAllLoop    	    3571	    732541 ns/op	  157950 B/op	    2750 allocs/op
+BenchmarkExecutionTallyLoop              	     697	   3442165 ns/op	 2252168 B/op	    1097 allocs/op
+BenchmarkCompileControlFlowWorkload      	  180141	     13414 ns/op	    9664 B/op	     180 allocs/op
+BenchmarkCompileTypedWorkload            	  128024	     18808 ns/op	   12616 B/op	     230 allocs/op
+BenchmarkCompileMassiveWorkload          	   12726	    191940 ns/op	  144816 B/op	    2243 allocs/op
+BenchmarkCallShortScript                 	  427030	      5683 ns/op	    3128 B/op	      25 allocs/op
+BenchmarkCallControlFlowWorkload         	    3946	    622062 ns/op	    5128 B/op	      52 allocs/op
+BenchmarkCallTypedCompositeValidation    	     268	   8891817 ns/op	 5259743 B/op	   55330 allocs/op
+BenchmarkExecutionCapabilityWorkflowLoop 	     270	   8306004 ns/op	 1100952 B/op	   12304 allocs/op
+BenchmarkExecutionTimeParseFormatLoop    	    3877	    656296 ns/op	   33144 B/op	     830 allocs/op
+BenchmarkExecutionStringNormalizeLoop    	    2944	    826423 ns/op	   72824 B/op	    2190 allocs/op
+BenchmarkExecutionHashTransformLoop      	     702	   3594562 ns/op	  534168 B/op	    4736 allocs/op
+BenchmarkModuleRequireCacheHit           	   42799	     56288 ns/op	   16032 B/op	     151 allocs/op
+BenchmarkModuleRequireCacheMiss          	   35266	     67874 ns/op	   20080 B/op	     195 allocs/op
+BenchmarkModuleRequireCyclePath          	   42578	     58229 ns/op	   17136 B/op	     200 allocs/op
+BenchmarkComplexRunAnalytics             	    6595	    317337 ns/op	   35584 B/op	     797 allocs/op
+BenchmarkComplexRunTyped                 	   38694	     63427 ns/op	   10032 B/op	      88 allocs/op
+BenchmarkComplexRunMassive               	     598	   3825029 ns/op	  192832 B/op	    1266 allocs/op
+PASS
+ok  	github.com/mgomes/vibescript/vibes	68.686s
diff --git a/benchmarks/baselines/v0.20.0-pr.txt b/benchmarks/baselines/v0.20.0-pr.txt
new file mode 100644
index 0000000..45c1ae6
--- /dev/null
+++ b/benchmarks/baselines/v0.20.0-pr.txt
@@ -0,0 +1,41 @@
+# VibeScript benchmark run
+# timestamp: 2026-02-21T18:31:59Z
+# git_commit: cbe5e6a
+# go_version: go version go1.26.0 darwin/arm64
+# package: ./vibes
+# bench_pattern: ^Benchmark
+# count: 1
+# benchtime: 1s
+# cpu: 1
+# command: go test ./vibes -run ^$ -bench ^Benchmark -benchmem -count 1 -benchtime 1s -cpu 1
+
+goos: darwin
+goarch: arm64
+pkg: github.com/mgomes/vibescript/vibes
+cpu: Apple M1 Max
+BenchmarkExecutionArithmeticLoop         	     990	   1041161 ns/op	    9144 B/op	     553 allocs/op
+BenchmarkExecutionArrayPipeline          	      72	  17167602 ns/op	  928433 B/op	   15350 allocs/op
+BenchmarkExecutionMethodDispatchLoop     	     430	   2768843 ns/op	  199664 B/op	    2779 allocs/op
+BenchmarkExecutionCapabilityFindLoop     	     272	   4467332 ns/op	  395376 B/op	    5571 allocs/op
+BenchmarkExecutionJSONParseLoop          	    1134	   1093307 ns/op	  206192 B/op	    3723 allocs/op
+BenchmarkExecutionJSONStringifyLoop      	    1914	    664214 ns/op	  102724 B/op	    2464 allocs/op
+BenchmarkExecutionRegexReplaceAllLoop    	    1718	    736594 ns/op	  157950 B/op	    2750 allocs/op
+BenchmarkExecutionTallyLoop              	     348	   3444825 ns/op	 2252168 B/op	    1097 allocs/op
+BenchmarkCompileControlFlowWorkload      	   89504	     13904 ns/op	    9664 B/op	     180 allocs/op
+BenchmarkCompileTypedWorkload            	   61092	     19634 ns/op	   12616 B/op	     230 allocs/op
+BenchmarkCompileMassiveWorkload          	    6313	    191390 ns/op	  144816 B/op	    2243 allocs/op
+BenchmarkCallShortScript                 	  206752	      5783 ns/op	    3128 B/op	      25 allocs/op
+BenchmarkCallControlFlowWorkload         	    1987	    617088 ns/op	    5128 B/op	      52 allocs/op
+BenchmarkCallTypedCompositeValidation    	     134	   8886666 ns/op	 5259744 B/op	   55330 allocs/op
+BenchmarkExecutionCapabilityWorkflowLoop 	     134	   8222791 ns/op	 1100952 B/op	   12304 allocs/op
+BenchmarkExecutionTimeParseFormatLoop    	    1954	    662865 ns/op	   33144 B/op	     830 allocs/op
+BenchmarkExecutionStringNormalizeLoop    	    1449	    833651 ns/op	   72824 B/op	    2190 allocs/op
+BenchmarkExecutionHashTransformLoop      	     348	   3596853 ns/op	  534168 B/op	    4736 allocs/op
+BenchmarkModuleRequireCacheHit           	   21824	     56145 ns/op	   16032 B/op	     151 allocs/op
+BenchmarkModuleRequireCacheMiss          	   17610	     68171 ns/op	   20080 B/op	     195 allocs/op
+BenchmarkModuleRequireCyclePath          	   21298	     55919 ns/op	   17136 B/op	     200 allocs/op
+BenchmarkComplexRunAnalytics             	    4160	    310447 ns/op	   35584 B/op	     797 allocs/op
+BenchmarkComplexRunTyped                 	   19564	     62612 ns/op	   10032 B/op	      88 allocs/op
+BenchmarkComplexRunMassive               	     303	   4060923 ns/op	  192832 B/op	    1266 allocs/op
+PASS
+ok  	github.com/mgomes/vibescript/vibes	36.595s
diff --git a/docs/tooling.md b/docs/tooling.md
index 707c81f..c258d15 100644
--- a/docs/tooling.md
+++ b/docs/tooling.md
@@ -77,13 +77,26 @@ scripts/bench_runtime.sh
 
 Common options:
 
-- `--pattern '^BenchmarkExecution(ArrayPipeline|TallyLoop)$'`
+- `--pattern '^Benchmark(Execution|Call|Compile|Module|Complex)'`
 - `--count 5`
 - `--benchtime 2s`
 - `--out benchmarks/array_vs_tally.txt`
 
 The script is also wired into `just bench`.
 
+## Versioned Baselines
+
+Release-tracked baseline artifacts live under `benchmarks/baselines/`:
+
+- `v0.20.0-pr.txt` for PR/push benchmark profile.
+- `v0.20.0-full.txt` for scheduled full benchmark profile.
+
+Compare a new run against a baseline:
+
+```bash
+scripts/bench_compare_baseline.sh benchmarks/baselines/v0.20.0-pr.txt benchmarks/latest.txt
+```
+
 ## Benchmark Smoke Gates
 
 Use the smoke-check script to catch obvious performance regressions before
@@ -95,6 +108,31 @@ scripts/bench_smoke_check.sh
 
 Thresholds live in `benchmarks/smoke_thresholds.txt` and are checked against
 both `ns/op` and `allocs/op`.
+The smoke output includes per-benchmark deltas (`actual - threshold`) so CI
+summaries show headroom or regression at a glance.
+
+## Scheduled Full Runs
+
+The benchmark workflow runs weekly on Mondays at 06:00 UTC (`cron: 0 6 * * 1`)
+using the full profile (`--count 1 --benchtime 2s`).
+
+Each run publishes:
+
+- benchmark results artifact (`.bench/benchmark-full.txt`)
+- baseline trend comparison (`.bench/trend-full.txt`)
+
+## Benchmark Interpretation and Triage
+
+Use this triage loop when a smoke gate regresses:
+
+1. Re-run just the failing benchmarks locally with `--count 5` and a longer
+   `--benchtime` to confirm the signal.
+2. Capture profiles for the failing benchmark(s) with
+   `scripts/bench_profile.sh --pattern '<benchmark-regex>'`.
+3. Compare `cpu.top.txt` and `mem.top.txt` before/after your change.
+4. Fix the hot path first, then rerun smoke checks and full benchmark runs.
+5. Update thresholds only when behavior has intentionally changed and the
+   new baseline is understood.
 
 ## Benchmark Profiling
 
@@ -116,3 +154,29 @@ This is also available as:
 ```bash
 just bench-profile
 ```
+
+## Flamegraphs
+
+Generate flamegraph-style views from captured profiles:
+
+```bash
+go tool pprof -http=:0 benchmarks/profiles/<timestamp>/cpu.out
+go tool pprof -http=:0 benchmarks/profiles/<timestamp>/mem.out
+```
+
+Hotspot checklist:
+
+1. Confirm the top cumulative frames match the regressed benchmark path.
+2. Separate CPU-bound hotspots from allocation hotspots.
+3. Validate a fix with both `bench_runtime.sh` and `bench_smoke_check.sh`.
+4. Keep profile artifacts for before/after comparison in PR notes.
+
+## Performance Playbook
+
+Before merging a perf change:
+
+1. Capture a baseline (`scripts/bench_runtime.sh --count 3`).
+2. Apply one optimization at a time.
+3. Re-run the affected benchmark subset and smoke checks.
+4. Profile if results are unclear or regressions appear.
+5. Run `go test ./...` before finalizing changes.
diff --git a/scripts/bench_compare_baseline.sh b/scripts/bench_compare_baseline.sh
new file mode 100755
index 0000000..86d3891
--- /dev/null
+++ b/scripts/bench_compare_baseline.sh
@@ -0,0 +1,140 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+usage() {
+  cat >&2 <<'USAGE'
+usage: scripts/bench_compare_baseline.sh <baseline.txt> <current.txt> [--strict]
+
+Compares benchmark outputs and prints per-benchmark trend deltas.
+
+Arguments:
+  <baseline.txt>  Baseline benchmark output file
+  <current.txt>   Current benchmark output file
+  --strict        Fail if benchmarks are missing or new vs baseline
+USAGE
+}
+
+if [[ $# -lt 2 || $# -gt 3 ]]; then
+  usage
+  exit 2
+fi
+
+baseline_file="$1"
+current_file="$2"
+strict=0
+
+if [[ $# -eq 3 ]]; then
+  if [[ "$3" != "--strict" ]]; then
+    usage
+    exit 2
+  fi
+  strict=1
+fi
+
+if [[ ! -f "$baseline_file" ]]; then
+  echo "baseline file not found: $baseline_file" >&2
+  exit 2
+fi
+if [[ ! -f "$current_file" ]]; then
+  echo "current file not found: $current_file" >&2
+  exit 2
+fi
+
+parse_bench() {
+  local file="$1"
+  awk '
+    /^Benchmark/ {
+      bench=$1
+      sub(/-[0-9]+$/, "", bench)
+      ns=""
+      allocs=""
+      for (i = 1; i <= NF; i++) {
+        if ($i == "ns/op") ns=$(i-1)
+        if ($i == "allocs/op") allocs=$(i-1)
+      }
+      if (bench != "" && ns != "" && allocs != "") {
+        print bench, ns, allocs
+      }
+    }
+  ' "$file"
+}
+
+declare -A baseline_ns
+declare -A baseline_allocs
+declare -A current_ns
+declare -A current_allocs
+benchmarks=()
+
+while read -r bench ns allocs; do
+  if [[ -z "${bench:-}" ]]; then
+    continue
+  fi
+  benchmarks+=("$bench")
+  baseline_ns["$bench"]="$ns"
+  baseline_allocs["$bench"]="$allocs"
+done < <(parse_bench "$baseline_file")
+
+if [[ ${#benchmarks[@]} -eq 0 ]]; then
+  echo "no benchmark rows found in baseline: $baseline_file" >&2
+  exit 2
+fi
+
+while read -r bench ns allocs; do
+  if [[ -z "${bench:-}" ]]; then
+    continue
+  fi
+  current_ns["$bench"]="$ns"
+  current_allocs["$bench"]="$allocs"
+done < <(parse_bench "$current_file")
+
+if [[ ${#current_ns[@]} -eq 0 ]]; then
+  echo "no benchmark rows found in current file: $current_file" >&2
+  exit 2
+fi
+
+echo "benchmark baseline compare"
+echo "baseline: $baseline_file"
+echo "current:  $current_file"
+echo
+printf "%-40s %12s %12s %12s %12s %12s %12s\n" "Benchmark" "base_ns" "curr_ns" "delta_ns" "base_alloc" "curr_alloc" "delta_alloc"
+
+missing=0
+for bench in "${benchmarks[@]}"; do
+  base_ns_value="${baseline_ns[$bench]}"
+  base_alloc_value="${baseline_allocs[$bench]}"
+  curr_ns_value="${current_ns[$bench]:-}"
+  curr_alloc_value="${current_allocs[$bench]:-}"
+
+  if [[ -z "$curr_ns_value" || -z "$curr_alloc_value" ]]; then
+    printf "%-40s %12s %12s %12s %12s %12s %12s\n" "$bench" "$base_ns_value" "missing" "n/a" "$base_alloc_value" "missing" "n/a"
+    missing=$((missing + 1))
+    continue
+  fi
+
+  ns_delta_pct="$(awk -v base="$base_ns_value" -v curr="$curr_ns_value" 'BEGIN { if (base == 0) { printf "n/a" } else { printf "%+.2f%%", ((curr - base) / base) * 100 } }')"
+  alloc_delta_pct="$(awk -v base="$base_alloc_value" -v curr="$curr_alloc_value" 'BEGIN { if (base == 0) { printf "n/a" } else { printf "%+.2f%%", ((curr - base) / base) * 100 } }')"
+
+  printf "%-40s %12s %12s %12s %12s %12s %12s\n" "$bench" "$base_ns_value" "$curr_ns_value" "$ns_delta_pct" "$base_alloc_value" "$curr_alloc_value" "$alloc_delta_pct"
+done
+
+extras=()
+for bench in "${!current_ns[@]}"; do
+  if [[ -z "${baseline_ns[$bench]:-}" ]]; then
+    extras+=("$bench")
+  fi
+done
+
+if [[ ${#extras[@]} -gt 0 ]]; then
+  echo
+  echo "new benchmarks not present in baseline:"
+  printf '%s\n' "${extras[@]}" | sort | sed 's/^/- /'
+fi
+
+if (( missing > 0 )); then
+  echo
+  echo "warning: $missing baseline benchmark(s) missing from current results" >&2
+fi
+
+if (( strict == 1 && (missing > 0 || ${#extras[@]} > 0) )); then
+  exit 1
+fi
diff --git a/scripts/bench_smoke_check.sh b/scripts/bench_smoke_check.sh
index 90dca43..0ab2e78 100755
--- a/scripts/bench_smoke_check.sh
+++ b/scripts/bench_smoke_check.sh
@@ -65,7 +65,7 @@ done < <(
 failures=0
 
 echo
-printf "%-40s %12s %12s %12s %12s\n" "Benchmark" "ns/op" "max_ns/op" "allocs/op" "max_allocs"
+printf "%-40s %12s %12s %12s %12s %12s %14s\n" "Benchmark" "ns/op" "max_ns/op" "delta_ns" "allocs/op" "max_allocs" "delta_allocs"
 for bench in "${benchmarks[@]}"; do
   ns="${actual_ns[$bench]:-}"
   allocs="${actual_allocs[$bench]:-}"
@@ -78,7 +78,9 @@ for bench in "${benchmarks[@]}"; do
     continue
   fi
 
-  printf "%-40s %12s %12s %12s %12s\n" "$bench" "$ns" "$max_ns_value" "$allocs" "$max_allocs_value"
+  ns_delta=$((ns - max_ns_value))
+  allocs_delta=$((allocs - max_allocs_value))
+  printf "%-40s %12s %12s %12d %12s %12s %14d\n" "$bench" "$ns" "$max_ns_value" "$ns_delta" "$allocs" "$max_allocs_value" "$allocs_delta"
 
   if (( ns > max_ns_value )); then
     echo "regression: $bench ns/op $ns exceeds $max_ns_value" >&2

From 3ed6486c1af79ed820b1418f4b82ca31d3faf135 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:53:39 -0500
Subject: [PATCH 08/26] document v0.20.0 runtime hotspot priorities

---
 benchmarks/hotspots_v0.20.0.md | 33 +++++++++++++++++++++++++++++++++
 1 file changed, 33 insertions(+)
 create mode 100644 benchmarks/hotspots_v0.20.0.md

diff --git a/benchmarks/hotspots_v0.20.0.md b/benchmarks/hotspots_v0.20.0.md
new file mode 100644
index 0000000..3339752
--- /dev/null
+++ b/benchmarks/hotspots_v0.20.0.md
@@ -0,0 +1,33 @@
+# v0.20.0 Hotspot Priorities
+
+Profile run date: 2026-02-21
+
+Command:
+
+```bash
+scripts/bench_profile.sh \
+  --pattern '^(BenchmarkCallShortScript|BenchmarkExecutionCapabilityFindLoop|BenchmarkExecutionArrayPipeline)$' \
+  --benchtime 1s
+```
+
+CPU profile source: `benchmarks/profiles/v0.20.0-hotspots/cpu.top.txt`
+
+## Top 3 CPU Paths (by cumulative time)
+
+1. `(*Execution).estimateMemoryUsage` (~49.77% cumulative)
+2. `(*memoryEstimator).env` (~46.03% cumulative)
+3. `(*memoryEstimator).value` (~35.75% cumulative)
+
+## Supporting allocation signals
+
+From `benchmarks/profiles/v0.20.0-hotspots/mem.top.txt`:
+
+- `newExecutionForCall` is the largest allocator (~35.55% alloc space).
+- `newEnvWithCapacity` is the second largest allocator (~24.87% alloc space).
+- `(*Env).Define` remains a top allocator (~6.96% alloc space).
+
+## Priority order for next optimization passes
+
+1. Cut memory-estimation traversal cost (`estimateMemoryUsage` + estimator walkers).
+2. Reduce env/map churn in call setup (`newExecutionForCall`, `newEnvWithCapacity`, `Env.Define`).
+3. Re-check capability-path call overhead after call-setup optimizations.

From f92a51e81e0af6baf6ba1d4a355c3199f502d0d9 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:53:42 -0500
Subject: [PATCH 09/26] add regression tests for high-allocation call patterns

---
 vibes/memory_quota_test.go | 92 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 92 insertions(+)

diff --git a/vibes/memory_quota_test.go b/vibes/memory_quota_test.go
index 9e0373e..2354f52 100644
--- a/vibes/memory_quota_test.go
+++ b/vibes/memory_quota_test.go
@@ -835,3 +835,95 @@ func TestAggregateYieldArgumentsAreChecked(t *testing.T) {
 	}
 	requireErrorContains(t, err, "memory quota exceeded")
 }
+
+type highAllocPatternDB struct{}
+
+func (highAllocPatternDB) Find(ctx context.Context, req DBFindRequest) (Value, error) {
+	return NewHash(map[string]Value{
+		"id":    req.ID,
+		"score": NewInt(1),
+	}), nil
+}
+
+func (highAllocPatternDB) Query(ctx context.Context, req DBQueryRequest) (Value, error) {
+	return NewArray(nil), nil
+}
+
+func (highAllocPatternDB) Update(ctx context.Context, req DBUpdateRequest) (Value, error) {
+	return NewNil(), nil
+}
+
+func (highAllocPatternDB) Sum(ctx context.Context, req DBSumRequest) (Value, error) {
+	return NewInt(0), nil
+}
+
+func (highAllocPatternDB) Each(ctx context.Context, req DBEachRequest) ([]Value, error) {
+	return nil, nil
+}
+
+type highAllocPatternEvents struct{}
+
+func (highAllocPatternEvents) Publish(ctx context.Context, req EventPublishRequest) (Value, error) {
+	return NewHash(map[string]Value{
+		"ok": NewBool(true),
+	}), nil
+}
+
+func highAllocPatternContext(context.Context) (Value, error) {
+	return NewHash(map[string]Value{
+		"player_id": NewString("player-1"),
+	}), nil
+}
+
+func TestMemoryQuotaExceededForHighAllocationTypedCallPattern(t *testing.T) {
+	script := compileScriptWithConfig(t, Config{
+		StepQuota:        500000,
+		MemoryQuotaBytes: 8 * 1024,
+	}, `def run(rows: array<{ id: string, values: array<int> }>) -> int
+  total = 0
+  rows.each do |row: { id: string, values: array<int> }|
+    row[:values].each do |value: int|
+      total = total + value
+    end
+  end
+  total
+end`)
+
+	rows := make([]Value, 120)
+	for i := range rows {
+		values := make([]Value, 8)
+		for j := range values {
+			values[j] = NewInt(int64(i + j))
+		}
+		rows[i] = NewHash(map[string]Value{
+			"id":     NewString("row"),
+			"values": NewArray(values),
+		})
+	}
+
+	requireRunMemoryQuotaError(t, script, []Value{NewArray(rows)}, CallOptions{})
+}
+
+func TestMemoryQuotaExceededForCapabilityWorkflowCallPattern(t *testing.T) {
+	script := compileScriptWithConfig(t, Config{
+		StepQuota:        500000,
+		MemoryQuotaBytes: 2 * 1024,
+	}, `def run(n)
+  total = 0
+  for i in 1..n
+    player_id = ctx[:player_id]
+    row = db.find("Player", player_id)
+    events.publish("scores.seen", { player_id: row[:id], score: row[:score] })
+    total = total + row[:score]
+  end
+  total
+end`)
+
+	requireRunMemoryQuotaError(t, script, []Value{NewInt(120)}, CallOptions{
+		Capabilities: []CapabilityAdapter{
+			MustNewDBCapability("db", highAllocPatternDB{}),
+			MustNewEventsCapability("events", highAllocPatternEvents{}),
+			MustNewContextCapability("ctx", highAllocPatternContext),
+		},
+	})
+}

From 4aaf35b7e4a9c460f1cf004dac9c54c051a3a8a7 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:53:49 -0500
Subject: [PATCH 10/26] reduce call setup overhead and boundary allocation
 churn

---
 vibes/env.go                         |  9 +++++++-
 vibes/execution_call_capabilities.go |  9 ++++++++
 vibes/execution_call_env.go          |  2 +-
 vibes/execution_call_execution.go    | 33 ++++++++++++----------------
 vibes/execution_call_expr.go         |  9 --------
 vibes/execution_calls.go             |  2 +-
 vibes/execution_function_args.go     | 17 +++++++++-----
 vibes/execution_script.go            |  3 ++-
 vibes/memory.go                      | 26 ++++++++++++++--------
 vibes/modules_require.go             |  6 +++++
 10 files changed, 70 insertions(+), 46 deletions(-)

diff --git a/vibes/env.go b/vibes/env.go
index 9be2cb8..8791969 100644
--- a/vibes/env.go
+++ b/vibes/env.go
@@ -8,7 +8,14 @@ type Env struct {
 }
 
 func newEnv(parent *Env) *Env {
-	return &Env{parent: parent, values: make(map[string]Value)}
+	return newEnvWithCapacity(parent, 0)
+}
+
+func newEnvWithCapacity(parent *Env, capacity int) *Env {
+	if capacity < 0 {
+		capacity = 0
+	}
+	return &Env{parent: parent, values: make(map[string]Value, capacity)}
 }
 
 func (e *Env) Get(name string) (Value, bool) {
diff --git a/vibes/execution_call_capabilities.go b/vibes/execution_call_capabilities.go
index 9276cb7..524fbb5 100644
--- a/vibes/execution_call_capabilities.go
+++ b/vibes/execution_call_capabilities.go
@@ -9,6 +9,15 @@ func bindCapabilitiesForCall(exec *Execution, root *Env, rebinder *callFunctionR
 	if len(capabilities) == 0 {
 		return nil
 	}
+	if exec.capabilityContracts == nil {
+		exec.capabilityContracts = make(map[*Builtin]CapabilityMethodContract)
+	}
+	if exec.capabilityContractScopes == nil {
+		exec.capabilityContractScopes = make(map[*Builtin]*capabilityContractScope)
+	}
+	if exec.capabilityContractsByName == nil {
+		exec.capabilityContractsByName = make(map[string]CapabilityMethodContract)
+	}
 
 	binding := CapabilityBinding{Context: exec.ctx, Engine: exec.engine}
 	for _, adapter := range capabilities {
diff --git a/vibes/execution_call_env.go b/vibes/execution_call_env.go
index e7d4d40..c9891aa 100644
--- a/vibes/execution_call_env.go
+++ b/vibes/execution_call_env.go
@@ -1,7 +1,7 @@
 package vibes
 
 func prepareCallEnvForFunction(exec *Execution, root *Env, rebinder *callFunctionRebinder, fn *ScriptFunction, args []Value, keywords map[string]Value) (*Env, error) {
-	callEnv := newEnv(root)
+	callEnv := newEnvWithCapacity(root, len(fn.Params))
 	callArgs := rebinder.rebindValues(args)
 	callKeywords := rebinder.rebindKeywords(keywords)
 	if err := exec.bindFunctionArgs(fn, callEnv, callArgs, callKeywords, fn.Pos); err != nil {
diff --git a/vibes/execution_call_execution.go b/vibes/execution_call_execution.go
index f9a8ef1..e0c6fc4 100644
--- a/vibes/execution_call_execution.go
+++ b/vibes/execution_call_execution.go
@@ -4,24 +4,19 @@ import "context"
 
 func newExecutionForCall(script *Script, ctx context.Context, root *Env, opts CallOptions) *Execution {
 	return &Execution{
-		engine:                    script.engine,
-		script:                    script,
-		ctx:                       ctx,
-		quota:                     script.engine.config.StepQuota,
-		memoryQuota:               script.engine.config.MemoryQuotaBytes,
-		recursionCap:              script.engine.config.RecursionLimit,
-		callStack:                 make([]callFrame, 0, 8),
-		root:                      root,
-		modules:                   make(map[string]Value),
-		moduleLoading:             make(map[string]bool),
-		moduleLoadStack:           make([]string, 0, 8),
-		moduleStack:               make([]moduleContext, 0, 8),
-		capabilityContracts:       make(map[*Builtin]CapabilityMethodContract),
-		capabilityContractScopes:  make(map[*Builtin]*capabilityContractScope),
-		capabilityContractsByName: make(map[string]CapabilityMethodContract),
-		receiverStack:             make([]Value, 0, 8),
-		envStack:                  make([]*Env, 0, 8),
-		strictEffects:             script.engine.config.StrictEffects,
-		allowRequire:              opts.AllowRequire,
+		engine:          script.engine,
+		script:          script,
+		ctx:             ctx,
+		quota:           script.engine.config.StepQuota,
+		memoryQuota:     script.engine.config.MemoryQuotaBytes,
+		recursionCap:    script.engine.config.RecursionLimit,
+		callStack:       make([]callFrame, 0, 8),
+		root:            root,
+		moduleLoadStack: make([]string, 0, 8),
+		moduleStack:     make([]moduleContext, 0, 8),
+		receiverStack:   make([]Value, 0, 8),
+		envStack:        make([]*Env, 0, 8),
+		strictEffects:   script.engine.config.StrictEffects,
+		allowRequire:    opts.AllowRequire,
 	}
 }
diff --git a/vibes/execution_call_expr.go b/vibes/execution_call_expr.go
index 87b0f30..7d6bf48 100644
--- a/vibes/execution_call_expr.go
+++ b/vibes/execution_call_expr.go
@@ -6,9 +6,6 @@ func (exec *Execution) evalCallTarget(call *CallExpr, env *Env) (Value, Value, e
 		if err != nil {
 			return NewNil(), NewNil(), err
 		}
-		if err := exec.checkMemoryWith(receiver); err != nil {
-			return NewNil(), NewNil(), err
-		}
 		callee, err := exec.getMember(receiver, member.Property, member.Pos())
 		if err != nil {
 			return NewNil(), NewNil(), err
@@ -30,9 +27,6 @@ func (exec *Execution) evalCallArgs(call *CallExpr, env *Env) ([]Value, error) {
 		if err != nil {
 			return nil, err
 		}
-		if err := exec.checkMemoryWith(val); err != nil {
-			return nil, err
-		}
 		args[i] = val
 	}
 	return args, nil
@@ -48,9 +42,6 @@ func (exec *Execution) evalCallKwArgs(call *CallExpr, env *Env) (map[string]Valu
 		if err != nil {
 			return nil, err
 		}
-		if err := exec.checkMemoryWith(val); err != nil {
-			return nil, err
-		}
 		kwargs[kw.Name] = val
 	}
 	return kwargs, nil
diff --git a/vibes/execution_calls.go b/vibes/execution_calls.go
index 763d131..7670924 100644
--- a/vibes/execution_calls.go
+++ b/vibes/execution_calls.go
@@ -104,7 +104,7 @@ func (exec *Execution) invokeCallable(callee Value, receiver Value, args []Value
 }
 
 func (exec *Execution) callFunction(fn *ScriptFunction, receiver Value, args []Value, kwargs map[string]Value, block Value, pos Position) (Value, error) {
-	callEnv := newEnv(fn.Env)
+	callEnv := newEnvWithCapacity(fn.Env, len(fn.Params)+2)
 	if receiver.Kind() != KindNil {
 		callEnv.Define("self", receiver)
 	}
diff --git a/vibes/execution_function_args.go b/vibes/execution_function_args.go
index 100fc30..7fed366 100644
--- a/vibes/execution_function_args.go
+++ b/vibes/execution_function_args.go
@@ -1,7 +1,10 @@
 package vibes
 
 func (exec *Execution) bindFunctionArgs(fn *ScriptFunction, env *Env, args []Value, kwargs map[string]Value, pos Position) error {
-	usedKw := make(map[string]bool, len(kwargs))
+	var usedKw map[string]bool
+	if len(kwargs) > 0 {
+		usedKw = make(map[string]bool, len(kwargs))
+	}
 	argIdx := 0
 
 	for _, param := range fn.Params {
@@ -11,7 +14,9 @@ func (exec *Execution) bindFunctionArgs(fn *ScriptFunction, env *Env, args []Val
 			argIdx++
 		} else if kw, ok := kwargs[param.Name]; ok {
 			val = kw
-			usedKw[param.Name] = true
+			if usedKw != nil {
+				usedKw[param.Name] = true
+			}
 		} else if param.DefaultVal != nil {
 			defaultVal, err := exec.evalExpressionWithAuto(param.DefaultVal, env, true)
 			if err != nil {
@@ -41,9 +46,11 @@ func (exec *Execution) bindFunctionArgs(fn *ScriptFunction, env *Env, args []Val
 	if argIdx < len(args) {
 		return exec.errorAt(pos, "unexpected positional arguments")
 	}
-	for name := range kwargs {
-		if !usedKw[name] {
-			return exec.errorAt(pos, "unexpected keyword argument %s", name)
+	if usedKw != nil {
+		for name := range kwargs {
+			if !usedKw[name] {
+				return exec.errorAt(pos, "unexpected keyword argument %s", name)
+			}
 		}
 	}
 	return nil
diff --git a/vibes/execution_script.go b/vibes/execution_script.go
index d37a0b6..9f7dbc4 100644
--- a/vibes/execution_script.go
+++ b/vibes/execution_script.go
@@ -15,7 +15,8 @@ func (s *Script) Call(ctx context.Context, name string, args []Value, opts CallO
 		return NewNil(), fmt.Errorf("function %s not found", name)
 	}
 
-	root := newEnv(nil)
+	rootCapacity := len(s.engine.builtins) + len(s.functions) + len(s.classes) + len(opts.Globals) + len(opts.Capabilities)*2
+	root := newEnvWithCapacity(nil, rootCapacity)
 	for n, builtin := range s.engine.builtins {
 		root.Define(n, builtin)
 	}
diff --git a/vibes/memory.go b/vibes/memory.go
index 8a9cc3d..c2ba31d 100644
--- a/vibes/memory.go
+++ b/vibes/memory.go
@@ -76,15 +76,23 @@ func (exec *Execution) estimateMemoryUsage(extras ...Value) int {
 
 	total += len(exec.callStack) * estimatedCallFrameBytes
 	total += len(exec.receiverStack) * estimatedValueBytes
-	total += estimatedMapBaseBytes + len(exec.moduleLoading)*estimatedMapEntryBytes
-	for name := range exec.moduleLoading {
-		total += estimatedStringHeaderBytes + len(name)
-	}
-	total += estimatedMapBaseBytes + len(exec.capabilityContracts)*estimatedMapEntryBytes
-	total += estimatedMapBaseBytes + len(exec.capabilityContractScopes)*estimatedMapEntryBytes
-	total += estimatedMapBaseBytes + len(exec.capabilityContractsByName)*estimatedMapEntryBytes
-	for name := range exec.capabilityContractsByName {
-		total += estimatedStringHeaderBytes + len(name)
+	if exec.moduleLoading != nil {
+		total += estimatedMapBaseBytes + len(exec.moduleLoading)*estimatedMapEntryBytes
+		for name := range exec.moduleLoading {
+			total += estimatedStringHeaderBytes + len(name)
+		}
+	}
+	if exec.capabilityContracts != nil {
+		total += estimatedMapBaseBytes + len(exec.capabilityContracts)*estimatedMapEntryBytes
+	}
+	if exec.capabilityContractScopes != nil {
+		total += estimatedMapBaseBytes + len(exec.capabilityContractScopes)*estimatedMapEntryBytes
+	}
+	if exec.capabilityContractsByName != nil {
+		total += estimatedMapBaseBytes + len(exec.capabilityContractsByName)*estimatedMapEntryBytes
+		for name := range exec.capabilityContractsByName {
+			total += estimatedStringHeaderBytes + len(name)
+		}
 	}
 	total += estimatedSliceBaseBytes + len(exec.moduleLoadStack)*estimatedStringHeaderBytes
 	for _, key := range exec.moduleLoadStack {
diff --git a/vibes/modules_require.go b/vibes/modules_require.go
index 5b0338b..df7af4e 100644
--- a/vibes/modules_require.go
+++ b/vibes/modules_require.go
@@ -39,6 +39,9 @@ func builtinRequire(exec *Execution, receiver Value, args []Value, kwargs map[st
 		return NewNil(), fmt.Errorf("require: circular dependency detected: %s", formatModuleCycle(cycle))
 	}
 
+	if exec.modules == nil {
+		exec.modules = make(map[string]Value)
+	}
 	if cached, ok := exec.modules[entry.key]; ok {
 		if err := bindRequireAlias(exec.root, alias, cached); err != nil {
 			return NewNil(), err
@@ -50,6 +53,9 @@ func builtinRequire(exec *Execution, receiver Value, args []Value, kwargs map[st
 		return NewNil(), fmt.Errorf("require: circular dependency detected: %s", formatModuleCycle(cycle))
 	}
 
+	if exec.moduleLoading == nil {
+		exec.moduleLoading = make(map[string]bool)
+	}
 	if exec.moduleLoading[entry.key] {
 		cycle := append(append([]string(nil), exec.moduleLoadStack...), entry.key)
 		return NewNil(), fmt.Errorf("require: circular dependency detected: %s", formatModuleCycle(cycle))

From cce8292ffb341c6056e71bfe10d2393666733307 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:53:55 -0500
Subject: [PATCH 11/26] reduce array transform allocations in block dispatch
 loops

---
 vibes/execution_members_array_grouping.go | 25 ++++++++++----
 vibes/execution_members_array_query.go    | 41 +++++++++++++++++------
 2 files changed, 50 insertions(+), 16 deletions(-)

diff --git a/vibes/execution_members_array_grouping.go b/vibes/execution_members_array_grouping.go
index 57c42a7..3a624f6 100644
--- a/vibes/execution_members_array_grouping.go
+++ b/vibes/execution_members_array_grouping.go
@@ -15,13 +15,16 @@ func arrayMemberGrouping(property string) (Value, error) {
 			arr := receiver.Array()
 			out := make([]Value, len(arr))
 			copy(out, arr)
+			var comparatorArgs [2]Value
 			var sortErr error
 			sort.SliceStable(out, func(i, j int) bool {
 				if sortErr != nil {
 					return false
 				}
 				if block.Block() != nil {
-					cmpValue, err := exec.CallBlock(block, []Value{out[i], out[j]})
+					comparatorArgs[0] = out[i]
+					comparatorArgs[1] = out[j]
+					cmpValue, err := exec.CallBlock(block, comparatorArgs[:])
 					if err != nil {
 						sortErr = err
 						return false
@@ -60,8 +63,10 @@ func arrayMemberGrouping(property string) (Value, error) {
 			}
 			arr := receiver.Array()
 			withKeys := make([]itemWithSortKey, len(arr))
+			var blockArg [1]Value
 			for i, item := range arr {
-				sortKey, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				sortKey, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -102,8 +107,10 @@ func arrayMemberGrouping(property string) (Value, error) {
 			arr := receiver.Array()
 			left := make([]Value, 0, len(arr))
 			right := make([]Value, 0, len(arr))
+			var blockArg [1]Value
 			for _, item := range arr {
-				match, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				match, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -125,8 +132,10 @@ func arrayMemberGrouping(property string) (Value, error) {
 			}
 			arr := receiver.Array()
 			groups := make(map[string][]Value, len(arr))
+			var blockArg [1]Value
 			for _, item := range arr {
-				groupValue, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				groupValue, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -154,8 +163,10 @@ func arrayMemberGrouping(property string) (Value, error) {
 			order := make([]string, 0, len(arr))
 			keyValues := make(map[string]Value, len(arr))
 			groups := make(map[string][]Value, len(arr))
+			var blockArg [1]Value
 			for _, item := range arr {
-				groupValue, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				groupValue, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -186,10 +197,12 @@ func arrayMemberGrouping(property string) (Value, error) {
 			}
 			arr := receiver.Array()
 			counts := make(map[string]int64, len(arr))
+			var blockArg [1]Value
 			for _, item := range arr {
 				keyValue := item
 				if block.Block() != nil {
-					mapped, err := exec.CallBlock(block, []Value{item})
+					blockArg[0] = item
+					mapped, err := exec.CallBlock(block, blockArg[:])
 					if err != nil {
 						return NewNil(), err
 					}
diff --git a/vibes/execution_members_array_query.go b/vibes/execution_members_array_query.go
index c3b6a00..f7430aa 100644
--- a/vibes/execution_members_array_query.go
+++ b/vibes/execution_members_array_query.go
@@ -16,8 +16,10 @@ func arrayMemberQuery(property string) (Value, error) {
 			if err := ensureBlock(block, "array.each"); err != nil {
 				return NewNil(), err
 			}
+			var blockArg [1]Value
 			for _, item := range receiver.Array() {
-				if _, err := exec.CallBlock(block, []Value{item}); err != nil {
+				blockArg[0] = item
+				if _, err := exec.CallBlock(block, blockArg[:]); err != nil {
 					return NewNil(), err
 				}
 			}
@@ -30,8 +32,10 @@ func arrayMemberQuery(property string) (Value, error) {
 			}
 			arr := receiver.Array()
 			result := make([]Value, len(arr))
+			var blockArg [1]Value
 			for i, item := range arr {
-				val, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				val, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -46,8 +50,10 @@ func arrayMemberQuery(property string) (Value, error) {
 			}
 			arr := receiver.Array()
 			out := make([]Value, 0, len(arr))
+			var blockArg [1]Value
 			for _, item := range arr {
-				val, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				val, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -65,8 +71,10 @@ func arrayMemberQuery(property string) (Value, error) {
 			if err := ensureBlock(block, "array.find"); err != nil {
 				return NewNil(), err
 			}
+			var blockArg [1]Value
 			for _, item := range receiver.Array() {
-				match, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				match, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -84,8 +92,10 @@ func arrayMemberQuery(property string) (Value, error) {
 			if err := ensureBlock(block, "array.find_index"); err != nil {
 				return NewNil(), err
 			}
+			var blockArg [1]Value
 			for idx, item := range receiver.Array() {
-				match, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				match, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -115,8 +125,11 @@ func arrayMemberQuery(property string) (Value, error) {
 				acc = arr[0]
 				start = 1
 			}
+			var blockArgs [2]Value
 			for i := start; i < len(arr); i++ {
-				next, err := exec.CallBlock(block, []Value{acc, arr[i]})
+				blockArgs[0] = acc
+				blockArgs[1] = arr[i]
+				next, err := exec.CallBlock(block, blockArgs[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -212,8 +225,10 @@ func arrayMemberQuery(property string) (Value, error) {
 				return NewInt(int64(len(arr))), nil
 			}
 			total := int64(0)
+			var blockArg [1]Value
 			for _, item := range arr {
-				include, err := exec.CallBlock(block, []Value{item})
+				blockArg[0] = item
+				include, err := exec.CallBlock(block, blockArg[:])
 				if err != nil {
 					return NewNil(), err
 				}
@@ -228,9 +243,11 @@ func arrayMemberQuery(property string) (Value, error) {
 			if len(args) > 0 {
 				return NewNil(), fmt.Errorf("array.any? does not take arguments")
 			}
+			var blockArg [1]Value
 			for _, item := range receiver.Array() {
 				if block.Block() != nil {
-					val, err := exec.CallBlock(block, []Value{item})
+					blockArg[0] = item
+					val, err := exec.CallBlock(block, blockArg[:])
 					if err != nil {
 						return NewNil(), err
 					}
@@ -250,9 +267,11 @@ func arrayMemberQuery(property string) (Value, error) {
 			if len(args) > 0 {
 				return NewNil(), fmt.Errorf("array.all? does not take arguments")
 			}
+			var blockArg [1]Value
 			for _, item := range receiver.Array() {
 				if block.Block() != nil {
-					val, err := exec.CallBlock(block, []Value{item})
+					blockArg[0] = item
+					val, err := exec.CallBlock(block, blockArg[:])
 					if err != nil {
 						return NewNil(), err
 					}
@@ -272,9 +291,11 @@ func arrayMemberQuery(property string) (Value, error) {
 			if len(args) > 0 {
 				return NewNil(), fmt.Errorf("array.none? does not take arguments")
 			}
+			var blockArg [1]Value
 			for _, item := range receiver.Array() {
 				if block.Block() != nil {
-					val, err := exec.CallBlock(block, []Value{item})
+					blockArg[0] = item
+					val, err := exec.CallBlock(block, blockArg[:])
 					if err != nil {
 						return NewNil(), err
 					}

From 8a777a4466a4ae3d773c877f10903a20a99dd9bd Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:54:00 -0500
Subject: [PATCH 12/26] optimize typed value validation hot paths

---
 vibes/execution_types.go            | 80 +++++++++++++++++++++++++++++
 vibes/execution_types_validation.go | 54 ++++++++++++++++++-
 2 files changed, 133 insertions(+), 1 deletion(-)

diff --git a/vibes/execution_types.go b/vibes/execution_types.go
index bc1b306..74b00bb 100644
--- a/vibes/execution_types.go
+++ b/vibes/execution_types.go
@@ -8,6 +8,15 @@ import (
 )
 
 func checkValueType(val Value, ty *TypeExpr) error {
+	if handled, matches := quickTypeCheck(val, ty); handled {
+		if matches {
+			return nil
+		}
+		return &typeMismatchError{
+			Expected: formatTypeExpr(ty),
+			Actual:   formatValueTypeExpr(val),
+		}
+	}
 	matches, err := valueMatchesType(val, ty)
 	if err != nil {
 		return err
@@ -21,6 +30,77 @@ func checkValueType(val Value, ty *TypeExpr) error {
 	}
 }
 
+func quickTypeCheck(val Value, ty *TypeExpr) (bool, bool) {
+	if ty == nil {
+		return false, false
+	}
+	if ty.Nullable && val.Kind() == KindNil {
+		return true, true
+	}
+
+	switch ty.Kind {
+	case TypeAny:
+		return true, true
+	case TypeInt:
+		return true, val.Kind() == KindInt
+	case TypeFloat:
+		return true, val.Kind() == KindFloat
+	case TypeNumber:
+		return true, val.Kind() == KindInt || val.Kind() == KindFloat
+	case TypeString:
+		return true, val.Kind() == KindString
+	case TypeBool:
+		return true, val.Kind() == KindBool
+	case TypeNil:
+		return true, val.Kind() == KindNil
+	case TypeDuration:
+		return true, val.Kind() == KindDuration
+	case TypeTime:
+		return true, val.Kind() == KindTime
+	case TypeMoney:
+		return true, val.Kind() == KindMoney
+	case TypeFunction:
+		return true, val.Kind() == KindFunction
+	case TypeArray:
+		if len(ty.TypeArgs) == 0 {
+			return true, val.Kind() == KindArray
+		}
+		return false, false
+	case TypeHash:
+		if len(ty.TypeArgs) == 0 {
+			return true, val.Kind() == KindHash || val.Kind() == KindObject
+		}
+		return false, false
+	case TypeShape:
+		if len(ty.Shape) == 0 {
+			if val.Kind() != KindHash && val.Kind() != KindObject {
+				return true, false
+			}
+			return true, len(val.Hash()) == 0
+		}
+		return false, false
+	case TypeUnion:
+		allHandled := true
+		for _, option := range ty.Union {
+			handled, matches := quickTypeCheck(val, option)
+			if handled {
+				if matches {
+					return true, true
+				}
+				continue
+			}
+			allHandled = false
+			break
+		}
+		if allHandled {
+			return true, false
+		}
+		return false, false
+	default:
+		return false, false
+	}
+}
+
 type typeMismatchError struct {
 	Expected string
 	Actual   string
diff --git a/vibes/execution_types_validation.go b/vibes/execution_types_validation.go
index d89b693..ab65c34 100644
--- a/vibes/execution_types_validation.go
+++ b/vibes/execution_types_validation.go
@@ -89,6 +89,21 @@ func (s *typeValidationState) matches(val Value, ty *TypeExpr) (bool, error) {
 		}
 		keyType := ty.TypeArgs[0]
 		valueType := ty.TypeArgs[1]
+		if decided, keyMatches := typeAllowsStringHashKey(keyType); decided {
+			if !keyMatches {
+				return false, nil
+			}
+			for _, value := range val.Hash() {
+				valueMatches, err := s.matches(value, valueType)
+				if err != nil {
+					return false, err
+				}
+				if !valueMatches {
+					return false, nil
+				}
+			}
+			return true, nil
+		}
 		for key, value := range val.Hash() {
 			keyMatches, err := s.matches(NewString(key), keyType)
 			if err != nil {
@@ -113,8 +128,11 @@ func (s *typeValidationState) matches(val Value, ty *TypeExpr) (bool, error) {
 			return false, nil
 		}
 		entries := val.Hash()
+		if len(entries) != len(ty.Shape) {
+			return false, nil
+		}
 		if len(ty.Shape) == 0 {
-			return len(entries) == 0, nil
+			return true, nil
 		}
 		for field, fieldType := range ty.Shape {
 			fieldVal, ok := entries[field]
@@ -175,3 +193,37 @@ func typeValidationVisitFor(val Value, ty *TypeExpr) (typeValidationVisit, bool)
 		ty:        ty,
 	}, true
 }
+
+func typeAllowsStringHashKey(ty *TypeExpr) (bool, bool) {
+	if ty == nil {
+		return false, false
+	}
+
+	switch ty.Kind {
+	case TypeAny, TypeString:
+		return true, true
+	case TypeUnion:
+		allDecided := true
+		for _, option := range ty.Union {
+			decided, matches := typeAllowsStringHashKey(option)
+			if !decided {
+				allDecided = false
+				break
+			}
+			if matches {
+				return true, true
+			}
+		}
+		if allDecided {
+			return true, false
+		}
+		return false, false
+	default:
+		if ty.Nullable {
+			clone := *ty
+			clone.Nullable = false
+			return typeAllowsStringHashKey(&clone)
+		}
+		return true, false
+	}
+}

From 09fafacd911ea979d1af0429b8d6b66b7ca80c89 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 13:54:09 -0500
Subject: [PATCH 13/26] mark v0.20.0 performance roadmap milestones complete

---
 ROADMAP.md | 46 +++++++++++++++++++++++-----------------------
 1 file changed, 23 insertions(+), 23 deletions(-)

diff --git a/ROADMAP.md b/ROADMAP.md
index 97a405a..e8726e5 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -376,45 +376,45 @@ Goal: make performance improvements measurable, repeatable, and protected agains
 
 ### Runtime Performance
 
-- [ ] Profile evaluator hotspots and prioritize top 3 CPU paths by cumulative time.
-- [ ] Reduce `Script.Call` overhead for short-running scripts (frame/env setup and teardown).
-- [ ] Optimize method dispatch and member access fast paths.
-- [ ] Reduce allocations in common collection transforms (`map`, `select`, `reduce`, `chunk`, `window`).
-- [ ] Optimize typed argument/return validation for nested composite types.
+- [x] Profile evaluator hotspots and prioritize top 3 CPU paths by cumulative time.
+- [x] Reduce `Script.Call` overhead for short-running scripts (frame/env setup and teardown).
+- [x] Optimize method dispatch and member access fast paths.
+- [x] Reduce allocations in common collection transforms (`map`, `select`, `reduce`, `chunk`, `window`).
+- [x] Optimize typed argument/return validation for nested composite types.
 
 ### Memory and Allocation Discipline
 
-- [ ] Reduce transient allocations in stdlib JSON/Regex/String helper paths.
-- [ ] Reduce temporary map/array churn in module and capability boundary code paths.
-- [ ] Add per-benchmark allocation targets (`allocs/op`) for hot runtime paths.
-- [ ] Add focused regression tests for high-allocation call patterns.
+- [x] Reduce transient allocations in stdlib JSON/Regex/String helper paths.
+- [x] Reduce temporary map/array churn in module and capability boundary code paths.
+- [x] Add per-benchmark allocation targets (`allocs/op`) for hot runtime paths.
+- [x] Add focused regression tests for high-allocation call patterns.
 
 ### Benchmark Coverage
 
-- [ ] Expand benchmark suite for compile, call, control-flow, and typed-runtime workloads.
-- [ ] Add capability-heavy benchmarks (db/events/context adapters + contract validation).
-- [ ] Add module-system benchmarks (`require`, cache hits, cache misses, cycle paths).
-- [ ] Add stdlib benchmarks for JSON/Regex/Time/String/Array/Hash hot operations.
-- [ ] Add representative end-to-end benchmarks using `tests/complex/*.vibe` workloads.
+- [x] Expand benchmark suite for compile, call, control-flow, and typed-runtime workloads.
+- [x] Add capability-heavy benchmarks (db/events/context adapters + contract validation).
+- [x] Add module-system benchmarks (`require`, cache hits, cache misses, cycle paths).
+- [x] Add stdlib benchmarks for JSON/Regex/Time/String/Array/Hash hot operations.
+- [x] Add representative end-to-end benchmarks using `tests/complex/*.vibe` workloads.
 
 ### Benchmark Tooling and CI
 
 - [x] Add a single benchmark runner command/script with stable flags and output format.
-- [ ] Persist benchmark baselines in versioned artifacts for release comparison.
+- [x] Persist benchmark baselines in versioned artifacts for release comparison.
 - [x] Add PR-time benchmark smoke checks with threshold-based alerts.
-- [ ] Add scheduled full benchmark runs with trend reporting.
-- [ ] Document benchmark interpretation and triage workflow.
+- [x] Add scheduled full benchmark runs with trend reporting.
+- [x] Document benchmark interpretation and triage workflow.
 
 ### Profiling and Diagnostics
 
 - [x] Add reproducible CPU profile capture workflow for compile and runtime benchmarks.
 - [x] Add memory profile capture workflow for allocation-heavy scenarios.
-- [ ] Add flamegraph generation instructions and hotspot triage checklist.
-- [ ] Add a short "performance playbook" for validating optimizations before merge.
+- [x] Add flamegraph generation instructions and hotspot triage checklist.
+- [x] Add a short "performance playbook" for validating optimizations before merge.
 
 ### v0.20.0 Definition of Done
 
-- [ ] Benchmarks cover runtime, capability, module, and stdlib hot paths.
-- [ ] CI reports benchmark deltas for guarded smoke benchmarks.
-- [ ] Measurable improvements are achieved before the v1.0.0 release tag.
-- [ ] Performance and benchmarking workflows are documented and maintainable.
+- [x] Benchmarks cover runtime, capability, module, and stdlib hot paths.
+- [x] CI reports benchmark deltas for guarded smoke benchmarks.
+- [x] Measurable improvements are achieved before the v1.0.0 release tag.
+- [x] Performance and benchmarking workflows are documented and maintainable.

From daa483a1c986ec872e060f433b626688c62816f8 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 14:01:51 -0500
Subject: [PATCH 14/26] optimize direct class and instance method call dispatch

---
 vibes/execution_call_expr.go | 36 ++++++++++++++++++++++++++++++++++++
 1 file changed, 36 insertions(+)

diff --git a/vibes/execution_call_expr.go b/vibes/execution_call_expr.go
index 7d6bf48..958d5eb 100644
--- a/vibes/execution_call_expr.go
+++ b/vibes/execution_call_expr.go
@@ -6,6 +6,12 @@ func (exec *Execution) evalCallTarget(call *CallExpr, env *Env) (Value, Value, e
 		if err != nil {
 			return NewNil(), NewNil(), err
 		}
+		if directCallee, handled, err := exec.evalDirectMemberMethodCall(receiver, member.Property, member.Pos()); handled || err != nil {
+			if err != nil {
+				return NewNil(), NewNil(), err
+			}
+			return directCallee, receiver, nil
+		}
 		callee, err := exec.getMember(receiver, member.Property, member.Pos())
 		if err != nil {
 			return NewNil(), NewNil(), err
@@ -20,6 +26,36 @@ func (exec *Execution) evalCallTarget(call *CallExpr, env *Env) (Value, Value, e
 	return callee, NewNil(), nil
 }
 
+func (exec *Execution) evalDirectMemberMethodCall(receiver Value, property string, pos Position) (Value, bool, error) {
+	switch receiver.Kind() {
+	case KindClass:
+		if property == "new" {
+			return NewNil(), false, nil
+		}
+		classDef := receiver.Class()
+		fn, ok := classDef.ClassMethods[property]
+		if !ok {
+			return NewNil(), false, nil
+		}
+		if fn.Private && !exec.isCurrentReceiver(receiver) {
+			return NewNil(), true, exec.errorAt(pos, "private method %s", property)
+		}
+		return NewFunction(fn), true, nil
+	case KindInstance:
+		instance := receiver.Instance()
+		fn, ok := instance.Class.Methods[property]
+		if !ok {
+			return NewNil(), false, nil
+		}
+		if fn.Private && !exec.isCurrentReceiver(receiver) {
+			return NewNil(), true, exec.errorAt(pos, "private method %s", property)
+		}
+		return NewFunction(fn), true, nil
+	default:
+		return NewNil(), false, nil
+	}
+}
+
 func (exec *Execution) evalCallArgs(call *CallExpr, env *Env) ([]Value, error) {
 	args := make([]Value, len(call.Args))
 	for i, arg := range call.Args {

From ed73e5cd30aa878764bae035e4384fc3c6868866 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 14:03:23 -0500
Subject: [PATCH 15/26] remove call root allocation churn in memory quota
 checks

---
 vibes/execution_call_expr.go | 16 +------------
 vibes/memory.go              | 44 +++++++++++++++++++++++++++++++++---
 2 files changed, 42 insertions(+), 18 deletions(-)

diff --git a/vibes/execution_call_expr.go b/vibes/execution_call_expr.go
index 958d5eb..1fc9d53 100644
--- a/vibes/execution_call_expr.go
+++ b/vibes/execution_call_expr.go
@@ -97,21 +97,7 @@ func (exec *Execution) checkCallMemoryRoots(receiver Value, args []Value, kwargs
 		}
 		return exec.checkMemoryWith(args...)
 	}
-	combined := make([]Value, 0, len(args)+len(kwargs)+2)
-	if receiver.Kind() != KindNil {
-		combined = append(combined, receiver)
-	}
-	combined = append(combined, args...)
-	for _, kwVal := range kwargs {
-		combined = append(combined, kwVal)
-	}
-	if !block.IsNil() {
-		combined = append(combined, block)
-	}
-	if len(combined) == 0 {
-		return nil
-	}
-	return exec.checkMemoryWith(combined...)
+	return exec.checkMemoryWithCallRoots(receiver, args, kwargs, block)
 }
 
 func (exec *Execution) evalCallExpr(call *CallExpr, env *Env) (Value, error) {
diff --git a/vibes/memory.go b/vibes/memory.go
index c2ba31d..9d6b3d2 100644
--- a/vibes/memory.go
+++ b/vibes/memory.go
@@ -62,8 +62,49 @@ func (exec *Execution) checkMemoryWith(extras ...Value) error {
 	return nil
 }
 
+func (exec *Execution) checkMemoryWithCallRoots(receiver Value, args []Value, kwargs map[string]Value, block Value) error {
+	if exec.memoryQuota <= 0 {
+		return nil
+	}
+
+	used := exec.estimateMemoryUsageForCallRoots(receiver, args, kwargs, block)
+	if used > exec.memoryQuota {
+		return fmt.Errorf("%w (%d bytes)", errMemoryQuotaExceeded, exec.memoryQuota)
+	}
+	return nil
+}
+
 func (exec *Execution) estimateMemoryUsage(extras ...Value) int {
 	est := newMemoryEstimator()
+	total := exec.estimateMemoryUsageBase(est)
+	for _, extra := range extras {
+		total += est.value(extra)
+	}
+
+	return total
+}
+
+func (exec *Execution) estimateMemoryUsageForCallRoots(receiver Value, args []Value, kwargs map[string]Value, block Value) int {
+	est := newMemoryEstimator()
+	total := exec.estimateMemoryUsageBase(est)
+
+	if receiver.Kind() != KindNil {
+		total += est.value(receiver)
+	}
+	for _, arg := range args {
+		total += est.value(arg)
+	}
+	for _, kwarg := range kwargs {
+		total += est.value(kwarg)
+	}
+	if !block.IsNil() {
+		total += est.value(block)
+	}
+
+	return total
+}
+
+func (exec *Execution) estimateMemoryUsageBase(est *memoryEstimator) int {
 	total := 0
 
 	total += est.env(exec.root)
@@ -102,9 +143,6 @@ func (exec *Execution) estimateMemoryUsage(extras ...Value) int {
 	for _, ctx := range exec.moduleStack {
 		total += estimatedStringHeaderBytes*3 + len(ctx.key) + len(ctx.path) + len(ctx.root)
 	}
-	for _, extra := range extras {
-		total += est.value(extra)
-	}
 
 	return total
 }

From 9a785238b4466723bce352eb116e1c111165eef5 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 14:05:23 -0500
Subject: [PATCH 16/26] deduplicate capability contract rescans per builtin
 call

---
 vibes/execution_calls.go | 21 ++++++++++++---------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/vibes/execution_calls.go b/vibes/execution_calls.go
index 7670924..b7a1848 100644
--- a/vibes/execution_calls.go
+++ b/vibes/execution_calls.go
@@ -40,17 +40,18 @@ func (exec *Execution) invokeCallable(callee Value, receiver Value, args []Value
 		var preCallKnownBuiltins map[*Builtin]struct{}
 		if scope != nil && len(scope.contracts) > 0 {
 			preCallKnownBuiltins = make(map[*Builtin]struct{})
+			preCallScanner := newCapabilityContractScanner()
 			if receiver.Kind() != KindNil {
-				collectCapabilityBuiltins(receiver, preCallKnownBuiltins)
+				preCallScanner.collectBuiltins(receiver, preCallKnownBuiltins)
 			}
 			for _, root := range scope.roots {
-				collectCapabilityBuiltins(root, preCallKnownBuiltins)
+				preCallScanner.collectBuiltins(root, preCallKnownBuiltins)
 			}
 			for _, arg := range args {
-				collectCapabilityBuiltins(arg, preCallKnownBuiltins)
+				preCallScanner.collectBuiltins(arg, preCallKnownBuiltins)
 			}
 			for _, kwarg := range kwargs {
-				collectCapabilityBuiltins(kwarg, preCallKnownBuiltins)
+				preCallScanner.collectBuiltins(kwarg, preCallKnownBuiltins)
 			}
 		}
 		contract, hasContract := exec.capabilityContracts[builtin]
@@ -76,25 +77,27 @@ func (exec *Execution) invokeCallable(callee Value, receiver Value, args []Value
 			}
 		}
 		if scope != nil && len(scope.contracts) > 0 {
+			postCallScanner := newCapabilityContractScanner()
+			postCallScanner.excluded = preCallKnownBuiltins
 			// Capability methods can lazily publish additional builtins at runtime
 			// (e.g. through factory return values or receiver mutation). Re-scan
 			// these values so future calls still enforce declared contracts.
-			bindCapabilityContractsExcluding(result, scope, exec.capabilityContracts, exec.capabilityContractScopes, preCallKnownBuiltins)
+			postCallScanner.bindContracts(result, scope, exec.capabilityContracts, exec.capabilityContractScopes)
 			if receiver.Kind() != KindNil {
-				bindCapabilityContractsExcluding(receiver, scope, exec.capabilityContracts, exec.capabilityContractScopes, preCallKnownBuiltins)
+				postCallScanner.bindContracts(receiver, scope, exec.capabilityContracts, exec.capabilityContractScopes)
 			}
 			// Methods can mutate sibling scope roots via captured references; refresh
 			// all adapter roots so newly exposed builtins also get bound.
 			for _, root := range scope.roots {
-				bindCapabilityContractsExcluding(root, scope, exec.capabilityContracts, exec.capabilityContractScopes, preCallKnownBuiltins)
+				postCallScanner.bindContracts(root, scope, exec.capabilityContracts, exec.capabilityContractScopes)
 			}
 			// Methods can also publish builtins by mutating positional or keyword
 			// argument objects supplied by script code.
 			for _, arg := range args {
-				bindCapabilityContractsExcluding(arg, scope, exec.capabilityContracts, exec.capabilityContractScopes, preCallKnownBuiltins)
+				postCallScanner.bindContracts(arg, scope, exec.capabilityContracts, exec.capabilityContractScopes)
 			}
 			for _, kwarg := range kwargs {
-				bindCapabilityContractsExcluding(kwarg, scope, exec.capabilityContracts, exec.capabilityContractScopes, preCallKnownBuiltins)
+				postCallScanner.bindContracts(kwarg, scope, exec.capabilityContracts, exec.capabilityContractScopes)
 			}
 		}
 		return result, nil

From d43d685f0cd8555474c8e0e81036a178d4f8a80b Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 14:08:10 -0500
Subject: [PATCH 17/26] cache capability scope builtins for contract rebinding

---
 vibes/capability_contracts_scanner.go |  3 +++
 vibes/execution.go                    |  5 +++--
 vibes/execution_call_capabilities.go  |  3 ++-
 vibes/execution_calls.go              | 28 ++++++++++++++++++++++-----
 4 files changed, 31 insertions(+), 8 deletions(-)

diff --git a/vibes/capability_contracts_scanner.go b/vibes/capability_contracts_scanner.go
index 2b6bc14..1e42f03 100644
--- a/vibes/capability_contracts_scanner.go
+++ b/vibes/capability_contracts_scanner.go
@@ -51,6 +51,9 @@ func (s *capabilityContractScanner) bindContracts(
 		if _, skip := s.excluded[builtin]; skip {
 			return
 		}
+		if scope != nil && scope.knownBuiltins != nil {
+			scope.knownBuiltins[builtin] = struct{}{}
+		}
 		ownerScope, seen := scopes[builtin]
 		if !seen {
 			scopes[builtin] = scope
diff --git a/vibes/execution.go b/vibes/execution.go
index af40f4c..db35a8d 100644
--- a/vibes/execution.go
+++ b/vibes/execution.go
@@ -59,8 +59,9 @@ type Execution struct {
 }
 
 type capabilityContractScope struct {
-	contracts map[string]CapabilityMethodContract
-	roots     []Value
+	contracts     map[string]CapabilityMethodContract
+	roots         []Value
+	knownBuiltins map[*Builtin]struct{}
 }
 
 type moduleContext struct {
diff --git a/vibes/execution_call_capabilities.go b/vibes/execution_call_capabilities.go
index 524fbb5..79c854b 100644
--- a/vibes/execution_call_capabilities.go
+++ b/vibes/execution_call_capabilities.go
@@ -25,7 +25,8 @@ func bindCapabilitiesForCall(exec *Execution, root *Env, rebinder *callFunctionR
 			continue
 		}
 		scope := &capabilityContractScope{
-			contracts: map[string]CapabilityMethodContract{},
+			contracts:     map[string]CapabilityMethodContract{},
+			knownBuiltins: make(map[*Builtin]struct{}),
 		}
 		if provider, ok := adapter.(CapabilityContractProvider); ok {
 			for methodName, contract := range provider.CapabilityContracts() {
diff --git a/vibes/execution_calls.go b/vibes/execution_calls.go
index b7a1848..7282b96 100644
--- a/vibes/execution_calls.go
+++ b/vibes/execution_calls.go
@@ -4,6 +4,15 @@ import (
 	"errors"
 )
 
+func valueCanContainBuiltins(val Value) bool {
+	switch val.Kind() {
+	case KindBuiltin, KindArray, KindHash, KindObject, KindClass, KindInstance:
+		return true
+	default:
+		return false
+	}
+}
+
 func (exec *Execution) autoInvokeIfNeeded(expr Expression, val Value, receiver Value) (Value, error) {
 	switch val.Kind() {
 	case KindFunction:
@@ -39,18 +48,21 @@ func (exec *Execution) invokeCallable(callee Value, receiver Value, args []Value
 		scope := exec.capabilityContractScopes[builtin]
 		var preCallKnownBuiltins map[*Builtin]struct{}
 		if scope != nil && len(scope.contracts) > 0 {
-			preCallKnownBuiltins = make(map[*Builtin]struct{})
+			preCallKnownBuiltins = scope.knownBuiltins
 			preCallScanner := newCapabilityContractScanner()
-			if receiver.Kind() != KindNil {
+			if valueCanContainBuiltins(receiver) {
 				preCallScanner.collectBuiltins(receiver, preCallKnownBuiltins)
 			}
-			for _, root := range scope.roots {
-				preCallScanner.collectBuiltins(root, preCallKnownBuiltins)
-			}
 			for _, arg := range args {
+				if !valueCanContainBuiltins(arg) {
+					continue
+				}
 				preCallScanner.collectBuiltins(arg, preCallKnownBuiltins)
 			}
 			for _, kwarg := range kwargs {
+				if !valueCanContainBuiltins(kwarg) {
+					continue
+				}
 				preCallScanner.collectBuiltins(kwarg, preCallKnownBuiltins)
 			}
 		}
@@ -94,9 +106,15 @@ func (exec *Execution) invokeCallable(callee Value, receiver Value, args []Value
 			// Methods can also publish builtins by mutating positional or keyword
 			// argument objects supplied by script code.
 			for _, arg := range args {
+				if !valueCanContainBuiltins(arg) {
+					continue
+				}
 				postCallScanner.bindContracts(arg, scope, exec.capabilityContracts, exec.capabilityContractScopes)
 			}
 			for _, kwarg := range kwargs {
+				if !valueCanContainBuiltins(kwarg) {
+					continue
+				}
 				postCallScanner.bindContracts(kwarg, scope, exec.capabilityContracts, exec.capabilityContractScopes)
 			}
 		}

From fde3f7766051c7dc2c93dec3a4b275313151bef0 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 20:23:03 -0500
Subject: [PATCH 18/26] keep capability exclusion scan call-local

---
 vibes/execution_calls.go | 13 ++++++++++++-
 1 file changed, 12 insertions(+), 1 deletion(-)

diff --git a/vibes/execution_calls.go b/vibes/execution_calls.go
index 7282b96..d74f802 100644
--- a/vibes/execution_calls.go
+++ b/vibes/execution_calls.go
@@ -13,6 +13,17 @@ func valueCanContainBuiltins(val Value) bool {
 	}
 }
 
+func cloneBuiltinSet(src map[*Builtin]struct{}) map[*Builtin]struct{} {
+	if len(src) == 0 {
+		return make(map[*Builtin]struct{})
+	}
+	out := make(map[*Builtin]struct{}, len(src))
+	for builtin := range src {
+		out[builtin] = struct{}{}
+	}
+	return out
+}
+
 func (exec *Execution) autoInvokeIfNeeded(expr Expression, val Value, receiver Value) (Value, error) {
 	switch val.Kind() {
 	case KindFunction:
@@ -48,7 +59,7 @@ func (exec *Execution) invokeCallable(callee Value, receiver Value, args []Value
 		scope := exec.capabilityContractScopes[builtin]
 		var preCallKnownBuiltins map[*Builtin]struct{}
 		if scope != nil && len(scope.contracts) > 0 {
-			preCallKnownBuiltins = scope.knownBuiltins
+			preCallKnownBuiltins = cloneBuiltinSet(scope.knownBuiltins)
 			preCallScanner := newCapabilityContractScanner()
 			if valueCanContainBuiltins(receiver) {
 				preCallScanner.collectBuiltins(receiver, preCallKnownBuiltins)

From eca759963262aefa45485be2b28ffcae151a454d Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 20:23:37 -0500
Subject: [PATCH 19/26] remove unused capability builtin collector

---
 vibes/capability_contracts.go | 8 --------
 1 file changed, 8 deletions(-)

diff --git a/vibes/capability_contracts.go b/vibes/capability_contracts.go
index e40d57f..a936c03 100644
--- a/vibes/capability_contracts.go
+++ b/vibes/capability_contracts.go
@@ -56,11 +56,3 @@ func bindCapabilityContractsExcluding(
 	scanner.excluded = excluded
 	scanner.bindContracts(val, scope, target, scopes)
 }
-
-func collectCapabilityBuiltins(val Value, out map[*Builtin]struct{}) {
-	if out == nil {
-		return
-	}
-	scanner := newCapabilityContractScanner()
-	scanner.collectBuiltins(val, out)
-}

From d7651bf47987bf5e5de6aba7a21ed877ebf505c0 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 20:44:51 -0500
Subject: [PATCH 20/26] enforce receiver memory checks before member lookup
 errors

---
 vibes/execution_call_expr.go |  3 +++
 vibes/memory_quota_test.go   | 32 ++++++++++++++++++++++++++++++++
 2 files changed, 35 insertions(+)

diff --git a/vibes/execution_call_expr.go b/vibes/execution_call_expr.go
index 1fc9d53..599dfe3 100644
--- a/vibes/execution_call_expr.go
+++ b/vibes/execution_call_expr.go
@@ -6,6 +6,9 @@ func (exec *Execution) evalCallTarget(call *CallExpr, env *Env) (Value, Value, e
 		if err != nil {
 			return NewNil(), NewNil(), err
 		}
+		if err := exec.checkMemoryWith(receiver); err != nil {
+			return NewNil(), NewNil(), err
+		}
 		if directCallee, handled, err := exec.evalDirectMemberMethodCall(receiver, member.Property, member.Pos()); handled || err != nil {
 			if err != nil {
 				return NewNil(), NewNil(), err
diff --git a/vibes/memory_quota_test.go b/vibes/memory_quota_test.go
index 2354f52..fa40726 100644
--- a/vibes/memory_quota_test.go
+++ b/vibes/memory_quota_test.go
@@ -421,6 +421,38 @@ func TestTransientMethodCallReceiverAllocationsAreChecked(t *testing.T) {
 	requireErrorContains(t, err, "memory quota exceeded")
 }
 
+func TestTransientMethodCallReceiverLookupErrorsAreChecked(t *testing.T) {
+	pos := Position{Line: 1, Column: 1}
+	elements := make([]Expression, 1200)
+	for i := range elements {
+		elements[i] = &StringLiteral{Value: "abcdefghij", position: pos}
+	}
+
+	stmt := &ExprStmt{
+		Expr: &CallExpr{
+			Callee: &MemberExpr{
+				Object:   &ArrayLiteral{Elements: elements, position: pos},
+				Property: "missing",
+				position: pos,
+			},
+			position: pos,
+		},
+		position: pos,
+	}
+
+	exec := &Execution{
+		quota:         10000,
+		memoryQuota:   1,
+		moduleLoading: make(map[string]bool),
+	}
+	env := newEnv(nil)
+	_, _, err := exec.evalStatements([]Statement{stmt}, env)
+	if err == nil {
+		t.Fatalf("expected memory quota error for transient method-call lookup receiver")
+	}
+	requireErrorContains(t, err, "memory quota exceeded")
+}
+
 func TestIfConditionTransientAllocationsAreChecked(t *testing.T) {
 	pos := Position{Line: 1, Column: 1}
 	elements := make([]Expression, 1200)

From 6cb766f31e0abcfbd76dddd6b6bfa8ffb995fad2 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 20:45:36 -0500
Subject: [PATCH 21/26] restore fail-fast memory checks across call argument
 evaluation

---
 vibes/execution_call_expr.go | 15 +++++++++++-
 vibes/memory_quota_test.go   | 44 ++++++++++++++++++++++++++++++++++++
 2 files changed, 58 insertions(+), 1 deletion(-)

diff --git a/vibes/execution_call_expr.go b/vibes/execution_call_expr.go
index 599dfe3..ddcbae4 100644
--- a/vibes/execution_call_expr.go
+++ b/vibes/execution_call_expr.go
@@ -66,6 +66,9 @@ func (exec *Execution) evalCallArgs(call *CallExpr, env *Env) ([]Value, error) {
 		if err != nil {
 			return nil, err
 		}
+		if err := exec.checkMemoryWith(val); err != nil {
+			return nil, err
+		}
 		args[i] = val
 	}
 	return args, nil
@@ -81,6 +84,9 @@ func (exec *Execution) evalCallKwArgs(call *CallExpr, env *Env) (map[string]Valu
 		if err != nil {
 			return nil, err
 		}
+		if err := exec.checkMemoryWith(val); err != nil {
+			return nil, err
+		}
 		kwargs[kw.Name] = val
 	}
 	return kwargs, nil
@@ -90,7 +96,14 @@ func (exec *Execution) evalCallBlock(call *CallExpr, env *Env) (Value, error) {
 	if call.Block == nil {
 		return NewNil(), nil
 	}
-	return exec.evalBlockLiteral(call.Block, env)
+	block, err := exec.evalBlockLiteral(call.Block, env)
+	if err != nil {
+		return NewNil(), err
+	}
+	if err := exec.checkMemoryWith(block); err != nil {
+		return NewNil(), err
+	}
+	return block, nil
 }
 
 func (exec *Execution) checkCallMemoryRoots(receiver Value, args []Value, kwargs map[string]Value, block Value) error {
diff --git a/vibes/memory_quota_test.go b/vibes/memory_quota_test.go
index fa40726..a0bc714 100644
--- a/vibes/memory_quota_test.go
+++ b/vibes/memory_quota_test.go
@@ -568,6 +568,50 @@ func TestAggregateBuiltinArgumentsAreChecked(t *testing.T) {
 	requireErrorContains(t, err, "memory quota exceeded")
 }
 
+func TestCallArgumentMemoryChecksFailFastBeforeLaterSideEffects(t *testing.T) {
+	pos := Position{Line: 1, Column: 1}
+	payload := strings.Repeat("a", 5000)
+	tickCount := 0
+
+	stmt := &ExprStmt{
+		Expr: &CallExpr{
+			Callee: &Identifier{Name: "noop", position: pos},
+			Args: []Expression{
+				&StringLiteral{Value: payload, position: pos},
+				&CallExpr{
+					Callee:   &Identifier{Name: "tick", position: pos},
+					position: pos,
+				},
+			},
+			position: pos,
+		},
+		position: pos,
+	}
+
+	exec := &Execution{
+		quota:         10000,
+		memoryQuota:   2048,
+		moduleLoading: make(map[string]bool),
+	}
+	env := newEnv(nil)
+	env.Define("noop", NewBuiltin("noop", func(exec *Execution, receiver Value, args []Value, kwargs map[string]Value, block Value) (Value, error) {
+		return NewNil(), nil
+	}))
+	env.Define("tick", NewBuiltin("tick", func(exec *Execution, receiver Value, args []Value, kwargs map[string]Value, block Value) (Value, error) {
+		tickCount++
+		return NewInt(1), nil
+	}))
+
+	_, _, err := exec.evalStatements([]Statement{stmt}, env)
+	if err == nil {
+		t.Fatalf("expected memory quota error for oversized first argument")
+	}
+	requireErrorContains(t, err, "memory quota exceeded")
+	if tickCount != 0 {
+		t.Fatalf("expected later argument side effects to be skipped, got %d", tickCount)
+	}
+}
+
 func TestTransientAssignmentValueIsCheckedBeforeAssign(t *testing.T) {
 	pos := Position{Line: 1, Column: 1}
 	elements := make([]Expression, 1200)

From d17311607c72f1b1f1ecc71eefd9a6dd9da33270 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 21:16:16 -0500
Subject: [PATCH 22/26] preserve unknown hash key-type errors in fast-path
 checks

---
 vibes/execution_types_validation.go      |  4 ++
 vibes/execution_types_validation_test.go | 53 ++++++++++++++++++++++++
 2 files changed, 57 insertions(+)
 create mode 100644 vibes/execution_types_validation_test.go

diff --git a/vibes/execution_types_validation.go b/vibes/execution_types_validation.go
index ab65c34..3975003 100644
--- a/vibes/execution_types_validation.go
+++ b/vibes/execution_types_validation.go
@@ -200,6 +200,10 @@ func typeAllowsStringHashKey(ty *TypeExpr) (bool, bool) {
 	}
 
 	switch ty.Kind {
+	case TypeUnknown:
+		// Unknown key types must flow through full matching so callers preserve
+		// unknown-type errors instead of silently treating them as mismatches.
+		return false, false
 	case TypeAny, TypeString:
 		return true, true
 	case TypeUnion:
diff --git a/vibes/execution_types_validation_test.go b/vibes/execution_types_validation_test.go
new file mode 100644
index 0000000..4e5b39a
--- /dev/null
+++ b/vibes/execution_types_validation_test.go
@@ -0,0 +1,53 @@
+package vibes
+
+import (
+	"strings"
+	"testing"
+)
+
+func TestTypeAllowsStringHashKeyDefersUnknownUnions(t *testing.T) {
+	keyType := &TypeExpr{
+		Kind: TypeUnion,
+		Union: []*TypeExpr{
+			{Name: "typo", Kind: TypeUnknown},
+			{Name: "string", Kind: TypeString},
+		},
+	}
+
+	decided, matches := typeAllowsStringHashKey(keyType)
+	if decided {
+		t.Fatalf("expected unknown key union to defer to full matcher")
+	}
+	if matches {
+		t.Fatalf("unexpected string-key fast-path match for unknown key union")
+	}
+}
+
+func TestValueMatchesTypeHashUnknownKeyUnionReturnsError(t *testing.T) {
+	hashType := &TypeExpr{
+		Kind: TypeHash,
+		TypeArgs: []*TypeExpr{
+			{
+				Kind: TypeUnion,
+				Union: []*TypeExpr{
+					{Name: "typo", Kind: TypeUnknown},
+					{Name: "string", Kind: TypeString},
+				},
+			},
+			{Name: "int", Kind: TypeInt},
+		},
+	}
+
+	matches, err := valueMatchesType(NewHash(map[string]Value{
+		"score": NewInt(1),
+	}), hashType)
+	if err == nil {
+		t.Fatalf("expected unknown type error")
+	}
+	if matches {
+		t.Fatalf("unknown key union should not report a match")
+	}
+	if !strings.Contains(err.Error(), "unknown type typo") {
+		t.Fatalf("expected unknown type error, got %v", err)
+	}
+}

From 4be0524c14966b60b5b9e72812474ae902b27c9c Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sat, 21 Feb 2026 21:28:47 -0500
Subject: [PATCH 23/26] make benchmark smoke threshold checks float-safe

---
 scripts/bench_smoke_check.sh | 18 +++++++++++++-----
 1 file changed, 13 insertions(+), 5 deletions(-)

diff --git a/scripts/bench_smoke_check.sh b/scripts/bench_smoke_check.sh
index 0ab2e78..89c1e1c 100755
--- a/scripts/bench_smoke_check.sh
+++ b/scripts/bench_smoke_check.sh
@@ -64,6 +64,14 @@ done < <(
 
 failures=0
 
+float_delta() {
+  awk -v actual="$1" -v limit="$2" 'BEGIN { printf "%.4f", actual - limit }'
+}
+
+float_exceeds() {
+  awk -v actual="$1" -v limit="$2" 'BEGIN { exit (actual > limit) ? 0 : 1 }'
+}
+
 echo
 printf "%-40s %12s %12s %12s %12s %12s %14s\n" "Benchmark" "ns/op" "max_ns/op" "delta_ns" "allocs/op" "max_allocs" "delta_allocs"
 for bench in "${benchmarks[@]}"; do
@@ -78,15 +86,15 @@ for bench in "${benchmarks[@]}"; do
     continue
   fi
 
-  ns_delta=$((ns - max_ns_value))
-  allocs_delta=$((allocs - max_allocs_value))
-  printf "%-40s %12s %12s %12d %12s %12s %14d\n" "$bench" "$ns" "$max_ns_value" "$ns_delta" "$allocs" "$max_allocs_value" "$allocs_delta"
+  ns_delta="$(float_delta "$ns" "$max_ns_value")"
+  allocs_delta="$(float_delta "$allocs" "$max_allocs_value")"
+  printf "%-40s %12s %12s %12s %12s %12s %14s\n" "$bench" "$ns" "$max_ns_value" "$ns_delta" "$allocs" "$max_allocs_value" "$allocs_delta"
 
-  if (( ns > max_ns_value )); then
+  if float_exceeds "$ns" "$max_ns_value"; then
     echo "regression: $bench ns/op $ns exceeds $max_ns_value" >&2
     failures=$((failures + 1))
   fi
-  if (( allocs > max_allocs_value )); then
+  if float_exceeds "$allocs" "$max_allocs_value"; then
     echo "regression: $bench allocs/op $allocs exceeds $max_allocs_value" >&2
     failures=$((failures + 1))
   fi

From 15a01036b73c377e831dd321d2484cfbdb95a10e Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sun, 22 Feb 2026 00:15:11 -0500
Subject: [PATCH 24/26] account capability builtin caches in memory quota
 estimates

---
 vibes/memory.go            | 11 ++++++++
 vibes/memory_quota_test.go | 57 ++++++++++++++++++++++++++++++++++++++
 2 files changed, 68 insertions(+)

diff --git a/vibes/memory.go b/vibes/memory.go
index 9d6b3d2..4839d88 100644
--- a/vibes/memory.go
+++ b/vibes/memory.go
@@ -128,6 +128,17 @@ func (exec *Execution) estimateMemoryUsageBase(est *memoryEstimator) int {
 	}
 	if exec.capabilityContractScopes != nil {
 		total += estimatedMapBaseBytes + len(exec.capabilityContractScopes)*estimatedMapEntryBytes
+		seenScopes := make(map[*capabilityContractScope]struct{}, len(exec.capabilityContractScopes))
+		for _, scope := range exec.capabilityContractScopes {
+			if scope == nil {
+				continue
+			}
+			if _, seen := seenScopes[scope]; seen {
+				continue
+			}
+			seenScopes[scope] = struct{}{}
+			total += estimatedMapBaseBytes + len(scope.knownBuiltins)*estimatedMapEntryBytes
+		}
 	}
 	if exec.capabilityContractsByName != nil {
 		total += estimatedMapBaseBytes + len(exec.capabilityContractsByName)*estimatedMapEntryBytes
diff --git a/vibes/memory_quota_test.go b/vibes/memory_quota_test.go
index a0bc714..d2e8529 100644
--- a/vibes/memory_quota_test.go
+++ b/vibes/memory_quota_test.go
@@ -61,6 +61,63 @@ func TestMemoryQuotaCountsClassVars(t *testing.T) {
 	requireRunMemoryQuotaError(t, script, nil, CallOptions{})
 }
 
+func TestMemoryQuotaCountsCapabilityScopeKnownBuiltins(t *testing.T) {
+	scopeWithKnown := &capabilityContractScope{
+		knownBuiltins: make(map[*Builtin]struct{}),
+	}
+	for range 400 {
+		scopeWithKnown.knownBuiltins[NewBuiltin("cap.dynamic", builtinAssert).Builtin()] = struct{}{}
+	}
+	scopeWithoutKnown := &capabilityContractScope{
+		knownBuiltins: make(map[*Builtin]struct{}),
+	}
+
+	withKnown := &Execution{
+		quota:         10000,
+		memoryQuota:   0,
+		moduleLoading: make(map[string]bool),
+		capabilityContractScopes: map[*Builtin]*capabilityContractScope{
+			NewBuiltin("cap.call", builtinAssert).Builtin(): scopeWithKnown,
+		},
+	}
+	withoutKnown := &Execution{
+		quota:         10000,
+		memoryQuota:   0,
+		moduleLoading: make(map[string]bool),
+		capabilityContractScopes: map[*Builtin]*capabilityContractScope{
+			NewBuiltin("cap.call", builtinAssert).Builtin(): scopeWithoutKnown,
+		},
+	}
+
+	withKnownBytes := withKnown.estimateMemoryUsage()
+	withoutKnownBytes := withoutKnown.estimateMemoryUsage()
+	if withKnownBytes <= withoutKnownBytes {
+		t.Fatalf("expected known builtin cache to increase memory estimate (%d <= %d)", withKnownBytes, withoutKnownBytes)
+	}
+
+	quota := withoutKnownBytes + (withKnownBytes-withoutKnownBytes)/2
+	if quota <= withoutKnownBytes {
+		quota = withoutKnownBytes + 1
+	}
+	if quota >= withKnownBytes {
+		quota = withKnownBytes - 1
+	}
+
+	enforced := &Execution{
+		quota:         10000,
+		memoryQuota:   quota,
+		moduleLoading: make(map[string]bool),
+		capabilityContractScopes: map[*Builtin]*capabilityContractScope{
+			NewBuiltin("cap.call", builtinAssert).Builtin(): scopeWithKnown,
+		},
+	}
+	err := enforced.checkMemory()
+	if err == nil {
+		t.Fatalf("expected memory quota error when known builtin cache grows")
+	}
+	requireErrorContains(t, err, "memory quota exceeded")
+}
+
 func TestMemoryQuotaAllowsExecution(t *testing.T) {
 	script := compileScriptWithConfig(t, Config{
 		StepQuota:        20000,

From b5943cf4ce57bc7593de0fa74b767e417b231bc3 Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sun, 22 Feb 2026 00:16:47 -0500
Subject: [PATCH 25/26] relax capability workflow smoke threshold for CI
 variance

---
 benchmarks/smoke_thresholds.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/benchmarks/smoke_thresholds.txt b/benchmarks/smoke_thresholds.txt
index f3df605..e1ceb47 100644
--- a/benchmarks/smoke_thresholds.txt
+++ b/benchmarks/smoke_thresholds.txt
@@ -9,7 +9,7 @@ BenchmarkExecutionArithmeticLoop 5000000 1000
 BenchmarkExecutionArrayPipeline 30000000 20000
 BenchmarkExecutionMethodDispatchLoop 8000000 6000
 BenchmarkExecutionCapabilityFindLoop 12000000 9000
-BenchmarkExecutionCapabilityWorkflowLoop 14000000 15000
+BenchmarkExecutionCapabilityWorkflowLoop 15000000 15000
 BenchmarkExecutionJSONParseLoop 3000000 5000
 BenchmarkExecutionJSONStringifyLoop 3000000 4000
 BenchmarkExecutionRegexReplaceAllLoop 4000000 4000

From 28b1b0d83648fc10bb461174b10fcde5e9c8d5ef Mon Sep 17 00:00:00 2001
From: Mauricio Gomes <mauricio@edge14.com>
Date: Sun, 22 Feb 2026 18:22:52 -0500
Subject: [PATCH 26/26] scan capability roots before call-boundary exclusion

---
 vibes/capability_contracts_test.go | 53 ++++++++++++++++++++++++++++++
 vibes/execution_calls.go           |  6 ++++
 2 files changed, 59 insertions(+)

diff --git a/vibes/capability_contracts_test.go b/vibes/capability_contracts_test.go
index b667da1..da8f9d3 100644
--- a/vibes/capability_contracts_test.go
+++ b/vibes/capability_contracts_test.go
@@ -349,6 +349,32 @@ func (c importingContractCapability) CapabilityContracts() map[string]Capability
 	}
 }
 
+type siblingRootForeignLeakProbeCapability struct{}
+
+func (siblingRootForeignLeakProbeCapability) Bind(binding CapabilityBinding) (map[string]Value, error) {
+	return map[string]Value{
+		"publisher": NewObject(map[string]Value{
+			"touch": NewBuiltin("publisher.touch", func(exec *Execution, receiver Value, args []Value, kwargs map[string]Value, block Value) (Value, error) {
+				return NewString("ok"), nil
+			}),
+		}),
+		"peer": NewObject(map[string]Value{}),
+	}, nil
+}
+
+func (siblingRootForeignLeakProbeCapability) CapabilityContracts() map[string]CapabilityMethodContract {
+	return map[string]CapabilityMethodContract{
+		"foo.call": {
+			ValidateArgs: func(args []Value, kwargs map[string]Value, block Value) error {
+				if len(args) != 1 || args[0].Kind() != KindInt {
+					return fmt.Errorf("provider foo.call expects int")
+				}
+				return nil
+			},
+		},
+	}
+}
+
 type argMutationContractCapability struct {
 	invokeCount *int
 }
@@ -723,6 +749,33 @@ end`)
 	}
 }
 
+func TestCapabilityContractsDoNotHijackForeignBuiltinsFromSiblingRoots(t *testing.T) {
+	script := compileScriptDefault(t, `def run()
+  peer.call = foreign.call
+  publisher.touch()
+  peer.call("ok")
+end`)
+	var err error
+
+	shared := &foreignBuiltinRef{}
+	invocations := 0
+	result, err := script.Call(context.Background(), "run", nil, CallOptions{
+		Capabilities: []CapabilityAdapter{
+			legacyForeignFooCapability{shared: shared, invokeCount: &invocations},
+			siblingRootForeignLeakProbeCapability{},
+		},
+	})
+	if err != nil {
+		t.Fatalf("unexpected error: %v", err)
+	}
+	if invocations != 1 {
+		t.Fatalf("expected foreign call once, got %d", invocations)
+	}
+	if result.Kind() != KindString || result.String() != "legacy-foreign" {
+		t.Fatalf("unexpected result: %#v", result)
+	}
+}
+
 func TestCapabilityContractsBindAfterArgumentMutation(t *testing.T) {
 	script := compileScriptDefault(t, `def run()
   target = {}
diff --git a/vibes/execution_calls.go b/vibes/execution_calls.go
index d74f802..853c4a9 100644
--- a/vibes/execution_calls.go
+++ b/vibes/execution_calls.go
@@ -76,6 +76,12 @@ func (exec *Execution) invokeCallable(callee Value, receiver Value, args []Value
 				}
 				preCallScanner.collectBuiltins(kwarg, preCallKnownBuiltins)
 			}
+			for _, root := range scope.roots {
+				if !valueCanContainBuiltins(root) {
+					continue
+				}
+				preCallScanner.collectBuiltins(root, preCallKnownBuiltins)
+			}
 		}
 		contract, hasContract := exec.capabilityContracts[builtin]
 		if hasContract && contract.ValidateArgs != nil {