diff --git a/ci3/ci-metrics/app.py b/ci3/ci-metrics/app.py
index c62875e7d19a..e2925d9ae3b0 100644
--- a/ci3/ci-metrics/app.py
+++ b/ci3/ci-metrics/app.py
@@ -6,6 +6,7 @@
 import os
 import re
 import redis
+import time
 import threading
 from pathlib import Path
 
@@ -37,14 +38,30 @@ def verify_password(username, password):
 
 
 def _init():
-    """Initialize SQLite and start background threads."""
+    """Initialize SQLite, warm caches, and start background threads."""
     try:
         db.get_db()
         metrics.start_test_listener(r)
+        metrics.start_phase_listener(r)
         metrics.start_ci_run_sync(r)
+        github_data.start_merge_queue_poller()
+        github_data.start_pr_dirs_worker()
         print("[ci-metrics] Background threads started")
     except Exception as e:
         print(f"[ci-metrics] Warning: startup failed: {e}")
+    # Warm billing caches so first request isn't slow
+    try:
+        from billing.gcp import _ensure_cached as _warm_gcp
+        _warm_gcp()
+        print("[ci-metrics] GCP billing cache warmed")
+    except Exception as e:
+        print(f"[ci-metrics] GCP billing warmup failed: {e}")
+    try:
+        from billing.aws import _ensure_cached as _warm_aws
+        _warm_aws()
+        print("[ci-metrics] AWS costs cache warmed")
+    except Exception as e:
+        print(f"[ci-metrics] AWS costs warmup failed: {e}")
 
 threading.Thread(target=_init, daemon=True, name='metrics-init').start()
 
@@ -101,6 +118,74 @@ def _json(data):
     return Response(json.dumps(data), mimetype='application/json')
 
 
+_TEN_DAYS = 10 * 24 * 3600
+
+
+def _cache_ttl(date_to: str) -> int:
+    """Return 10-day TTL for historical ranges (date_to < today), else 5 min."""
+    try:
+        if datetime.strptime(date_to, '%Y-%m-%d').date() < datetime.now().date():
+            return _TEN_DAYS
+    except ValueError:
+        pass
+    return 300
+
+
+# ---- Author mapping: git display name → GitHub username ----
+
+_author_map = {}
+_author_map_ts = 0
+
+
+def _get_author_map() -> dict:
+    """Build git display name → GitHub username mapping from ci_runs + pr_authors."""
+    global _author_map, _author_map_ts
+    now = time.time()
+    if now - _author_map_ts < 3600 and _author_map:
+        return _author_map
+    rows = db.query('''
+        SELECT cr.author as git_name, pa.author as github_user, COUNT(*) as c
+        FROM ci_runs cr
+        JOIN pr_authors pa ON cr.pr_number = pa.pr_number
+        WHERE cr.author IS NOT NULL AND cr.author != ''
+        AND pa.author IS NOT NULL AND pa.author != ''
+        GROUP BY cr.author, pa.author
+    ''')
+    name_to_gh = {}
+    for row in rows:
+        gn = row['git_name']
+        gh = row['github_user']
+        if gn not in name_to_gh:
+            name_to_gh[gn] = {}
+        name_to_gh[gn][gh] = name_to_gh[gn].get(gh, 0) + row['c']
+    result = {}
+    for gn, gh_counts in name_to_gh.items():
+        best = max(gh_counts, key=gh_counts.get)
+        result[gn] = best
+        result[best] = best  # identity mapping for usernames used as commit_author
+    _author_map = result
+    _author_map_ts = now
+    return result
+
+
+def _normalize_authors(authors_str: str) -> str:
+    """Normalize comma-separated git names to deduplicated GitHub usernames."""
+    if not authors_str:
+        return ''
+    amap = _get_author_map()
+    seen = set()
+    result = []
+    for name in authors_str.split(','):
+        name = name.strip()
+        if not name:
+            continue
+        gh = amap.get(name, name)
+        if gh not in seen:
+            seen.add(gh)
+            result.append(gh)
+    return ','.join(result)
+
+
 # ---- Namespace billing ----
 
 @app.route('/namespace-billing')
@@ -166,7 +251,7 @@ def api_ci_runs():
     ts_from = int(datetime.strptime(date_from, '%Y-%m-%d').timestamp() * 1000) if date_from else None
     ts_to = int((datetime.strptime(date_to, '%Y-%m-%d') + timedelta(days=1)).timestamp() * 1000) if date_to else None
 
-    runs = metrics.get_ci_runs(r, ts_from, ts_to)
+    runs = metrics.get_ci_runs(ts_from, ts_to)
 
     if status_filter:
         runs = [run for run in runs if run.get('status') == status_filter]
@@ -185,7 +270,7 @@ def api_ci_runs():
 @auth.login_required
 def api_ci_stats():
     ts_from = int((datetime.now() - timedelta(days=7)).timestamp() * 1000)
-    runs = metrics.get_ci_runs(r, ts_from)
+    runs = metrics.get_ci_runs(ts_from)
 
     total = len(runs)
     passed = sum(1 for run in runs if run.get('status') == 'PASSED')
@@ -233,6 +318,7 @@ def api_costs_overview():
             buckets[key]['aws_total'] += entry.get('aws_total', 0)
             buckets[key]['gcp_total'] += entry.get('gcp_total', 0)
         result['by_date'] = sorted(buckets.values(), key=lambda x: x['date'])
+    result['period'] = {'from': date_from, 'to': date_to}
     return _json(result)
 
 
@@ -287,7 +373,7 @@ def api_costs_attribution():
     ts_from = int(datetime.strptime(date_from, '%Y-%m-%d').timestamp() * 1000)
     ts_to = int((datetime.strptime(date_to, '%Y-%m-%d') + timedelta(days=1)).timestamp() * 1000)
 
-    runs = metrics.get_ci_runs(r, ts_from, ts_to)
+    runs = metrics.get_ci_runs(ts_from, ts_to)
     runs_with_cost = [run for run in runs if run.get('cost_usd') is not None]
 
     # Enrich merge queue runs with PR author from GitHub
@@ -311,6 +397,9 @@ def api_costs_attribution():
         prn = info['pr_number']
         if prn and int(prn) in pr_authors:
             author = pr_authors[int(prn)]['author']
+        # Attribute nightly / release runs to a special 'release' actor
+        if info['type'] in ('nightly', 'releases'):
+            author = 'release'
 
         inst_type = run.get('instance_type', 'unknown')
         vcpus = run.get('instance_vcpus')
@@ -383,14 +472,17 @@ def api_costs_attribution():
     instances.sort(key=lambda x: -(x['cost_usd'] or 0))
 
     all_types = sorted(by_type.keys())
+    # Pre-compute runs-per-date to avoid O(dates × instances)
+    runs_per_date = {}
+    for inst in instances:
+        runs_per_date[inst['date']] = runs_per_date.get(inst['date'], 0) + 1
     by_date_list = []
     for date in sorted(by_date_type):
-        entry = {'date': date, 'total': 0, 'runs': 0}
+        entry = {'date': date, 'total': 0, 'runs': runs_per_date.get(date, 0)}
         for rt in all_types:
             entry[rt] = round(by_date_type[date].get(rt, 0), 2)
             entry['total'] += by_date_type[date].get(rt, 0)
         entry['total'] = round(entry['total'], 2)
-        entry['runs'] = sum(1 for inst in instances if inst['date'] == date)
         by_date_list.append(entry)
 
     by_date_list = _aggregate_dates(by_date_list, granularity,
@@ -405,6 +497,7 @@ def api_costs_attribution():
         'by_date': by_date_list,
         'run_types': all_types,
         'instances': instances[:500],
+        'period': {'from': date_from, 'to': date_to},
         'totals': {'aws': round(total_aws, 2), 'gcp': round(gcp_total, 2),
                    'gcp_unattributed': round(gcp_total, 2),
                    'combined': round(total_aws + gcp_total, 2)},
@@ -421,7 +514,7 @@ def api_costs_runners():
     ts_from = int(datetime.strptime(date_from, '%Y-%m-%d').timestamp() * 1000)
     ts_to = int((datetime.strptime(date_to, '%Y-%m-%d') + timedelta(days=1)).timestamp() * 1000)
 
-    runs = metrics.get_ci_runs(r, ts_from, ts_to)
+    runs = metrics.get_ci_runs(ts_from, ts_to)
     runs_with_cost = [run for run in runs if run.get('cost_usd') is not None]
     if dashboard:
         runs_with_cost = [run for run in runs_with_cost if run.get('dashboard') == dashboard]
@@ -475,6 +568,7 @@ def api_costs_runners():
         'by_date': by_date,
         'by_instance_type': by_instance,
         'by_dashboard': by_dashboard,
+        'period': {'from': date_from, 'to': date_to},
         'summary': {
             'total_cost': round(total_cost, 2),
             'spot_pct': round(100.0 * spot_cost / max(total_cost, 0.01), 1),
@@ -493,13 +587,18 @@ def api_ci_performance():
     date_to = request.args.get('to', datetime.now().strftime('%Y-%m-%d'))
     dashboard = request.args.get('dashboard', '')
     granularity = request.args.get('granularity', 'daily')
+    _ck = f'perf:{date_from}:{date_to}:{dashboard}:{granularity}'
+    if cached := db.cache_get(_ck):
+        return _json(cached)
+    _t0 = time.perf_counter()
     ts_from = int(datetime.strptime(date_from, '%Y-%m-%d').timestamp() * 1000)
     ts_to = int((datetime.strptime(date_to, '%Y-%m-%d') + timedelta(days=1)).timestamp() * 1000)
 
-    runs = metrics.get_ci_runs(r, ts_from, ts_to)
+    runs = metrics.get_ci_runs(ts_from, ts_to)
     runs = [run for run in runs if run.get('status') in ('PASSED', 'FAILED')]
     if dashboard:
         runs = [run for run in runs if run.get('dashboard') == dashboard]
+    _t1 = time.perf_counter()
 
     by_date_map = {}
     for run in runs:
@@ -519,6 +618,7 @@ def api_ci_performance():
     by_date = []
     for date in sorted(by_date_map):
         d = by_date_map[date]
+        durs = sorted(d['durations'])
         by_date.append({
             'date': date,
             'total': d['total'],
@@ -526,75 +626,107 @@ def api_ci_performance():
             'failed': d['failed'],
             'pass_rate': round(100.0 * d['passed'] / max(d['total'], 1), 1),
             'failure_rate': round(100.0 * d['failed'] / max(d['total'], 1), 1),
-            'avg_duration_mins': round(sum(d['durations']) / len(d['durations']), 1) if d['durations'] else None,
+            'avg_duration_mins': round(sum(durs) / len(durs), 1) if durs else None,
+            'p50_duration_mins': round(durs[len(durs) // 2], 1) if durs else None,
+            'p95_duration_mins': round(durs[int(len(durs) * 0.95)], 1) if durs else None,
+            'max_duration_mins': round(max(durs), 1) if durs else None,
         })
 
+    _t2 = time.perf_counter()
+    # Merge test outcome counts from test_daily_stats before aggregation
+    ds_conditions = ['date >= ?', 'date <= ?']
+    ds_params = [date_from, date_to]
+    if dashboard:
+        ds_conditions.append('dashboard = ?')
+        ds_params.append(dashboard)
+    ds_where = 'WHERE ' + ' AND '.join(ds_conditions)
+
+    daily_test_counts = db.query(f'''
+        SELECT date, SUM(passed) as passed, SUM(failed) as failed, SUM(flaked) as flaked
+        FROM test_daily_stats {ds_where}
+        GROUP BY date
+    ''', ds_params)
+    daily_test_map = {r['date']: r for r in daily_test_counts}
+    for d in by_date:
+        tc = daily_test_map.get(d['date'], {})
+        d['flake_count'] = tc.get('flaked', 0) or 0
+        d['test_failure_count'] = tc.get('failed', 0) or 0
+        d['test_success_count'] = tc.get('passed', 0) or 0
+
     by_date = _aggregate_dates(by_date, granularity,
-                               sum_fields=['total', 'passed', 'failed'],
-                               avg_fields=['avg_duration_mins'])
+                               sum_fields=['total', 'passed', 'failed',
+                                           'flake_count', 'test_failure_count', 'test_success_count'],
+                               avg_fields=['avg_duration_mins', 'p50_duration_mins',
+                                           'p95_duration_mins', 'max_duration_mins'])
     for d in by_date:
         d['pass_rate'] = round(100.0 * d['passed'] / max(d['total'], 1), 1)
         d['failure_rate'] = round(100.0 * d['failed'] / max(d['total'], 1), 1)
 
-    # Daily flake/failure counts from test_events
-    if dashboard:
-        flake_daily = db.query('''
-            SELECT substr(timestamp, 1, 10) as date, COUNT(*) as count
-            FROM test_events WHERE status = 'flaked' AND dashboard = ?
-            AND timestamp >= ? AND timestamp < ?
-            GROUP BY substr(timestamp, 1, 10)
-        ''', (dashboard, date_from, date_to + 'T23:59:59'))
-        fail_test_daily = db.query('''
-            SELECT substr(timestamp, 1, 10) as date, COUNT(*) as count
-            FROM test_events WHERE status = 'failed' AND dashboard = ?
-            AND timestamp >= ? AND timestamp < ?
-            GROUP BY substr(timestamp, 1, 10)
-        ''', (dashboard, date_from, date_to + 'T23:59:59'))
-    else:
-        flake_daily = db.query('''
-            SELECT substr(timestamp, 1, 10) as date, COUNT(*) as count
-            FROM test_events WHERE status = 'flaked'
-            AND timestamp >= ? AND timestamp < ?
-            GROUP BY substr(timestamp, 1, 10)
-        ''', (date_from, date_to + 'T23:59:59'))
-        fail_test_daily = db.query('''
-            SELECT substr(timestamp, 1, 10) as date, COUNT(*) as count
-            FROM test_events WHERE status = 'failed'
-            AND timestamp >= ? AND timestamp < ?
-            GROUP BY substr(timestamp, 1, 10)
-        ''', (date_from, date_to + 'T23:59:59'))
-    flake_daily_map = {r['date']: r['count'] for r in flake_daily}
-    fail_test_daily_map = {r['date']: r['count'] for r in fail_test_daily}
-    for d in by_date:
-        d['flake_count'] = flake_daily_map.get(d['date'], 0)
-        d['test_failure_count'] = fail_test_daily_map.get(d['date'], 0)
+    # Duration by dashboard (pipeline) — from pre-aggregated ci_run_daily_stats
+    dbd_rows = db.query('''
+        SELECT date, dashboard, run_count, passed, failed,
+               sum_duration, min_duration, max_duration, p50_duration, p95_duration
+        FROM ci_run_daily_stats
+        WHERE date >= ? AND date <= ?
+        ORDER BY date
+    ''', (date_from, date_to))
+
+    dbd_map = {}  # {dashboard: [{date, avg_duration_mins, ...}]}
+    for r in dbd_rows:
+        dbd_map.setdefault(r['dashboard'], []).append({
+            'date': r['date'],
+            'avg_duration_mins': round(r['sum_duration'] / max(r['run_count'], 1), 1),
+            'total_duration_mins': round(r['sum_duration'], 1),
+            'p50_duration_mins': r['p50_duration'],
+            'p95_duration_mins': r['p95_duration'],
+            'count': r['run_count'],
+        })
+
+    duration_by_dashboard = {}
+    for db_name, entries in dbd_map.items():
+        duration_by_dashboard[db_name] = _aggregate_dates(
+            entries, granularity,
+            sum_fields=['count', 'total_duration_mins'],
+            avg_fields=['avg_duration_mins', 'p50_duration_mins', 'p95_duration_mins'])
 
-    # Top flakes/failures
+    _t3 = time.perf_counter()
+    # Top flakes/failures (with affected authors — filter out empty/NULL)
+    _author_concat = "GROUP_CONCAT(DISTINCT CASE WHEN commit_author IS NOT NULL AND commit_author != '' THEN commit_author END)"
     if dashboard:
-        top_flakes = db.query('''
-            SELECT test_cmd, COUNT(*) as count, ref_name
+        top_flakes = db.query(f'''
+            SELECT test_cmd, COUNT(*) as count, dashboard,
+                   {_author_concat} as authors
             FROM test_events WHERE status='flaked' AND dashboard = ?
             AND timestamp >= ? AND timestamp <= ?
-            GROUP BY test_cmd ORDER BY count DESC LIMIT 15
+            GROUP BY test_cmd ORDER BY count DESC LIMIT 20
         ''', (dashboard, date_from, date_to + 'T23:59:59'))
-        top_failures = db.query('''
-            SELECT test_cmd, COUNT(*) as count
+        top_failures = db.query(f'''
+            SELECT test_cmd, COUNT(*) as count, dashboard,
+                   {_author_concat} as authors
             FROM test_events WHERE status='failed' AND dashboard = ?
             AND timestamp >= ? AND timestamp <= ?
-            GROUP BY test_cmd ORDER BY count DESC LIMIT 15
+            GROUP BY test_cmd ORDER BY count DESC LIMIT 20
         ''', (dashboard, date_from, date_to + 'T23:59:59'))
     else:
-        top_flakes = db.query('''
-            SELECT test_cmd, COUNT(*) as count, ref_name
+        top_flakes = db.query(f'''
+            SELECT test_cmd, COUNT(*) as count, dashboard,
+                   {_author_concat} as authors
             FROM test_events WHERE status='flaked' AND timestamp >= ? AND timestamp <= ?
-            GROUP BY test_cmd ORDER BY count DESC LIMIT 15
+            GROUP BY test_cmd ORDER BY count DESC LIMIT 20
         ''', (date_from, date_to + 'T23:59:59'))
-        top_failures = db.query('''
-            SELECT test_cmd, COUNT(*) as count
+        top_failures = db.query(f'''
+            SELECT test_cmd, COUNT(*) as count, dashboard,
+                   {_author_concat} as authors
             FROM test_events WHERE status='failed' AND timestamp >= ? AND timestamp <= ?
-            GROUP BY test_cmd ORDER BY count DESC LIMIT 15
+            GROUP BY test_cmd ORDER BY count DESC LIMIT 20
         ''', (date_from, date_to + 'T23:59:59'))
 
+    # Normalize git display names → GitHub usernames
+    for row in top_flakes:
+        row['authors'] = _normalize_authors(row.get('authors', ''))
+    for row in top_failures:
+        row['authors'] = _normalize_authors(row.get('authors', ''))
+
     # Summary
     total = len(runs)
     passed = sum(1 for run in runs if run.get('status') == 'PASSED')
@@ -606,38 +738,24 @@ def api_ci_performance():
         if complete and ts:
             durations.append((complete - ts) / 60000.0)
 
-    if dashboard:
-        flake_count = db.query('''
-            SELECT COUNT(*) as c FROM test_events WHERE status='flaked' AND dashboard = ?
-            AND timestamp >= ? AND timestamp <= ?
-        ''', (dashboard, date_from, date_to + 'T23:59:59'))
-        total_tests = db.query('''
-            SELECT COUNT(*) as c FROM test_events WHERE status IN ('failed','flaked') AND dashboard = ?
-            AND timestamp >= ? AND timestamp <= ?
-        ''', (dashboard, date_from, date_to + 'T23:59:59'))
-        total_failures_count = db.query('''
-            SELECT COUNT(*) as c FROM test_events WHERE status='failed' AND dashboard = ?
-            AND timestamp >= ? AND timestamp <= ?
-        ''', (dashboard, date_from, date_to + 'T23:59:59'))
-    else:
-        flake_count = db.query('''
-            SELECT COUNT(*) as c FROM test_events WHERE status='flaked' AND timestamp >= ? AND timestamp <= ?
-        ''', (date_from, date_to + 'T23:59:59'))
-        total_tests = db.query('''
-            SELECT COUNT(*) as c FROM test_events WHERE status IN ('failed','flaked') AND timestamp >= ? AND timestamp <= ?
-        ''', (date_from, date_to + 'T23:59:59'))
-        total_failures_count = db.query('''
-            SELECT COUNT(*) as c FROM test_events WHERE status='failed' AND timestamp >= ? AND timestamp <= ?
-        ''', (date_from, date_to + 'T23:59:59'))
-
-    fc = flake_count[0]['c'] if flake_count else 0
-    tc = total_tests[0]['c'] if total_tests else 0
-    tfc = total_failures_count[0]['c'] if total_failures_count else 0
-
-    return _json({
+    # Test outcome summary from test_daily_stats
+    ds_summary = db.query(f'''
+        SELECT SUM(passed) as passed, SUM(failed) as failed, SUM(flaked) as flaked
+        FROM test_daily_stats {ds_where}
+    ''', ds_params)
+    ds_s = ds_summary[0] if ds_summary else {}
+    fc = ds_s.get('flaked', 0) or 0
+    tfc = ds_s.get('failed', 0) or 0
+    tpc = ds_s.get('passed', 0) or 0
+    tc = fc + tfc + tpc
+
+    _t4 = time.perf_counter()
+    _result = {
         'by_date': by_date,
+        'duration_by_dashboard': duration_by_dashboard,
         'top_flakes': top_flakes,
         'top_failures': top_failures,
+        'period': {'from': date_from, 'to': date_to},
         'summary': {
             'total_runs': total,
             'pass_rate': round(100.0 * passed / max(total, 1), 1),
@@ -646,8 +764,12 @@ def api_ci_performance():
             'flake_rate': round(100.0 * fc / max(tc, 1), 1) if tc else 0,
             'total_flakes': fc,
             'total_test_failures': tfc,
+            'total_test_successes': tpc,
         },
-    })
+    }
+    print(f"[perf] ci_performance {date_from}..{date_to} | get_ci_runs={_t1-_t0:.3f}s db_queries={_t2-_t1:.3f}s agg={_t3-_t2:.3f}s top_flakes={_t4-_t3:.3f}s total={_t4-_t0:.3f}s", flush=True)
+    db.cache_set(_ck, _result, _cache_ttl(date_to))
+    return _json(_result)
 
 
 # ---- GitHub integration ----
@@ -682,10 +804,19 @@ def api_pr_metrics():
     date_from = request.args.get('from', (datetime.now() - timedelta(days=30)).strftime('%Y-%m-%d'))
     date_to = request.args.get('to', datetime.now().strftime('%Y-%m-%d'))
     author = request.args.get('author', '')
+    _ck = f'pr_metrics:{date_from}:{date_to}:{author}'
+    if cached := db.cache_get(_ck):
+        return _json(cached)
+    _t0 = time.perf_counter()
     ts_from = int(datetime.strptime(date_from, '%Y-%m-%d').timestamp() * 1000)
     ts_to = int((datetime.strptime(date_to, '%Y-%m-%d') + timedelta(days=1)).timestamp() * 1000)
-    ci_runs = metrics.get_ci_runs(r, ts_from, ts_to)
-    return _json(github_data.get_pr_metrics(date_from, date_to, author, ci_runs))
+    ci_runs = metrics.get_ci_runs(ts_from, ts_to)
+    _t1 = time.perf_counter()
+    _result = github_data.get_pr_metrics(date_from, date_to, author, ci_runs)
+    _t2 = time.perf_counter()
+    print(f"[perf] pr_metrics {date_from}..{date_to} | get_ci_runs={_t1-_t0:.3f}s get_pr_metrics={_t2-_t1:.3f}s total={_t2-_t0:.3f}s", flush=True)
+    db.cache_set(_ck, _result, _cache_ttl(date_to))
+    return _json(_result)
 
 
 @app.route('/api/merge-queue/stats')
@@ -693,7 +824,32 @@ def api_pr_metrics():
 def api_merge_queue_stats():
     date_from = request.args.get('from', (datetime.now() - timedelta(days=30)).strftime('%Y-%m-%d'))
     date_to = request.args.get('to', datetime.now().strftime('%Y-%m-%d'))
-    return _json(github_data.get_merge_queue_stats(date_from, date_to))
+    _ck = f'mq_stats:{date_from}:{date_to}'
+    if cached := db.cache_get(_ck):
+        return _json(cached)
+    _t0 = time.perf_counter()
+    _result = github_data.get_merge_queue_stats(date_from, date_to)
+    _t1 = time.perf_counter()
+    print(f"[perf] merge_queue_stats {date_from}..{date_to} | get_merge_queue_stats={_t1-_t0:.3f}s total={_t1-_t0:.3f}s", flush=True)
+    db.cache_set(_ck, _result, _cache_ttl(date_to))
+    return _json(_result)
+
+
+@app.route('/api/test-history/<test_hash>')
+@auth.login_required
+def api_test_history(test_hash):
+    """Test event history by hash — SQLite backing for Redis history_ lists."""
+    branch = request.args.get('branch', '')
+    limit = min(int(request.args.get('limit', 1000)), 5000)
+    rows = metrics.get_test_history(test_hash, branch, limit)
+    return _json(rows)
+
+
+@app.route('/api/ci/runs/pr/<int:pr_number>')
+@auth.login_required
+def api_ci_runs_for_pr(pr_number):
+    limit = min(int(request.args.get('limit', 100)), 500)
+    return _json(metrics.get_ci_runs_for_pr(pr_number, limit))
 
 
 @app.route('/api/ci/flakes-by-command')
@@ -702,8 +858,38 @@ def api_flakes_by_command():
     date_from = request.args.get('from', (datetime.now() - timedelta(days=30)).strftime('%Y-%m-%d'))
     date_to = request.args.get('to', datetime.now().strftime('%Y-%m-%d'))
     dashboard = request.args.get('dashboard', '')
+    _ck = f'flakes:{date_from}:{date_to}:{dashboard}'
+    _t0 = time.perf_counter()
     metrics.sync_failed_tests_to_sqlite(r)
-    return _json(metrics.get_flakes_by_command(date_from, date_to, dashboard))
+    _t1 = time.perf_counter()
+    if cached := db.cache_get(_ck):
+        return _json(cached)
+    _result = metrics.get_flakes_by_command(date_from, date_to, dashboard)
+    _t2 = time.perf_counter()
+    print(f"[perf] flakes_by_command {date_from}..{date_to} | sync={_t1-_t0:.3f}s get_flakes={_t2-_t1:.3f}s total={_t2-_t0:.3f}s", flush=True)
+    db.cache_set(_ck, _result, _cache_ttl(date_to))
+    return _json(_result)
+
+
+# ---- CI Phase timing ----
+
+@app.route('/api/ci/phases')
+@auth.login_required
+def api_ci_phases():
+    """CI phase timing breakdown: avg time per phase, by date, and per run."""
+    date_from = request.args.get('from', (datetime.now() - timedelta(days=30)).strftime('%Y-%m-%d'))
+    date_to = request.args.get('to', datetime.now().strftime('%Y-%m-%d'))
+    dashboard = request.args.get('dashboard', '')
+    run_id = request.args.get('run_id', '')
+    _ck = f'phases:{date_from}:{date_to}:{dashboard}:{run_id}'
+    if cached := db.cache_get(_ck):
+        return _json(cached)
+    _t0 = time.perf_counter()
+    _result = metrics.get_phases(date_from, date_to, dashboard, run_id)
+    _t1 = time.perf_counter()
+    print(f"[perf] ci_phases {date_from}..{date_to} | get_phases={_t1-_t0:.3f}s total={_t1-_t0:.3f}s", flush=True)
+    db.cache_set(_ck, _result, _cache_ttl(date_to))
+    return _json(_result)
 
 
 # ---- Test timings ----
@@ -717,96 +903,157 @@ def api_test_timings():
     dashboard = request.args.get('dashboard', '')
     status = request.args.get('status', '')  # filter to specific status
     test_cmd = request.args.get('test_cmd', '')  # filter to specific test
-
-    conditions = ['duration_secs IS NOT NULL', 'duration_secs > 0',
-                  'timestamp >= ?', "timestamp < ? || 'T23:59:59'"]
-    params = [date_from, date_to]
-
+    _ck = f'timings:{date_from}:{date_to}:{dashboard}:{status}:{test_cmd}'
+    _ttl = _cache_ttl(date_to)
+    if cached := db.cache_get(_ck):
+        return _json(cached)
+    _t0 = time.perf_counter()
+
+    # Base WHERE for test_daily_stats
+    ds_conds = ['date >= ?', 'date <= ?']
+    ds_params = [date_from, date_to]
     if dashboard:
-        conditions.append('dashboard = ?')
-        params.append(dashboard)
-    if status:
-        conditions.append('status = ?')
-        params.append(status)
+        ds_conds.append('dashboard = ?')
+        ds_params.append(dashboard)
     if test_cmd:
-        conditions.append('test_cmd = ?')
-        params.append(test_cmd)
-
-    where = 'WHERE ' + ' AND '.join(conditions)
-
-    # Per-test stats
-    by_test = db.query(f'''
-        SELECT test_cmd,
-               COUNT(*) as count,
-               ROUND(AVG(duration_secs), 1) as avg_secs,
-               ROUND(MIN(duration_secs), 1) as min_secs,
-               ROUND(MAX(duration_secs), 1) as max_secs,
-               SUM(CASE WHEN status = 'passed' THEN 1 ELSE 0 END) as passed,
-               SUM(CASE WHEN status = 'failed' THEN 1 ELSE 0 END) as failed,
-               SUM(CASE WHEN status = 'flaked' THEN 1 ELSE 0 END) as flaked,
-               dashboard
-        FROM test_events {where}
-        GROUP BY test_cmd
-        ORDER BY count DESC
-        LIMIT 200
-    ''', params)
-
-    # Add pass rate
-    for row in by_test:
-        total = row['passed'] + row['failed'] + row['flaked']
-        row['pass_rate'] = round(100.0 * row['passed'] / max(total, 1), 1)
-        row['total_time_secs'] = round(row['avg_secs'] * row['count'], 0)
-
-    # Daily time series (aggregate across all tests or filtered test)
-    by_date = db.query(f'''
-        SELECT substr(timestamp, 1, 10) as date,
-               COUNT(*) as count,
-               ROUND(AVG(duration_secs), 1) as avg_secs,
-               ROUND(MAX(duration_secs), 1) as max_secs,
-               SUM(CASE WHEN status = 'passed' THEN 1 ELSE 0 END) as passed,
-               SUM(CASE WHEN status = 'failed' THEN 1 ELSE 0 END) as failed,
-               SUM(CASE WHEN status = 'flaked' THEN 1 ELSE 0 END) as flaked
-        FROM test_events {where}
-        GROUP BY substr(timestamp, 1, 10)
-        ORDER BY date
-    ''', params)
-
-    # Summary
-    summary_rows = db.query(f'''
-        SELECT COUNT(*) as count,
-               ROUND(AVG(duration_secs), 1) as avg_secs,
-               ROUND(MAX(duration_secs), 1) as max_secs,
-               SUM(duration_secs) as total_secs,
-               SUM(CASE WHEN status = 'passed' THEN 1 ELSE 0 END) as passed,
-               SUM(CASE WHEN status = 'failed' THEN 1 ELSE 0 END) as failed,
-               SUM(CASE WHEN status = 'flaked' THEN 1 ELSE 0 END) as flaked
-        FROM test_events {where}
-    ''', params)
-    s = summary_rows[0] if summary_rows else {}
-
-    # Slowest individual test runs
+        ds_conds.append('test_cmd = ?')
+        ds_params.append(test_cmd)
+    ds_where = 'WHERE ' + ' AND '.join(ds_conds)
+
+    if not status:
+        # Fast path: push GROUP BY into SQL — returns N_tests + N_dates rows, not N_tests*N_dates rows
+        by_test_rows = db.query(f'''
+            SELECT test_cmd, MAX(dashboard) as dashboard,
+                   SUM(passed) as passed, SUM(failed) as failed, SUM(flaked) as flaked,
+                   SUM(total_secs) as total_secs, SUM(count_timed) as count_timed,
+                   MIN(min_secs) as min_secs, MAX(max_secs) as max_secs
+            FROM test_daily_stats {ds_where}
+            GROUP BY test_cmd
+            ORDER BY SUM(passed)+SUM(failed)+SUM(flaked) DESC LIMIT 500
+        ''', ds_params)
+        _t1 = time.perf_counter()
+
+        by_date_rows = db.query(f'''
+            SELECT date,
+                   SUM(passed) as passed, SUM(failed) as failed, SUM(flaked) as flaked,
+                   SUM(total_secs) as total_secs, SUM(count_timed) as count_timed
+            FROM test_daily_stats {ds_where}
+            GROUP BY date ORDER BY date
+        ''', ds_params)
+        _t2 = time.perf_counter()
+
+        by_test = []
+        for t in by_test_rows:
+            count = (t['passed'] or 0) + (t['failed'] or 0) + (t['flaked'] or 0)
+            avg_secs = round(t['total_secs'] / t['count_timed'], 1) if t['count_timed'] else None
+            by_test.append({
+                'test_cmd': t['test_cmd'], 'dashboard': t['dashboard'], 'count': count,
+                'passed': t['passed'] or 0, 'failed': t['failed'] or 0, 'flaked': t['flaked'] or 0,
+                'pass_rate': round(100.0 * (t['passed'] or 0) / max(count, 1), 1),
+                'avg_secs': avg_secs, 'min_secs': t['min_secs'], 'max_secs': t['max_secs'],
+                'total_time_secs': round(t['total_secs'] or 0, 0),
+            })
+
+        by_date = []
+        for d in by_date_rows:
+            count = (d['passed'] or 0) + (d['failed'] or 0) + (d['flaked'] or 0)
+            avg_secs = round(d['total_secs'] / d['count_timed'], 1) if d['count_timed'] else None
+            by_date.append({
+                'date': d['date'], 'passed': d['passed'] or 0,
+                'failed': d['failed'] or 0, 'flaked': d['flaked'] or 0,
+                'count': count, 'avg_secs': avg_secs,
+            })
+
+        total_passed = sum(d['passed'] for d in by_date)
+        total_failed = sum(d['failed'] for d in by_date)
+        total_flaked = sum(d['flaked'] for d in by_date)
+        total_secs_all = sum(d['total_secs'] or 0 for d in by_date_rows)
+        count_timed_all = sum(d['count_timed'] or 0 for d in by_date_rows)
+    else:
+        # Slow fallback: status filter requires scanning test_events
+        te_conds = ['duration_secs IS NOT NULL', 'duration_secs > 0',
+                    'timestamp >= ?', "timestamp < ? || 'T23:59:59'"]
+        te_params = [date_from, date_to]
+        if dashboard:
+            te_conds.append('dashboard = ?')
+            te_params.append(dashboard)
+        te_conds.append('status = ?')
+        te_params.append(status)
+        if test_cmd:
+            te_conds.append('test_cmd = ?')
+            te_params.append(test_cmd)
+        te_where = 'WHERE ' + ' AND '.join(te_conds)
+
+        raw = db.query(f'''
+            SELECT test_cmd, dashboard,
+                   COUNT(*) as count,
+                   ROUND(AVG(duration_secs),1) as avg_secs,
+                   ROUND(MIN(duration_secs),1) as min_secs,
+                   ROUND(MAX(duration_secs),1) as max_secs,
+                   SUM(duration_secs) as total_secs,
+                   substr(timestamp,1,10) as date
+            FROM test_events {te_where}
+            GROUP BY test_cmd
+            ORDER BY count DESC LIMIT 200
+        ''', te_params)
+        _t1 = time.perf_counter()
+        by_test = [dict(r, pass_rate=0, passed=0, failed=r['count'] if status=='failed' else 0,
+                        flaked=r['count'] if status=='flaked' else 0,
+                        total_time_secs=round(r['total_secs'] or 0, 0)) for r in raw]
+
+        by_date_raw = db.query(f'''
+            SELECT substr(timestamp,1,10) as date, COUNT(*) as count
+            FROM test_events {te_where}
+            GROUP BY substr(timestamp,1,10) ORDER BY date
+        ''', te_params)
+        by_date = [{'date': r['date'], 'count': r['count'], 'passed': 0,
+                    'failed': r['count'] if status=='failed' else 0,
+                    'flaked': r['count'] if status=='flaked' else 0} for r in by_date_raw]
+
+        total_passed = 0
+        total_failed = sum(r['count'] for r in by_date) if status == 'failed' else 0
+        total_flaked = sum(r['count'] for r in by_date) if status == 'flaked' else 0
+        total_secs_all = sum(r.get('total_secs') or 0 for r in raw)
+        count_timed_all = sum(r['count'] for r in raw)
+        _t2 = time.perf_counter()
+
+    # Slowest individual runs — uses idx_test_events_duration index
+    sl_conds = ['duration_secs IS NOT NULL', 'duration_secs > 0',
+                'timestamp >= ?', "timestamp <= ? || 'T23:59:59'"]
+    sl_params = [date_from, date_to]
+    if dashboard:
+        sl_conds.append('dashboard = ?')
+        sl_params.append(dashboard)
+    if test_cmd:
+        sl_conds.append('test_cmd = ?')
+        sl_params.append(test_cmd)
+    sl_where = 'WHERE ' + ' AND '.join(sl_conds)
     slowest = db.query(f'''
         SELECT test_cmd, status, duration_secs, dashboard,
-               substr(timestamp, 1, 10) as date, commit_author, log_url
-        FROM test_events {where}
-        ORDER BY duration_secs DESC
-        LIMIT 50
-    ''', params)
-
-    return _json({
+               substr(timestamp,1,10) as date, commit_author, log_url
+        FROM test_events {sl_where}
+        ORDER BY duration_secs DESC LIMIT 50
+    ''', sl_params)
+    _t3 = time.perf_counter()
+
+    print(f"[perf] test_timings {date_from}..{date_to} | by_test={_t1-_t0:.3f}s by_date={_t2-_t1:.3f}s slowest={_t3-_t2:.3f}s total={_t3-_t0:.3f}s", flush=True)
+    _result = {
         'by_test': by_test,
         'by_date': by_date,
         'slowest': slowest,
+        'period': {'from': date_from, 'to': date_to},
         'summary': {
-            'total_runs': s.get('count', 0),
-            'avg_duration_secs': s.get('avg_secs'),
-            'max_duration_secs': s.get('max_secs'),
-            'total_compute_secs': round(s.get('total_secs', 0) or 0, 0),
-            'passed': s.get('passed', 0),
-            'failed': s.get('failed', 0),
-            'flaked': s.get('flaked', 0),
+            'total_runs': total_passed + total_failed + total_flaked,
+            'avg_duration_secs': round(total_secs_all / count_timed_all, 1) if count_timed_all > 0 else None,
+            'max_duration_secs': slowest[0]['duration_secs'] if slowest else None,
+            'total_compute_secs': round(total_secs_all, 0),
+            'passed': total_passed,
+            'failed': total_failed,
+            'flaked': total_flaked,
         },
-    })
+    }
+    db.cache_set(_ck, _result, _ttl)
+    return _json(_result)
 
 
 # ---- Dashboard views ----
@@ -844,5 +1091,59 @@ def test_timings():
     return "Dashboard not found", 404
 
 
+@app.route('/ci-health-report')
+@auth.login_required
+def ci_health_report():
+    path = Path(__file__).parent / 'views' / 'ci-health-report.html'
+    if path.exists():
+        return path.read_text()
+    return "Report not found", 404
+
+
+@app.route('/commits')
+@auth.login_required
+def commits_page():
+    path = Path(__file__).parent / 'views' / 'commits.html'
+    return path.read_text()
+
+
+@app.route('/api/commits')
+@auth.login_required
+def api_commits():
+    branch = request.args.get('branch', 'next')
+    page = max(1, int(request.args.get('page', 1)))
+    per_page = min(int(request.args.get('per_page', 50)), 100)
+    return _json(github_data.get_recent_commits(branch, page, per_page))
+
+
+@app.route('/flake-prs')
+@auth.login_required
+def flake_prs():
+    path = Path(__file__).parent / 'views' / 'flake-prs.html'
+    if path.exists():
+        return path.read_text()
+    return "Page not found", 404
+
+
+@app.route('/api/flake-prs')
+@auth.login_required
+def api_flake_prs():
+    rows = db.query('''
+        SELECT pa.pr_number, pa.author, pa.title, pa.branch,
+               pa.additions, pa.deletions, pa.fetched_at,
+               MIN(cr.timestamp_ms) as first_seen_ms
+        FROM pr_authors pa
+        LEFT JOIN ci_runs cr ON cr.pr_number = pa.pr_number
+        WHERE (
+            pa.title LIKE '%flake%' OR pa.title LIKE '%deflake%'
+            OR pa.branch LIKE '%flake%' OR pa.branch LIKE '%deflake%'
+        )
+        GROUP BY pa.pr_number
+        ORDER BY pa.pr_number DESC
+        LIMIT 200
+    ''')
+    return _json([dict(r) for r in rows])
+
+
 if __name__ == '__main__':
     app.run(host='0.0.0.0', port=8081)
diff --git a/ci3/ci-metrics/billing/aws.py b/ci3/ci-metrics/billing/aws.py
index 481393d74ec3..4dc9061b37df 100644
--- a/ci3/ci-metrics/billing/aws.py
+++ b/ci3/ci-metrics/billing/aws.py
@@ -54,6 +54,8 @@
     # Messaging
     'Amazon Simple Notification Service': 'sns',
     'Amazon Simple Queue Service': 'sqs',
+    # Savings Plans / Reserved Instances
+    'Savings Plans for AWS Compute usage': 'savings_plans',
     # Other
     'Tax': 'tax',
     'AWS Support (Business)': 'support',
@@ -63,6 +65,16 @@
 
 import re
 
+# One-time contract payments: annual Savings Plan upfronts and monthly Reserved Instance charges.
+# These appear as large single-day spikes but are not operational spend.
+_ONE_TIME_CATEGORIES = frozenset({
+    'savings_plan_1yr_annual',
+    'savings_plan_3yr_annual',
+    'savings_plan_1yr_annual_partial',
+    'savings_plan_3yr_annual_partial',
+    'reserved_instance_monthly',
+})
+
 _cache = {'rows': [], 'ts': 0}
 _cache_lock = threading.Lock()
 _detail_cache = {'rows': [], 'ts': 0}
@@ -152,7 +164,10 @@ def _fetch_aws_costs(date_from: str, date_to: str) -> list[dict]:
                 TimePeriod={'Start': date_from, 'End': date_to},
                 Granularity='DAILY',
                 Metrics=['UnblendedCost'],
-                GroupBy=[{'Type': 'DIMENSION', 'Key': 'SERVICE'}],
+                GroupBy=[
+                    {'Type': 'DIMENSION', 'Key': 'SERVICE'},
+                    {'Type': 'DIMENSION', 'Key': 'USAGE_TYPE'},
+                ],
             )
             if next_token:
                 kwargs['NextPageToken'] = next_token
@@ -163,12 +178,26 @@ def _fetch_aws_costs(date_from: str, date_to: str) -> list[dict]:
                 date = result['TimePeriod']['Start']
                 for group in result['Groups']:
                     service = group['Keys'][0]
+                    usage_type = group['Keys'][1] if len(group['Keys']) > 1 else ''
                     amount = float(group['Metrics']['UnblendedCost']['Amount'])
                     if amount == 0:
                         continue
                     category = SERVICE_CATEGORY_MAP.get(service, 'other')
+                    # Savings plans: ComputeSP:1yrAllUpfront, ComputeSP:3yrNoUpfront, etc.
+                    if category == 'savings_plans':
+                        m = re.match(r'ComputeSP:(\d+yr)(\w+)', usage_type)
+                        if m:
+                            term = m.group(1)
+                            payment = m.group(2)
+                            if payment == 'NoUpfront':
+                                category = f'savings_plan_{term}_monthly'
+                            elif 'Upfront' in payment:
+                                category = f'savings_plan_{term}_annual'
+                    # EC2 reserved instances: HeavyUsage:<type> billed monthly on 1st
+                    elif category == 'ec2' and 'HeavyUsage:' in usage_type:
+                        category = 'reserved_instance_monthly'
                     if category == 'other':
-                        print(f"[rk_aws_costs] unmapped service: {service!r} (${amount:.2f})")
+                        print(f"[rk_aws_costs] unmapped service: {service!r} / {usage_type!r} (${amount:.2f})")
                     rows.append({
                         'date': date,
                         'service': service,
@@ -322,26 +351,32 @@ def get_costs_overview(date_from: str, date_to: str) -> dict:
     for r in aws_rows:
         d = r['date']
         if d not in by_date:
-            by_date[d] = {'date': d, 'aws': {}, 'gcp': {}, 'aws_total': 0, 'gcp_total': 0}
+            by_date[d] = {'date': d, 'aws': {}, 'gcp': {}, 'aws_total': 0, 'gcp_total': 0, 'aws_one_time': 0}
         cat = r['category']
         by_date[d]['aws'][cat] = by_date[d]['aws'].get(cat, 0) + r['amount_usd']
         by_date[d]['aws_total'] += r['amount_usd']
+        if cat in _ONE_TIME_CATEGORIES:
+            by_date[d]['aws_one_time'] += r['amount_usd']
 
     for d, cats in gcp_by_date.items():
         if d not in by_date:
-            by_date[d] = {'date': d, 'aws': {}, 'gcp': {}, 'aws_total': 0, 'gcp_total': 0}
+            by_date[d] = {'date': d, 'aws': {}, 'gcp': {}, 'aws_total': 0, 'gcp_total': 0, 'aws_one_time': 0}
         by_date[d]['gcp'] = cats
         by_date[d]['gcp_total'] = sum(cats.values())
 
     sorted_dates = sorted(by_date.values(), key=lambda x: x['date'])
     aws_total = sum(d['aws_total'] for d in sorted_dates)
+    aws_one_time = sum(d['aws_one_time'] for d in sorted_dates)
     gcp_total = sum(d['gcp_total'] for d in sorted_dates)
 
     return {
         'by_date': sorted_dates,
         'totals': {
             'aws': round(aws_total, 2),
+            'aws_operational': round(aws_total - aws_one_time, 2),
+            'aws_one_time': round(aws_one_time, 2),
             'gcp': round(gcp_total, 2),
             'combined': round(aws_total + gcp_total, 2),
+            'combined_operational': round(aws_total - aws_one_time + gcp_total, 2),
         }
     }
diff --git a/ci3/ci-metrics/db.py b/ci3/ci-metrics/db.py
index 93e970fe3a56..e19380902825 100644
--- a/ci3/ci-metrics/db.py
+++ b/ci3/ci-metrics/db.py
@@ -3,11 +3,14 @@
 Stores test events (from Redis pub/sub) and merge queue daily stats
 (backfilled from GitHub API).
 """
+import json
 import os
 import sqlite3
 import threading
+import time
 
-_DB_PATH = os.path.join(os.getenv('LOGS_DISK_PATH', '/logs-disk'), 'metrics.db')
+_DB_PATH = os.getenv('METRICS_DB_PATH',
+                     os.path.join(os.getenv('LOGS_DISK_PATH', '/logs-disk'), 'metrics.db'))
 _local = threading.local()
 
 SCHEMA = """
@@ -34,6 +37,7 @@
 CREATE INDEX IF NOT EXISTS idx_test_events_ts ON test_events(timestamp);
 CREATE INDEX IF NOT EXISTS idx_test_events_cmd ON test_events(test_cmd);
 CREATE INDEX IF NOT EXISTS idx_test_events_dashboard ON test_events(dashboard);
+CREATE INDEX IF NOT EXISTS idx_test_events_status_ts ON test_events(status, timestamp);
 
 CREATE TABLE IF NOT EXISTS merge_queue_daily (
     date           TEXT PRIMARY KEY,
@@ -64,6 +68,84 @@
 CREATE INDEX IF NOT EXISTS idx_ci_runs_ts ON ci_runs(timestamp_ms);
 CREATE INDEX IF NOT EXISTS idx_ci_runs_name ON ci_runs(name);
 CREATE INDEX IF NOT EXISTS idx_ci_runs_dashboard ON ci_runs(dashboard);
+
+CREATE TABLE IF NOT EXISTS test_daily_stats (
+    date          TEXT NOT NULL,
+    test_cmd      TEXT NOT NULL,
+    dashboard     TEXT NOT NULL DEFAULT '',
+    passed        INTEGER NOT NULL DEFAULT 0,
+    failed        INTEGER NOT NULL DEFAULT 0,
+    flaked        INTEGER NOT NULL DEFAULT 0,
+    total_secs    REAL NOT NULL DEFAULT 0,
+    count_timed   INTEGER NOT NULL DEFAULT 0,
+    min_secs      REAL,
+    max_secs      REAL,
+    PRIMARY KEY (date, test_cmd, dashboard)
+);
+CREATE INDEX IF NOT EXISTS idx_tds_date ON test_daily_stats(date);
+CREATE INDEX IF NOT EXISTS idx_tds_dashboard ON test_daily_stats(dashboard);
+
+CREATE TABLE IF NOT EXISTS merge_queue_snapshots (
+    id             INTEGER PRIMARY KEY AUTOINCREMENT,
+    timestamp      TEXT NOT NULL,
+    depth          INTEGER NOT NULL,
+    entries_json   TEXT
+);
+CREATE INDEX IF NOT EXISTS idx_mqs_ts ON merge_queue_snapshots(timestamp);
+
+CREATE TABLE IF NOT EXISTS ci_run_daily_stats (
+    date          TEXT NOT NULL,
+    dashboard     TEXT NOT NULL,
+    run_count     INTEGER NOT NULL DEFAULT 0,
+    passed        INTEGER NOT NULL DEFAULT 0,
+    failed        INTEGER NOT NULL DEFAULT 0,
+    sum_duration  REAL NOT NULL DEFAULT 0,
+    min_duration  REAL,
+    max_duration  REAL,
+    p50_duration  REAL,
+    p95_duration  REAL,
+    PRIMARY KEY (date, dashboard)
+);
+CREATE INDEX IF NOT EXISTS idx_crds_date ON ci_run_daily_stats(date);
+
+CREATE TABLE IF NOT EXISTS ci_phases (
+    id            INTEGER PRIMARY KEY AUTOINCREMENT,
+    phase         TEXT NOT NULL,
+    duration_secs REAL NOT NULL,
+    exit_code     INTEGER,
+    run_id        TEXT,
+    job_id        TEXT,
+    dashboard     TEXT NOT NULL DEFAULT '',
+    ref_name      TEXT,
+    commit_hash   TEXT,
+    timestamp     TEXT NOT NULL
+);
+CREATE INDEX IF NOT EXISTS idx_ci_phases_run ON ci_phases(run_id);
+CREATE INDEX IF NOT EXISTS idx_ci_phases_ts ON ci_phases(timestamp);
+CREATE INDEX IF NOT EXISTS idx_ci_phases_phase ON ci_phases(phase);
+
+CREATE TABLE IF NOT EXISTS pr_authors (
+    pr_number     INTEGER PRIMARY KEY,
+    author        TEXT NOT NULL,
+    title         TEXT NOT NULL DEFAULT '',
+    branch        TEXT NOT NULL DEFAULT '',
+    additions     INTEGER DEFAULT 0,
+    deletions     INTEGER DEFAULT 0,
+    fetched_at    TEXT NOT NULL
+);
+
+CREATE TABLE IF NOT EXISTS api_cache (
+    key        TEXT PRIMARY KEY,
+    value      TEXT NOT NULL,
+    created_at REAL NOT NULL,
+    ttl_secs   INTEGER NOT NULL DEFAULT 300
+);
+
+CREATE TABLE IF NOT EXISTS pr_cache (
+    key        TEXT PRIMARY KEY,
+    value      TEXT NOT NULL,
+    updated_at REAL NOT NULL
+);
 """
 
 
@@ -73,6 +155,16 @@
     "ALTER TABLE ci_runs ADD COLUMN job_id TEXT DEFAULT ''",
     "ALTER TABLE ci_runs ADD COLUMN arch TEXT DEFAULT ''",
     "CREATE INDEX IF NOT EXISTS idx_ci_runs_dashboard ON ci_runs(dashboard)",
+    "ALTER TABLE test_events ADD COLUMN test_hash TEXT",
+    "CREATE INDEX IF NOT EXISTS idx_test_events_hash ON test_events(test_hash)",
+    "ALTER TABLE merge_queue_daily ADD COLUMN avg_depth REAL",
+    "ALTER TABLE merge_queue_daily ADD COLUMN peak_depth INTEGER",
+    "CREATE INDEX IF NOT EXISTS idx_test_events_duration_ts ON test_events(timestamp) WHERE duration_secs IS NOT NULL AND duration_secs > 0",
+    "ALTER TABLE test_daily_stats ADD COLUMN total_secs REAL NOT NULL DEFAULT 0",
+    "ALTER TABLE test_daily_stats ADD COLUMN count_timed INTEGER NOT NULL DEFAULT 0",
+    "ALTER TABLE test_daily_stats ADD COLUMN min_secs REAL",
+    "ALTER TABLE test_daily_stats ADD COLUMN max_secs REAL",
+    "CREATE INDEX IF NOT EXISTS idx_test_events_duration ON test_events(duration_secs DESC) WHERE duration_secs IS NOT NULL AND duration_secs > 0",
 ]
 
 
@@ -105,3 +197,31 @@ def execute(sql: str, params=()):
     conn = get_db()
     conn.execute(sql, params)
     conn.commit()
+
+
+def cache_get(key: str):
+    """Return cached value (parsed JSON) if not expired, else None."""
+    rows = query('SELECT value, created_at, ttl_secs FROM api_cache WHERE key = ?', (key,))
+    if rows and time.time() - rows[0]['created_at'] < rows[0]['ttl_secs']:
+        return json.loads(rows[0]['value'])
+    return None
+
+
+def cache_set(key: str, data, ttl_secs: int = 300) -> None:
+    """Store data as JSON in the cache with a TTL."""
+    execute(
+        'INSERT OR REPLACE INTO api_cache (key, value, created_at, ttl_secs) VALUES (?, ?, ?, ?)',
+        (key, json.dumps(data, default=str), time.time(), ttl_secs),
+    )
+
+
+def cache_invalidate_prefix(prefix: str) -> None:
+    """Delete all cache entries whose key starts with prefix."""
+    execute('DELETE FROM api_cache WHERE key LIKE ?', (prefix + '%',))
+
+
+def cache_cleanup() -> None:
+    """Remove expired entries."""
+    execute(
+        "DELETE FROM api_cache WHERE created_at + ttl_secs < unixepoch('now')"
+    )
diff --git a/ci3/ci-metrics/ec2_pricing.py b/ci3/ci-metrics/ec2_pricing.py
index ace55ea4f40a..96e0561d0d70 100644
--- a/ci3/ci-metrics/ec2_pricing.py
+++ b/ci3/ci-metrics/ec2_pricing.py
@@ -16,12 +16,20 @@
 # ---- Hardcoded fallback rates (us-east-2, USD/hr) ----
 
 _HARDCODED_RATES = {
-    ('m6a.48xlarge', True):  8.31,   # spot
-    ('m6a.48xlarge', False): 16.56,  # on-demand
-    ('m6a.32xlarge', True):  5.54,
-    ('m6a.32xlarge', False): 11.04,
+    ('m6a.xlarge',   True):  0.07,   # spot
+    ('m6a.xlarge',   False): 0.1728, # on-demand
+    ('m6a.4xlarge',  True):  0.28,
+    ('m6a.4xlarge',  False): 0.6912,
+    ('m6a.8xlarge',  True):  0.55,
+    ('m6a.8xlarge',  False): 1.3824,
     ('m6a.16xlarge', True):  2.77,
     ('m6a.16xlarge', False): 5.52,
+    ('m6a.24xlarge', True):  1.66,
+    ('m6a.24xlarge', False): 4.1472,
+    ('m6a.32xlarge', True):  5.54,
+    ('m6a.32xlarge', False): 11.04,
+    ('m6a.48xlarge', True):  8.31,
+    ('m6a.48xlarge', False): 16.56,
     ('m7a.48xlarge', True):  8.31,
     ('m7a.48xlarge', False): 16.56,
     ('m7a.16xlarge', True):  2.77,
@@ -145,8 +153,19 @@ def _fetch_all_spot(instance_types: list[str]) -> dict[str, float]:
 # ---- Cache refresh ----
 
 def _get_known_instance_types() -> list[str]:
-    """Return the set of instance types we need pricing for."""
-    return sorted({itype for itype, _ in _HARDCODED_RATES})
+    """Return the set of instance types we need pricing for (hardcoded + from DB)."""
+    types = {itype for itype, _ in _HARDCODED_RATES}
+    try:
+        import db
+        conn = db.get_db()
+        rows = conn.execute(
+            "SELECT DISTINCT instance_type FROM ci_runs "
+            "WHERE instance_type IS NOT NULL AND instance_type != '' AND instance_type != 'unknown'"
+        ).fetchall()
+        types.update(r['instance_type'] for r in rows)
+    except Exception:
+        pass
+    return sorted(types)
 
 
 def _refresh_cache():
diff --git a/ci3/ci-metrics/github_data.py b/ci3/ci-metrics/github_data.py
index 8824d187cb81..9c36a708025d 100644
--- a/ci3/ci-metrics/github_data.py
+++ b/ci3/ci-metrics/github_data.py
@@ -1,15 +1,20 @@
 """GitHub API polling with in-memory cache.
 
-Fetches PR lifecycle, deployment runs, branch lag, and merge queue stats via `gh` CLI.
+Fetches PR lifecycle, deployment runs, branch lag, and merge queue stats via
+the GitHub REST API (using requests + GH_TOKEN env var).
 Most data cached in memory with TTL. Merge queue stats persisted to SQLite daily.
 """
 import json
-import subprocess
+import os
+import requests
 import threading
 import time
 from datetime import datetime, timedelta, timezone
 
+import db as _db
+
 REPO = 'AztecProtocol/aztec-packages'
+_GH_API = 'https://api.github.com'
 
 BRANCH_PAIRS = [
     ('next', 'staging-public'),
@@ -25,41 +30,126 @@
 
 _CACHE_TTL = 3600  # 1 hour
 _pr_cache = {'data': [], 'ts': 0}
+_commits_cache: dict = {}  # keyed by branch
+_commits_lock = threading.Lock()
 _deploy_cache = {'data': [], 'ts': 0}
 _lag_cache = {'data': [], 'ts': 0}
-_pr_author_cache = {}  # {pr_number: {'author': str, 'title': str, 'branch': str}}
 _pr_lock = threading.Lock()
 _deploy_lock = threading.Lock()
 _lag_lock = threading.Lock()
 
 
-def _gh(args: list[str]) -> str | None:
+def _gh_headers() -> dict:
+    token = os.environ.get('GH_TOKEN') or os.environ.get('GITHUB_TOKEN', '')
+    h = {'Accept': 'application/vnd.github+json', 'X-GitHub-Api-Version': '2022-11-28'}
+    if token:
+        h['Authorization'] = f'Bearer {token}'
+    return h
+
+
+def _github_get(path: str, paginate: bool = False) -> list | dict | None:
+    """GET from GitHub REST API. Returns parsed JSON (list or dict).
+    If paginate=True, follows Link: next headers and merges array results."""
+    url = f'{_GH_API}/{path}' if not path.startswith('http') else path
+    headers = _gh_headers()
     try:
-        result = subprocess.run(
-            ['gh'] + args,
-            capture_output=True, text=True, timeout=30
-        )
-        if result.returncode == 0:
-            return result.stdout.strip()
-    except (FileNotFoundError, subprocess.TimeoutExpired) as e:
-        print(f"[rk_github] gh error: {e}")
-    return None
+        if not paginate:
+            resp = requests.get(url, headers=headers, timeout=30)
+            if resp.status_code != 200:
+                print(f"[rk_github] API {resp.status_code}: {url}")
+                return None
+            return resp.json()
+        # Paginated: collect all pages
+        all_items = []
+        while url:
+            resp = requests.get(url, headers=headers, timeout=30)
+            if resp.status_code != 200:
+                print(f"[rk_github] API {resp.status_code}: {url}")
+                break
+            data = resp.json()
+            if isinstance(data, list):
+                all_items.extend(data)
+            elif isinstance(data, dict):
+                # For endpoints like /actions/workflows/.../runs that wrap in an object
+                all_items.append(data)
+            # Follow Link: <url>; rel="next"
+            link = resp.headers.get('Link', '')
+            url = None
+            for part in link.split(','):
+                if 'rel="next"' in part:
+                    url = part.split('<')[1].split('>')[0]
+        return all_items
+    except Exception as e:
+        print(f"[rk_github] API error: {e}")
+        return None
+
+
+def _github_graphql(query: str, variables: dict = None) -> dict | None:
+    """Execute a GitHub GraphQL query."""
+    headers = _gh_headers()
+    try:
+        resp = requests.post(f'{_GH_API}/graphql', headers=headers,
+                             json={'query': query, 'variables': variables or {}},
+                             timeout=30)
+        if resp.status_code != 200:
+            print(f"[rk_github] GraphQL {resp.status_code}")
+            return None
+        data = resp.json()
+        if 'errors' in data:
+            print(f"[rk_github] GraphQL errors: {data['errors']}")
+        return data.get('data')
+    except Exception as e:
+        print(f"[rk_github] GraphQL error: {e}")
+        return None
 
 
 # ---- PR lifecycle ----
 
+_PR_GQL = '''
+query($owner: String!, $repo: String!, $cursor: String) {
+  repository(owner: $owner, name: $repo) {
+    pullRequests(states: MERGED, first: 100, after: $cursor, orderBy: {field: UPDATED_AT, direction: DESC}) {
+      pageInfo { hasNextPage endCursor }
+      nodes {
+        number
+        author { login }
+        title
+        createdAt
+        mergedAt
+        closedAt
+        baseRefName
+        headRefName
+        additions
+        deletions
+        changedFiles
+        isDraft
+        reviewDecision
+        labels(first: 20) { nodes { name } }
+      }
+    }
+  }
+}'''
+
+
 def _fetch_and_process_prs() -> list[dict]:
-    out = _gh([
-        'pr', 'list', '--repo', REPO, '--state', 'merged',
-        '--limit', '500',
-        '--json', 'number,author,title,createdAt,mergedAt,closedAt,baseRefName,'
-                  'headRefName,additions,deletions,changedFiles,isDraft,reviewDecision,labels'
-    ])
-    if not out:
-        return []
-    try:
-        prs = json.loads(out)
-    except json.JSONDecodeError:
+    owner, repo = REPO.split('/')
+    prs = []
+    cursor = None
+    for _ in range(5):  # max 5 pages = 500 PRs
+        data = _github_graphql(_PR_GQL, {'owner': owner, 'repo': repo, 'cursor': cursor})
+        if not data:
+            break
+        pr_data = data.get('repository', {}).get('pullRequests', {})
+        nodes = pr_data.get('nodes', [])
+        for node in nodes:
+            node['author'] = (node.get('author') or {}).get('login', 'unknown')
+            node['labels'] = [l['name'] for l in (node.get('labels') or {}).get('nodes', [])]
+        prs.extend(nodes)
+        page_info = pr_data.get('pageInfo', {})
+        if not page_info.get('hasNextPage'):
+            break
+        cursor = page_info.get('endCursor')
+    if not prs:
         return []
 
     for pr in prs:
@@ -87,9 +177,20 @@ def _fetch_and_process_prs() -> list[dict]:
 
 
 def _ensure_prs():
+    import db as _db
     now = time.time()
     if _pr_cache['data'] and now - _pr_cache['ts'] < _CACHE_TTL:
         return
+    # Try SQLite cache before hitting GitHub
+    if not _pr_cache['data']:
+        try:
+            rows = _db.query("SELECT value, updated_at FROM pr_cache WHERE key = 'prs'")
+            if rows and now - rows[0]['updated_at'] < _CACHE_TTL:
+                _pr_cache['data'] = json.loads(rows[0]['value'])
+                _pr_cache['ts'] = rows[0]['updated_at']
+                return
+        except Exception:
+            pass
     if not _pr_lock.acquire(blocking=False):
         return
     try:
@@ -97,6 +198,13 @@ def _ensure_prs():
         if prs:
             _pr_cache['data'] = prs
             _pr_cache['ts'] = now
+            try:
+                _db.execute(
+                    "INSERT OR REPLACE INTO pr_cache (key, value, updated_at) VALUES ('prs', ?, ?)",
+                    (json.dumps(prs, default=str), now),
+                )
+            except Exception:
+                pass
     finally:
         _pr_lock.release()
 
@@ -106,20 +214,14 @@ def _ensure_prs():
 def _fetch_all_deploys() -> list[dict]:
     all_runs = []
     for workflow in DEPLOY_WORKFLOWS:
-        out = _gh([
-            'run', 'list', '--repo', REPO,
-            '--workflow', workflow, '--limit', '50',
-            '--json', 'databaseId,status,conclusion,createdAt,updatedAt,headBranch,name'
-        ])
-        if not out:
-            continue
-        try:
-            runs = json.loads(out)
-        except json.JSONDecodeError:
+        data = _github_get(
+            f'repos/{REPO}/actions/workflows/{workflow}/runs?per_page=50&status=completed')
+        if not data:
             continue
+        runs = data.get('workflow_runs', [])
         for run in runs:
-            started = run.get('createdAt', '')
-            completed = run.get('updatedAt')
+            started = run.get('created_at', '')
+            completed = run.get('updated_at')
             duration = None
             if started and completed:
                 try:
@@ -129,9 +231,9 @@ def _fetch_all_deploys() -> list[dict]:
                 except (ValueError, TypeError):
                     pass
             all_runs.append({
-                'run_id': str(run.get('databaseId', '')),
+                'run_id': str(run.get('id', '')),
                 'workflow_name': workflow.replace('.yml', ''),
-                'ref_name': run.get('headBranch', ''),
+                'ref_name': run.get('head_branch', ''),
                 'status': run.get('conclusion', run.get('status', 'unknown')),
                 'started_at': started,
                 'completed_at': completed,
@@ -162,26 +264,22 @@ def _fetch_branch_lag() -> list[dict]:
     results = []
     today = datetime.now(timezone.utc).date().isoformat()
     for source, target in BRANCH_PAIRS:
-        out = _gh([
-            'api', f'repos/{REPO}/compare/{target}...{source}',
-            '--jq', '.ahead_by'
-        ])
-        if not out:
+        data = _github_get(f'repos/{REPO}/compare/{target}...{source}')
+        if not data:
             continue
         try:
-            commits_behind = int(out)
+            commits_behind = int(data.get('ahead_by', 0))
         except (ValueError, TypeError):
             continue
 
         days_behind = None
-        out2 = _gh([
-            'api', f'repos/{REPO}/compare/{target}...{source}',
-            '--jq', '.commits[0].commit.committer.date'
-        ])
-        if out2:
+        commits = data.get('commits', [])
+        if commits:
             try:
-                oldest = datetime.fromisoformat(out2.replace('Z', '+00:00'))
-                days_behind = round((datetime.now(timezone.utc) - oldest).total_seconds() / 86400, 1)
+                oldest_date = commits[0].get('commit', {}).get('committer', {}).get('date', '')
+                if oldest_date:
+                    oldest = datetime.fromisoformat(oldest_date.replace('Z', '+00:00'))
+                    days_behind = round((datetime.now(timezone.utc) - oldest).total_seconds() / 86400, 1)
             except (ValueError, TypeError):
                 pass
 
@@ -291,71 +389,106 @@ def get_branch_lag(date_from: str, date_to: str) -> dict:
     return {'pairs': pairs}
 
 
+def _cache_pr_author(pr_number: int, info: dict):
+    """Write PR author info to SQLite cache."""
+    _db.execute('''
+        INSERT OR REPLACE INTO pr_authors (pr_number, author, title, branch, additions, deletions, fetched_at)
+        VALUES (?, ?, ?, ?, ?, ?, ?)
+    ''', (pr_number, info['author'], info.get('title', ''), info.get('branch', ''),
+          info.get('additions', 0), info.get('deletions', 0),
+          datetime.now(timezone.utc).isoformat()))
+
+
+def _get_cached_pr_author(pr_number: int) -> dict | None:
+    """Read PR author info from SQLite cache."""
+    rows = _db.query('SELECT * FROM pr_authors WHERE pr_number = ?', (pr_number,))
+    if rows:
+        r = rows[0]
+        return {'author': r['author'], 'title': r['title'], 'branch': r['branch'],
+                'additions': r['additions'], 'deletions': r['deletions']}
+    return None
+
+
 def get_pr_author(pr_number) -> dict | None:
-    """Look up PR author/title by number. Results are cached permanently (PR data doesn't change)."""
+    """Look up PR author/title by number. Results cached in SQLite."""
     pr_number = int(pr_number) if pr_number else None
     if not pr_number:
         return None
-    if pr_number in _pr_author_cache:
-        return _pr_author_cache[pr_number]
 
-    # Check merged PR cache first (already fetched)
+    # Check SQLite cache
+    cached = _get_cached_pr_author(pr_number)
+    if cached:
+        return cached
+
+    # Check merged PR cache (already fetched in-memory)
     for pr in _pr_cache.get('data', []):
         if pr.get('number') == pr_number:
             info = {'author': pr.get('author', 'unknown'), 'title': pr.get('title', ''),
                     'branch': pr.get('headRefName', ''),
                     'additions': pr.get('additions', 0), 'deletions': pr.get('deletions', 0)}
-            _pr_author_cache[pr_number] = info
+            _cache_pr_author(pr_number, info)
             return info
 
-    # Fetch from GitHub API
-    out = _gh(['pr', 'view', str(pr_number), '--repo', REPO,
-               '--json', 'author,title,headRefName,additions,deletions'])
-    if out:
+    # Fetch from GitHub REST API
+    data = _github_get(f'repos/{REPO}/pulls/{pr_number}')
+    if data:
         try:
-            data = json.loads(out)
-            author = data.get('author', {})
-            if isinstance(author, dict):
-                author = author.get('login', 'unknown')
+            author = (data.get('user') or {}).get('login', 'unknown')
             info = {'author': author, 'title': data.get('title', ''),
-                    'branch': data.get('headRefName', ''),
+                    'branch': (data.get('head') or {}).get('ref', ''),
                     'additions': data.get('additions', 0), 'deletions': data.get('deletions', 0)}
-            _pr_author_cache[pr_number] = info
+            _cache_pr_author(pr_number, info)
             return info
-        except (json.JSONDecodeError, KeyError):
+        except (KeyError, TypeError):
             pass
     return None
 
 
 def batch_get_pr_authors(pr_numbers: set) -> dict:
-    """Fetch authors for multiple PR numbers, using cache. Returns {pr_number: info}."""
+    """Fetch authors for multiple PR numbers, using SQLite cache. Returns {pr_number: info}."""
     result = {}
-    to_fetch = []
-    for prn in pr_numbers:
-        if not prn:
-            continue
-        prn = int(prn)
-        if prn in _pr_author_cache:
-            result[prn] = _pr_author_cache[prn]
-        else:
-            to_fetch.append(prn)
-
-    # Check merged PR cache first
-    for pr in _pr_cache.get('data', []):
-        num = pr.get('number')
-        if num in to_fetch:
-            info = {'author': pr.get('author', 'unknown'), 'title': pr.get('title', ''),
-                    'branch': pr.get('headRefName', ''),
-                    'additions': pr.get('additions', 0), 'deletions': pr.get('deletions', 0)}
-            _pr_author_cache[num] = info
-            result[num] = info
-            to_fetch.remove(num)
-
-    # Fetch remaining individually (with a cap to avoid API abuse)
-    for prn in to_fetch[:50]:
-        info = get_pr_author(prn)
-        if info:
-            result[prn] = info
+    # Batch fetch from SQLite cache in a single query
+    clean = [int(prn) for prn in pr_numbers if prn]
+    if not clean:
+        return result
+    placeholders = ','.join('?' * len(clean))
+    cached_rows = _db.query(
+        f'SELECT * FROM pr_authors WHERE pr_number IN ({placeholders})', clean)
+    cached_set = set()
+    for r in cached_rows:
+        prn = r['pr_number']
+        result[prn] = {'author': r['author'], 'title': r['title'], 'branch': r['branch'],
+                       'additions': r['additions'], 'deletions': r['deletions']}
+        cached_set.add(prn)
+    to_fetch = [prn for prn in clean if prn not in cached_set]
+
+    # Check merged PR cache (in-memory)
+    if to_fetch:
+        to_fetch_set = set(to_fetch)
+        for pr in _pr_cache.get('data', []):
+            num = pr.get('number')
+            if num in to_fetch_set:
+                info = {'author': pr.get('author', 'unknown'), 'title': pr.get('title', ''),
+                        'branch': pr.get('headRefName', ''),
+                        'additions': pr.get('additions', 0), 'deletions': pr.get('deletions', 0)}
+                _cache_pr_author(num, info)
+                result[num] = info
+                to_fetch_set.discard(num)
+        to_fetch = list(to_fetch_set)
+
+    # Fetch remaining concurrently (with a cap to avoid API abuse)
+    if to_fetch:
+        from concurrent.futures import ThreadPoolExecutor, as_completed
+        with ThreadPoolExecutor(max_workers=10) as pool:
+            futures = {pool.submit(get_pr_author, prn): prn for prn in to_fetch[:50]}
+            for fut in as_completed(futures):
+                prn = futures[fut]
+                try:
+                    info = fut.result()
+                    if info:
+                        result[prn] = info
+                except Exception:
+                    pass
 
     return result
 
@@ -495,33 +628,29 @@ def _median(vals):
 
 def _fetch_merge_queue_runs(date_str: str) -> dict:
     """Fetch merge_group workflow runs for a single date. Returns daily summary."""
-    out = _gh([
-        'api', '--paginate',
+    pages = _github_get(
         f'repos/{REPO}/actions/workflows/{CI3_WORKFLOW}/runs'
         f'?event=merge_group&created={date_str}&per_page=100',
-        '--jq', '.workflow_runs[] | [.conclusion, .status] | @tsv',
-    ])
+        paginate=True)
     summary = {'date': date_str, 'total': 0, 'success': 0, 'failure': 0,
                'cancelled': 0, 'in_progress': 0}
-    if not out:
+    if not pages:
         return summary
-    for line in out.strip().split('\n'):
-        if not line.strip():
-            continue
-        parts = line.split('\t')
-        conclusion = parts[0] if parts[0] else ''
-        status = parts[1] if len(parts) > 1 else ''
-        summary['total'] += 1
-        if conclusion == 'success':
-            summary['success'] += 1
-        elif conclusion == 'failure':
-            summary['failure'] += 1
-        elif conclusion == 'cancelled':
-            summary['cancelled'] += 1
-        elif status in ('in_progress', 'queued', 'waiting'):
-            summary['in_progress'] += 1
-        else:
-            summary['failure'] += 1  # treat unknown conclusions as failures
+    for page in pages:
+        for run in (page.get('workflow_runs') or []) if isinstance(page, dict) else []:
+            conclusion = run.get('conclusion') or ''
+            status = run.get('status') or ''
+            summary['total'] += 1
+            if conclusion == 'success':
+                summary['success'] += 1
+            elif conclusion == 'failure':
+                summary['failure'] += 1
+            elif conclusion == 'cancelled':
+                summary['cancelled'] += 1
+            elif status in ('in_progress', 'queued', 'waiting'):
+                summary['in_progress'] += 1
+            else:
+                summary['failure'] += 1  # treat unknown conclusions as failures
     return summary
 
 
@@ -597,13 +726,14 @@ def _backfill_merge_queue():
 
 
 def refresh_merge_queue_today():
-    """Refresh today's (and yesterday's) merge queue stats. Called periodically."""
+    """Refresh recent merge queue stats. Re-fetches the last 7 days to fix any
+    zero rows written during transient API failures."""
     import db
     conn = db.get_db()
-    today = datetime.now(timezone.utc).date().isoformat()
-    yesterday = (datetime.now(timezone.utc) - timedelta(days=1)).date().isoformat()
+    today = datetime.now(timezone.utc).date()
 
-    for ds in [yesterday, today]:
+    for i in range(7):
+        ds = (today - timedelta(days=i)).isoformat()
         summary = _fetch_merge_queue_runs(ds)
         conn.execute(
             'INSERT OR REPLACE INTO merge_queue_daily (date, total, success, failure, cancelled, in_progress) '
@@ -613,6 +743,80 @@ def refresh_merge_queue_today():
         conn.commit()
 
 
+_MQ_DEPTH_GQL = '''
+query($owner: String!, $repo: String!, $branch: String!) {
+  repository(owner: $owner, name: $repo) {
+    mergeQueue(branch: $branch) {
+      entries(first: 100) {
+        totalCount
+        nodes { position state enqueuedAt pullRequest { number title author { login } } }
+      }
+    }
+  }
+}'''
+
+_MQ_BRANCH = 'next'
+
+
+def poll_merge_queue_depth():
+    """Snapshot the current merge queue depth into SQLite."""
+    import db
+    owner, repo = REPO.split('/')
+    data = _github_graphql(_MQ_DEPTH_GQL,
+                           {'owner': owner, 'repo': repo, 'branch': _MQ_BRANCH})
+    if not data:
+        return
+    mq = (data.get('repository') or {}).get('mergeQueue')
+    if mq is None:
+        return
+    entries = mq.get('entries', {})
+    depth = entries.get('totalCount', 0)
+    nodes = entries.get('nodes', [])
+    entries_json = json.dumps([{
+        'position': n.get('position'),
+        'state': n.get('state'),
+        'pr': (n.get('pullRequest') or {}).get('number'),
+        'author': ((n.get('pullRequest') or {}).get('author') or {}).get('login'),
+    } for n in nodes]) if nodes else None
+
+    now = datetime.now(timezone.utc).isoformat()
+    db.execute('INSERT INTO merge_queue_snapshots (timestamp, depth, entries_json) VALUES (?, ?, ?)',
+               (now, depth, entries_json))
+
+
+def _aggregate_depth_stats():
+    """Aggregate merge_queue_snapshots into avg/peak depth on merge_queue_daily."""
+    import db
+    conn = db.get_db()
+    rows = conn.execute('''
+        SELECT substr(timestamp, 1, 10) as date,
+               ROUND(AVG(depth), 1) as avg_depth,
+               MAX(depth) as peak_depth
+        FROM merge_queue_snapshots
+        GROUP BY substr(timestamp, 1, 10)
+    ''').fetchall()
+    for row in rows:
+        conn.execute('''
+            UPDATE merge_queue_daily SET avg_depth = ?, peak_depth = ?
+            WHERE date = ?
+        ''', (row['avg_depth'], row['peak_depth'], row['date']))
+    conn.commit()
+
+
+def start_merge_queue_poller():
+    """Start background thread that polls merge queue depth every 5 minutes."""
+    def loop():
+        while True:
+            try:
+                poll_merge_queue_depth()
+            except Exception as e:
+                print(f"[rk_github] queue depth poll error: {e}")
+            time.sleep(300)  # 5 minutes
+    t = threading.Thread(target=loop, daemon=True, name='mq-depth-poller')
+    t.start()
+    return t
+
+
 _mq_backfill_lock = threading.Lock()
 _mq_last_refresh = 0
 _MQ_REFRESH_TTL = 3600  # refresh today's data every hour
@@ -629,6 +833,7 @@ def ensure_merge_queue_data():
     try:
         _backfill_merge_queue()
         refresh_merge_queue_today()
+        _aggregate_depth_stats()
         _mq_last_refresh = now
     finally:
         _mq_backfill_lock.release()
@@ -646,7 +851,7 @@ def get_merge_queue_stats(date_from: str, date_to: str) -> dict:
         threading.Thread(target=ensure_merge_queue_data, daemon=True).start()
 
     rows = db.query(
-        'SELECT date, total, success, failure, cancelled, in_progress '
+        'SELECT date, total, success, failure, cancelled, in_progress, avg_depth, peak_depth '
         'FROM merge_queue_daily WHERE date >= ? AND date <= ? ORDER BY date',
         (date_from, date_to))
 
@@ -664,3 +869,144 @@ def get_merge_queue_stats(date_from: str, date_to: str) -> dict:
             'days': len([r for r in rows if r['total'] > 0]),
         },
     }
+
+
+import re as _re
+
+_COMMIT_TYPE_RE = _re.compile(
+    r'^(fix|feat|chore|refactor|docs|style|test|perf|ci|build|revert)(\([^)]+\))?(!)?: '
+)
+_PR_NUM_RE = _re.compile(r'\(#(\d+)\)\s*$')
+_MERGE_TRAIN_RE = _re.compile(r'merge-train/([^\s]+)')
+
+
+def _parse_commit(raw: dict) -> dict:
+    """Normalise a GitHub REST commit object into a compact dict."""
+    sha = raw.get('sha', '')
+    msg = raw.get('commit', {}).get('message', '') or ''
+    subject = msg.split('\n')[0]
+    c_author = raw.get('commit', {}).get('author', {}) or {}
+    # Prefer committer login if available (shows GitHub username not git display name)
+    login = (raw.get('author') or {}).get('login', '')
+    author = login or c_author.get('name', '')
+    date = c_author.get('date', '')  # ISO-8601
+
+    # Parse conventional commit type + scope
+    m = _COMMIT_TYPE_RE.match(subject)
+    commit_type = m.group(1) if m else 'other'
+    breaking = bool(m and m.group(3))
+    scope_raw = m.group(2) if m else ''
+    scope = scope_raw[1:-1] if scope_raw else ''  # strip parens
+
+    # Extract PR number from "(#NNNNN)" at end of subject
+    pr_m = _PR_NUM_RE.search(subject)
+    pr_number = int(pr_m.group(1)) if pr_m else None
+    clean_subject = _PR_NUM_RE.sub('', subject).rstrip()
+
+    # Detect merge-train commits
+    mt_m = _MERGE_TRAIN_RE.search(subject)
+    merge_train = mt_m.group(1) if mt_m else None
+    is_merge = len(raw.get('parents', [])) > 1
+
+    return {
+        'sha': sha,
+        'subject': clean_subject,
+        'type': commit_type,
+        'scope': scope,
+        'breaking': breaking,
+        'pr': pr_number,
+        'author': author,
+        'date': date,
+        'merge_train': merge_train,
+        'is_merge': is_merge,
+        'dirs': None,  # populated by caller if Redis cache available
+    }
+
+
+_pr_dirs_cache: dict = {}  # {pr_number: [dirs]} in-memory cache (long TTL)
+_pr_dirs_lock = threading.Lock()
+_pr_dirs_fetch_queue: set = set()
+_pr_dirs_worker_started = False
+
+
+def _compute_pr_dirs(pr_number: int) -> list[str]:
+    """Fetch changed files for a PR and return 2-level path buckets."""
+    data = _github_get(f'repos/{REPO}/pulls/{pr_number}/files?per_page=100')
+    if not data or not isinstance(data, list):
+        return []
+    dirs: set[str] = set()
+    for f in data:
+        filename = f.get('filename', '')
+        if not filename:
+            continue
+        parts = filename.split('/')
+        top = parts[0]
+        dirs.add(top)
+        # For yarn-project, include 2nd level for sub-project drill-down
+        if top == 'yarn-project' and len(parts) > 1:
+            dirs.add(f'yarn-project/{parts[1]}')
+    return sorted(dirs)
+
+
+def _pr_dirs_worker():
+    """Background worker: drains the fetch queue, caches results."""
+    while True:
+        time.sleep(2)
+        with _pr_dirs_lock:
+            if not _pr_dirs_fetch_queue:
+                continue
+            pr_number = _pr_dirs_fetch_queue.pop()
+        try:
+            dirs = _compute_pr_dirs(pr_number)
+            with _pr_dirs_lock:
+                _pr_dirs_cache[pr_number] = dirs
+        except Exception as e:
+            print(f'[github_data] pr_dirs fetch error for #{pr_number}: {e}')
+
+
+def start_pr_dirs_worker():
+    """Start the background PR dirs fetcher (call once at startup)."""
+    global _pr_dirs_worker_started
+    if _pr_dirs_worker_started:
+        return
+    _pr_dirs_worker_started = True
+    t = threading.Thread(target=_pr_dirs_worker, daemon=True, name='pr-dirs-fetcher')
+    t.start()
+
+
+def get_pr_dirs(pr_number: int) -> list[str] | None:
+    """Return cached dirs for a PR, or None if not yet fetched (queues async fetch)."""
+    with _pr_dirs_lock:
+        if pr_number in _pr_dirs_cache:
+            return _pr_dirs_cache[pr_number]
+        _pr_dirs_fetch_queue.add(pr_number)
+    return None
+
+
+def get_recent_commits(branch: str = 'next', page: int = 1, per_page: int = 50) -> list[dict]:
+    """Fetch a page of commits from GitHub API with 5-minute in-memory cache."""
+    per_page = min(per_page, 100)
+    cache_key = f'{branch}:{page}:{per_page}'
+    now = time.time()
+    with _commits_lock:
+        cached = _commits_cache.get(cache_key)
+        if cached and now - cached['ts'] < 300:
+            return cached['data']
+
+    data = _github_get(
+        f'repos/{REPO}/commits?sha={branch}&per_page={per_page}&page={page}'
+    )
+    if not data or not isinstance(data, list):
+        result = []
+    else:
+        result = [_parse_commit(raw) for raw in data]
+
+    with _commits_lock:
+        _commits_cache[cache_key] = {'data': result, 'ts': now}
+
+    # Enrich with cached dirs (non-blocking)
+    for c in result:
+        if c.get('pr'):
+            c['dirs'] = get_pr_dirs(c['pr'])
+
+    return result
diff --git a/ci3/ci-metrics/metrics.py b/ci3/ci-metrics/metrics.py
index 5c0d1610e06b..8582ef0ad90c 100644
--- a/ci3/ci-metrics/metrics.py
+++ b/ci3/ci-metrics/metrics.py
@@ -1,9 +1,11 @@
-"""CI metrics: direct Redis reads + test event listener.
+"""CI metrics: SQLite source of truth + Redis ingestion + test event listener.
 
-Reads CI run data directly from Redis sorted sets on each request.
+CI runs are ingested from Redis (written by log_ci_run on CI instances) and
+stored in SQLite. All reads go through SQLite so enriched fields (instance_type
+from CloudTrail, recalculated costs) are preserved.
 Test events stored in SQLite since they only arrive via pub/sub.
-CI runs periodically synced from Redis to SQLite for flake correlation.
 """
+import hashlib
 import json
 import re
 import time
@@ -21,6 +23,18 @@
 _URL_PR_RE = re.compile(r'/pull/(\d+)')
 
 
+def hash_str_orig(s: str) -> str:
+    """Replicate bash's `echo "$s" | git hash-object --stdin | cut -c1-16`.
+
+    git hash-object computes SHA-1 of "blob <len>\\0<content>" where content
+    includes the trailing newline from echo. Length is byte length, not
+    Unicode code points.
+    """
+    content = (s + "\n").encode('utf-8')
+    blob = f"blob {len(content)}\0".encode('utf-8') + content
+    return hashlib.sha1(blob).hexdigest()[:16]
+
+
 def compute_run_cost(data: dict) -> float | None:
     complete = data.get('complete')
     ts = data.get('timestamp')
@@ -31,7 +45,9 @@ def compute_run_cost(data: dict) -> float | None:
     is_spot = bool(data.get('spot'))
     rate = ec2_pricing.get_instance_rate(instance_type, is_spot)
     if not rate:
-        vcpus = data.get('instance_vcpus', 192)
+        vcpus = data.get('instance_vcpus')
+        if not vcpus:
+            return None  # unknown instance type and no vCPU data
         rate = vcpus * ec2_pricing.get_fallback_vcpu_rate(is_spot)
     return round(hours * rate, 4)
 
@@ -116,31 +132,37 @@ def _get_ci_runs_from_sqlite(date_from_ms=None, date_to_ms=None):
     return runs
 
 
-def get_ci_runs(redis_conn, date_from_ms=None, date_to_ms=None):
-    """Read CI runs from Redis, backfilled with SQLite for data that Redis has flushed."""
-    redis_runs = _get_ci_runs_from_redis(redis_conn, date_from_ms, date_to_ms)
-
-    # Find the earliest timestamp in Redis to know what SQLite needs to fill
-    redis_keys = set()
-    redis_min_ts = float('inf')
-    for run in redis_runs:
-        ts = run.get('timestamp', 0)
-        redis_keys.add((run.get('dashboard', ''), ts, run.get('name', '')))
-        if ts < redis_min_ts:
-            redis_min_ts = ts
-
-    # If requesting data older than what Redis has, backfill from SQLite
-    sqlite_runs = []
-    need_sqlite = (date_from_ms is not None and date_from_ms < redis_min_ts) or not redis_runs
-    if need_sqlite:
-        sqlite_to = int(redis_min_ts) if redis_runs else date_to_ms
-        sqlite_runs = _get_ci_runs_from_sqlite(date_from_ms, sqlite_to)
-        # Deduplicate: only include SQLite runs not already in Redis
-        sqlite_runs = [r for r in sqlite_runs
-                       if (r.get('dashboard', ''), r.get('timestamp', 0), r.get('name', ''))
-                       not in redis_keys]
-
-    return sqlite_runs + redis_runs
+def get_ci_runs(date_from_ms=None, date_to_ms=None):
+    """Read CI runs from SQLite (the source of truth).
+
+    Redis is only an ingestion pipe — sync_ci_runs_to_sqlite() copies data in.
+    All reads go through SQLite so enriched fields (instance_type from CloudTrail,
+    recalculated costs) are always reflected.
+    """
+    return _get_ci_runs_from_sqlite(date_from_ms, date_to_ms)
+
+
+def get_ci_runs_for_pr(pr_number: int, limit: int = 100) -> list:
+    """Return CI runs for a specific PR, most recent first."""
+    rows = db.query(
+        'SELECT * FROM ci_runs WHERE pr_number = ? ORDER BY timestamp_ms DESC LIMIT ?',
+        (pr_number, limit)
+    )
+    return [{
+        'dashboard': row['dashboard'],
+        'name': row['name'],
+        'timestamp': row['timestamp_ms'],
+        'complete': row['complete_ms'],
+        'status': row['status'],
+        'author': row['author'],
+        'pr_number': row['pr_number'],
+        'instance_type': row['instance_type'],
+        'instance_vcpus': row.get('instance_vcpus'),
+        'spot': bool(row['spot']),
+        'cost_usd': row['cost_usd'],
+        'job_id': row.get('job_id', ''),
+        'arch': row.get('arch', ''),
+    } for row in rows]
 
 
 def _ts_to_date(ts_ms):
@@ -149,6 +171,32 @@ def _ts_to_date(ts_ms):
 
 # ---- Test event handling (only thing needing SQLite) ----
 
+def _upsert_daily_stats(status: str, test_cmd: str, dashboard: str, timestamp: str, duration_secs=None):
+    """Increment the daily counter for a test status."""
+    date = timestamp[:10]  # 'YYYY-MM-DD'
+    col = status if status in ('passed', 'failed', 'flaked') else None
+    if not col:
+        return
+    d = duration_secs if duration_secs and duration_secs > 0 else None
+    if d:
+        db.execute(f'''
+            INSERT INTO test_daily_stats (date, test_cmd, dashboard, {col}, total_secs, count_timed, min_secs, max_secs)
+            VALUES (?, ?, ?, 1, ?, 1, ?, ?)
+            ON CONFLICT(date, test_cmd, dashboard) DO UPDATE SET
+                {col} = {col} + 1,
+                total_secs = total_secs + excluded.total_secs,
+                count_timed = count_timed + 1,
+                min_secs = CASE WHEN min_secs IS NULL OR excluded.min_secs < min_secs THEN excluded.min_secs ELSE min_secs END,
+                max_secs = CASE WHEN max_secs IS NULL OR excluded.max_secs > max_secs THEN excluded.max_secs ELSE max_secs END
+        ''', (date, test_cmd, dashboard, d, d, d))
+    else:
+        db.execute(f'''
+            INSERT INTO test_daily_stats (date, test_cmd, dashboard, {col})
+            VALUES (?, ?, ?, 1)
+            ON CONFLICT(date, test_cmd, dashboard) DO UPDATE SET {col} = {col} + 1
+        ''', (date, test_cmd, dashboard))
+
+
 def _handle_test_event(channel: str, data: dict):
     status = channel.split(':')[-1]
     # Handle field name mismatches: run_test_cmd publishes 'cmd' for failed/flaked
@@ -157,12 +205,19 @@ def _handle_test_event(channel: str, data: dict):
     log_url = data.get('log_url') or data.get('log_key')
     if log_url and not log_url.startswith('http'):
         log_url = f'http://ci.aztec-labs.com/{log_url}'
+    dashboard = data.get('dashboard', '')
+    timestamp = data.get('timestamp', datetime.now(timezone.utc).isoformat())
+    test_hash = hash_str_orig(test_cmd) if test_cmd else None
+
+    # Always update daily stats (lightweight aggregate)
+    _upsert_daily_stats(status, test_cmd, dashboard, timestamp, data.get('duration_secs'))
+
     db.execute('''
         INSERT INTO test_events
         (status, test_cmd, log_url, ref_name, commit_hash, commit_author,
          commit_msg, exit_code, duration_secs, is_scenario, owners,
-         flake_group_id, dashboard, timestamp)
-        VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+         flake_group_id, dashboard, timestamp, test_hash)
+        VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
     ''', (
         status,
         test_cmd,
@@ -176,14 +231,15 @@ def _handle_test_event(channel: str, data: dict):
         1 if data.get('is_scenario_test') else 0,
         json.dumps(data['owners']) if data.get('owners') else None,
         data.get('flake_group_id'),
-        data.get('dashboard', ''),
-        data.get('timestamp', datetime.now(timezone.utc).isoformat()),
+        dashboard,
+        timestamp,
+        test_hash,
     ))
 
 
 def start_test_listener(redis_conn):
     """Subscribe to test event channels only. Reconnects on failure."""
-    channels = [b'ci:test:started', b'ci:test:passed', b'ci:test:failed', b'ci:test:flaked']
+    channels = [b'ci:test:passed', b'ci:test:failed', b'ci:test:flaked']
 
     def listener():
         backoff = 1
@@ -215,6 +271,163 @@ def listener():
     return t
 
 
+# ---- CI Phase timing listener ----
+
+def _handle_phase_event(data: dict):
+    """Insert a CI phase timing event into SQLite."""
+    db.execute('''
+        INSERT INTO ci_phases
+        (phase, duration_secs, exit_code, run_id, job_id, dashboard,
+         ref_name, commit_hash, timestamp)
+        VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
+    ''', (
+        data.get('phase', ''),
+        data.get('duration_secs', 0),
+        data.get('exit_code'),
+        data.get('run_id', ''),
+        data.get('job_id', ''),
+        data.get('dashboard', ''),
+        data.get('ref_name', ''),
+        data.get('commit_hash', ''),
+        datetime.now(timezone.utc).isoformat(),
+    ))
+
+
+def start_phase_listener(redis_conn):
+    """Subscribe to ci:phase:complete and store in ci_phases table."""
+    def listener():
+        backoff = 1
+        while True:
+            try:
+                pubsub = redis_conn.pubsub()
+                pubsub.subscribe(b'ci:phase:complete')
+                backoff = 1
+                for message in pubsub.listen():
+                    if message['type'] != 'message':
+                        continue
+                    try:
+                        payload = message['data']
+                        if isinstance(payload, bytes):
+                            payload = payload.decode()
+                        _handle_phase_event(json.loads(payload))
+                    except Exception as e:
+                        print(f"[rk_metrics] Error parsing phase event: {e}")
+            except Exception as e:
+                print(f"[rk_metrics] Phase listener error (reconnecting in {backoff}s): {e}")
+                time.sleep(backoff)
+                backoff = min(backoff * 2, 60)
+
+    t = threading.Thread(target=listener, daemon=True, name='phase-listener')
+    t.start()
+    return t
+
+
+def get_phases(date_from: str, date_to: str, dashboard: str = '',
+               run_id: str = '') -> dict:
+    """Query CI phase timing data for the API."""
+    conditions = ['timestamp >= ?', 'timestamp < ?']
+    params: list = [date_from, date_to + 'T23:59:59']
+    if dashboard:
+        conditions.append('dashboard = ?')
+        params.append(dashboard)
+    if run_id:
+        conditions.append('run_id = ?')
+        params.append(run_id)
+    where = 'WHERE ' + ' AND '.join(conditions)
+
+    # Aggregate by phase name
+    by_phase = db.query(f'''
+        SELECT phase,
+               COUNT(*) as count,
+               ROUND(AVG(duration_secs), 1) as avg_secs,
+               ROUND(MIN(duration_secs), 1) as min_secs,
+               ROUND(MAX(duration_secs), 1) as max_secs,
+               ROUND(SUM(duration_secs), 0) as total_secs
+        FROM ci_phases {where}
+        GROUP BY phase
+        ORDER BY total_secs DESC
+    ''', params)
+
+    # Aggregate by date: avg duration per phase per day
+    date_rows = db.query(f'''
+        SELECT substr(timestamp, 1, 10) as date, phase,
+               ROUND(AVG(duration_secs), 1) as avg_secs,
+               COUNT(*) as count
+        FROM ci_phases {where}
+        GROUP BY date, phase
+        ORDER BY date
+    ''', params)
+    by_date: dict[str, dict] = {}
+    for row in date_rows:
+        d = row['date']
+        if d not in by_date:
+            by_date[d] = {'date': d, 'phases': {}}
+        by_date[d]['phases'][row['phase']] = row['avg_secs']
+
+    # Recent individual runs with their phases
+    recent_runs = db.query(f'''
+        SELECT run_id, job_id, dashboard, ref_name, commit_hash,
+               phase, duration_secs, exit_code, timestamp
+        FROM ci_phases {where}
+        ORDER BY timestamp DESC
+        LIMIT 500
+    ''', params)
+    runs_map: dict[str, dict] = {}
+    for row in recent_runs:
+        rid = row['run_id'] or row['timestamp']
+        if rid not in runs_map:
+            runs_map[rid] = {
+                'run_id': row['run_id'], 'job_id': row['job_id'],
+                'dashboard': row['dashboard'], 'ref_name': row['ref_name'],
+                'commit_hash': row['commit_hash'], 'phases': [],
+            }
+        runs_map[rid]['phases'].append({
+            'phase': row['phase'],
+            'duration_secs': row['duration_secs'],
+            'exit_code': row['exit_code'],
+        })
+
+    # Aggregate by dashboard: P95 duration per phase per pipeline.
+    # Step 1: sum durations within each (dashboard, phase, run_id) — multiple machines
+    # running the same phase in one run are summed, not counted separately.
+    # Step 2: compute P95 across run_ids in Python.
+    per_run_rows = db.query(f'''
+        SELECT dashboard, phase, run_id,
+               ROUND(SUM(duration_secs), 3) as run_total
+        FROM ci_phases {where}
+        AND dashboard != ''
+        AND run_id != ''
+        GROUP BY dashboard, phase, run_id
+    ''', params)
+
+    import math
+    from collections import defaultdict
+    run_totals: dict[tuple, list] = defaultdict(list)
+    for row in per_run_rows:
+        run_totals[(row['dashboard'], row['phase'])].append(row['run_total'])
+
+    by_dashboard: dict[str, dict] = {}
+    for (dash, phase), totals in sorted(run_totals.items()):
+        totals_s = sorted(totals)
+        n = len(totals_s)
+        p95_idx = min(math.ceil(0.95 * n) - 1, n - 1)
+        p95 = round(totals_s[p95_idx], 1)
+        if dash not in by_dashboard:
+            by_dashboard[dash] = {'dashboard': dash, 'phases': {}, 'total_secs': 0, 'count': 0}
+        by_dashboard[dash]['phases'][phase] = p95
+        by_dashboard[dash]['total_secs'] += sum(totals_s)
+        by_dashboard[dash]['count'] = max(by_dashboard[dash]['count'], n)
+    for d in by_dashboard.values():
+        d['total_secs'] = round(d['total_secs'], 1)
+
+    return {
+        'by_phase': by_phase,
+        'by_date': list(by_date.values()),
+        'by_dashboard': list(by_dashboard.values()),
+        'recent_runs': list(runs_map.values())[:50],
+    }
+
+
 # ---- Sync failed_tests_{section} lists from Redis into SQLite ----
 
 _ANSI_STRIP = re.compile(r'\x1b\[[^m]*m|\x1b\]8;;[^\x07]*\x07')
@@ -326,18 +539,18 @@ def sync_failed_tests_to_sqlite(redis_conn):
     _failed_tests_sync_ts = now
 
     conn = db.get_db()
-    # Track existing entries to avoid duplicates: log_url for entries that have one,
-    # (test_cmd, timestamp, dashboard) composite key for entries without log_url
+    # Track existing failed/flaked entries to avoid duplicates (this sync only
+    # processes failed/flaked from Redis lists, so no need to scan passed rows).
     existing_urls = {row['log_url'] for row in conn.execute(
-        "SELECT DISTINCT log_url FROM test_events WHERE log_url IS NOT NULL"
+        "SELECT DISTINCT log_url FROM test_events WHERE log_url IS NOT NULL AND status IN ('failed', 'flaked')"
     ).fetchall()}
     existing_keys = {(row['test_cmd'], row['timestamp'], row['dashboard']) for row in conn.execute(
-        "SELECT test_cmd, timestamp, dashboard FROM test_events WHERE log_url IS NULL"
+        "SELECT test_cmd, timestamp, dashboard FROM test_events WHERE log_url IS NULL AND status IN ('failed', 'flaked')"
     ).fetchall()}
 
     total = 0
-    for section in SECTIONS:
-        key = f'failed_tests_{section}'
+    for section in SECTIONS + ['']:
+        key = f'failed_tests_{section}' if section else 'failed_tests'
         try:
             entries = redis_conn.lrange(key, 0, -1)
         except Exception as e:
@@ -363,21 +576,27 @@ def sync_failed_tests_to_sqlite(redis_conn):
                     INSERT INTO test_events
                     (status, test_cmd, log_url, ref_name, commit_author,
                      commit_msg, duration_secs, flake_group_id, dashboard,
-                     timestamp)
-                    VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                     timestamp, test_hash)
+                    VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                 ''', (
                     parsed['status'], parsed['test_cmd'], parsed['log_url'],
                     parsed['ref_name'], parsed['commit_author'],
                     parsed['commit_msg'], parsed['duration_secs'],
                     parsed['flake_group_id'], parsed['dashboard'],
                     parsed['timestamp'],
+                    hash_str_orig(parsed['test_cmd']) if parsed['test_cmd'] else None,
                 ))
+                _upsert_daily_stats(
+                    parsed['status'], parsed['test_cmd'],
+                    parsed['dashboard'], parsed['timestamp'])
                 total += 1
             except Exception as e:
                 print(f"[rk_metrics] Error inserting test event: {e}")
     conn.commit()
     if total:
         print(f"[rk_metrics] Synced {total} test events from Redis lists")
+        db.cache_invalidate_prefix('flakes:')
+        db.cache_invalidate_prefix('timings:')
 
 
 # ---- Seed loading ----
@@ -437,15 +656,16 @@ def _load_seed_data():
         events = data['test_events']
         for ev in events:
             try:
+                te_cmd = ev.get('test_cmd', '')
                 conn.execute('''
                     INSERT OR IGNORE INTO test_events
                     (status, test_cmd, log_url, ref_name, commit_hash, commit_author,
                      commit_msg, exit_code, duration_secs, is_scenario, owners,
-                     flake_group_id, dashboard, timestamp)
-                    VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                     flake_group_id, dashboard, timestamp, test_hash)
+                    VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
                 ''', (
                     ev.get('status', ''),
-                    ev.get('test_cmd', ''),
+                    te_cmd,
                     ev.get('log_url'),
                     ev.get('ref_name', ''),
                     ev.get('commit_hash'),
@@ -458,6 +678,7 @@ def _load_seed_data():
                     ev.get('flake_group_id'),
                     ev.get('dashboard', ''),
                     ev.get('timestamp', ''),
+                    hash_str_orig(te_cmd) if te_cmd else None,
                 ))
             except Exception:
                 continue
@@ -472,14 +693,19 @@ def _load_seed_data():
 
 
 def sync_ci_runs_to_sqlite(redis_conn):
-    """Sync all CI runs from Redis into SQLite for persistence."""
+    """Ingest CI runs from Redis into SQLite.
+
+    Redis is the ingestion pipe (log_ci_run writes there from CI instances).
+    SQLite is the source of truth. Fields enriched post-ingestion (instance_type,
+    cost_usd from CloudTrail resolution) are preserved — only overwritten if
+    Redis has a non-empty value.
+    """
     global _ci_sync_ts
     now = time.time()
     if now - _ci_sync_ts < _CI_SYNC_TTL:
         return
     _ci_sync_ts = now
 
-    # Sync everything Redis has (not just 30 days)
     runs = _get_ci_runs_from_redis(redis_conn)
 
     now_iso = datetime.now(timezone.utc).isoformat()
@@ -488,11 +714,32 @@ def sync_ci_runs_to_sqlite(redis_conn):
     for run in runs:
         try:
             conn.execute('''
-                INSERT OR REPLACE INTO ci_runs
+                INSERT INTO ci_runs
                 (dashboard, name, timestamp_ms, complete_ms, status, author,
                  pr_number, instance_type, instance_vcpus, spot, cost_usd,
                  job_id, arch, synced_at)
                 VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                ON CONFLICT(dashboard, timestamp_ms, name) DO UPDATE SET
+                    complete_ms = excluded.complete_ms,
+                    status = excluded.status,
+                    author = excluded.author,
+                    pr_number = excluded.pr_number,
+                    instance_vcpus = excluded.instance_vcpus,
+                    spot = excluded.spot,
+                    job_id = excluded.job_id,
+                    arch = excluded.arch,
+                    synced_at = excluded.synced_at,
+                    -- Preserve enriched fields: only overwrite if Redis has real data
+                    instance_type = CASE
+                        WHEN excluded.instance_type IS NOT NULL AND excluded.instance_type != ''
+                        THEN excluded.instance_type
+                        ELSE ci_runs.instance_type
+                    END,
+                    cost_usd = CASE
+                        WHEN excluded.instance_type IS NOT NULL AND excluded.instance_type != ''
+                        THEN excluded.cost_usd
+                        ELSE ci_runs.cost_usd
+                    END
             ''', (
                 run.get('dashboard', ''),
                 run.get('name', ''),
@@ -514,17 +761,372 @@ def sync_ci_runs_to_sqlite(redis_conn):
             print(f"[rk_metrics] Error syncing run: {e}")
     conn.commit()
     print(f"[rk_metrics] Synced {count} CI runs to SQLite")
+    db.cache_invalidate_prefix('perf:')
+
+
+def _backfill_daily_stats():
+    """Populate test_daily_stats from existing test_events rows.
+
+    Uses INSERT OR IGNORE to fill gaps without overwriting data from the
+    real-time listener.  Safe to call repeatedly — skips dates/tests that
+    already have rows.
+    """
+    conn = db.get_db()
+    cur = conn.execute('''
+        INSERT OR IGNORE INTO test_daily_stats (date, test_cmd, dashboard, passed, failed, flaked)
+        SELECT substr(timestamp, 1, 10) as date, test_cmd, dashboard,
+               SUM(CASE WHEN status = 'passed' THEN 1 ELSE 0 END),
+               SUM(CASE WHEN status = 'failed' THEN 1 ELSE 0 END),
+               SUM(CASE WHEN status = 'flaked' THEN 1 ELSE 0 END)
+        FROM test_events
+        GROUP BY substr(timestamp, 1, 10), test_cmd, dashboard
+    ''')
+    conn.commit()
+    if cur.rowcount and cur.rowcount > 0:
+        print(f"[rk_metrics] Backfilled {cur.rowcount} daily stat rows from test_events")
+
+
+def _materialize_ci_run_daily_stats():
+    """Recompute ci_run_daily_stats from ci_runs.
+
+    Replaces all rows — safe to call repeatedly.  Stores pre-aggregated
+    duration percentiles so the API doesn't need to scan raw rows.
+    """
+    conn = db.get_db()
+    # Fetch raw daily durations grouped by date + dashboard
+    rows = conn.execute('''
+        SELECT
+            strftime('%Y-%m-%d', timestamp_ms / 1000, 'unixepoch') AS date,
+            dashboard,
+            (complete_ms - timestamp_ms) / 60000.0 AS dur_mins
+        FROM ci_runs
+        WHERE status IN ('PASSED', 'FAILED')
+          AND complete_ms IS NOT NULL AND complete_ms > timestamp_ms
+    ''').fetchall()
+
+    # Group durations: {(date, dashboard): [dur_mins, ...]}
+    groups = {}
+    for r in rows:
+        key = (r['date'], r['dashboard'])
+        groups.setdefault(key, {'passed': 0, 'failed': 0, 'durs': []})
+        groups[key]['durs'].append(r['dur_mins'])
+
+    # Also count pass/fail per group
+    status_rows = conn.execute('''
+        SELECT
+            strftime('%Y-%m-%d', timestamp_ms / 1000, 'unixepoch') AS date,
+            dashboard, status, COUNT(*) as cnt
+        FROM ci_runs
+        WHERE status IN ('PASSED', 'FAILED')
+        GROUP BY date, dashboard, status
+    ''').fetchall()
+    for r in status_rows:
+        key = (r['date'], r['dashboard'])
+        if key not in groups:
+            groups[key] = {'passed': 0, 'failed': 0, 'durs': []}
+        if r['status'] == 'PASSED':
+            groups[key]['passed'] = r['cnt']
+        else:
+            groups[key]['failed'] = r['cnt']
+
+    conn.execute('DELETE FROM ci_run_daily_stats')
+    inserted = 0
+    for (date, dashboard), g in groups.items():
+        durs = sorted(g['durs'])
+        n = len(durs)
+        conn.execute('''
+            INSERT INTO ci_run_daily_stats
+            (date, dashboard, run_count, passed, failed,
+             sum_duration, min_duration, max_duration, p50_duration, p95_duration)
+            VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+        ''', (
+            date, dashboard, g['passed'] + g['failed'],
+            g['passed'], g['failed'],
+            round(sum(durs), 2) if durs else 0,
+            round(min(durs), 1) if durs else None,
+            round(max(durs), 1) if durs else None,
+            round(durs[n // 2], 1) if durs else None,
+            round(durs[int(n * 0.95)], 1) if durs else None,
+        ))
+        inserted += 1
+    conn.commit()
+    print(f"[rk_metrics] Materialized {inserted} ci_run_daily_stats rows")
+
+
+def _backfill_test_hashes():
+    """Populate test_hash for existing test_events rows that are missing it."""
+    conn = db.get_db()
+    rows = conn.execute(
+        "SELECT DISTINCT test_cmd FROM test_events WHERE test_hash IS NULL AND test_cmd != ''"
+    ).fetchall()
+    if not rows:
+        return
+    for row in rows:
+        cmd = row['test_cmd']
+        h = hash_str_orig(cmd)
+        conn.execute(
+            "UPDATE test_events SET test_hash = ? WHERE test_cmd = ? AND test_hash IS NULL",
+            (h, cmd))
+    conn.commit()
+    print(f"[rk_metrics] Backfilled test_hash for {len(rows)} distinct test commands")
+
+
+# ---- CloudTrail instance type resolution ----
+
+_ct_resolve_ts = 0
+_CT_RESOLVE_TTL = 6 * 3600  # 6 hours
+
+
+def _fetch_cloudtrail_daily(ct, event_name, start_time, end_time, max_per_day=10000):
+    """Fetch CloudTrail events in daily chunks to avoid the 5000-event global limit."""
+    events = []
+    day = start_time.replace(hour=0, minute=0, second=0, microsecond=0)
+    while day < end_time:
+        day_end = min(day + timedelta(days=1), end_time)
+        kwargs = {
+            'LookupAttributes': [
+                {'AttributeKey': 'EventName', 'AttributeValue': event_name},
+            ],
+            'StartTime': day,
+            'EndTime': day_end,
+            'MaxResults': 50,
+        }
+        while True:
+            resp = ct.lookup_events(**kwargs)
+            events.extend(resp.get('Events', []))
+            token = resp.get('NextToken')
+            if not token or len(events) >= max_per_day:
+                break
+            kwargs['NextToken'] = token
+        day += timedelta(days=1)
+    return events
+
+
+# Name tag format: <branch_normalized>_<arch>[_<postfix>]
+_NAME_TAG_RE = re.compile(r'^(.+)_(amd64|arm64)(?:_.*)?$')
+
+
+def _normalize_branch_name(name):
+    """Normalize a branch name the same way bootstrap_ec2 does for the EC2 Name tag."""
+    m = re.match(r'^gh-readonly-queue/[^/]+/pr-(\d+)', name)
+    if m:
+        return f'pr-{m.group(1)}'
+    name = re.sub(r'\s*\(queue\)$', '', name)
+    return re.sub(r'[^a-zA-Z0-9-]', '_', name[:50])
+
+
+def resolve_unknown_instance_types():
+    """Query CloudTrail for RunInstances + CreateTags events to resolve unknown instance types.
+
+    Strategy:
+    1. Fetch RunInstances events (daily chunks) → instance_id → instance_type + launch_time
+    2. Fetch CreateTags events (daily chunks) → instance_id → {Name, Group, Dashboard, ...}
+       Tags are accumulated across multiple events then filtered to Group=build-instance.
+    3. Join by instance_id, then match to ci_runs by normalized branch name + arch + time window.
+    """
+    global _ct_resolve_ts
+    now = time.time()
+    if now - _ct_resolve_ts < _CT_RESOLVE_TTL:
+        return
+    _ct_resolve_ts = now
+
+    conn = db.get_db()
+    unknown_runs = conn.execute('''
+        SELECT dashboard, name, timestamp_ms, complete_ms, instance_vcpus, spot,
+               cost_usd, arch, pr_number
+        FROM ci_runs
+        WHERE (instance_type IS NULL OR instance_type = '' OR instance_type = 'unknown')
+        AND timestamp_ms > ?
+    ''', (int((time.time() - 90 * 86400) * 1000),)).fetchall()
+
+    if not unknown_runs:
+        return
+
+    try:
+        import boto3
+    except ImportError:
+        return
+
+    try:
+        ct = boto3.client('cloudtrail', region_name='us-east-2')
+        start_time = datetime.fromtimestamp(
+            min(r['timestamp_ms'] for r in unknown_runs) / 1000 - 300, tz=timezone.utc)
+        end_time = datetime.now(timezone.utc)
+
+        # Step 1: Fetch RunInstances events in daily chunks → instance_id → type + launch time
+        run_events = _fetch_cloudtrail_daily(ct, 'RunInstances', start_time, end_time)
+        instance_types = {}
+        instance_launch_times = {}
+        for event in run_events:
+            try:
+                detail = json.loads(event.get('CloudTrailEvent', '{}'))
+                itype = detail.get('requestParameters', {}).get('instanceType', '')
+                items = (detail.get('responseElements') or {}).get('instancesSet', {}).get('items', [])
+                for item in items:
+                    iid = item.get('instanceId', '')
+                    item_type = item.get('instanceType', '') or itype
+                    if iid and item_type:
+                        instance_types[iid] = item_type
+                        instance_launch_times[iid] = int(event['EventTime'].timestamp() * 1000)
+            except Exception:
+                continue
+
+        if not instance_types:
+            print("[rk_metrics] CloudTrail: no RunInstances events found")
+            return
+
+        # Step 2: Fetch CreateTags events in daily chunks.
+        # Accumulate ALL tags per instance first, then filter to build instances.
+        # This handles the case where Name, Group, and Dashboard are set in separate
+        # create-tags API calls (aws_request_instance_type lines 97, 126, 127).
+        tag_events = _fetch_cloudtrail_daily(ct, 'CreateTags', start_time, end_time)
+        all_instance_tags = {}
+        for event in tag_events:
+            try:
+                detail = json.loads(event.get('CloudTrailEvent', '{}'))
+                req = detail.get('requestParameters', {})
+                resources = req.get('resourcesSet', {}).get('items', [])
+                tags = req.get('tagSet', {}).get('items', [])
+                tag_dict = {t.get('key', ''): t.get('value', '') for t in tags}
+                for res in resources:
+                    rid = res.get('resourceId', '')
+                    if rid.startswith('i-'):
+                        if rid not in all_instance_tags:
+                            all_instance_tags[rid] = {}
+                        all_instance_tags[rid].update(tag_dict)
+            except Exception:
+                continue
+
+        # Filter to build instances
+        instance_tags = {
+            iid: tags for iid, tags in all_instance_tags.items()
+            if tags.get('Group') == 'build-instance'
+        }
+
+        # Step 3: Join RunInstances + CreateTags by instance_id
+        instances = []
+        for iid, itype in instance_types.items():
+            tags = instance_tags.get(iid, {})
+            if not tags.get('Name'):
+                continue
+            instances.append({
+                'instance_type': itype,
+                'launch_ms': instance_launch_times.get(iid, 0),
+                'dashboard': tags.get('Dashboard', ''),
+                'name_tag': tags.get('Name', ''),
+            })
+
+        # Build index: normalized branch name → [instances]
+        tag_index = {}
+        for inst in instances:
+            m = _NAME_TAG_RE.match(inst['name_tag'])
+            if m:
+                tag_index.setdefault(m.group(1), []).append(inst)
+            else:
+                tag_index.setdefault(inst['name_tag'], []).append(inst)
+
+        # Step 4: Match unknown runs to instances
+        updated = 0
+        for run in unknown_runs:
+            run_name = run['name']
+            run_arch = run['arch'] or ''
+            run_ts = run['timestamp_ms']
+            run_dashboard = run['dashboard']
+
+            expected_name = _normalize_branch_name(run_name)
+            candidates = tag_index.get(expected_name, [])
+
+            best = None
+            for inst in candidates:
+                # Verify arch matches
+                if run_arch:
+                    m = _NAME_TAG_RE.match(inst['name_tag'])
+                    if m and m.group(2) != run_arch:
+                        continue
+
+                # Verify dashboard matches (if tag present)
+                if inst['dashboard'] and inst['dashboard'] != run_dashboard:
+                    continue
+
+                # CI run starts after instance launch; allow up to 90 min (instance lifetime)
+                delta = run_ts - inst['launch_ms']
+                if delta < -60_000 or delta > 5400_000:
+                    continue
+
+                # Prefer most recently launched instance before the run
+                if delta >= 0 and (best is None or inst['launch_ms'] > best['launch_ms']):
+                    best = inst
+                elif best is None and abs(delta) < 60_000:
+                    best = inst
+
+            if best:
+                itype = best['instance_type']
+                is_spot = bool(run['spot'])
+                rate = ec2_pricing.get_instance_rate(itype, is_spot)
+                new_cost = run['cost_usd']
+                if rate and run['complete_ms'] and run['timestamp_ms']:
+                    hours = (run['complete_ms'] - run['timestamp_ms']) / 3_600_000
+                    new_cost = round(hours * rate, 4)
+                conn.execute('''
+                    UPDATE ci_runs SET instance_type = ?, cost_usd = ?
+                    WHERE dashboard = ? AND timestamp_ms = ? AND name = ?
+                ''', (itype, new_cost, run['dashboard'], run['timestamp_ms'], run['name']))
+                updated += 1
+
+        conn.commit()
+        if updated:
+            print(f"[rk_metrics] CloudTrail: resolved {updated}/{len(unknown_runs)} unknown instance types")
+        else:
+            print(f"[rk_metrics] CloudTrail: {len(instances)} instances, "
+                  f"0/{len(unknown_runs)} matched")
+    except Exception as e:
+        print(f"[rk_metrics] CloudTrail resolution failed: {e}")
+
+
+def recalculate_all_costs():
+    """Recalculate cost_usd for all ci_runs based on current instance_type and pricing."""
+    conn = db.get_db()
+    runs = conn.execute('''
+        SELECT dashboard, name, timestamp_ms, complete_ms, instance_type,
+               instance_vcpus, spot, cost_usd
+        FROM ci_runs
+        WHERE complete_ms IS NOT NULL AND complete_ms > 0
+    ''').fetchall()
+    updated = 0
+    for run in runs:
+        cost = compute_run_cost({
+            'complete': run['complete_ms'],
+            'timestamp': run['timestamp_ms'],
+            'instance_type': run['instance_type'] or 'unknown',
+            'spot': run['spot'],
+            'instance_vcpus': run['instance_vcpus'],
+        })
+        if cost is not None and cost != run['cost_usd']:
+            conn.execute('''
+                UPDATE ci_runs SET cost_usd = ?
+                WHERE dashboard = ? AND timestamp_ms = ? AND name = ?
+            ''', (cost, run['dashboard'], run['timestamp_ms'], run['name']))
+            updated += 1
+    conn.commit()
+    print(f"[rk_metrics] Recalculated costs: {updated}/{len(runs)} changed")
+    return updated
 
 
 def start_ci_run_sync(redis_conn):
     """Start periodic CI run + test event sync thread."""
     _load_seed_data()
+    _backfill_daily_stats()
+    _backfill_test_hashes()
+    _materialize_ci_run_daily_stats()
 
     def loop():
         while True:
             try:
                 sync_ci_runs_to_sqlite(redis_conn)
                 sync_failed_tests_to_sqlite(redis_conn)
+                resolve_unknown_instance_types()
+                _materialize_ci_run_daily_stats()
+                db.cache_cleanup()
             except Exception as e:
                 print(f"[rk_metrics] sync error: {e}")
             time.sleep(600)  # check every 10 min (TTL gates actual work)
@@ -600,3 +1202,21 @@ def get_flakes_by_command(date_from, date_to, dashboard=''):
             'total_failures': sum(failures_by_command.values()),
         },
     }
+
+
+def get_test_history(test_hash: str, branch: str = '', limit: int = 1000) -> list[dict]:
+    """Get test event history by test_hash, matching Redis history_{hash}[_{branch}] lists."""
+    conditions = ['test_hash = ?']
+    params: list = [test_hash]
+    if branch:
+        conditions.append('ref_name = ?')
+        params.append(branch)
+    where = 'WHERE ' + ' AND '.join(conditions)
+    params.append(limit)
+    return db.query(f'''
+        SELECT status, test_cmd, log_url, ref_name, commit_author,
+               commit_msg, duration_secs, dashboard, timestamp
+        FROM test_events {where}
+        ORDER BY timestamp DESC
+        LIMIT ?
+    ''', params)
diff --git a/ci3/ci-metrics/requirements.txt b/ci3/ci-metrics/requirements.txt
index d6516263133f..310ecadf230a 100644
--- a/ci3/ci-metrics/requirements.txt
+++ b/ci3/ci-metrics/requirements.txt
@@ -6,3 +6,4 @@ Flask-HTTPAuth
 requests
 google-cloud-bigquery
 boto3
+pytest
diff --git a/ci3/ci-metrics/rk.py b/ci3/ci-metrics/rk.py
new file mode 100644
index 000000000000..d099b92dbbd7
--- /dev/null
+++ b/ci3/ci-metrics/rk.py
@@ -0,0 +1 @@
+from app import app
diff --git a/ci3/ci-metrics/test_cache.py b/ci3/ci-metrics/test_cache.py
new file mode 100644
index 000000000000..5538a3810958
--- /dev/null
+++ b/ci3/ci-metrics/test_cache.py
@@ -0,0 +1,154 @@
+"""Automated performance tests: SQLite response cache makes 1-year ci-insights fast.
+
+Usage:
+    pip install pytest
+    METRICS_DB_PATH=/tmp/t.db DASHBOARD_PASSWORD=test REDIS_HOST=invalid pytest test_cache.py -v
+
+All 18 parametrised tests should pass.  Cold requests may take several seconds;
+warm (cached) requests must be < 100 ms each.
+"""
+import base64
+import json
+import os
+import tempfile
+import time
+from datetime import date, timedelta
+
+# Set env vars BEFORE importing the app so db path and Redis host are fixed
+_db_path = tempfile.mktemp(suffix='.db')
+os.environ.setdefault('METRICS_DB_PATH', _db_path)
+os.environ.setdefault('DASHBOARD_PASSWORD', 'test')
+os.environ.setdefault('REDIS_HOST', 'invalid')  # causes Redis errors, swallowed silently
+
+import pytest
+
+# Import app after env vars are set; background threads start but Redis fails gracefully
+from app import app
+import db
+
+# Basic-auth header for 'test:test'
+_AUTH = {'Authorization': 'Basic ' + base64.b64encode(b'test:test').decode()}
+
+YEAR_FROM = '2025-02-24'
+YEAR_TO = '2026-02-24'
+
+ENDPOINTS = [
+    f'/api/ci/performance?from={YEAR_FROM}&to={YEAR_TO}&granularity=daily',
+    f'/api/ci/phases?from={YEAR_FROM}&to={YEAR_TO}',
+    f'/api/ci/flakes-by-command?from={YEAR_FROM}&to={YEAR_TO}',
+    f'/api/tests/timings?from={YEAR_FROM}&to={YEAR_TO}',
+    f'/api/merge-queue/stats?from={YEAR_FROM}&to={YEAR_TO}',
+    f'/api/prs/metrics?from={YEAR_FROM}&to={YEAR_TO}',
+]
+
+
+def _seed():
+    """Insert one year of synthetic data covering all 6 ci-insights endpoints."""
+    conn = db.get_db()
+    dashboards = ['next', 'prs', 'master']
+    start = date(2025, 2, 24)
+    end = date(2026, 2, 24)
+    ts_base = int(time.mktime(start.timetuple())) * 1000
+    ms_per_day = 86_400_000
+
+    for i, day in enumerate(
+        start + timedelta(days=n) for n in range((end - start).days + 1)
+    ):
+        ds = day.isoformat()
+        ts = ts_base + i * ms_per_day
+
+        # merge_queue_daily — one row per day
+        conn.execute(
+            'INSERT OR IGNORE INTO merge_queue_daily (date, total, success, failure) VALUES (?,10,8,2)',
+            (ds,),
+        )
+
+        for dash in dashboards:
+            # ci_runs — 5 per pipeline per day
+            for j in range(5):
+                conn.execute(
+                    '''INSERT OR IGNORE INTO ci_runs
+                       (dashboard, name, timestamp_ms, complete_ms, status, author, synced_at)
+                       VALUES (?,?,?,?,?,?,?)''',
+                    (
+                        dash, f'run-{i}-{dash}-{j}',
+                        ts + j * 60_000,
+                        ts + j * 60_000 + 3_600_000,
+                        'PASSED' if j % 5 != 0 else 'FAILED',
+                        'ci-bot', ds,
+                    ),
+                )
+
+            # test_daily_stats
+            conn.execute(
+                '''INSERT OR IGNORE INTO test_daily_stats
+                   (date, test_cmd, dashboard, passed, failed, flaked) VALUES (?,?,?,80,5,2)''',
+                (ds, f'test_{dash}', dash),
+            )
+
+            # test_events — 3 per pipeline per day (one flaked for flakes endpoint)
+            for j in range(3):
+                conn.execute(
+                    '''INSERT OR IGNORE INTO test_events
+                       (status, test_cmd, ref_name, dashboard, timestamp, duration_secs)
+                       VALUES (?,?,?,?,?,?)''',
+                    (
+                        'passed' if j < 2 else 'flaked',
+                        f'test_{dash}',
+                        'main', dash,
+                        f'{ds}T12:00:0{j}',
+                        30.0 + j,
+                    ),
+                )
+
+            # ci_phases — build + test phases per pipeline per day
+            for phase in ('build', 'test'):
+                conn.execute(
+                    '''INSERT OR IGNORE INTO ci_phases
+                       (phase, duration_secs, dashboard, timestamp) VALUES (?,?,?,?)''',
+                    (phase, 1200.0, dash, f'{ds}T12:00:00'),
+                )
+
+    conn.commit()
+
+
+@pytest.fixture(scope='session', autouse=True)
+def seeded_db():
+    _seed()
+
+
+@pytest.fixture(scope='session')
+def client():
+    app.config['TESTING'] = True
+    with app.test_client() as c:
+        yield c
+
+
+@pytest.mark.parametrize('url', ENDPOINTS)
+def test_cold_returns_valid_json(client, url):
+    """First request computes from SQLite and returns valid JSON."""
+    r = client.get(url, headers=_AUTH)
+    assert r.status_code == 200, f'HTTP {r.status_code}: {r.data[:200]}'
+    data = json.loads(r.data)
+    assert data  # non-empty response
+
+
+@pytest.mark.parametrize('url', ENDPOINTS)
+def test_warm_hit_under_100ms(client, url):
+    """Second request is served from cache and completes in < 100 ms."""
+    # Ensure cold request ran (order not guaranteed across parametrised tests)
+    client.get(url, headers=_AUTH)
+    # Warm request — must hit cache
+    t0 = time.perf_counter()
+    r = client.get(url, headers=_AUTH)
+    elapsed_ms = (time.perf_counter() - t0) * 1000
+    assert r.status_code == 200
+    assert elapsed_ms < 100, f'{url}: cache hit took {elapsed_ms:.1f} ms (limit 100 ms)'
+
+
+@pytest.mark.parametrize('url', ENDPOINTS)
+def test_cached_response_matches_original(client, url):
+    """Cached response is byte-for-byte identical to the original."""
+    r1 = client.get(url, headers=_AUTH)
+    r2 = client.get(url, headers=_AUTH)
+    assert r1.data == r2.data
diff --git a/ci3/ci-metrics/test_cloudtrail.py b/ci3/ci-metrics/test_cloudtrail.py
new file mode 100644
index 000000000000..8acd71925cec
--- /dev/null
+++ b/ci3/ci-metrics/test_cloudtrail.py
@@ -0,0 +1,302 @@
+#!/usr/bin/env python3
+"""Test CloudTrail instance type resolution against real data + SQLite.
+
+Usage:
+  python3 test_cloudtrail.py /path/to/metrics.db --dry-run   # preview matches
+  python3 test_cloudtrail.py /path/to/metrics.db              # apply updates
+  python3 test_cloudtrail.py --days 7 --dry-run               # only last 7 days
+"""
+import json
+import os
+import re
+import sqlite3
+import sys
+from datetime import datetime, timedelta, timezone
+
+try:
+    import boto3
+except ImportError:
+    print("ERROR: boto3 not installed")
+    sys.exit(1)
+
+DB_PATH = os.getenv('METRICS_DB_PATH',
+                     os.path.join(os.getenv('LOGS_DISK_PATH', '/logs-disk'), 'metrics.db'))
+for arg in sys.argv[1:]:
+    if not arg.startswith('-') and os.path.exists(arg):
+        DB_PATH = arg
+        break
+
+dry_run = '--dry-run' in sys.argv
+days_back = 90
+for i, arg in enumerate(sys.argv):
+    if arg == '--days' and i + 1 < len(sys.argv):
+        days_back = int(sys.argv[i + 1])
+
+ct = boto3.client('cloudtrail', region_name='us-east-2')
+
+
+def fetch_events(event_name, start, end, max_events=10000):
+    events = []
+    kwargs = {
+        'LookupAttributes': [{'AttributeKey': 'EventName', 'AttributeValue': event_name}],
+        'StartTime': start, 'EndTime': end, 'MaxResults': 50,
+    }
+    while True:
+        resp = ct.lookup_events(**kwargs)
+        events.extend(resp.get('Events', []))
+        token = resp.get('NextToken')
+        if not token or len(events) >= max_events:
+            break
+        kwargs['NextToken'] = token
+    return events
+
+
+def normalize_branch_name(name):
+    """Normalize a branch name the same way bootstrap_ec2 does for the EC2 Name tag."""
+    # Strip merge queue prefix: gh-readonly-queue/next/pr-123-... → pr-123
+    m = re.match(r'^gh-readonly-queue/[^/]+/pr-(\d+)', name)
+    if m:
+        return f'pr-{m.group(1)}'
+    # Strip " (queue)" suffix from log_ci_run simplified names
+    name = re.sub(r'\s*\(queue\)$', '', name)
+    # Same as: echo -n "$REF_NAME" | head -c 50 | tr -c 'a-zA-Z0-9-' '_'
+    return re.sub(r'[^a-zA-Z0-9-]', '_', name[:50])
+
+
+# ---- Step 1: Fetch RunInstances events in daily chunks ----
+end_time = datetime.now(timezone.utc)
+start_time = end_time - timedelta(days=days_back)
+
+print(f"Fetching RunInstances events in daily chunks ({start_time.date()} to {end_time.date()})...")
+instance_types = {}   # instance_id → instance_type
+instance_times = {}   # instance_id → launch_time_ms
+total_run_events = 0
+
+day_start = start_time.replace(hour=0, minute=0, second=0, microsecond=0)
+while day_start < end_time:
+    day_end = min(day_start + timedelta(days=1), end_time)
+    events = fetch_events('RunInstances', day_start, day_end)
+    total_run_events += len(events)
+
+    for event in events:
+        try:
+            detail = json.loads(event.get('CloudTrailEvent', '{}'))
+            itype = detail.get('requestParameters', {}).get('instanceType', '')
+            items = (detail.get('responseElements') or {}).get('instancesSet', {}).get('items', [])
+            for item in items:
+                iid = item.get('instanceId', '')
+                item_type = item.get('instanceType', '') or itype
+                if iid and item_type:
+                    instance_types[iid] = item_type
+                    instance_times[iid] = int(event['EventTime'].timestamp() * 1000)
+        except Exception:
+            continue
+
+    day_start = day_start + timedelta(days=1)
+    sys.stdout.write(f"\r  {day_start.strftime('%Y-%m-%d')}: {total_run_events} events, {len(instance_types)} instances")
+    sys.stdout.flush()
+
+print(f"\n  Total: {total_run_events} RunInstances events, {len(instance_types)} unique instances")
+
+if not instance_types:
+    print("No RunInstances data. Exiting.")
+    sys.exit(1)
+
+# ---- Step 2: Fetch CreateTags events in daily chunks ----
+# NOTE: Tags are applied to CI instances in multiple create-tags calls:
+#   1. aws_request_instance_type line 97: Name + Group + GithubActor + CICommand + Dashboard (all at once)
+#   2. aws_request_instance_type line 126: Name only (redundant, after SSH)
+#   3. aws_request_instance_type line 127: Group only (redundant, after SSH)
+# CloudTrail sometimes misses event #1, so we must accumulate tags from ALL events
+# for each instance, then filter to build instances afterwards.
+print(f"\nFetching CreateTags events in daily chunks...")
+all_instance_tags = {}  # instance_id → accumulated tags (unfiltered)
+total_tag_events = 0
+
+day_start = start_time.replace(hour=0, minute=0, second=0, microsecond=0)
+while day_start < end_time:
+    day_end = min(day_start + timedelta(days=1), end_time)
+    events = fetch_events('CreateTags', day_start, day_end)
+    total_tag_events += len(events)
+
+    for event in events:
+        try:
+            detail = json.loads(event.get('CloudTrailEvent', '{}'))
+            req = detail.get('requestParameters', {})
+            resources = req.get('resourcesSet', {}).get('items', [])
+            tags = req.get('tagSet', {}).get('items', [])
+            tag_dict = {t.get('key', ''): t.get('value', '') for t in tags}
+            for res in resources:
+                rid = res.get('resourceId', '')
+                if rid.startswith('i-'):
+                    if rid not in all_instance_tags:
+                        all_instance_tags[rid] = {}
+                    all_instance_tags[rid].update(tag_dict)
+        except Exception:
+            continue
+
+    day_start = day_start + timedelta(days=1)
+    sys.stdout.write(f"\r  {day_start.strftime('%Y-%m-%d')}: {total_tag_events} events, {len(all_instance_tags)} instances")
+    sys.stdout.flush()
+
+# Filter to build instances (those with Group=build-instance tag)
+instance_tags = {
+    iid: tags for iid, tags in all_instance_tags.items()
+    if tags.get('Group') == 'build-instance'
+}
+print(f"\n  Total: {total_tag_events} CreateTags events, {len(all_instance_tags)} total instances, {len(instance_tags)} build instances")
+
+# ---- Step 3: Join RunInstances + CreateTags by instance_id ----
+instances = []
+joined_count = 0
+for iid, itype in instance_types.items():
+    tags = instance_tags.get(iid, {})
+    has_tags = bool(tags.get('Name'))
+    if has_tags:
+        joined_count += 1
+    instances.append({
+        'instance_id': iid,
+        'instance_type': itype,
+        'launch_ms': instance_times.get(iid, 0),
+        'dashboard': tags.get('Dashboard', ''),
+        'name_tag': tags.get('Name', ''),
+        'actor': tags.get('GithubActor', ''),
+    })
+
+print(f"\n  Joined: {len(instances)} total RunInstances, {joined_count} with Name tag from CreateTags")
+print(f"  CreateTags instances NOT in RunInstances: {len(instance_tags) - joined_count}")
+
+# Show type distribution
+type_counts = {}
+for inst in instances:
+    if inst['name_tag']:
+        type_counts[inst['instance_type']] = type_counts.get(inst['instance_type'], 0) + 1
+print(f"\n  Instance types (from joined data):")
+for t, c in sorted(type_counts.items(), key=lambda x: -x[1]):
+    print(f"    {t}: {c}")
+
+# ---- Step 4: Load SQLite and match ----
+if not os.path.exists(DB_PATH):
+    print(f"\nNo database at {DB_PATH}. Exiting after CloudTrail summary.")
+    sys.exit(0)
+
+conn = sqlite3.connect(DB_PATH)
+conn.row_factory = sqlite3.Row
+
+cutoff_ms = int((datetime.now(timezone.utc) - timedelta(days=days_back)).timestamp() * 1000)
+unknown_runs = conn.execute('''
+    SELECT dashboard, name, timestamp_ms, complete_ms, instance_vcpus, spot,
+           cost_usd, arch, pr_number
+    FROM ci_runs
+    WHERE (instance_type IS NULL OR instance_type = '' OR instance_type = 'unknown')
+    AND timestamp_ms > ?
+''', (cutoff_ms,)).fetchall()
+print(f"\n{len(unknown_runs)} unknown ci_runs in last {days_back} days")
+
+# Build lookup: normalized_name → [instances] for fast matching
+# Name tag format: <branch_normalized>_<arch>[_<postfix>]
+# Examples:
+#   next_amd64                              → branch=next
+#   merge-train_spartan_amd64_17            → branch=merge-train_spartan
+#   pr-20419_arm64_a1-fast                  → branch=pr-20419
+#   cl_all_in_makefile_arm64_a1-fast        → branch=cl_all_in_makefile
+_NAME_TAG_RE = re.compile(r'^(.+)_(amd64|arm64)(?:_.*)?$')
+tag_index = {}
+for inst in instances:
+    if inst['name_tag']:
+        m = _NAME_TAG_RE.match(inst['name_tag'])
+        if m:
+            branch = m.group(1)
+            tag_index.setdefault(branch, []).append(inst)
+        else:
+            # No arch suffix found — use name as-is
+            tag_index.setdefault(inst['name_tag'], []).append(inst)
+
+updated = 0
+unmatched_dashboards = {}
+matches = []
+for run in unknown_runs:
+    run_name = run['name']
+    run_arch = run['arch'] or ''
+    run_ts = run['timestamp_ms']
+    run_dashboard = run['dashboard']
+
+    # Compute expected EC2 instance name (same as bootstrap_ec2)
+    expected_name = normalize_branch_name(run_name)
+
+    # Look up by normalized name
+    candidates = tag_index.get(expected_name, [])
+
+    best = None
+    best_delta = float('inf')
+    for inst in candidates:
+        # Verify arch matches — Name tag format: branch_<arch>[_postfix]
+        if run_arch:
+            m = _NAME_TAG_RE.match(inst['name_tag'])
+            if m and m.group(2) != run_arch:
+                continue
+        # Verify dashboard matches (if tag present)
+        if inst['dashboard'] and inst['dashboard'] != run_dashboard:
+            continue
+        # CI run should start AFTER instance launch. Instance runs multiple steps
+        # over its ~90-minute lifetime (default shutdown timer).
+        delta = run_ts - inst['launch_ms']
+        if delta < -60_000:  # run shouldn't start >1 min before launch
+            continue
+        if delta > 5400_000:  # 90 min max lifetime
+            continue
+        # Prefer the most recently launched instance (closest launch BEFORE run)
+        if delta >= 0 and (best is None or inst['launch_ms'] > best['launch_ms']):
+            best_delta = delta
+            best = inst
+        elif best is None and abs(delta) < 60_000:
+            # Allow small negative delta (clock skew)
+            best_delta = abs(delta)
+            best = inst
+
+    if best:
+        matches.append({
+            'dashboard': run_dashboard,
+            'name': run_name,
+            'timestamp_ms': run_ts,
+            'new_type': best['instance_type'],
+            'delta_s': round(best_delta / 1000),
+            'tag': best['name_tag'],
+            'iid': best['instance_id'],
+        })
+        if not dry_run:
+            conn.execute('''
+                UPDATE ci_runs SET instance_type = ?
+                WHERE dashboard = ? AND timestamp_ms = ? AND name = ?
+            ''', (best['instance_type'], run_dashboard, run_ts, run_name))
+        updated += 1
+    else:
+        unmatched_dashboards[run_dashboard] = unmatched_dashboards.get(run_dashboard, 0) + 1
+
+if not dry_run and updated:
+    conn.commit()
+
+print(f"\n{'Would resolve' if dry_run else 'Resolved'} {updated}/{len(unknown_runs)} unknown instance types")
+
+if matches:
+    print(f"\nSample matches:")
+    for m in matches[:30]:
+        print(f"  [{m['dashboard']:6s}] {m['name']:45s} -> {m['new_type']:15s} "
+              f"(dt={m['delta_s']:4d}s, tag={m['tag']}, id={m['iid']})")
+    if len(matches) > 30:
+        print(f"  ... and {len(matches) - 30} more")
+
+    # Summary by type
+    type_counts = {}
+    for m in matches:
+        type_counts[m['new_type']] = type_counts.get(m['new_type'], 0) + 1
+    print(f"\nResolved types:")
+    for t, c in sorted(type_counts.items(), key=lambda x: -x[1]):
+        print(f"  {t}: {c}")
+
+if unmatched_dashboards:
+    print(f"\nUnmatched by dashboard:")
+    for d, c in sorted(unmatched_dashboards.items(), key=lambda x: -x[1]):
+        print(f"  {d}: {c}")
+
+conn.close()
diff --git a/ci3/ci-metrics/views/ci-health-report.html b/ci3/ci-metrics/views/ci-health-report.html
new file mode 100644
index 000000000000..e23b0165116e
--- /dev/null
+++ b/ci3/ci-metrics/views/ci-health-report.html
@@ -0,0 +1,999 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<title>Aztec CI Health Report</title>
+<script src="https://cdn.jsdelivr.net/npm/chart.js@4.4.0/dist/chart.umd.min.js"></script>
+<style>
+*,*::before,*::after{box-sizing:border-box;margin:0;padding:0}
+html,body{height:100%;background:#0d1117;color:#e6edf3;font-family:-apple-system,'Segoe UI',sans-serif;overflow:hidden}
+.deck{width:100%;height:100vh;position:relative}
+.slide{position:absolute;top:0;left:0;width:100%;height:100%;display:flex;flex-direction:column;padding:40px 56px;opacity:0;transition:opacity .25s ease;pointer-events:none;overflow:hidden}
+.slide.active{opacity:1;pointer-events:all}
+.nav{position:fixed;bottom:24px;right:32px;display:flex;gap:10px;z-index:100}
+.nav button{background:#161b22;border:1px solid #30363d;color:#e6edf3;padding:7px 18px;border-radius:6px;cursor:pointer;font-size:13px;transition:background .15s}
+.nav button:hover{background:#21262d}
+.progress{position:fixed;bottom:31px;left:50%;transform:translateX(-50%);color:#7d8590;font-size:12px;font-family:monospace;letter-spacing:.04em}
+.label{font-size:11px;text-transform:uppercase;letter-spacing:.1em;color:#7d8590;margin-bottom:6px}
+h2{font-size:26px;font-weight:600;color:#e6edf3;margin-bottom:3px;line-height:1.2}
+.sub{color:#7d8590;font-size:14px;margin-bottom:18px}
+.card{flex:1;background:#161b22;border:1px solid #21262d;border-radius:8px;padding:18px 20px}
+.card .num{font-size:34px;font-weight:700;line-height:1;margin:6px 0 3px;font-family:monospace}
+.card .sub2{font-size:13px;color:#8b949e}
+.g{color:#3fb950}.y{color:#e3b341}.r{color:#f85149}.b{color:#58a6ff}.o{color:#f0883e}
+.row{display:flex;gap:20px;flex:1;min-height:0}
+.col{display:flex;flex-direction:column;flex:1;min-height:0}
+.cw{position:relative;flex:1;min-height:0}
+.note{background:#161b22;border-left:3px solid #58a6ff;padding:10px 14px;border-radius:0 6px 6px 0;font-size:13px;color:#c9d1d9;margin-top:10px;line-height:1.55}
+.note.y{border-color:#e3b341}.note.r{border-color:#f85149}.note.g{border-color:#3fb950}
+.g2{display:grid;grid-template-columns:1fr 1fr;gap:16px;flex:1}
+.g3{display:grid;grid-template-columns:1fr 1fr 1fr;gap:16px;flex:1}
+.title-slide{justify-content:center}
+.eyebrow{font-size:12px;text-transform:uppercase;letter-spacing:.12em;color:#58a6ff;margin-bottom:20px}
+h1{font-size:56px;font-weight:700;line-height:1.05;margin-bottom:6px}
+.kpis{display:flex;gap:48px;margin-top:44px}
+.knum{font-size:44px;font-weight:700;font-family:monospace;line-height:1}
+.klabel{font-size:12px;color:#7d8590;margin-top:4px}
+.source{margin-top:auto;font-size:11px;color:#484f58}
+.block{background:#161b22;border:1px solid #21262d;border-radius:8px;padding:16px 18px;margin-bottom:10px}
+.block .bhead{font-size:13px;font-weight:600;color:#e6edf3;margin-bottom:5px}
+.block p{font-size:13px;color:#8b949e;line-height:1.6}
+.pr-card{background:#161b22;border:1px solid #21262d;border-radius:8px;padding:12px 14px;margin-bottom:8px;display:flex;align-items:flex-start;gap:10px}
+.pr-card.cause{border-left:3px solid #f85149}
+.pr-card.fix{border-left:3px solid #3fb950}
+.pr-num{font-family:monospace;font-size:13px;font-weight:700;white-space:nowrap}
+.pr-num a{color:#58a6ff;text-decoration:none}
+.pr-num a:hover{text-decoration:underline}
+.pr-meta{flex:1;min-width:0}
+.pr-title{font-size:13px;color:#e6edf3;font-weight:600;line-height:1.3}
+.pr-body{font-size:12px;color:#8b949e;margin-top:3px;line-height:1.5}
+.linear-tag{display:inline-block;background:#21262d;border:1px solid #30363d;border-radius:4px;padding:2px 7px;font-size:11px;color:#58a6ff;text-decoration:none;margin-top:4px}
+.linear-tag:hover{background:#30363d}
+.deflake-row{display:flex;gap:8px;flex-wrap:wrap;margin-bottom:6px}
+.dtag{background:#161b22;border:1px solid #21262d;border-radius:6px;padding:5px 9px;font-size:11px;font-family:monospace}
+.dtag a{color:#58a6ff;text-decoration:none}
+.dtag a:hover{text-decoration:underline}
+.dtag .dauthor{color:#7d8590;font-size:10px;display:block;margin-top:1px}
+</style>
+</head>
+<body>
+
+<div class="deck" id="deck">
+
+<!-- 0: TITLE -->
+<div class="slide title-slide active" id="s0">
+  <div class="eyebrow">aztec-packages · Jan 21 – Feb 23, 2026</div>
+  <h1>CI Health Report</h1>
+  <div style="color:#7d8590;font-size:16px">34-day view · spend · flake · pipeline health · actions</div>
+  <div class="kpis">
+    <div><div class="knum y">$6,107</div><div class="klabel">AWS CI EC2 (34d · metrics.db)</div></div>
+    <div><div class="knum" style="color:#d2a8ff">$22,738</div><div class="klabel">AWS operational total (34d · Cost Explorer, ex-tax, ex-contract)</div></div>
+    <div><div class="knum b">$9,972</div><div class="klabel">GCP compute (30d · 31 namespaces)</div></div>
+    <div><div class="knum r">63.5%</div><div class="klabel">merge queue success (712 attempts)</div></div>
+    <div><div class="knum g">92.3%</div><div class="klabel">next pipeline pass rate</div></div>
+    <div><div class="knum b">33.6 min</div><div class="klabel">next P50 · +8% in 3 weeks</div></div>
+  </div>
+  <div class="source">source: ci.aztec-labs.com metrics.db + BigQuery · 5,136 tracked runs · Jan 21–Feb 23, 2026</div>
+</div>
+
+<!-- 1: SPEND OVERVIEW -->
+<div class="slide" id="s-spend">
+  <div class="label">§1 spend · overview</div>
+  <h2>$6,107 AWS CI EC2 in 34 days — network is the cost hotspot at 30% of spend, 18.4% spot</h2>
+  <div class="sub">Jan 21–Feb 23 · metrics.db cost_usd · CI pipelines only (GCP on next slide)</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="spendBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">network pipeline</div>
+        <div class="num r" style="font-size:28px">$5.03<span style="font-size:14px;color:#7d8590">/run avg</span></div>
+        <div class="sub2">523 runs · only 15.5% spot · $2,632 total = 37% of all CI spend</div>
+      </div>
+      <div class="card">
+        <div class="label">prs pipeline</div>
+        <div class="num g" style="font-size:28px">$0.72<span style="font-size:14px;color:#7d8590">/run avg</span></div>
+        <div class="sub2">1,864 runs · 94.4% spot · $1,340 total · most cost-efficient pipeline</div>
+      </div>
+      <div class="note r" style="margin-top:0">Network spot rate 15.5% vs 87–99% everywhere else. Spot costs ~86% less than on-demand. Network pipeline is the single largest AWS cost lever.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 2: GCP FULL PICTURE -->
+<div class="slide" id="s-gcp-total">
+  <div class="label">§1 spend · full picture</div>
+  <h2>$16K/month total: $9K dev/testing across both clouds, $6K always-on production</h2>
+  <div class="sub">AWS CI EC2 $6,107 (34d · metrics.db) · AWS operational $22,738 (34d · Cost Explorer, ex-tax, ex-contract) · GCP $9,972 (30d)</div>
+  <div class="row">
+    <div class="col" style="max-width:260px">
+      <div class="cw"><canvas id="gcpDonut"></canvas></div>
+    </div>
+    <div class="col">
+      <div class="cw"><canvas id="awsGcpBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:280px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">GCP production clusters</div>
+        <div class="num b" style="font-size:26px">$6,379<span style="font-size:14px;color:#7d8590">/mo</span></div>
+        <div class="sub2">testnet $997 · next-net $859 · mainnet $816 · staging $792 · fisherman $334. Always-on regardless of CI activity.</div>
+      </div>
+      <div class="note"><strong style="color:#e3b341">$6,107</strong> = CI run EC2 tracked in metrics.db — what we directly pay per CI job. Gap to $16,221 total EC2 bill = always-on infra (NAT, VPC, bastion, EFS) not tagged as CI runs. <strong style="color:#d2a8ff">$22,738</strong> = full AWS operational (Cost Explorer, 34d): EC2 $16,221 + CloudFront $1,829 + EC2-Other $2,177 + ElastiCache $637 + misc $1,874. Excluded: $17,520 annual Savings Plan commitment (one-time contract) + $6,172 tax → $46,430 total AWS bill. GCP: $2,129 CI namespaces + $6,379 prod clusters (always-on, CI-independent).</div>
+    </div>
+  </div>
+</div>
+
+<!-- 3: WEEKLY COST TREND -->
+<div class="slide" id="s-weekly-cost">
+  <div class="label">§1 spend · weekly trend</div>
+  <h2>W04 network anomaly: $999 in one week — Feb 14 instance change cut it 91%</h2>
+  <div class="sub">Stacked weekly CI spend by pipeline · m6a.48xlarge eliminated from network CI Feb 14, replaced by m6a.4xlarge</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="weeklyCostBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">W04 network (m6a.48xlarge, on-demand)</div>
+        <div class="num r" style="font-size:28px">$9.79<span style="font-size:14px;color:#7d8590">/run</span></div>
+        <div class="sub2">192 vCPUs, on-demand pricing. Long-failing jobs during p2p/epoch instability. $999 in one week.</div>
+      </div>
+      <div class="card">
+        <div class="label">W07 network (m6a.4xlarge)</div>
+        <div class="num g" style="font-size:28px">$0.85<span style="font-size:14px;color:#7d8590">/run</span></div>
+        <div class="sub2">$94 total for the week. Network tests no longer run on the 192-vCPU on-demand beast.</div>
+      </div>
+      <div class="note g" style="margin-top:0">W07 total: $988 vs W06 peak $1,947. 49% weekly reduction driven by eliminating m6a.48xlarge from network tests. kind tests also moved to spot this period.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 4: SPOT GAP -->
+<div class="slide" id="s-network-spot">
+  <div class="label">§1 spend · spot discipline</div>
+  <h2>Network pipeline: 15.5% spot — every other pipeline runs 87–99% spot</h2>
+  <div class="sub">Spot instances cost ~86% less than on-demand at equivalent capacity. The gap is isolated to network.</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="spotBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="note r">Network at 15.5% spot: 442 of 523 runs were on-demand. At prs pipeline spot rates (94.4%) the network bill drops from $2,632 to ~$370. ~$2,200/month opportunity.</div>
+      <div class="note y">GCP spot migration: $1,397/month in 0%-spot namespaces (eth-mainnet, sepolia, monitoring). Ops complexity — preemption handling for archive nodes. See §4.</div>
+      <div class="note g">kind tests moved to spot (done). Network pipeline is the next highest-ROI action on AWS.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 5: WEEKLY FLAKES -->
+<div class="slide" id="s-flakes">
+  <div class="label">§2 flake · weekly pattern</div>
+  <h2>One cluster drove every spike — p2p/epoch cleared completely in W07</h2>
+  <div class="sub">Jan 14–Feb 23 · stacked: p2p/epoch (orange) · other flakes (blue) · hard fails (red)</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="flakeBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">p2p/epoch cluster (W02–W06)</div>
+        <div class="num o" style="font-size:28px">2,034<span style="font-size:14px;color:#7d8590"> events</span></div>
+        <div class="sub2">56 distinct tests · all classified as flakes (0 hard fails) · 747 events in W06 → 2 in W07</div>
+      </div>
+      <div class="note r">W06 (Feb 9): 515 hard fails — highest of any week. Three high-risk PRs merged same day (see slide 8).</div>
+      <div class="note y">W08 (Feb 23, partial): 36 events, 0 p2p/epoch. Too early to call — partial week, low volume.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 6: CLUSTER ANATOMY -->
+<div class="slide" id="s-cluster">
+  <div class="label">§2 flake · anatomy</div>
+  <h2>2,034 labeled events across 56 tests — and 1,912 unlabeled failures behind them</h2>
+  <div class="sub">The e2e-p2p-epoch-flakes cluster is tagged. Everything else is anonymous.</div>
+  <div class="row">
+    <div class="col" style="max-width:280px">
+      <div class="cw"><canvas id="clusterDonut"></canvas></div>
+    </div>
+    <div class="col" style="justify-content:center;gap:10px">
+      <div class="block">
+        <div class="bhead" style="color:#f0883e">e2e-p2p-epoch-flakes · 2,034 events · 56 tests · 0 hard fails</div>
+        <p>Known cluster. All events classified as flakes — timing-driven, not code bugs. Cleared in W07 after Santiago PRs <a href="https://github.com/AztecProtocol/aztec-packages/pull/20351" style="color:#58a6ff">#20351</a> (mbps test fix) and <a href="https://github.com/AztecProtocol/aztec-packages/pull/20462" style="color:#58a6ff">#20462</a> (remove hardcoded 10s timeout), plus ludamad <a href="https://github.com/AztecProtocol/aztec-packages/pull/20613" style="color:#58a6ff">#20613</a> (CI parallelism). Root cause: PXE using latest (not checkpointed) block across distributed epoch transitions. Will recur.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#e3b341">Unlabeled · 1,912 events · 938 distinct tests · merge queue failures</div>
+        <p>These are failures in the merge queue (next pipeline). In the queue, any failure blocks a PR — whether it's a real bug, infrastructure noise, or a timing race. 938 distinct failing tests with no cluster assignment and no assigned owner. This is the long tail of test rot that grows with every feature sprint.</p>
+      </div>
+      <div class="note r">The labeled cluster cleared. The unlabeled tail didn't. 938 distinct failing tests is residual risk that accumulates without active maintenance.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 7: REAL BUGS & DEFLAKE GATE -->
+<div class="slide" id="s-real-bugs">
+  <div class="label">§2 flake · signal quality</div>
+  <h2>New flakes keep appearing — the floor doesn't clear, and 4 grinds didn't catch W04</h2>
+  <div class="sub">0.12% overall flake rate (6,632 flakes / 5.5M test runs) — low headline, lumpy reality</div>
+  <div class="row" style="gap:24px;margin-top:8px">
+    <div class="col">
+      <div class="label" style="color:#f85149;margin-bottom:8px">W04: the gate failed</div>
+      <div class="block">
+        <div class="bhead">valid_epoch_pruned_slash: 0 events W03 → 346 events W04</div>
+        <p>This test passed the 4-run deflake gate and was merged. In its first full week in CI it produced 346 fail/flake events — 33% of the entire W04 spike. Similarly, tx_proposal_collector (180 events) and inactivity_slash_with_consequence (74 events) debuted in W04 with immediate instability. All passed the gate.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#e3b341">team-alpha now running 10 grinds</div>
+        <p>A stricter informal standard adopted by one team. Not yet universal policy. Reduces risk of introducing flaky tests but increases CI time per new test by 2.5×. Proposal: targeted deflake — instrument tests for determinism before setting a grind count. Outstanding from offsite.</p>
+      </div>
+    </div>
+    <div class="col">
+      <div class="label" style="color:#f85149;margin-bottom:8px">W07: new regressions after p2p fix</div>
+      <div class="block">
+        <div class="bhead">profile_gates.test.ts (12 events) + compile.test.ts (11 events)</div>
+        <p>Both appeared for the first time in W07 — the same week the p2p cluster cleared. CLI-layer tests, hash-prefixed job context. Not present in W06. New regressions introduced during the W07 fix sprint, or surface area exposed once p2p noise was removed.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#e3b341">~7% of CI run failures are genuine code bugs</div>
+        <p>Most failures are infrastructure noise (nightly 61% quick-fail) or p2p timing (labeled cluster). Merge-queue failures often behave like flakes regardless of their root cause — they block PRs that may be perfectly correct. New failing tests appear every week; old ones aren't fully removed.</p>
+      </div>
+    </div>
+  </div>
+</div>
+
+<!-- 8: PR CORRELATION — CAUSES + FIXES -->
+<div class="slide" id="s-pr-causes">
+  <div class="label">§2 flake · PR correlation</div>
+  <h2 style="color:#e6edf3">What caused the spikes — and who fixed them</h2>
+  <div class="sub">Attribution via ci_runs × pr_authors. Santiago Palladino: 18+ fix PRs in 6 weeks.</div>
+  <div class="row" style="gap:24px;margin-top:8px">
+    <div class="col">
+      <div class="label" style="color:#f85149;margin-bottom:8px">spike causes</div>
+      <div class="pr-card cause">
+        <div class="pr-num"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19532">#19532</a> <a href="https://github.com/AztecProtocol/aztec-packages/pull/19509">#19509</a> <a href="https://github.com/AztecProtocol/aztec-packages/pull/19564">#19564</a></div>
+        <div class="pr-meta">
+          <div class="pr-title" style="color:#f85149">W02 — Jan 13 · 2,072 flakes</div>
+          <div class="pr-body">spalladino refactors (e2e setup, archiver, test setup). Changed patterns exposing latent timing races across p2p/epoch simultaneously. Tipping point for existing instability.</div>
+        </div>
+      </div>
+      <div class="pr-card cause">
+        <div class="pr-num"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19982">#19982</a></div>
+        <div class="pr-meta">
+          <div class="pr-title" style="color:#f85149">W04 — Jan 26 · 935 flakes</div>
+          <div class="pr-body">PhilWindle added cross-chain mbps e2e tests without pre-deflaking. valid_epoch_pruned_slash: 0→346 events. tx_proposal_collector: 180 events. inactivity_slash_with_consequence: 74 events. All absent the prior week.</div>
+        </div>
+      </div>
+      <div class="pr-card cause">
+        <div class="pr-num"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20047">#20047</a> <a href="https://github.com/AztecProtocol/aztec-packages/pull/20241">#20241</a> <a href="https://github.com/AztecProtocol/aztec-packages/pull/20257">#20257</a></div>
+        <div class="pr-meta">
+          <div class="pr-title" style="color:#f85149">W06 — Feb 9 · 850 flakes + 515 hard fails (worst week)</div>
+          <div class="pr-body">Three high-risk PRs same day: <a href="https://github.com/AztecProtocol/aztec-packages/pull/20047" style="color:#58a6ff">#20047</a> peer scoring (15:27, mrzeszutko), <a href="https://github.com/AztecProtocol/aztec-packages/pull/20241" style="color:#58a6ff">#20241</a> max checkpoints→32 (11:21), <a href="https://github.com/AztecProtocol/aztec-packages/pull/20257" style="color:#58a6ff">#20257</a> hash constants (14:38, LeilaWang). Spanning p2p + epoch config + consensus hashes — the exact subsystems where all flakes live.</div>
+        </div>
+      </div>
+    </div>
+    <div class="col">
+      <div class="label" style="color:#3fb950;margin-bottom:8px">fixes that worked</div>
+      <div class="pr-card fix">
+        <div class="pr-num"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19914">#19914</a></div>
+        <div class="pr-meta">
+          <div class="pr-title" style="color:#3fb950">W03 — Jan 23 · −57% · root fix</div>
+          <div class="pr-body">spalladino: checkpointed chain tip for PXE. PXE was using latest (not checkpointed) block, causing epoch boundary races. 6 of 7 CI runs passed cleanly. Most impactful single fix of the period.</div>
+        </div>
+      </div>
+      <div class="pr-card fix">
+        <div class="pr-num"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20088">#20088</a> <a href="https://github.com/AztecProtocol/aztec-packages/pull/20140">#20140</a></div>
+        <div class="pr-meta">
+          <div class="pr-title" style="color:#3fb950">W05 — Feb 3–5 · −33%</div>
+          <div class="pr-body">spalladino <a href="https://github.com/AztecProtocol/aztec-packages/pull/20088" style="color:#58a6ff">#20088</a> slasher multi-block handling. PhilWindle <a href="https://github.com/AztecProtocol/aztec-packages/pull/20140" style="color:#58a6ff">#20140</a> deflake discv5. 20+ CI runs over 2 days before clean merge.</div>
+        </div>
+      </div>
+      <div class="pr-card fix">
+        <div class="pr-num"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20351">#20351</a> <a href="https://github.com/AztecProtocol/aztec-packages/pull/20462">#20462</a> <a href="https://github.com/AztecProtocol/aztec-packages/pull/20613">#20613</a></div>
+        <div class="pr-meta">
+          <div class="pr-title" style="color:#3fb950">W07 — Feb 10–17 · −65% · p2p cluster cleared</div>
+          <div class="pr-body">spalladino <a href="https://github.com/AztecProtocol/aztec-packages/pull/20351" style="color:#58a6ff">#20351</a> fix mbps chain test (p2p_client 311→0 flakes). <a href="https://github.com/AztecProtocol/aztec-packages/pull/20462" style="color:#58a6ff">#20462</a> remove hardcoded 10s timeout. ludamad <a href="https://github.com/AztecProtocol/aztec-packages/pull/20613" style="color:#58a6ff">#20613</a> CI parallelism — insufficient workers caused timeout cascades misclassified as flakes.</div>
+        </div>
+      </div>
+    </div>
+  </div>
+  <div class="note r" style="margin-top:8px">Pattern: every spike triggered by new unstable tests or multi-subsystem config changes without pre-deflaking. Will recur without structural change.</div>
+</div>
+
+<!-- 9: FIX/DEFLAKE TRACKER -->
+<div class="slide" id="s-flake-track">
+  <div class="label">§2 flake · maintenance cost</div>
+  <h2>30 fix/deflake PRs in 34 days — nearly one per day of ongoing maintenance overhead</h2>
+  <div class="sub">PRs with "fix/flake/deflake" in title or branch · Jan 14–Feb 23 · engineers patching unstable tests continuously</div>
+  <div class="row" style="gap:24px;margin-top:4px">
+    <div class="col">
+      <div class="label" style="color:#7d8590;margin-bottom:8px">recent (Feb)</div>
+      <div class="deflake-row">
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20636">#20636</a><span class="dauthor">spypsy · Feb 18</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20609">#20609</a><span class="dauthor">alexghr · Feb 17</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20439">#20439</a><span class="dauthor">ludamad · Feb 12</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20335">#20335</a><span class="dauthor">spypsy · Feb 10</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20330">#20330</a><span class="dauthor">ludamad · Feb 10</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19322">#19322</a><span class="dauthor">charlielye · Feb 10</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20246">#20246</a><span class="dauthor">mverzilli · Feb 6</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20243">#20243</a><span class="dauthor">mverzilli · Feb 6</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20240">#20240</a><span class="dauthor">mverzilli · Feb 6</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20215">#20215</a><span class="dauthor">ludamad · Feb 5</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20160">#20160</a><span class="dauthor">mverzilli · Feb 4</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20095">#20095</a><span class="dauthor">suyash67 · Feb 4</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20140">#20140</a><span class="dauthor">PhilWindle · Feb 3</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20131">#20131</a><span class="dauthor">alexghr · Feb 3</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20119">#20119</a><span class="dauthor">alexghr · Feb 3</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20115">#20115</a><span class="dauthor">danielntmd · Feb 2</span></div>
+      </div>
+    </div>
+    <div class="col">
+      <div class="label" style="color:#7d8590;margin-bottom:8px">earlier (Jan)</div>
+      <div class="deflake-row">
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20090">#20090</a><span class="dauthor">mralj · Jan 30</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20070">#20070</a><span class="dauthor">mralj · Jan 30</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20068">#20068</a><span class="dauthor">mralj · Jan 30</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20040">#20040</a><span class="dauthor">mralj · Jan 29</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20024">#20024</a><span class="dauthor">spalladino · Jan 28</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/20004">#20004</a><span class="dauthor">spalladino · Jan 28</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19952">#19952</a><span class="dauthor">ludamad · Jan 26</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19910">#19910</a><span class="dauthor">spalladino · Jan 23</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19782">#19782</a><span class="dauthor">alexghr · Jan 21</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19767">#19767</a><span class="dauthor">spalladino · Jan 20</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19705">#19705</a><span class="dauthor">PhilWindle · Jan 19</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19618">#19618</a><span class="dauthor">alexghr · Jan 15</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19588">#19588</a><span class="dauthor">spalladino · Jan 15</span></div>
+        <div class="dtag"><a href="https://github.com/AztecProtocol/aztec-packages/pull/19580">#19580</a><span class="dauthor">PhilWindle · Jan 14</span></div>
+      </div>
+    </div>
+    <div class="col" style="max-width:260px;justify-content:center">
+      <div class="card" style="text-align:center">
+        <div class="label">deflake maintenance rate</div>
+        <div class="num r">30</div>
+        <div class="sub2">PRs in 34 days = 0.88/day. 8 distinct contributors. spalladino (6), alexghr (5), ludamad (4), mverzilli (4), mralj (4), PhilWindle (3).</div>
+      </div>
+      <div class="note r" style="margin-top:10px">This is the hidden cost of test rot — not paid in dollars but in senior engineer hours. Each deflake PR is an interrupt to feature work.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 10: PIPELINE PASS RATES -->
+<div class="slide" id="s-pass-rates">
+  <div class="label">§3 health · pass rates</div>
+  <h2>next at 92% — nightly and network stuck at 58%, different failure modes</h2>
+  <div class="sub">Jan 21–Feb 23 · ci_run_daily_stats · 4,870 total runs across 5 pipelines</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="passRatesBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">nightly (573 runs)</div>
+        <div class="num r" style="font-size:28px">58.1%</div>
+        <div class="sub2">61% of failures complete in under 5 min — single job, crashes at startup before tests run. Environment instability, not code.</div>
+      </div>
+      <div class="card">
+        <div class="label">network (450 runs)</div>
+        <div class="num r" style="font-size:28px">58.0%</div>
+        <div class="sub2">9.5% quick-fail, 87.9min avg fail duration. Network runs often partially pass — a FAIL may have completed 80% of its test suite before one test times out.</div>
+      </div>
+      <div class="note">Nightly failures are environment crashes (startup), not code regressions. Network failures are long-running timeouts — pass rate understates how much actually succeeds.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 11: INFRA VS CODE FAILURES -->
+<div class="slide" id="s-infra">
+  <div class="label">§3 health · failure anatomy</div>
+  <h2>61% of nightly failures complete in under 5 minutes — infra crashes, not code</h2>
+  <div class="sub">Quick-fail proxy: FAILED runs completing in &lt;5 min. Heuristic — some short unit tests legitimately fail fast.</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="infraBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="note r">nightly: 60.8% quick-fail (avg 5.2min to failure). Single job type (next), bailing at startup. The pipeline is crashing on environment setup — likely a Docker pull, secret mount, or k8s scheduling failure — before any test code runs.</div>
+      <div class="note y">prs: 30.3% quick-fail (168 of 555 failures). 1 in 3 PR CI failures is infrastructure, not the engineer's code. Significant developer friction that inflates apparent failure rates.</div>
+      <div class="note g">next: 9.0% quick-fail — next failures are mostly genuine test failures. The highest-signal pipeline for code quality.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 12: BUILD TIME -->
+<div class="slide" id="s-build-time">
+  <div class="label">§3 health · build time</div>
+  <h2>next P50 +8% in 3 weeks — P95 up 22%, tail latency accelerating</h2>
+  <div class="sub">W05=Feb 2 · W06=Feb 9 · W07=Feb 16 · individual ci_runs PASSED records · exact percentiles</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="buildTimeChart"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">P95 growth (3 weeks)</div>
+        <div class="num r" style="font-size:28px">+22%</div>
+        <div class="sub2">45.3min (W05) → 55.1min (W07). At this rate: P95 exceeds 70min by May.</div>
+      </div>
+      <div class="card">
+        <div class="label">P50 growth (3 weeks)</div>
+        <div class="num y" style="font-size:28px">+8%</div>
+        <div class="sub2">31.0min (W05) → 33.6min (W07). Compounded across 1,100+ next runs/month.</div>
+      </div>
+      <div class="note">W08 early data (Feb 23, 10 runs only): P50=32.9, P95=34.5. Too small a sample to conclude. No identified root cause for the growth trend.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 13: MERGE QUEUE -->
+<div class="slide" id="s-mq">
+  <div class="label">§3 health · merge queue</div>
+  <h2>63.5% merge queue success — W04 bottomed at 57.6%, W07 still only 59.5%</h2>
+  <div class="sub">712 total attempts · 452 successes · 251 failures · Jan 21–Feb 23</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="mqChart"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">34-day success rate</div>
+        <div class="num r" style="font-size:34px">63.5%</div>
+        <div class="sub2">1 in 3 merge attempts needs a retry. Target for a healthy queue: 85%+.</div>
+      </div>
+      <div class="note r">W07 (59.5%) is worse than W06 (69.6%) despite the p2p fix. Hard test failures replaced flakes as merge blockers — the queue improved in one dimension and degraded in another.</div>
+      <div class="note y">W04 worst week: 91 failures out of 217 attempts (57.6%). Coincided with the p2p/epoch spike and the new unstable test introductions.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 14: DAY OF WEEK -->
+<div class="slide" id="s-dow">
+  <div class="label">§3 health · scheduling patterns</div>
+  <h2>Tuesday 72% vs Thursday 82% — the Monday queue effect is measurable</h2>
+  <div class="sub">Jan 21–Feb 23 · all pipelines · 4,870 runs · 9.5pp spread between worst and best weekday</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="dowBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:300px;justify-content:center;gap:10px">
+      <div class="note">Mon/Tue dip: PRs accumulate over the weekend and all enter the merge queue simultaneously Monday morning. Pipeline contention drives higher failure rates. By Thursday the queue has cleared and pass rates recover.</div>
+      <div class="note y">9.5pp spread (Tue 72.3% → Thu 81.8%). Thursday–Friday is measurably safer for large feature merges. Batch rollouts on Monday are higher risk.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 15: GCP SPOT OPPORTUNITY -->
+<div class="slide" id="s-gcp-opt">
+  <div class="label">§4 GCP · optimization</div>
+  <h2>$1,397/month in 0%-spot namespaces — ops complexity vs savings is the open question</h2>
+  <div class="sub">Five GCP namespaces running 100% on-demand at 86% spot discount foregone · Jan 21–Feb 20</div>
+  <div class="row">
+    <div class="col">
+      <div class="cw"><canvas id="gcpOptBar"></canvas></div>
+    </div>
+    <div class="col" style="max-width:310px;justify-content:center;gap:10px">
+      <div class="card">
+        <div class="label">Monthly savings potential</div>
+        <div class="num g" style="font-size:26px">$1,397<span style="font-size:14px;color:#7d8590">/mo</span></div>
+        <div class="sub2">eth-mainnet + sepolia ($800) · monitoring ($599). At 86% spot discount, matching cluster-wide spot rate.</div>
+      </div>
+      <div class="note r">eth-mainnet and sepolia: Ethereum archive nodes, 80% memory utilization. Spot preemption means re-syncing from chain tip. Engineering cost to handle graceful preemption needs evaluation.</div>
+      <div class="note y">metrics + public-telemetry: Prometheus/Grafana. Spot-tolerant with PVC persistence — a platform ops task, not a code change. Lower risk than archive nodes.</div>
+    </div>
+  </div>
+</div>
+
+<!-- 16: WHAT WE'VE DONE -->
+<div class="slide" id="s-done">
+  <div class="label">§5 actions · done</div>
+  <h2>Three improvements landed in February</h2>
+  <div class="sub">Concrete changes with measured impact on cost and flake counts.</div>
+  <div class="g3" style="margin-top:8px">
+    <div>
+      <div class="label" style="color:#3fb950;margin-bottom:8px">cost — instance type</div>
+      <div class="block">
+        <div class="bhead" style="color:#3fb950">m6a.48xlarge → m6a.4xlarge (Feb 14)</div>
+        <p>The 192-vCPU on-demand instance running network tests is gone. At W04's failure rate it cost $9.79/run and $999 in a single week. m6a.4xlarge costs $0.85/run. W07 network spend: $94 vs W04's $999. 91% per-run cost reduction. Network tests no longer run on an oversized on-demand machine. Done.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#3fb950">kind tests moved to spot</div>
+        <p>kind test runs moved from on-demand to spot instances. ~86% cost reduction on affected runs. Done.</p>
+      </div>
+    </div>
+    <div>
+      <div class="label" style="color:#3fb950;margin-bottom:8px">flake — p2p/epoch cleared</div>
+      <div class="block">
+        <div class="bhead" style="color:#3fb950">e2e-p2p-epoch-flakes: 2,034 → ~0 events</div>
+        <p>The cluster that drove every spike since Jan 6 cleared in W07. Two p2p/epoch events in W07 vs 747 in W06. W08: zero p2p events so far.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#3fb950">Santiago Palladino: 18+ fix PRs (Jan–Feb)</div>
+        <p><a href="https://github.com/AztecProtocol/aztec-packages/pull/19914" style="color:#58a6ff">#19914</a> checkpointed PXE chain tip (root fix), <a href="https://github.com/AztecProtocol/aztec-packages/pull/20088" style="color:#58a6ff">#20088</a> slasher multi-block, <a href="https://github.com/AztecProtocol/aztec-packages/pull/20351" style="color:#58a6ff">#20351</a> mbps chain test (311→0 flakes), <a href="https://github.com/AztecProtocol/aztec-packages/pull/20462" style="color:#58a6ff">#20462</a> remove hardcoded 10s timeout. ludamad <a href="https://github.com/AztecProtocol/aztec-packages/pull/20613" style="color:#58a6ff">#20613</a> CI parallelism fix.</p>
+      </div>
+    </div>
+    <div>
+      <div class="label" style="color:#e3b341;margin-bottom:8px">open — not yet resolved</div>
+      <div class="block">
+        <div class="bhead" style="color:#e3b341">p2p cluster root cause</div>
+        <p>Cleared via targeted fixes, not architectural resolution. PXE epoch boundary races and test isolation issues remain. Will recur when new p2p/epoch features merge. No assigned owner for permanent fix.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#e3b341">Build time creep unresolved</div>
+        <p>next P50 +8%, P95 +22% in 3 weeks. No identified cause. At current rate P95 exceeds 70 min by May.</p>
+      </div>
+    </div>
+  </div>
+</div>
+
+<!-- 17: DEFLAKE QUESTION -->
+<div class="slide" id="s-deflake">
+  <div class="label">§5 actions · in progress</div>
+  <h2>The deflake gate exists — but W04 proved 4 grinds isn't enough for epoch/slashing tests</h2>
+  <div class="sub">Outstanding from offsite: reassess deflake strategy. team-alpha already at 10 grinds.</div>
+  <div class="row" style="gap:24px;margin-top:8px">
+    <div class="col">
+      <div class="label" style="color:#7d8590;margin-bottom:8px">current state</div>
+      <div class="block">
+        <div class="bhead">4-run deflake gate (universal, always existed)</div>
+        <p>All new e2e tests must pass 4 consecutive CI runs before merging. Has been standard for some time. Cost: ~$11 in deflake CI spend over 34 days — not a cost constraint.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#f85149">W04 evidence: the gate failed</div>
+        <p>valid_epoch_pruned_slash passed 4 grinds and produced 346 events in its first week. tx_proposal_collector (180 events) and inactivity_slash_with_consequence (74 events) debuted similarly. The gate is not filtering unstable epoch/slashing tests adequately.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#3fb950">team-alpha: 10 grinds</div>
+        <p>Informal higher standard on one team. Not yet universal. Reduces risk but increases CI wait time by 2.5× per new test.</p>
+      </div>
+    </div>
+    <div class="col">
+      <div class="label" style="color:#7d8590;margin-bottom:8px">options</div>
+      <div class="block">
+        <div class="bhead">Option A: raise blanket gate to 10 grinds</div>
+        <p>Universal. Simple to enforce. team-alpha already doing this. Tradeoff: 2.5× CI cost per new e2e test; developers wait longer before merge. Not evidence-based — fast-passing tests still get 10 runs.</p>
+        <a class="linear-tag" href="https://linear.app/aztec-labs/issue/A-533/set-up-hard-grinding-tests-in-spartan-merge-train-for-next" target="_blank">A-533 · set up hard grinding tests in spartan merge train</a>
+      </div>
+      <div class="block">
+        <div class="bhead">Option B: targeted deflake (proposed)</div>
+        <p>Analyze test pass rate distribution over N runs. Flag tests above a variance threshold. Grind count becomes adaptive: stable tests get 4, timing-sensitive tests get 20+. More surgical, higher tooling cost to implement.</p>
+      </div>
+      <div class="block">
+        <div class="bhead" style="color:#e3b341">Decision needed from offsite follow-up</div>
+        <p>Who owns the deflake gate upgrade? What is the target flake rate threshold before a test is considered acceptable for CI merge?</p>
+      </div>
+    </div>
+  </div>
+</div>
+
+<!-- 18: OPEN QUESTIONS -->
+<div class="slide" id="s-open-qs">
+  <div class="label">§5 actions · open questions</div>
+  <h2>Three questions for discussion</h2>
+  <div class="sub">Not answered here — require team input, owner assignment, or cost-benefit analysis.</div>
+  <div class="g3" style="margin-top:16px">
+    <div>
+      <div class="label" style="color:#e3b341;margin-bottom:8px">deflake strategy</div>
+      <div class="block">
+        <div class="bhead">Targeted deflake vs blanket grinds?</div>
+        <p>team-alpha doing 10 grinds — should this become universal? Or build adaptive tooling that sets the grind count per-test based on variance? Who owns the implementation and the policy?</p>
+        <a class="linear-tag" href="https://linear.app/aztec-labs/issue/A-533/set-up-hard-grinding-tests-in-spartan-merge-train-for-next" target="_blank">A-533</a>
+      </div>
+      <div class="note y" style="margin-top:10px">Evidence: W04 proved 4 isn't enough for epoch/slashing tests. 10 is pragmatic but not evidence-based. Targeted deflake is surgical but requires tooling investment.</div>
+    </div>
+    <div>
+      <div class="label" style="color:#e3b341;margin-bottom:8px">GCP spot migration</div>
+      <div class="block">
+        <div class="bhead">$1,397/month savings — worth the ops complexity?</div>
+        <p>eth-mainnet and sepolia archive nodes: spot preemption means re-syncing from chain tip. metrics and public-telemetry: lower risk, Prometheus/Grafana with PVC persistence. What's the engineering cost to make each namespace preemption-safe?</p>
+      </div>
+      <div class="note y" style="margin-top:10px">AWS network pipeline spot migration (~$2,200/mo) is likely the easier, higher-ROI first step — no archive node complexity.</div>
+    </div>
+    <div>
+      <div class="label" style="color:#f85149;margin-bottom:8px">p2p/epoch ownership</div>
+      <div class="block">
+        <div class="bhead">Who owns the cluster to permanent resolution?</div>
+        <p>The cluster cleared through 18+ targeted fix PRs. Root cause — PXE epoch boundary races, test isolation, distributed timing — is not architecturally resolved. Next p2p feature merge will likely trigger another spike without a named owner and explicit SLO.</p>
+      </div>
+      <div class="note r" style="margin-top:10px">Without assignment: the next spike will be diagnosed reactively, same as this one. Expected recurrence: within 1–2 major p2p feature merges.</div>
+    </div>
+  </div>
+</div>
+
+</div><!-- /deck -->
+
+<div class="progress" id="progress">1 / 19</div>
+<div class="nav">
+  <button onclick="go(-1)">← prev</button>
+  <button onclick="go(1)">next →</button>
+</div>
+
+<script>
+// ── DATA ──────────────────────────────────────────────────────────────
+const C = {
+  blue:'#58a6ff', green:'#3fb950', yellow:'#e3b341', red:'#f85149',
+  purple:'#d2a8ff', orange:'#f0883e', gray:'#484f58', text:'#c9d1d9'
+};
+
+const SPEND = [
+  {p:'next',     cost:2442, runs:1247, spot_pct:88.7, avg:1.96},
+  {p:'network',  cost:1855, runs:445,  spot_pct:18.4, avg:4.17},
+  {p:'prs',      cost:1366, runs:1904, spot_pct:94.4, avg:0.72},
+  {p:'releases', cost:188,  runs:288,  spot_pct:91.3, avg:0.65},
+  {p:'nightly',  cost:140,  runs:505,  spot_pct:98.4, avg:0.28},
+  {p:'local',    cost:105,  runs:107,  spot_pct:97.2, avg:0.98},
+  {p:'deflake',  cost:11,   runs:32,   spot_pct:96.9, avg:0.34},
+];
+
+const GCP_CATS = [
+  {cat:'Production clusters', v:6379, col:'#58a6ff'},
+  {cat:'CI scenarios',        v:2129, col:'#f0883e'},
+  {cat:'K8s infra floor',     v:1190, col:'#e3b341'},
+  {cat:'Other/misc',          v:274,  col:'#484f58'},
+];
+
+const WEEKLY_COST = [
+  {w:'W03', net:158, ntly:45,  lcl:21, rel:11,  nxt:0,    prs:0},
+  {w:'W04', net:999, ntly:18,  lcl:0,  rel:27,  nxt:0,    prs:0},
+  {w:'W05', net:462, ntly:21,  lcl:0,  rel:48,  nxt:1075, prs:146},
+  {w:'W06', net:130, ntly:39,  lcl:84, rel:58,  nxt:937,  prs:699},
+  {w:'W07', net:94,  ntly:13,  lcl:0,  rel:38,  nxt:402,  prs:441},
+];
+
+const WEEKLY_FLAKES = [
+  {w:'W02', date:'Jan 14', flakes:2072, fails:178,  p2p:1363},
+  {w:'W03', date:'Jan 19', flakes:598,  fails:20,   p2p:472},
+  {w:'W04', date:'Jan 26', flakes:935,  fails:119,  p2p:868},
+  {w:'W05', date:'Feb 2',  flakes:390,  fails:313,  p2p:247},
+  {w:'W06', date:'Feb 9',  flakes:850,  fails:515,  p2p:747},
+  {w:'W07', date:'Feb 16', flakes:299,  fails:256,  p2p:2},
+  {w:'W08', date:'Feb 23', flakes:19,   fails:17,   p2p:0},
+];
+
+const PIPELINES = [
+  {p:'next',     pass:92.3, runs:1442},
+  {p:'releases', pass:86.6, runs:299},
+  {p:'prs',      pass:73.6, runs:2106},
+  {p:'nightly',  pass:58.1, runs:573},
+  {p:'network',  pass:58.0, runs:450},
+];
+
+const INFRA = [
+  {p:'nightly',  total:240, quick:146, pct:60.8},
+  {p:'releases', total:40,  quick:19,  pct:47.5},
+  {p:'prs',      total:555, quick:168, pct:30.3},
+  {p:'network',  total:189, quick:18,  pct:9.5},
+  {p:'next',     total:111, quick:10,  pct:9.0},
+];
+
+const BUILD_TIMES = [
+  {w:'W05', p50:31.0, p95:45.3},
+  {w:'W06', p50:32.2, p95:49.5},
+  {w:'W07', p50:33.6, p95:55.1},
+];
+
+const MQ_WEEKLY = [
+  {w:'W03', attempts:120, success:87,  fail:31, pct:72.5},
+  {w:'W04', attempts:217, success:125, fail:91, pct:57.6},
+  {w:'W05', attempts:137, success:86,  fail:50, pct:62.8},
+  {w:'W06', attempts:115, success:80,  fail:32, pct:69.6},
+  {w:'W07', attempts:121, success:72,  fail:47, pct:59.5},
+];
+
+const DOW = [
+  {d:'Sun', r:81.6, n:207},
+  {d:'Mon', r:73.1, n:814},
+  {d:'Tue', r:72.3, n:935},
+  {d:'Wed', r:77.2, n:813},
+  {d:'Thu', r:81.8, n:886},
+  {d:'Fri', r:77.8, n:979},
+  {d:'Sat', r:76.3, n:236},
+];
+
+const GCP_OPT = [
+  {ns:'eth-mainnet',      cost:465, savings:400, note:'archive node · 80% memory'},
+  {ns:'sepolia',          cost:465, savings:400, note:'archive node · 80% memory'},
+  {ns:'metrics',          cost:396, savings:340, note:'0% spot · Prometheus/Grafana'},
+  {ns:'public-telemetry', cost:301, savings:259, note:'0% spot · monitoring'},
+  {ns:'kube:sys-overhead',cost:395, savings:56,  note:'13.6% spot · k8s system'},
+];
+
+// ── NAVIGATION ────────────────────────────────────────────────────────
+let cur = 0;
+const slides = document.querySelectorAll('.slide');
+const N = slides.length;
+const rendered = new Set([0]);
+
+function go(d) {
+  slides[cur].classList.remove('active');
+  cur = Math.max(0, Math.min(N-1, cur+d));
+  slides[cur].classList.add('active');
+  document.getElementById('progress').textContent = `${cur+1} / ${N}`;
+  if (!rendered.has(cur)) { renderSlide(cur); rendered.add(cur); }
+}
+document.addEventListener('keydown', e => {
+  if (e.key==='ArrowRight'||e.key==='ArrowDown') go(1);
+  if (e.key==='ArrowLeft'||e.key==='ArrowUp') go(-1);
+});
+
+// ── CHART HELPERS ─────────────────────────────────────────────────────
+Chart.defaults.color = '#7d8590';
+const GRID = {color:'#21262d'};
+const TICK = (sz=11) => ({color:'#7d8590', font:{family:'monospace',size:sz}});
+const LEG = {labels:{color:'#8b949e',boxWidth:10,font:{size:10,family:'monospace'}}};
+const TIP = {bodyFont:{family:'monospace',size:11},titleFont:{size:11}};
+
+function mk(id, type, data, opts={}) {
+  const el = document.getElementById(id);
+  if (!el) return;
+  return new Chart(el, {type, data, options:{responsive:true,maintainAspectRatio:false,plugins:{legend:LEG,tooltip:TIP},...opts}});
+}
+
+// ── RENDERERS ─────────────────────────────────────────────────────────
+function renderSlide(n) {
+  const fns = {1:sSpend,2:sGCPTotal,3:sWeeklyCost,4:sSpotBar,5:sFlakes,6:sCluster,
+               10:sPassRates,11:sInfra,12:sBuildTime,13:sMQ,14:sDOW,15:sGCPOpt};
+  if (fns[n]) fns[n]();
+}
+
+function sSpend() {
+  const s = [...SPEND].sort((a,b)=>b.cost-a.cost);
+  mk('spendBar','bar',{
+    labels: s.map(d=>d.p),
+    datasets:[{
+      label:'total cost ($)',
+      data: s.map(d=>d.cost),
+      backgroundColor: s.map(d=>d.p==='network'?C.red+'cc':d.p==='next'?C.blue+'cc':C.green+'66'),
+      borderWidth:0,
+    }]
+  },{
+    indexAxis:'y',
+    scales:{
+      x:{ticks:{...TICK(),callback:v=>`$${v.toLocaleString()}`},grid:GRID},
+      y:{ticks:{color:'#c9d1d9',font:{size:12}},grid:{display:false}},
+    },
+    plugins:{
+      legend:{display:false},
+      tooltip:{callbacks:{label:c=>{
+        const d=s[c.dataIndex];
+        return ` $${d.cost.toLocaleString()} · ${d.runs} runs · $${d.avg}/run · ${d.spot_pct}% spot`;
+      }}}
+    }
+  });
+}
+
+function sGCPTotal() {
+  mk('gcpDonut','doughnut',{
+    labels: GCP_CATS.map(d=>d.cat),
+    datasets:[{data:GCP_CATS.map(d=>d.v),backgroundColor:GCP_CATS.map(d=>d.col),borderWidth:0,hoverOffset:6}]
+  },{
+    cutout:'60%',
+    plugins:{
+      legend:{position:'bottom',labels:{...LEG.labels}},
+      tooltip:{callbacks:{label:c=>` ${c.label}: $${c.raw.toLocaleString()} (${(c.raw/9972*100).toFixed(0)}%)`}}
+    }
+  });
+  mk('awsGcpBar','bar',{
+    labels:['AWS CI EC2 (34d)','GCP CI namespaces','GCP prod clusters','GCP k8s floor'],
+    datasets:[{
+      data:[6107,2129,6379,1190],
+      backgroundColor:[C.yellow+'cc',C.orange+'cc',C.blue+'cc',C.gray+'cc'],
+      borderWidth:0,
+    }]
+  },{
+    scales:{
+      x:{ticks:{color:'#c9d1d9',font:{size:11}},grid:{display:false}},
+      y:{ticks:{...TICK(),callback:v=>`$${v.toLocaleString()}`},grid:GRID},
+    },
+    plugins:{legend:{display:false},tooltip:{callbacks:{label:c=>` $${c.raw.toLocaleString()}`}}}
+  });
+}
+
+function sWeeklyCost() {
+  mk('weeklyCostBar','bar',{
+    labels: WEEKLY_COST.map(d=>d.w),
+    datasets:[
+      {label:'next',    data:WEEKLY_COST.map(d=>d.nxt), backgroundColor:C.blue+'99',   borderWidth:0, stack:'s'},
+      {label:'prs',     data:WEEKLY_COST.map(d=>d.prs), backgroundColor:C.green+'99',  borderWidth:0, stack:'s'},
+      {label:'network', data:WEEKLY_COST.map(d=>d.net), backgroundColor:C.red+'cc',    borderWidth:0, stack:'s'},
+      {label:'releases',data:WEEKLY_COST.map(d=>d.rel), backgroundColor:C.purple+'99', borderWidth:0, stack:'s'},
+      {label:'nightly', data:WEEKLY_COST.map(d=>d.ntly),backgroundColor:C.orange+'99', borderWidth:0, stack:'s'},
+      {label:'local',   data:WEEKLY_COST.map(d=>d.lcl), backgroundColor:C.gray+'99',   borderWidth:0, stack:'s'},
+    ]
+  },{
+    scales:{
+      x:{stacked:true,ticks:{color:'#c9d1d9'},grid:{display:false}},
+      y:{stacked:true,ticks:{...TICK(),callback:v=>`$${v}`},grid:GRID},
+    },
+    plugins:{legend:LEG,tooltip:{callbacks:{label:c=>` ${c.dataset.label}: $${c.raw}`}}}
+  });
+}
+
+function sSpotBar() {
+  const s = [...SPEND].sort((a,b)=>a.spot_pct-b.spot_pct);
+  mk('spotBar','bar',{
+    labels: s.map(d=>d.p),
+    datasets:[{
+      label:'spot usage (%)',
+      data: s.map(d=>d.spot_pct),
+      backgroundColor: s.map(d=>d.spot_pct<30?C.red+'cc':d.spot_pct<70?C.yellow+'cc':C.green+'99'),
+      borderWidth:0,
+    }]
+  },{
+    indexAxis:'y',
+    scales:{
+      x:{min:0,max:100,ticks:{...TICK(),callback:v=>`${v}%`},grid:GRID},
+      y:{ticks:{color:'#c9d1d9',font:{size:12}},grid:{display:false}},
+    },
+    plugins:{
+      legend:{display:false},
+      tooltip:{callbacks:{label:c=>{
+        const d=s[c.dataIndex];
+        return ` ${d.spot_pct}% spot · ${d.runs} runs · $${d.cost.toLocaleString()} total`;
+      }}}
+    }
+  });
+}
+
+function sFlakes() {
+  mk('flakeBar','bar',{
+    labels: WEEKLY_FLAKES.map(d=>`${d.w} ${d.date}`),
+    datasets:[
+      {label:'p2p/epoch cluster', data:WEEKLY_FLAKES.map(d=>d.p2p),           backgroundColor:C.orange+'cc', borderWidth:0, stack:'s'},
+      {label:'other flakes',      data:WEEKLY_FLAKES.map(d=>d.flakes-d.p2p),  backgroundColor:C.blue+'99',   borderWidth:0, stack:'s'},
+      {label:'hard fails',        data:WEEKLY_FLAKES.map(d=>d.fails),          backgroundColor:C.red+'cc',    borderWidth:0, stack:'s'},
+    ]
+  },{
+    scales:{
+      x:{stacked:true,ticks:{color:'#c9d1d9',font:{size:11}},grid:{display:false}},
+      y:{stacked:true,ticks:TICK(),grid:GRID,title:{display:true,text:'fail+flake events',color:'#7d8590'}},
+    },
+    plugins:{legend:LEG}
+  });
+}
+
+function sCluster() {
+  mk('clusterDonut','doughnut',{
+    labels:['e2e-p2p-epoch-flakes (labeled)','Unlabeled failures (938 tests)'],
+    datasets:[{
+      data:[2034,1912],
+      backgroundColor:[C.orange+'cc',C.gray+'99'],
+      borderWidth:0,hoverOffset:6,
+    }]
+  },{
+    cutout:'60%',
+    plugins:{
+      legend:{position:'bottom',labels:{...LEG.labels}},
+      tooltip:{callbacks:{label:c=>` ${c.raw.toLocaleString()} events (${(c.raw/3946*100).toFixed(0)}%)`}}
+    }
+  });
+}
+
+function sPassRates() {
+  const s = [...PIPELINES].sort((a,b)=>b.pass-a.pass);
+  mk('passRatesBar','bar',{
+    labels: s.map(d=>d.p),
+    datasets:[{
+      label:'pass rate (%)',
+      data: s.map(d=>d.pass),
+      backgroundColor: s.map(d=>d.pass>=85?C.green+'99':d.pass>=75?C.yellow+'cc':C.red+'cc'),
+      borderWidth:0,
+    }]
+  },{
+    indexAxis:'y',
+    scales:{
+      x:{min:50,max:100,ticks:{...TICK(),callback:v=>`${v}%`},grid:GRID},
+      y:{ticks:{color:'#c9d1d9',font:{size:12}},grid:{display:false}},
+    },
+    plugins:{
+      legend:{display:false},
+      tooltip:{callbacks:{label:c=>{
+        const d=s[c.dataIndex];
+        return ` ${d.pass}% pass rate · ${d.runs.toLocaleString()} runs`;
+      }}}
+    }
+  });
+}
+
+function sInfra() {
+  const s = [...INFRA].sort((a,b)=>b.pct-a.pct);
+  mk('infraBar','bar',{
+    labels: s.map(d=>d.p),
+    datasets:[{
+      label:'quick-fail rate (< 5 min)',
+      data: s.map(d=>d.pct),
+      backgroundColor: s.map(d=>d.pct>50?C.red+'cc':d.pct>25?C.yellow+'cc':C.green+'99'),
+      borderWidth:0,
+    }]
+  },{
+    indexAxis:'y',
+    scales:{
+      x:{min:0,max:75,ticks:{...TICK(),callback:v=>`${v}%`},grid:GRID},
+      y:{ticks:{color:'#c9d1d9',font:{size:12}},grid:{display:false}},
+    },
+    plugins:{
+      legend:{display:false},
+      tooltip:{callbacks:{label:c=>{
+        const d=s[c.dataIndex];
+        return ` ${d.pct}% quick-fail · ${d.quick} of ${d.total} failures`;
+      }}}
+    }
+  });
+}
+
+function sBuildTime() {
+  mk('buildTimeChart','line',{
+    labels: BUILD_TIMES.map(d=>d.w),
+    datasets:[
+      {label:'P50 (min)', data:BUILD_TIMES.map(d=>d.p50), borderColor:C.blue, backgroundColor:'transparent', tension:.3, pointRadius:6},
+      {label:'P95 (min)', data:BUILD_TIMES.map(d=>d.p95), borderColor:C.red,  backgroundColor:'transparent', tension:.3, pointRadius:6, borderDash:[5,3]},
+    ]
+  },{
+    scales:{
+      x:{ticks:{color:'#c9d1d9'},grid:{display:false}},
+      y:{min:25,max:65,ticks:TICK(),grid:GRID,title:{display:true,text:'minutes',color:'#7d8590'}},
+    },
+    plugins:{legend:LEG}
+  });
+}
+
+function sMQ() {
+  mk('mqChart','bar',{
+    labels: MQ_WEEKLY.map(d=>d.w),
+    datasets:[
+      {label:'merge attempts', data:MQ_WEEKLY.map(d=>d.attempts), backgroundColor:C.gray+'55', borderWidth:0, yAxisID:'y2'},
+      {label:'success rate (%)', data:MQ_WEEKLY.map(d=>d.pct), backgroundColor:MQ_WEEKLY.map(d=>d.pct<60?C.red+'cc':d.pct<70?C.yellow+'cc':C.green+'99'), borderWidth:0, yAxisID:'y'},
+    ]
+  },{
+    scales:{
+      y:{min:50,max:80,ticks:{...TICK(),callback:v=>`${v}%`},grid:GRID,title:{display:true,text:'success rate',color:'#7d8590'}},
+      y2:{position:'right',ticks:TICK(10),grid:{display:false},title:{display:true,text:'attempts',color:'#7d8590'}},
+      x:{ticks:{color:'#c9d1d9'},grid:{display:false}},
+    },
+    plugins:{legend:LEG,tooltip:{callbacks:{label:c=>{
+      if(c.datasetIndex===0) return ` ${c.raw} merge attempts`;
+      const d=MQ_WEEKLY[c.dataIndex];
+      return ` ${d.pct}% success · ${d.success} ok · ${d.fail} failed`;
+    }}}}
+  });
+}
+
+function sDOW() {
+  mk('dowBar','bar',{
+    labels: DOW.map(d=>d.d),
+    datasets:[{
+      label:'pass rate (%)',
+      data: DOW.map(d=>d.r),
+      backgroundColor: DOW.map(d=>d.r<75?C.red+'cc':d.r<80?C.yellow+'99':C.green+'99'),
+      borderWidth:0,
+    }]
+  },{
+    scales:{
+      x:{ticks:{color:'#c9d1d9'},grid:{display:false}},
+      y:{min:60,max:90,ticks:{...TICK(),callback:v=>`${v}%`},grid:GRID},
+    },
+    plugins:{legend:{display:false},tooltip:{callbacks:{label:c=>{
+      const d=DOW[c.dataIndex]; return ` ${d.r}% pass rate · ${d.n.toLocaleString()} runs`;
+    }}}}
+  });
+}
+
+function sGCPOpt() {
+  mk('gcpOptBar','bar',{
+    labels: GCP_OPT.map(d=>d.ns),
+    datasets:[
+      {label:'current cost (0% spot)', data:GCP_OPT.map(d=>d.cost),    backgroundColor:C.red+'bb',  borderWidth:0},
+      {label:'potential spot savings', data:GCP_OPT.map(d=>d.savings),  backgroundColor:C.green+'99',borderWidth:0},
+    ]
+  },{
+    scales:{
+      x:{ticks:{color:'#c9d1d9',font:{size:11}},grid:{display:false}},
+      y:{ticks:{...TICK(),callback:v=>`$${v}`},grid:GRID,title:{display:true,text:'monthly cost (USD)',color:'#7d8590'}},
+    },
+    plugins:{legend:LEG,tooltip:{callbacks:{label:c=>{
+      const d=GCP_OPT[c.dataIndex];
+      return c.datasetIndex===0?` $${c.raw}/mo — ${d.note}`:` save ~$${c.raw}/mo at spot rates`;
+    }}}}
+  });
+}
+</script>
+</body>
+</html>
diff --git a/ci3/ci-metrics/views/ci-insights.html b/ci3/ci-metrics/views/ci-insights.html
index 533b6bfb62cd..bb483af6f1d9 100644
--- a/ci3/ci-metrics/views/ci-insights.html
+++ b/ci3/ci-metrics/views/ci-insights.html
@@ -22,6 +22,15 @@
     .msg { color:#888; padding:8px 0; }
     .msg.err { color:#f85149; }
 
+    /* Tabs */
+    .tabs { display:flex; gap:0; margin:12px 0 0 0; }
+    .tab { background:#111; border:1px solid #333; border-bottom:none; color:#888;
+      font-family:monospace; font-size:13px; padding:6px 16px; cursor:pointer; }
+    .tab:hover { color:#ccc; }
+    .tab.active { background:#0a0a0a; color:#fff; border-color:#58a6ff; border-bottom:1px solid #0a0a0a; position:relative; z-index:1; }
+    .tab-content { display:none; border:1px solid #333; border-top:1px solid #333; padding:12px; background:#0a0a0a; margin-top:-1px; }
+    .tab-content.active { display:block; }
+
     /* KPI strip */
     .kpi-strip { display:flex; gap:12px; margin:16px 0; flex-wrap:wrap; }
     .kpi { background:#0a0a0a; border:1px solid #222; padding:12px 16px; flex:1; min-width:180px; max-height:120px; overflow:hidden; }
@@ -53,23 +62,41 @@
     .amt { font-variant-numeric:tabular-nums; text-align:right; }
     th.amt { text-align:right; }
     .detail-scroll { max-height:500px; overflow:auto; }
+    .detail-table { width:100%; border-collapse:collapse; font-size:12px; }
+    .detail-table th { text-align:left; padding:4px 6px; border-bottom:1px solid #333; color:#888; white-space:nowrap; position:sticky; top:0; background:#0a0a0a; }
+    .detail-table td { padding:4px 6px; border-bottom:1px solid #111; white-space:nowrap; }
+    .detail-table .amt { text-align:right; font-variant-numeric:tabular-nums; }
+    .detail-table th.amt { text-align:right; }
+    .stats { margin:12px 0; color:#888; }
+    .stats span { color:#ccc; }
 
+    /* Test details */
+    .cmd { max-width:500px; overflow:hidden; text-overflow:ellipsis; white-space:nowrap; }
+    .pass { color:#3fb950; }
+    .fail { color:#f85149; }
+    .flake { color:#d29922; }
   </style>
 </head>
 <body>
   <div class="nav" id="nav">
     <a href="/">&lt; CI</a> <span class="sep">|</span>
-    <a href="/cost-overview">cost overview</a>
-    <a href="/namespace-billing">namespace billing</a>
-    <a href="/ci-insights" class="active">ci insights</a>
+    <a href="/cost-overview">cost overview</a> <span class="sep">|</span>
+    <a href="/namespace-billing">namespace billing</a> <span class="sep">|</span>
+    <a href="/ci-insights" class="active">ci insights</a> <span class="sep">|</span>
+    <a href="/flake-prs">flake prs</a> <span class="sep">|</span>
+    <a href="/commits">commits</a>
   </div>
 
-  <h2 style="margin:8px 0;color:#ccc;">ci insights</h2>
+  <h2 style="margin:8px 0;color:#ccc;">ci insights <span id="period-label" style="font-size:12px;color:#666;font-weight:normal"></span></h2>
 
   <div class="controls">
-    <button data-range="14">2w</button>
+    <button data-range="365">1y</button>
+    <button data-range="180">6m</button>
     <button data-range="30">1m</button>
-    <button data-range="90">3m</button>
+    <button data-range="14">2w</button>
+    <button data-range="7">1w</button>
+    <button data-range="2">2d</button>
+    <button data-range="1">1d</button>
     <span style="color:#333">|</span>
     <label>from</label> <input type="date" id="dateFrom" />
     <label>to</label> <input type="date" id="dateTo" />
@@ -82,71 +109,205 @@ <h2 style="margin:8px 0;color:#ccc;">ci insights</h2>
   </div>
 
   <div id="msg" class="msg"></div>
-  <div id="pipeline-filter" style="display:none; margin:8px 0; padding:6px 12px; background:#1a1a2e; border:1px solid #58a6ff; align-items:center; gap:8px; font-size:13px;">
-    filtered to pipeline: <span id="pf-name" style="color:#fff;font-weight:bold"></span>
-    <span id="pf-clear" style="cursor:pointer;color:#888;margin-left:8px">[clear]</span>
-  </div>
 
-  <!-- KPI strip -->
-  <div class="kpi-strip" id="kpis">
-    <div class="kpi"><div class="label">daily ci spend</div><div class="value" id="kv-spend">--</div><canvas class="spark" id="ks-spend"></canvas></div>
-    <div class="kpi"><div class="label">cost / merge</div><div class="value" id="kv-cpm">--</div><canvas class="spark" id="ks-cpm"></canvas></div>
-    <div class="kpi"><div class="label">mq success rate</div><div class="value" id="kv-mq">--</div><canvas class="spark" id="ks-mq"></canvas></div>
-    <div class="kpi"><div class="label">flakes / day</div><div class="value" id="kv-flakes">--</div><canvas class="spark" id="ks-flakes"></canvas></div>
-    <div class="kpi"><div class="label">prs merged / day</div><div class="value" id="kv-prs">--</div><canvas class="spark" id="ks-prs"></canvas></div>
+  <div class="tabs">
+    <div class="tab active" data-tab="overview">Overview</div>
+    <div class="tab" data-tab="attribution">Attribution</div>
   </div>
 
-  <!-- Charts -->
-  <div class="charts">
-    <div class="chart-box full">
-      <h3>daily ci cost + 7-day rolling cost per merge</h3>
-      <div class="chart-wrap tall"><canvas id="costChart"></canvas></div>
+  <!-- ============ TAB: Overview ============ -->
+  <div class="tab-content active" id="tab-overview">
+    <div id="pipeline-filter" style="display:none; margin:8px 0; padding:6px 12px; background:#1a1a2e; border:1px solid #58a6ff; align-items:center; gap:8px; font-size:13px;">
+      filtered to pipeline: <span id="pf-name" style="color:#fff;font-weight:bold"></span>
+      <span id="pf-clear" style="cursor:pointer;color:#888;margin-left:8px">[clear]</span>
     </div>
-    <div class="chart-box">
-      <h3>merge queue: daily outcomes + success rate</h3>
-      <div class="chart-wrap med"><canvas id="mqChart"></canvas></div>
+
+    <div class="kpi-strip" id="kpis">
+      <div class="kpi"><div class="label">mq success rate</div><div class="value" id="kv-mq">--</div><canvas class="spark" id="ks-mq"></canvas></div>
+      <div class="kpi"><div class="label">flakes / day</div><div class="value" id="kv-flakes">--</div><canvas class="spark" id="ks-flakes"></canvas></div>
+      <div class="kpi"><div class="label">prs merged / day</div><div class="value" id="kv-prs">--</div><canvas class="spark" id="ks-prs"></canvas></div>
+      <div class="kpi"><div class="label">avg mq duration</div><div class="value" id="kv-citime">--</div><canvas class="spark" id="ks-citime"></canvas></div>
     </div>
-    <div class="chart-box">
-      <h3>flakes + test failures per day</h3>
-      <div class="chart-wrap med"><canvas id="flakeChart"></canvas></div>
+
+    <div class="charts">
+      <div class="chart-box">
+        <h3>merge queue: daily outcomes + success rate</h3>
+        <div class="chart-wrap med"><canvas id="mqChart"></canvas></div>
+      </div>
+      <div class="chart-box">
+        <h3>test outcomes per day</h3>
+        <div class="chart-wrap med"><canvas id="flakeChart"></canvas></div>
+      </div>
+      <div class="chart-box full">
+        <h3>ci run duration by pipeline (avg mins)</h3>
+        <div class="chart-wrap med"><canvas id="ciDurPipeChart"></canvas></div>
+      </div>
+      <div class="chart-box full">
+        <h3>total ci time by pipeline (hours)</h3>
+        <div class="chart-wrap med"><canvas id="ciTotalTimeChart"></canvas></div>
+      </div>
+      <div class="chart-box full">
+        <h3>P95 build time by pipeline &amp; phase (secs)</h3>
+        <div class="chart-wrap med"><canvas id="phaseChart"></canvas></div>
+      </div>
+    </div>
+
+    <div style="display:flex; gap:16px; flex-wrap:wrap;">
+      <div style="flex:1; min-width:300px;">
+        <div class="section-title">top flaky tests</div>
+        <div class="detail-scroll" style="max-height:320px;">
+          <table>
+            <thead><tr><th>test</th><th class="amt">flakes</th><th>affected</th></tr></thead>
+            <tbody id="top-flake-tbody"></tbody>
+          </table>
+        </div>
+      </div>
+      <div style="flex:1; min-width:300px;">
+        <div class="section-title">top failing tests</div>
+        <div class="detail-scroll" style="max-height:320px;">
+          <table>
+            <thead><tr><th>test</th><th class="amt">failures</th><th>affected</th></tr></thead>
+            <tbody id="top-fail-tbody"></tbody>
+          </table>
+        </div>
+      </div>
     </div>
-  </div>
 
-  <!-- Flake cost ranking table -->
-  <div class="section-title">flakes by pipeline</div>
-  <div class="detail-scroll">
-    <table>
-      <thead id="flake-thead"><tr></tr></thead>
-      <tbody id="flake-tbody"></tbody>
-    </table>
+    <div class="section-title">flakes by pipeline</div>
+    <div class="detail-scroll">
+      <table>
+        <thead id="flake-thead"><tr></tr></thead>
+        <tbody id="flake-tbody"></tbody>
+      </table>
+    </div>
+
+    <!-- Test Details (inline) -->
+    <div style="margin:24px 0 8px 0; border-top:1px solid #333; padding-top:16px;">
+      <div style="display:flex; gap:12px; align-items:center; flex-wrap:wrap;">
+        <span style="color:#888; font-size:12px; text-transform:uppercase;">test details</span>
+        <span style="color:#333">|</span>
+        <label style="color:#888">pipeline</label>
+        <select id="ttDashboard">
+          <option value="">all</option>
+          <option value="prs">prs</option>
+          <option value="next">next</option>
+          <option value="master">master</option>
+        </select>
+        <label style="color:#888">status</label>
+        <select id="ttStatus">
+          <option value="">all</option>
+          <option value="passed">passed</option>
+          <option value="failed">failed</option>
+          <option value="flaked">flaked</option>
+        </select>
+      </div>
+    </div>
+    <div id="ttMsg" class="msg"></div>
+    <div class="kpi-strip" id="ttKpis"></div>
+    <div class="charts">
+      <div class="chart-box full">
+        <h3>avg duration by day</h3>
+        <div class="chart-wrap" id="ttChartDuration"></div>
+      </div>
+      <div class="chart-box full">
+        <h3>test run count by day</h3>
+        <div class="chart-wrap" id="ttChartCount"></div>
+      </div>
+    </div>
+    <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:24px 0 8px 0;">tests by duration</h3>
+    <div class="detail-scroll">
+      <table id="ttTestTable">
+        <thead>
+          <tr>
+            <th>test command</th>
+            <th class="amt">runs</th>
+            <th class="amt">avg (s)</th>
+            <th class="amt">min (s)</th>
+            <th class="amt">max (s)</th>
+            <th class="amt">total (h)</th>
+            <th class="amt">pass %</th>
+            <th class="amt">passed</th>
+            <th class="amt">failed</th>
+            <th class="amt">flaked</th>
+          </tr>
+        </thead>
+        <tbody></tbody>
+      </table>
+    </div>
+    <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:24px 0 8px 0;">slowest individual runs</h3>
+    <div class="detail-scroll">
+      <table id="ttSlowestTable">
+        <thead>
+          <tr>
+            <th>test command</th>
+            <th class="amt">duration (s)</th>
+            <th>status</th>
+            <th>date</th>
+            <th>author</th>
+            <th>pipeline</th>
+            <th>log</th>
+          </tr>
+        </thead>
+        <tbody></tbody>
+      </table>
+    </div>
   </div>
 
-  <!-- Author CI profile table -->
-  <div class="section-title">author ci profile</div>
-  <div class="detail-scroll">
-    <table>
-      <thead id="author-thead"><tr></tr></thead>
-      <tbody id="author-tbody"></tbody>
-    </table>
+  <!-- ============ TAB: Attribution ============ -->
+  <div class="tab-content" id="tab-attribution">
+    <div class="stats" id="attr-stats"></div>
+    <div id="attr-user-filter" style="display:none; margin:8px 0; padding:6px 12px; background:#1a1a2e; border:1px solid #58a6ff; align-items:center; gap:8px; font-size:13px;">
+      filtered to user: <span id="attr-uf-name" style="color:#fff;font-weight:bold"></span>
+      <span id="attr-uf-clear" style="cursor:pointer;color:#888;margin-left:8px">[clear]</span>
+    </div>
+    <div id="attr-msg" class="msg"></div>
+    <div class="charts">
+      <div class="chart-box full">
+        <h3>ci cost by run type (time series)</h3>
+        <div class="chart-wrap tall"><canvas id="attrTimeSeries"></canvas></div>
+      </div>
+      <div class="chart-box">
+        <h3>cost by user (AWS + GCP)</h3>
+        <div class="chart-wrap" style="height:400px"><canvas id="userBar"></canvas></div>
+      </div>
+      <div class="chart-box">
+        <h3>cost by run type</h3>
+        <div class="chart-wrap med"><canvas id="typeDonut"></canvas></div>
+      </div>
+    </div>
+
+    <div class="section-title">author ci profile</div>
+    <div class="detail-scroll">
+      <table>
+        <thead id="author-thead"><tr></tr></thead>
+        <tbody id="author-tbody"></tbody>
+      </table>
+    </div>
+
+    <div class="section-title">instances</div>
+    <div class="detail-scroll" style="max-height:500px">
+      <table class="detail-table">
+        <thead id="attr-thead"><tr></tr></thead>
+        <tbody id="attr-tbody"></tbody>
+      </table>
+    </div>
   </div>
 
-  <script src="https://cdn.jsdelivr.net/npm/chart.js@3.9.1/dist/chart.min.js"></script>
+  <script src="https://cdn.jsdelivr.net/npm/chart.js@4"></script>
   <script>
     Chart.defaults.color = '#888';
     Chart.defaults.font.family = 'monospace';
 
-    // State
-    let costData = null, mqData = null, perfData = null, flakeData = null, prData = null;
+    // ---- Shared state ----
     let charts = {};
     let sparkCharts = {};
-    let flakeSort = { col: 'count', dir: 'desc' };
-    let authorSort = { col: 'total_cost', dir: 'desc' };
     let pipelineFilter = '';
 
     function granularity() { return document.querySelector('[data-g].active').dataset.g; }
-
     const fmt = v => v == null ? '--' : v >= 1000 ? '$' + v.toFixed(0).replace(/\B(?=(\d{3})+(?!\d))/g, ',') : v >= 1 ? '$' + v.toFixed(2) : '$' + v.toFixed(4);
-    const fmtDate = s => { const d = new Date(s + 'T00:00:00'); return d.toLocaleDateString('en-US', { month: 'short', day: 'numeric' }); };
+    const MONTHS = ['Jan','Feb','Mar','Apr','May','Jun','Jul','Aug','Sep','Oct','Nov','Dec'];
+    const fmtDate = s => { const d = new Date(s + 'T00:00:00'); return MONTHS[d.getMonth()] + ' ' + d.getDate(); };
+    const fmtDateFull = s => { const d = new Date(s + 'T00:00:00'); return MONTHS[d.getMonth()] + ' ' + d.getDate() + ', ' + d.getFullYear(); };
     const escapeHtml = s => { const d = document.createElement('div'); d.textContent = s; return d.innerHTML; };
 
     function delta(values) {
@@ -167,7 +328,6 @@ <h3>flakes + test failures per day</h3>
       return `<span class="delta ${cls}">${sign}${d.pct.toFixed(0)}%</span>`;
     }
 
-    // Sparkline: tiny Chart.js line, no axes, no labels
     function spark(canvasId, values, color) {
       if (sparkCharts[canvasId]) sparkCharts[canvasId].destroy();
       const ctx = document.getElementById(canvasId);
@@ -187,8 +347,14 @@ <h3>flakes + test failures per day</h3>
       });
     }
 
-    // ---- Data loading ----
-    async function load() {
+    // ==================================================================
+    //  TAB 1: Overview
+    // ==================================================================
+    let mqData = null, perfData = null, flakeData = null, prData = null, phaseData = null;
+    let flakeSort = { col: 'count', dir: 'desc' };
+    let authorSort = { col: 'total_cost', dir: 'desc' };
+
+    async function loadOverview() {
       const el = document.getElementById('msg');
       el.className = 'msg'; el.textContent = 'loading...';
       const f = document.getElementById('dateFrom').value;
@@ -196,7 +362,6 @@ <h3>flakes + test failures per day</h3>
       const g = granularity();
       const pf = pipelineFilter ? `&dashboard=${encodeURIComponent(pipelineFilter)}` : '';
 
-      // Show/hide pipeline filter indicator
       const pfEl = document.getElementById('pipeline-filter');
       if (pipelineFilter) {
         pfEl.style.display = 'inline-flex';
@@ -206,77 +371,53 @@ <h3>flakes + test failures per day</h3>
       }
 
       try {
-        const [costResp, mqResp, perfResp, flakeResp, prResp] = await Promise.all([
-          fetch(`/api/costs/runners?from=${f}&to=${t}&granularity=${g}${pf}`),
+        const ttP = new URLSearchParams({
+          from: f, to: t,
+          dashboard: document.getElementById('ttDashboard').value,
+          status: document.getElementById('ttStatus').value,
+        });
+        const [mqResp, perfResp, flakeResp, prResp, ttResp, phaseResp] = await Promise.all([
           fetch(`/api/merge-queue/stats?from=${f}&to=${t}`),
           fetch(`/api/ci/performance?from=${f}&to=${t}&granularity=${g}${pf}`),
           fetch(`/api/ci/flakes-by-command?from=${f}&to=${t}${pf}`),
           fetch(`/api/prs/metrics?from=${f}&to=${t}`),
+          fetch('/api/tests/timings?' + ttP),
+          fetch(`/api/ci/phases?from=${f}&to=${t}${pf}`),
         ]);
-
-        [costData, mqData, perfData, flakeData, prData] = await Promise.all([
-          costResp.json(), mqResp.json(), perfResp.json(), flakeResp.json(), prResp.json()
+        [mqData, perfData, flakeData, prData, ttData, phaseData] = await Promise.all([
+          mqResp.json(), perfResp.json(), flakeResp.json(), prResp.json(), ttResp.json(), phaseResp.json()
         ]);
-
         el.textContent = '';
-        render();
+        renderOverview();
+        ttRender();
       } catch (e) {
-        el.className = 'msg err';
-        el.textContent = 'error: ' + e.message;
+        el.className = 'msg err'; el.textContent = 'error: ' + e.message;
       }
     }
 
-    // ---- Render everything ----
-    function render() {
-      Object.values(charts).forEach(c => c.destroy());
-      charts = {};
+    function renderOverview() {
+      // Destroy overview charts
+      ['mq', 'flake', 'ciDurPipe', 'ciTotalTime', 'phase'].forEach(k => { if (charts[k]) { charts[k].destroy(); delete charts[k]; } });
+
+      const period = perfData?.period;
+      if (period) document.getElementById('period-label').textContent = `(${period.from} to ${period.to})`;
 
       renderKPIs();
-      renderCostChart();
       renderMQChart();
       renderFlakeChart();
+      renderCIDurPipeChart();
+      renderCITotalTimeChart();
+      renderPhaseChart();
+      renderTopFlakes();
+      renderTopFailures();
       renderFlakeTable();
-      renderAuthorTable();
-      saveUrl();
     }
 
-    // ---- KPI strip ----
     function renderKPIs() {
-      const costByDate = costData?.by_date || [];
       const mqByDate = mqData?.by_date || [];
       const perfByDate = perfData?.by_date || [];
       const prByDate = prData?.by_date || [];
-      const days = costByDate.length || 1;
-
-      // Daily CI spend
-      const dailyCosts = costByDate.map(d => d.total || 0);
-      const totalCost = dailyCosts.reduce((s, v) => s + v, 0);
-      const avgDailySpend = totalCost / days;
-      document.getElementById('kv-spend').innerHTML = fmt(avgDailySpend) + deltaHtml(dailyCosts);
-      spark('ks-spend', dailyCosts, '#58a6ff');
-
-      // Cost per merge (rolling)
-      const prMergedByDate = {};
-      prByDate.forEach(d => { prMergedByDate[d.date] = d.pr_count || 0; });
-      const costByDateMap = {};
-      costByDate.forEach(d => { costByDateMap[d.date] = d.total || 0; });
-      const allDates = [...new Set([...Object.keys(prMergedByDate), ...Object.keys(costByDateMap)])].sort();
-      let totalMerged = 0;
-      allDates.forEach(date => { totalMerged += prMergedByDate[date] || 0; });
-      const avgCPM = totalMerged > 0 ? totalCost / totalMerged : null;
-      // Per-day cost-per-merge for sparkline (7d rolling)
-      const cpmSpark = [];
-      for (let i = 0; i < allDates.length; i++) {
-        let windowCost = 0, windowMerged = 0;
-        for (let j = Math.max(0, i - 6); j <= i; j++) {
-          windowCost += costByDateMap[allDates[j]] || 0;
-          windowMerged += prMergedByDate[allDates[j]] || 0;
-        }
-        cpmSpark.push(windowMerged > 0 ? windowCost / windowMerged : null);
-      }
-      const cpmFiltered = cpmSpark.filter(v => v !== null);
-      document.getElementById('kv-cpm').innerHTML = (avgCPM != null ? fmt(avgCPM) : '--') + (cpmFiltered.length > 2 ? deltaHtml(cpmFiltered) : '');
-      spark('ks-cpm', cpmFiltered, '#d2a8ff');
+      const days = perfByDate.length || 1;
 
       // MQ success rate
       const mqRates = mqByDate.map(d => d.total > 0 ? 100 * d.success / d.total : null).filter(v => v !== null);
@@ -289,47 +430,37 @@ <h3>flakes + test failures per day</h3>
       // Flakes per day
       const flakeCounts = perfByDate.map(d => d.flake_count || 0);
       const totalFlakes = flakeCounts.reduce((s, v) => s + v, 0);
-      const avgFlakes = (totalFlakes / days).toFixed(1);
-      document.getElementById('kv-flakes').innerHTML = avgFlakes + deltaHtml(flakeCounts);
+      document.getElementById('kv-flakes').innerHTML = (totalFlakes / days).toFixed(1) + deltaHtml(flakeCounts);
       spark('ks-flakes', flakeCounts, '#f0883e');
 
       // PRs merged per day
       const prCounts = prByDate.map(d => d.pr_count || 0);
       const totalPRs = prCounts.reduce((s, v) => s + v, 0);
-      const avgPRs = (totalPRs / days).toFixed(1);
-      document.getElementById('kv-prs').innerHTML = avgPRs + (prCounts.length > 2 ? deltaHtml(prCounts, true) : '');
+      document.getElementById('kv-prs').innerHTML = (totalPRs / days).toFixed(1) + (prCounts.length > 2 ? deltaHtml(prCounts, true) : '');
       spark('ks-prs', prCounts, '#56d364');
-    }
 
-    // ---- Cost chart with rolling CPM overlay ----
-    function renderCostChart() {
-      const costByDate = costData?.by_date || [];
-      const prByDate = prData?.by_date || [];
-      const prMergedByDate = {};
-      prByDate.forEach(d => { prMergedByDate[d.date] = d.pr_count || 0; });
-
-      const dates = costByDate.map(d => d.date);
-      const spotCosts = costByDate.map(d => d.spot_cost || 0);
-      const odCosts = costByDate.map(d => d.ondemand_cost || 0);
-
-      // 7-day rolling cost per merge
-      const cpmLine = [];
-      for (let i = 0; i < dates.length; i++) {
-        let wCost = 0, wMerged = 0;
-        for (let j = Math.max(0, i - 6); j <= i; j++) {
-          wCost += (costByDate[j]?.total || 0);
-          wMerged += (prMergedByDate[dates[j]] || 0);
-        }
-        cpmLine.push(wMerged > 0 ? wCost / wMerged : null);
-      }
+      // Avg merge-queue duration (from duration_by_dashboard)
+      const mqDurData = (perfData?.duration_by_dashboard || {})['merge-queue'] || [];
+      const mqDurations = mqDurData.map(d => d.avg_duration_mins).filter(v => v != null);
+      const mqAvgDur = mqDurations.length ? mqDurations.reduce((s, v) => s + v, 0) / mqDurations.length : null;
+      document.getElementById('kv-citime').innerHTML = (mqAvgDur != null ? mqAvgDur.toFixed(0) + 'm' : '--') + (mqDurations.length > 2 ? deltaHtml(mqDurations) : '');
+      spark('ks-citime', mqDurations, '#d2a8ff');
+    }
 
-      charts.cost = new Chart(document.getElementById('costChart').getContext('2d'), {
+    function renderMQChart() {
+      const byDate = mqData?.by_date || [];
+      const dates = byDate.map(d => d.date);
+      const successRate = byDate.map(d => d.total > 0 ? 100 * d.success / d.total : null);
+      charts.mq = new Chart(document.getElementById('mqChart').getContext('2d'), {
         data: {
           labels: dates.map(fmtDate),
           datasets: [
-            { type: 'bar', label: 'Spot', data: spotCosts, backgroundColor: '#3fb950', stack: 'cost', borderWidth: 0, order: 2 },
-            { type: 'bar', label: 'On-Demand', data: odCosts, backgroundColor: '#58a6ff', stack: 'cost', borderWidth: 0, order: 2 },
-            { type: 'line', label: 'Cost/Merge (7d)', data: cpmLine, borderColor: '#d2a8ff', borderWidth: 2, pointRadius: 0, tension: 0.3, yAxisID: 'y1', order: 1, spanGaps: true },
+            { type: 'bar', label: 'Success', data: byDate.map(d => d.success || 0), backgroundColor: '#3fb950', stack: 'mq', borderWidth: 0, order: 3 },
+            { type: 'bar', label: 'Failure', data: byDate.map(d => d.failure || 0), backgroundColor: '#f85149', stack: 'mq', borderWidth: 0, order: 3 },
+            { type: 'bar', label: 'Cancelled', data: byDate.map(d => d.cancelled || 0), backgroundColor: '#888', stack: 'mq', borderWidth: 0, order: 3 },
+            { type: 'line', label: 'Success %', data: successRate, borderColor: '#56d364', borderWidth: 2, pointRadius: 0, tension: 0.3, yAxisID: 'y1', order: 1, spanGaps: true },
+            { type: 'line', label: 'Avg Queue Depth', data: byDate.map(d => d.avg_depth || 0), borderColor: '#d2a8ff', borderWidth: 1.5, pointRadius: 0, tension: 0.3, yAxisID: 'y2', order: 2 },
+            { type: 'line', label: 'Peak Queue Depth', data: byDate.map(d => d.peak_depth || 0), borderColor: '#d2a8ff44', borderWidth: 1, borderDash: [4, 3], pointRadius: 0, tension: 0.3, yAxisID: 'y2', order: 2 },
           ]
         },
         options: {
@@ -337,43 +468,29 @@ <h3>flakes + test failures per day</h3>
           interaction: { mode: 'index', intersect: false },
           scales: {
             x: { stacked: true, ticks: { color: '#555', maxRotation: 45 }, grid: { color: '#181818' } },
-            y: { stacked: true, position: 'left', beginAtZero: true, ticks: { color: '#555', callback: v => '$' + v }, grid: { color: '#181818' } },
-            y1: { position: 'right', beginAtZero: true, suggestedMax: Math.max(...cpmLine.filter(v => v != null), 0) * 1.15 || 100, ticks: { color: '#d2a8ff', callback: v => '$' + Math.round(v) }, grid: { display: false } }
+            y: { stacked: true, position: 'left', title: { display: true, text: 'runs', color: '#555', font: { size: 10 } }, ticks: { color: '#555' }, grid: { color: '#181818' } },
+            y1: { position: 'right', min: 0, max: 100, ticks: { color: '#56d364', callback: v => v + '%' }, grid: { display: false } },
+            y2: { position: 'right', title: { display: true, text: 'queue depth', color: '#d2a8ff', font: { size: 10 } }, ticks: { color: '#d2a8ff' }, grid: { display: false }, min: 0 }
           },
           plugins: {
             legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
-            tooltip: {
-              callbacks: {
-                label: c => {
-                  if (c.dataset.type === 'line') return `${c.dataset.label}: ${c.raw != null ? fmt(c.raw) : '--'}`;
-                  return `${c.dataset.label}: ${fmt(c.raw)}`;
-                },
-                footer: items => {
-                  const bars = items.filter(i => i.dataset.type === 'bar');
-                  return bars.length ? `total: ${fmt(bars.reduce((s, i) => s + i.raw, 0))}` : '';
-                }
-              }
-            }
+            tooltip: { callbacks: { label: c => c.dataset.label === 'Success %' ? `${c.dataset.label}: ${c.raw != null ? c.raw.toFixed(1) + '%' : '--'}` : `${c.dataset.label}: ${c.raw}` } }
           }
         }
       });
     }
 
-    // ---- Merge queue chart ----
-    function renderMQChart() {
-      const byDate = mqData?.by_date || [];
+    function renderFlakeChart() {
+      const byDate = perfData?.by_date || [];
       const dates = byDate.map(d => d.date);
-      const successRate = byDate.map(d => d.total > 0 ? 100 * d.success / d.total : null);
-
-      charts.mq = new Chart(document.getElementById('mqChart').getContext('2d'), {
+      charts.flake = new Chart(document.getElementById('flakeChart').getContext('2d'), {
         data: {
           labels: dates.map(fmtDate),
           datasets: [
-            { type: 'bar', label: 'Success', data: byDate.map(d => d.success || 0), backgroundColor: '#3fb950', stack: 'mq', borderWidth: 0, order: 3 },
-            { type: 'bar', label: 'Failure', data: byDate.map(d => d.failure || 0), backgroundColor: '#f85149', stack: 'mq', borderWidth: 0, order: 3 },
-            { type: 'bar', label: 'Cancelled', data: byDate.map(d => d.cancelled || 0), backgroundColor: '#888', stack: 'mq', borderWidth: 0, order: 3 },
-            { type: 'line', label: 'Success %', data: successRate, borderColor: '#56d364', borderWidth: 2, pointRadius: 0, tension: 0.3, yAxisID: 'y1', order: 1, spanGaps: true },
-            { type: 'line', label: 'Queue Depth', data: byDate.map(d => d.in_progress || 0), borderColor: '#d2a8ff', borderWidth: 1.5, borderDash: [4, 3], pointRadius: 0, tension: 0.3, yAxisID: 'y', order: 2 },
+            { type: 'bar', label: 'Flakes', data: byDate.map(d => d.flake_count || 0), backgroundColor: '#f0883e', borderWidth: 0, stack: 'issues', yAxisID: 'y', order: 3 },
+            { type: 'bar', label: 'Test Failures', data: byDate.map(d => d.test_failure_count || 0), backgroundColor: '#f85149', borderWidth: 0, stack: 'issues', yAxisID: 'y', order: 3 },
+            { type: 'line', label: 'Successes', data: byDate.map(d => d.test_success_count || 0), borderColor: '#3fb950', backgroundColor: 'rgba(63,185,80,0.08)', fill: true, borderWidth: 1.5, pointRadius: 0, tension: 0.3, yAxisID: 'y1', order: 2 },
+            { type: 'line', label: 'CI Failure Rate %', data: byDate.map(d => d.failure_rate || 0), borderColor: '#ff7b72', borderWidth: 2, pointRadius: 0, tension: 0.3, yAxisID: 'y2', order: 1 },
           ]
         },
         options: {
@@ -381,17 +498,18 @@ <h3>flakes + test failures per day</h3>
           interaction: { mode: 'index', intersect: false },
           scales: {
             x: { stacked: true, ticks: { color: '#555', maxRotation: 45 }, grid: { color: '#181818' } },
-            y: { stacked: true, position: 'left', ticks: { color: '#555' }, grid: { color: '#181818' } },
-            y1: { position: 'right', min: 0, max: 100, ticks: { color: '#56d364', callback: v => v + '%' }, grid: { display: false } }
+            y: { stacked: true, position: 'left', title: { display: true, text: 'failures + flakes', color: '#555', font: { size: 10 } }, ticks: { color: '#555' }, grid: { color: '#181818' } },
+            y1: { position: 'right', title: { display: true, text: 'successes', color: '#3fb950', font: { size: 10 } }, ticks: { color: '#3fb950' }, grid: { display: false } },
+            y2: { position: 'right', display: false, min: 0, ticks: { display: false }, grid: { display: false } }
           },
           plugins: {
             legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
             tooltip: {
               callbacks: {
-                label: c => {
-                  if (c.dataset.label === 'Success %') return `${c.dataset.label}: ${c.raw != null ? c.raw.toFixed(1) + '%' : '--'}`;
-                  return `${c.dataset.label}: ${c.raw}`;
-                }
+                title: items => items.length ? fmtDateFull(dates[items[0].dataIndex]) : '',
+                label: c => c.dataset.label === 'CI Failure Rate %' ? `${c.dataset.label}: ${c.raw != null ? c.raw.toFixed(1) + '%' : '--'}`
+                  : c.dataset.label === 'Successes' ? `${c.dataset.label}: ${(c.raw || 0).toLocaleString()}`
+                  : `${c.dataset.label}: ${c.raw}`
               }
             }
           }
@@ -399,36 +517,47 @@ <h3>flakes + test failures per day</h3>
       });
     }
 
-    // ---- Flake / test failure chart ----
-    function renderFlakeChart() {
-      const byDate = perfData?.by_date || [];
-      const dates = byDate.map(d => d.date);
+    function renderCIDurPipeChart() {
+      const dbd = perfData?.duration_by_dashboard || {};
+      const pipelines = Object.keys(dbd).sort();
+      if (!pipelines.length) return;
+      const pipeColors = { 'prs': '#3fb950', 'next': '#58a6ff', 'master': '#d2a8ff', 'nightly': '#f0883e', 'releases': '#f85149', 'deflake': '#a5d6ff' };
+      const defaultColors = ['#56d364', '#79c0ff', '#d2a8ff', '#f0883e', '#ff7b72', '#a5d6ff', '#e3b341', '#8b949e'];
+      // Collect all dates across pipelines
+      const allDates = new Set();
+      pipelines.forEach(p => (dbd[p] || []).forEach(d => allDates.add(d.date)));
+      const dates = [...allDates].sort();
 
-      charts.flake = new Chart(document.getElementById('flakeChart').getContext('2d'), {
-        data: {
-          labels: dates.map(fmtDate),
-          datasets: [
-            { type: 'bar', label: 'Flakes', data: byDate.map(d => d.flake_count || 0), backgroundColor: '#f0883e', borderWidth: 0, order: 2 },
-            { type: 'bar', label: 'Test Failures', data: byDate.map(d => d.test_failure_count || 0), backgroundColor: '#f85149', borderWidth: 0, order: 2 },
-            { type: 'line', label: 'CI Failure Rate %', data: byDate.map(d => d.failure_rate || 0), borderColor: '#ff7b72', borderWidth: 2, pointRadius: 0, tension: 0.3, yAxisID: 'y1', order: 1 },
-          ]
-        },
+      const datasets = pipelines.map((p, i) => {
+        const dateMap = {};
+        (dbd[p] || []).forEach(d => { dateMap[d.date] = d.avg_duration_mins; });
+        return {
+          label: p,
+          data: dates.map(d => dateMap[d] ?? null),
+          borderColor: pipeColors[p] || defaultColors[i % defaultColors.length],
+          borderWidth: 2,
+          pointRadius: 1,
+          tension: 0.3,
+          spanGaps: true,
+        };
+      });
+
+      charts.ciDurPipe = new Chart(document.getElementById('ciDurPipeChart').getContext('2d'), {
+        type: 'line',
+        data: { labels: dates.map(fmtDate), datasets },
         options: {
           responsive: true, maintainAspectRatio: false,
           interaction: { mode: 'index', intersect: false },
           scales: {
             x: { ticks: { color: '#555', maxRotation: 45 }, grid: { color: '#181818' } },
-            y: { position: 'left', ticks: { color: '#555' }, grid: { color: '#181818' } },
-            y1: { position: 'right', min: 0, ticks: { color: '#ff7b72', callback: v => v + '%' }, grid: { display: false } }
+            y: { title: { display: true, text: 'minutes', color: '#555', font: { size: 10 } }, ticks: { color: '#555' }, grid: { color: '#181818' } }
           },
           plugins: {
             legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
             tooltip: {
               callbacks: {
-                label: c => {
-                  if (c.dataset.type === 'line') return `${c.dataset.label}: ${c.raw != null ? c.raw.toFixed(1) + '%' : '--'}`;
-                  return `${c.dataset.label}: ${c.raw}`;
-                }
+                title: items => items.length ? fmtDateFull(dates[items[0].dataIndex]) : '',
+                label: c => `${c.dataset.label}: ${c.raw != null ? c.raw.toFixed(1) + 'm' : '--'}`
               }
             }
           }
@@ -436,7 +565,176 @@ <h3>flakes + test failures per day</h3>
       });
     }
 
-    // ---- Flakes table ----
+    function renderCITotalTimeChart() {
+      const dbd = perfData?.duration_by_dashboard || {};
+      const pipelines = Object.keys(dbd).sort();
+      if (!pipelines.length) return;
+      const pipeColors = { 'prs': '#3fb950', 'next': '#58a6ff', 'master': '#d2a8ff', 'nightly': '#f0883e', 'releases': '#f85149', 'deflake': '#a5d6ff' };
+      const defaultColors = ['#56d364', '#79c0ff', '#d2a8ff', '#f0883e', '#ff7b72', '#a5d6ff', '#e3b341', '#8b949e'];
+      const allDates = new Set();
+      pipelines.forEach(p => (dbd[p] || []).forEach(d => allDates.add(d.date)));
+      const dates = [...allDates].sort();
+
+      const datasets = pipelines.map((p, i) => {
+        const dateMap = {};
+        (dbd[p] || []).forEach(d => { dateMap[d.date] = d.total_duration_mins ? round(d.total_duration_mins / 60, 1) : null; });
+        return {
+          label: p, fill: true,
+          data: dates.map(d => dateMap[d] ?? null),
+          backgroundColor: (pipeColors[p] || defaultColors[i % defaultColors.length]) + '40',
+          borderColor: pipeColors[p] || defaultColors[i % defaultColors.length],
+          borderWidth: 2, pointRadius: 1, tension: 0.3, spanGaps: true,
+        };
+      });
+
+      function round(v, d) { const m = Math.pow(10, d); return Math.round(v * m) / m; }
+
+      charts.ciTotalTime = new Chart(document.getElementById('ciTotalTimeChart').getContext('2d'), {
+        type: 'line',
+        data: { labels: dates.map(fmtDate), datasets },
+        options: {
+          responsive: true, maintainAspectRatio: false,
+          interaction: { mode: 'index', intersect: false },
+          scales: {
+            x: { stacked: true, ticks: { color: '#555', maxRotation: 45 }, grid: { color: '#181818' } },
+            y: { stacked: true, title: { display: true, text: 'hours', color: '#555', font: { size: 10 } }, ticks: { color: '#555' }, grid: { color: '#181818' } }
+          },
+          plugins: {
+            legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
+            tooltip: {
+              callbacks: {
+                title: items => items.length ? fmtDateFull(dates[items[0].dataIndex]) : '',
+                label: c => `${c.dataset.label}: ${c.raw != null ? c.raw.toFixed(1) + 'h' : '--'}`,
+                footer: items => `total: ${items.reduce((s, i) => s + (i.raw || 0), 0).toFixed(1)}h`
+              }
+            }
+          }
+        }
+      });
+    }
+
+    function renderPhaseChart() {
+      const byDash = phaseData?.by_dashboard || [];
+      if (!byDash.length) return;
+
+      // Collect all unique phase names (no grouping — each artifact is its own phase)
+      const allPhases = new Set();
+      byDash.forEach(d => {
+        for (const p of Object.keys(d.phases || {})) allPhases.add(p);
+      });
+
+      const dashboards = byDash.map(d => d.dashboard).sort();
+      const dashData = {};
+      byDash.forEach(d => { dashData[d.dashboard] = d.phases || {}; });
+
+      // Sort phases by total time descending for nice stacking
+      const phaseTotals = {};
+      for (const p of allPhases) {
+        phaseTotals[p] = dashboards.reduce((s, d) => s + (dashData[d]?.[p] || 0), 0);
+      }
+      const phases = [...allPhases].sort((a, b) => phaseTotals[b] - phaseTotals[a]);
+
+      const phaseColors = {
+        'build': '#58a6ff', 'test': '#3fb950', 'bench': '#d2a8ff',
+        'noir': '#e3b341', 'avm-transpiler': '#a5d6ff', 'barretenberg': '#f0883e',
+        'noir-projects': '#ff7b72', 'l1-contracts': '#79c0ff', 'yarn-project': '#56d364',
+        'release-image': '#8b949e', 'parallel-builds': '#d2a8ff',
+      };
+      const defaultColors = ['#388bfd', '#f85149', '#56d364', '#79c0ff', '#d2a8ff', '#f0883e', '#ff7b72', '#a5d6ff', '#e3b341', '#8b949e', '#da3633', '#a371f7'];
+
+      // Sum of P95 values per dashboard (for stacked bar totals in tooltip)
+      const totals = dashboards.map(d => phases.reduce((s, p) => s + (dashData[d]?.[p] || 0), 0));
+
+      const datasets = phases.map((p, i) => ({
+        label: p,
+        data: dashboards.map(d => dashData[d]?.[p] || 0),
+        backgroundColor: phaseColors[p] || defaultColors[i % defaultColors.length],
+        borderWidth: 0,
+      }));
+
+      charts.phase = new Chart(document.getElementById('phaseChart').getContext('2d'), {
+        type: 'bar',
+        data: { labels: dashboards, datasets },
+        options: {
+          responsive: true, maintainAspectRatio: false,
+          interaction: { mode: 'index', intersect: false },
+          scales: {
+            x: { stacked: true, ticks: { color: '#ccc', font: { family: 'monospace', size: 12 } }, grid: { color: '#181818' } },
+            y: { stacked: true, title: { display: true, text: 'P95 secs', color: '#555', font: { size: 10 } }, ticks: { color: '#555', callback: v => v >= 3600 ? (v / 3600).toFixed(0) + 'h' : v >= 60 ? (v / 60).toFixed(0) + 'm' : v + 's' }, grid: { color: '#181818' } }
+          },
+          plugins: {
+            legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
+            tooltip: {
+              itemSort: (a, b) => b.raw - a.raw,
+              filter: c => c.raw > 0,
+              callbacks: {
+                label: c => `${c.dataset.label}: ${c.raw >= 3600 ? (c.raw / 3600).toFixed(1) + 'h' : c.raw >= 60 ? (c.raw / 60).toFixed(1) + 'm' : Math.round(c.raw) + 's'}`,
+                footer: items => `total: ${(items.reduce((s, i) => s + i.raw, 0) / 3600).toFixed(1)}h`
+              }
+            },
+            datalabels: false,
+          },
+          animation: {
+            onComplete: function() {
+              const ctx = this.ctx;
+              ctx.save();
+              ctx.font = '11px monospace';
+              ctx.fillStyle = '#ccc';
+              ctx.textAlign = 'center';
+              const meta = this.getDatasetMeta(datasets.length - 1);
+              if (!meta) { ctx.restore(); return; }
+              dashboards.forEach((d, i) => {
+                const total = totals[i];
+                if (!total) return;
+                const bar = meta.data[i];
+                if (!bar) return;
+                const label = total >= 3600 ? (total / 3600).toFixed(1) + 'h' : (total / 60).toFixed(0) + 'm';
+                ctx.fillText(label, bar.x, bar.y - 6);
+              });
+              ctx.restore();
+            }
+          }
+        }
+      });
+    }
+
+    function avatarHtml(authorsStr) {
+      if (!authorsStr) return '';
+      const authors = authorsStr.split(',').filter(a => a && a !== 'unknown');
+      if (!authors.length) return '';
+      return authors.slice(0, 6).map(a =>
+        `<img src="https://github.com/${encodeURIComponent(a)}.png?size=24" title="${escapeHtml(a)}" style="width:20px;height:20px;border-radius:50%;border:1px solid #333;vertical-align:middle;margin-right:2px" onerror="this.style.display='none'">`
+      ).join('') + (authors.length > 6 ? `<span style="color:#888;font-size:11px;vertical-align:middle">+${authors.length - 6}</span>` : '');
+    }
+
+    function renderTopFlakes() {
+      const flakes = perfData?.top_flakes || [];
+      const tbody = document.getElementById('top-flake-tbody');
+      if (!flakes.length) {
+        tbody.innerHTML = '<tr><td colspan="3" style="color:#888">no flake data</td></tr>';
+        return;
+      }
+      tbody.innerHTML = flakes.map(f => {
+        const cmd = escapeHtml(f.test_cmd || '');
+        const short = cmd.length > 80 ? cmd.slice(0, 77) + '...' : cmd;
+        return `<tr><td title="${cmd}" style="max-width:400px;overflow:hidden;text-overflow:ellipsis;white-space:nowrap">${short}</td><td class="amt" style="color:#f0883e">${f.count}</td><td style="white-space:nowrap">${avatarHtml(f.authors)}</td></tr>`;
+      }).join('');
+    }
+
+    function renderTopFailures() {
+      const failures = perfData?.top_failures || [];
+      const tbody = document.getElementById('top-fail-tbody');
+      if (!failures.length) {
+        tbody.innerHTML = '<tr><td colspan="3" style="color:#888">no failure data</td></tr>';
+        return;
+      }
+      tbody.innerHTML = failures.map(f => {
+        const cmd = escapeHtml(f.test_cmd || '');
+        const short = cmd.length > 80 ? cmd.slice(0, 77) + '...' : cmd;
+        return `<tr><td title="${cmd}" style="max-width:400px;overflow:hidden;text-overflow:ellipsis;white-space:nowrap">${short}</td><td class="amt" style="color:#f85149">${f.count}</td><td style="white-space:nowrap">${avatarHtml(f.authors)}</td></tr>`;
+      }).join('');
+    }
+
     function renderFlakeTable() {
       const cmds = flakeData?.by_command || [];
       if (!cmds.length) {
@@ -444,166 +742,414 @@ <h3>flakes + test failures per day</h3>
         document.querySelector('#flake-thead tr').innerHTML = '';
         return;
       }
-
       if (pipelineFilter) {
-        // Filtered: show individual test commands within this pipeline
-        const allTests = cmds.flatMap(c => (c.top_tests || []).map(t => ({
-          test_cmd: t.test_cmd || '',
-          count: t.count || 0,
-        })));
-        const hdrs = [
-          { k: 'test_cmd', l: 'Test Command' },
-          { k: 'count', l: 'Flakes', cls: 'amt' },
-        ];
-        const tr = document.querySelector('#flake-thead tr');
-        tr.innerHTML = '';
-        hdrs.forEach(h => {
-          const th = document.createElement('th');
-          th.textContent = h.l;
-          if (h.cls) th.className = h.cls;
-          th.onclick = () => {
-            flakeSort = flakeSort.col === h.k ? { col: h.k, dir: flakeSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' };
-            renderTestRows(allTests);
-          };
-          tr.appendChild(th);
-        });
+        const allTests = cmds.flatMap(c => (c.top_tests || []).map(t => ({ test_cmd: t.test_cmd || '', count: t.count || 0 })));
+        const hdrs = [{ k: 'test_cmd', l: 'Test Command' }, { k: 'count', l: 'Flakes', cls: 'amt' }];
+        const tr = document.querySelector('#flake-thead tr'); tr.innerHTML = '';
+        hdrs.forEach(h => { const th = document.createElement('th'); th.textContent = h.l; if (h.cls) th.className = h.cls; th.onclick = () => { flakeSort = flakeSort.col === h.k ? { col: h.k, dir: flakeSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' }; renderTestRows(allTests); }; tr.appendChild(th); });
         renderTestRows(allTests);
       } else {
-        // Unfiltered: show pipelines, clickable to filter
-        const rows = cmds.map(c => ({
-          pipeline: c.command || '',
-          count: c.total_flakes || 0,
-          failures: c.total_failures || 0,
-        }));
-        const hdrs = [
-          { k: 'pipeline', l: 'Pipeline' },
-          { k: 'count', l: 'Flakes', cls: 'amt' },
-          { k: 'failures', l: 'Failures', cls: 'amt' },
-        ];
-        const tr = document.querySelector('#flake-thead tr');
-        tr.innerHTML = '';
-        hdrs.forEach(h => {
-          const th = document.createElement('th');
-          th.textContent = h.l;
-          if (h.cls) th.className = h.cls;
-          th.onclick = () => {
-            flakeSort = flakeSort.col === h.k ? { col: h.k, dir: flakeSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' };
-            renderPipelineRows(rows);
-          };
-          tr.appendChild(th);
-        });
+        const rows = cmds.map(c => ({ pipeline: c.command || '', count: c.total_flakes || 0, failures: c.total_failures || 0 }));
+        const hdrs = [{ k: 'pipeline', l: 'Pipeline' }, { k: 'count', l: 'Flakes', cls: 'amt' }, { k: 'failures', l: 'Failures', cls: 'amt' }];
+        const tr = document.querySelector('#flake-thead tr'); tr.innerHTML = '';
+        hdrs.forEach(h => { const th = document.createElement('th'); th.textContent = h.l; if (h.cls) th.className = h.cls; th.onclick = () => { flakeSort = flakeSort.col === h.k ? { col: h.k, dir: flakeSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' }; renderPipelineRows(rows); }; tr.appendChild(th); });
         renderPipelineRows(rows);
       }
     }
 
     function renderPipelineRows(rows) {
-      rows.sort((a, b) => {
-        const col = flakeSort.col;
-        let av = a[col], bv = b[col];
-        if (typeof av === 'string') return flakeSort.dir === 'asc' ? av.localeCompare(bv) : bv.localeCompare(av);
-        return flakeSort.dir === 'asc' ? (av || 0) - (bv || 0) : (bv || 0) - (av || 0);
-      });
-
+      rows.sort((a, b) => { const col = flakeSort.col; let av = a[col], bv = b[col]; if (typeof av === 'string') return flakeSort.dir === 'asc' ? av.localeCompare(bv) : bv.localeCompare(av); return flakeSort.dir === 'asc' ? (av||0)-(bv||0) : (bv||0)-(av||0); });
       document.getElementById('flake-tbody').innerHTML = rows.map((r, i) =>
-        `<tr style="cursor:pointer" data-idx="${i}">` +
-        `<td>${escapeHtml(r.pipeline)}</td>` +
-        `<td class="amt" style="color:#f0883e">${r.count}</td>` +
-        `<td class="amt" style="color:#f85149">${r.failures}</td>` +
-        `</tr>`
+        `<tr style="cursor:pointer" data-idx="${i}"><td>${escapeHtml(r.pipeline)}</td><td class="amt" style="color:#f0883e">${r.count}</td><td class="amt" style="color:#f85149">${r.failures}</td></tr>`
       ).join('');
-
       document.querySelectorAll('#flake-tbody tr').forEach(tr => {
-        tr.onclick = () => {
-          const row = rows[parseInt(tr.dataset.idx)];
-          if (row.pipeline) {
-            pipelineFilter = row.pipeline;
-            load();
-          }
-        };
+        tr.onclick = () => { const row = rows[parseInt(tr.dataset.idx)]; if (row.pipeline) { pipelineFilter = row.pipeline; loadOverview(); } };
       });
     }
 
     function renderTestRows(rows) {
-      rows.sort((a, b) => {
-        const col = flakeSort.col;
-        let av = a[col], bv = b[col];
-        if (typeof av === 'string') return flakeSort.dir === 'asc' ? av.localeCompare(bv) : bv.localeCompare(av);
-        return flakeSort.dir === 'asc' ? (av || 0) - (bv || 0) : (bv || 0) - (av || 0);
-      });
-
+      rows.sort((a, b) => { const col = flakeSort.col; let av = a[col], bv = b[col]; if (typeof av === 'string') return flakeSort.dir === 'asc' ? av.localeCompare(bv) : bv.localeCompare(av); return flakeSort.dir === 'asc' ? (av||0)-(bv||0) : (bv||0)-(av||0); });
       document.getElementById('flake-tbody').innerHTML = rows.map(r =>
-        `<tr>` +
-        `<td>${escapeHtml(r.test_cmd)}</td>` +
-        `<td class="amt" style="color:#f0883e">${r.count}</td>` +
-        `</tr>`
+        `<tr><td>${escapeHtml(r.test_cmd)}</td><td class="amt" style="color:#f0883e">${r.count}</td></tr>`
       ).join('');
     }
 
-    // ---- Author CI profile table ----
-    function renderAuthorTable() {
-      const authors = prData?.by_author || [];
-      if (!authors.length) {
-        document.getElementById('author-tbody').innerHTML = '<tr><td colspan="6" style="color:#888">no PR data</td></tr>';
-        return;
+    // ==================================================================
+    //  TAB 2: Test Details (from test-timings)
+    // ==================================================================
+    let ttData = null;
+
+    async function ttLoad() {
+      const el = document.getElementById('ttMsg');
+      el.className = 'msg'; el.textContent = 'loading...';
+      const p = new URLSearchParams({
+        from: document.getElementById('dateFrom').value,
+        to: document.getElementById('dateTo').value,
+        dashboard: document.getElementById('ttDashboard').value,
+        status: document.getElementById('ttStatus').value,
+      });
+      try {
+        const r = await fetch('/api/tests/timings?' + p);
+        if (!r.ok) throw new Error(r.statusText);
+        ttData = await r.json();
+        el.textContent = '';
+        ttRender();
+      } catch (e) {
+        el.className = 'msg err'; el.textContent = 'error: ' + e.message;
       }
+    }
+
+    function ttRender() {
+      if (!ttData) return;
+      // Destroy old charts
+      ['ttDuration', 'ttCount'].forEach(k => { if (charts[k]) { charts[k].destroy(); delete charts[k]; } });
+
+      const s = ttData.summary;
+      const fmtN = v => v == null ? '-' : v.toLocaleString();
+      const fmtH = secs => secs == null ? '-' : (secs / 3600).toFixed(1);
+      const kpi = (label, value) => `<div class="kpi"><div class="label">${label}</div><div class="value">${value}</div></div>`;
 
+      document.getElementById('ttKpis').innerHTML = [
+        kpi('total runs', fmtN(s.total_runs)),
+        kpi('avg duration', s.avg_duration_secs != null ? s.avg_duration_secs + 's' : '-'),
+        kpi('max duration', s.max_duration_secs != null ? s.max_duration_secs + 's' : '-'),
+        kpi('total compute', fmtH(s.total_compute_secs) + 'h'),
+        kpi('passed', `<span class="pass">${fmtN(s.passed)}</span>`),
+        kpi('failed', `<span class="fail">${fmtN(s.failed)}</span>`),
+        kpi('flaked', `<span class="flake">${fmtN(s.flaked)}</span>`),
+      ].join('');
+
+      const dates = ttData.by_date.map(r => r.date);
+
+      // Duration chart
+      const durEl = document.getElementById('ttChartDuration');
+      durEl.innerHTML = '';
+      const durCanvas = document.createElement('canvas');
+      durEl.appendChild(durCanvas);
+      charts.ttDuration = new Chart(durCanvas, {
+        type: 'line',
+        data: {
+          labels: dates.map(fmtDate),
+          datasets: [
+            { label: 'avg (s)', data: ttData.by_date.map(r => r.avg_secs), borderColor: '#58a6ff', backgroundColor: 'rgba(88,166,255,0.1)', fill: true, tension: 0.3, pointRadius: 1 },
+            { label: 'max (s)', data: ttData.by_date.map(r => r.max_secs), borderColor: '#f8514966', borderDash: [4, 4], tension: 0.3, pointRadius: 0 },
+          ]
+        },
+        options: {
+          responsive: true, maintainAspectRatio: false,
+          plugins: {
+            legend: { display: true, labels: { color: '#888', font: { family: 'monospace', size: 11 } } },
+            tooltip: { callbacks: { title: items => items.length ? fmtDateFull(dates[items[0].dataIndex]) : '' } }
+          },
+          scales: { x: { ticks: { color: '#555' }, grid: { color: '#111' } }, y: { ticks: { color: '#555' }, grid: { color: '#111' } } },
+        }
+      });
+
+      // Count chart
+      const cntEl = document.getElementById('ttChartCount');
+      cntEl.innerHTML = '';
+      const cntCanvas = document.createElement('canvas');
+      cntEl.appendChild(cntCanvas);
+      charts.ttCount = new Chart(cntCanvas, {
+        data: {
+          labels: dates.map(fmtDate),
+          datasets: [
+            { type: 'bar', label: 'failed', data: ttData.by_date.map(r => r.failed), backgroundColor: '#da3633', stack: 'issues', yAxisID: 'y', order: 3 },
+            { type: 'bar', label: 'flaked', data: ttData.by_date.map(r => r.flaked), backgroundColor: '#9e6a03', stack: 'issues', yAxisID: 'y', order: 3 },
+            { type: 'line', label: 'passed', data: ttData.by_date.map(r => r.passed), borderColor: '#3fb950', backgroundColor: 'rgba(35,134,54,0.08)', fill: true, borderWidth: 1.5, pointRadius: 0, tension: 0.3, yAxisID: 'y1', order: 2 },
+          ]
+        },
+        options: {
+          responsive: true, maintainAspectRatio: false,
+          interaction: { mode: 'index', intersect: false },
+          plugins: {
+            legend: { display: true, labels: { color: '#888', font: { family: 'monospace', size: 11 } } },
+            tooltip: {
+              callbacks: {
+                title: items => items.length ? fmtDateFull(dates[items[0].dataIndex]) : '',
+                label: c => `${c.dataset.label}: ${(c.raw || 0).toLocaleString()}`
+              }
+            }
+          },
+          scales: {
+            x: { stacked: true, ticks: { color: '#555' }, grid: { color: '#111' } },
+            y: { stacked: true, position: 'left', title: { display: true, text: 'failed + flaked', color: '#555', font: { size: 10 } }, ticks: { color: '#555' }, grid: { color: '#111' } },
+            y1: { position: 'right', title: { display: true, text: 'passed', color: '#3fb950', font: { size: 10 } }, ticks: { color: '#3fb950' }, grid: { display: false } },
+          },
+        }
+      });
+
+      // Test table
+      const tb = document.querySelector('#ttTestTable tbody');
+      tb.innerHTML = ttData.by_test.map(t => `<tr>
+        <td class="cmd" title="${escapeHtml(t.test_cmd)}">${escapeHtml(t.test_cmd)}</td>
+        <td class="amt">${t.count}</td><td class="amt">${t.avg_secs}</td><td class="amt">${t.min_secs}</td><td class="amt">${t.max_secs}</td>
+        <td class="amt">${fmtH(t.total_time_secs)}</td><td class="amt">${t.pass_rate}%</td>
+        <td class="amt pass">${t.passed}</td><td class="amt fail">${t.failed}</td><td class="amt flake">${t.flaked}</td>
+      </tr>`).join('');
+
+      // Slowest table
+      const sb = document.querySelector('#ttSlowestTable tbody');
+      sb.innerHTML = ttData.slowest.map(t => `<tr>
+        <td class="cmd" title="${escapeHtml(t.test_cmd)}">${escapeHtml(t.test_cmd)}</td>
+        <td class="amt">${t.duration_secs}</td>
+        <td class="${t.status === 'passed' ? 'pass' : t.status === 'failed' ? 'fail' : 'flake'}">${t.status}</td>
+        <td>${t.date}</td><td>${escapeHtml(t.commit_author || '')}</td><td>${escapeHtml(t.dashboard || '')}</td>
+        <td>${t.log_url ? '<a href="' + escapeHtml(t.log_url) + '" target="_blank">log</a>' : ''}</td>
+      </tr>`).join('');
+
+      // Sort by clicking headers
+      [document.getElementById('ttTestTable'), document.getElementById('ttSlowestTable')].forEach(table => {
+        table.querySelectorAll('th').forEach((th, i) => {
+          if (th._sortBound) return;
+          th._sortBound = true;
+          th.addEventListener('click', () => {
+            const rows = [...table.querySelectorAll('tbody tr')];
+            const asc = th.dataset.sort !== 'asc';
+            th.dataset.sort = asc ? 'asc' : 'desc';
+            rows.sort((a, b) => {
+              let va = a.cells[i].textContent.replace(/[%h]/g, '');
+              let vb = b.cells[i].textContent.replace(/[%h]/g, '');
+              const na = parseFloat(va), nb = parseFloat(vb);
+              if (!isNaN(na) && !isNaN(nb)) return asc ? na - nb : nb - na;
+              return asc ? va.localeCompare(vb) : vb.localeCompare(va);
+            });
+            table.querySelector('tbody').append(...rows);
+          });
+        });
+      });
+    }
+
+    // ==================================================================
+    //  TAB 3: Attribution (from cost-overview)
+    // ==================================================================
+    let attrData = null;
+    let attrSort = { col: 'cost_usd', dir: 'desc' };
+    let attrUserFilter = '';
+
+    function setAttrUserFilter(user) {
+      attrUserFilter = user;
+      const el = document.getElementById('attr-user-filter');
+      if (user) { el.style.display = 'inline-flex'; document.getElementById('attr-uf-name').textContent = user; }
+      else { el.style.display = 'none'; }
+      renderAttribution();
+    }
+
+    async function loadAttribution() {
+      const msg = document.getElementById('attr-msg');
+      msg.className = 'msg'; msg.textContent = 'loading...';
+      try {
+        const f = document.getElementById('dateFrom').value;
+        const t = document.getElementById('dateTo').value;
+        const g = granularity();
+        const [attrResp, prResp] = await Promise.all([
+          fetch(`/api/costs/attribution?from=${f}&to=${t}&granularity=${g}`),
+          prData ? Promise.resolve(null) : fetch(`/api/prs/metrics?from=${f}&to=${t}`),
+        ]);
+        attrData = await attrResp.json();
+        if (prResp) prData = await prResp.json();
+        msg.textContent = '';
+        renderAttribution();
+        renderAuthorTable();
+      } catch (e) {
+        msg.className = 'msg err'; msg.textContent = 'error: ' + e.message;
+      }
+    }
+
+    function renderAttribution() {
+      if (!attrData) return;
+      const { by_user, by_type, totals } = attrData;
+
+      const filteredInstances = attrUserFilter ? attrData.instances.filter(i => i.author === attrUserFilter) : attrData.instances;
+      const filteredByType = {};
+      filteredInstances.forEach(i => {
+        if (!filteredByType[i.type]) filteredByType[i.type] = { type: i.type, cost: 0, runs: 0 };
+        filteredByType[i.type].cost += i.cost_usd || 0;
+        filteredByType[i.type].runs += 1;
+      });
+      const displayByType = attrUserFilter ? Object.values(filteredByType).sort((a, b) => b.cost - a.cost) : by_type;
+
+      const filteredByDate = {};
+      filteredInstances.forEach(i => {
+        if (!filteredByDate[i.date]) filteredByDate[i.date] = {};
+        filteredByDate[i.date][i.type] = (filteredByDate[i.date][i.type] || 0) + (i.cost_usd || 0);
+      });
+
+      const filteredAws = filteredInstances.reduce((s, i) => s + (i.cost_usd || 0), 0);
+      const filteredUser = attrUserFilter ? by_user.find(u => u.author === attrUserFilter) : null;
+      const filteredGcp = filteredUser ? filteredUser.gcp_cost : 0;
+      const unattr = totals.gcp_unattributed || 0;
+
+      if (attrUserFilter) {
+        document.getElementById('attr-stats').innerHTML =
+          `<span style="color:#fff">${attrUserFilter}</span>: aws: <span>${fmt(filteredAws)}</span> &middot; gcp: <span>${fmt(filteredGcp)}</span> &middot; runs: <span>${filteredInstances.length}</span>`;
+      } else {
+        document.getElementById('attr-stats').innerHTML =
+          `ci compute (aws): <span>${fmt(totals.aws)}</span> &middot; ` +
+          `gke namespaces (gcp): <span>${fmt(totals.gcp)}</span>` +
+          (unattr > 0 ? ` <span style="color:#888">(${fmt(unattr)} unattributed)</span>` : '') + ` &middot; ` +
+          `combined: <span style="color:#fff">${fmt(totals.combined)}</span> &middot; ` +
+          `users: <span>${by_user.length}</span> &middot; instances: <span>${attrData.instances.length}</span>`;
+      }
+
+      // Destroy old attribution charts
+      ['attrTimeSeries', 'userBar', 'typeDonut'].forEach(k => { if (charts[k]) { charts[k].destroy(); delete charts[k]; } });
+
+      // Time series
+      const allRunTypes = attrData.run_types || [];
+      const byDateSorted = Object.keys(filteredByDate).sort();
+      const byDate = byDateSorted.map(d => ({ date: d, ...filteredByDate[d] }));
+      const runTypes = attrUserFilter ? [...new Set(filteredInstances.map(i => i.type))].sort() : allRunTypes;
+      const typeColors = { 'merge-queue': '#58a6ff', 'pr': '#3fb950', 'nightly': '#d2a8ff', 'releases': '#f0883e', 'network': '#f85149', 'deflake': '#a5d6ff', 'other': '#555' };
+
+      if (byDate.length > 0) {
+        charts.attrTimeSeries = new Chart(document.getElementById('attrTimeSeries').getContext('2d'), {
+          type: 'bar',
+          data: { labels: byDate.map(d => fmtDate(d.date)), datasets: runTypes.map(rt => ({ label: rt, data: byDate.map(d => d[rt] || 0), backgroundColor: typeColors[rt] || '#555', borderWidth: 0 })) },
+          options: {
+            responsive: true, maintainAspectRatio: false, interaction: { mode: 'index', intersect: false },
+            scales: {
+              x: { stacked: true, ticks: { color: '#555', maxRotation: 45 }, grid: { color: '#181818' } },
+              y: { stacked: true, ticks: { color: '#555', callback: v => '$' + v }, grid: { color: '#181818' } }
+            },
+            plugins: {
+              legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
+              tooltip: { itemSort: (a, b) => b.raw - a.raw, filter: c => c.raw > 0, callbacks: { label: c => `${c.dataset.label}: ${fmt(c.raw)}`, footer: items => `total: ${fmt(items.reduce((s, i) => s + i.raw, 0))}` } }
+            }
+          }
+        });
+      }
+
+      // User bar
+      const topUsers = by_user.slice(0, 15);
+      charts.userBar = new Chart(document.getElementById('userBar').getContext('2d'), {
+        type: 'bar',
+        data: {
+          labels: topUsers.map(u => u.author),
+          datasets: [
+            { label: 'AWS (compute)', data: topUsers.map(u => u.aws_cost), backgroundColor: topUsers.map(u => u.author === attrUserFilter ? '#8cc9ff' : '#58a6ff'), barPercentage: 0.6 },
+            { label: 'GCP (namespace)', data: topUsers.map(u => u.gcp_cost), backgroundColor: topUsers.map(u => u.author === attrUserFilter ? '#6fdb7a' : '#3fb950'), barPercentage: 0.6 },
+          ]
+        },
+        options: {
+          responsive: true, maintainAspectRatio: false, indexAxis: 'y',
+          onClick: (e, elements) => { if (elements.length > 0) { const user = topUsers[elements[0].index].author; setAttrUserFilter(attrUserFilter === user ? '' : user); } },
+          scales: {
+            x: { stacked: true, ticks: { color: '#555', callback: v => '$' + v }, grid: { color: '#181818' } },
+            y: { stacked: true, ticks: { color: '#ccc', font: { family: 'monospace' } }, grid: { display: false } }
+          },
+          plugins: {
+            legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
+            tooltip: { callbacks: { label: c => `${c.dataset.label}: ${fmt(c.raw)}`, footer: items => `total: ${fmt(items.reduce((s, i) => s + i.raw, 0))}` } }
+          }
+        }
+      });
+
+      // Type donut
+      charts.typeDonut = new Chart(document.getElementById('typeDonut').getContext('2d'), {
+        type: 'doughnut',
+        data: {
+          labels: displayByType.map(t => t.type),
+          datasets: [{ data: displayByType.map(t => t.cost), backgroundColor: displayByType.map(t => typeColors[t.type] || '#555'), borderColor: '#0a0a0a', borderWidth: 2 }]
+        },
+        options: {
+          responsive: true, maintainAspectRatio: false,
+          plugins: {
+            legend: { position: 'right', labels: { color: '#888', boxWidth: 10, padding: 6, font: { size: 10, family: 'monospace' } } },
+            tooltip: { callbacks: { label: c => `${c.label}: ${fmt(c.raw)} (${c.dataset.data.reduce((s,v) => s+v, 0) > 0 ? ((c.raw / c.dataset.data.reduce((s,v) => s+v, 0)) * 100).toFixed(1) : 0}%)` } }
+          }
+        }
+      });
+
+      renderAttrTable();
+    }
+
+    function renderAttrTable() {
+      if (!attrData) return;
       const hdrs = [
-        { k: 'author', l: 'Author' },
-        { k: 'pr_count', l: 'PRs', cls: 'amt' },
-        { k: 'total_cost', l: 'CI Cost', cls: 'amt' },
-        { k: 'avg_runs', l: 'Runs/PR', cls: 'amt' },
-        { k: 'avg_ci_time', l: 'CI Time/PR', cls: 'amt' },
-        { k: 'avg_merge_time', l: 'Merge Time', cls: 'amt' },
+        { k: 'instance_name', l: 'Instance' }, { k: 'author', l: 'Author' }, { k: 'type', l: 'Type' },
+        { k: 'branch', l: 'Branch' }, { k: 'cost_usd', l: 'Cost', cls: 'amt' }, { k: 'duration_mins', l: 'Mins', cls: 'amt' },
+        { k: 'instance_type', l: 'EC2 Type' }, { k: 'spot', l: 'Spot' }, { k: 'date', l: 'Date' },
       ];
-      const tr = document.querySelector('#author-thead tr');
-      tr.innerHTML = '';
+      const tr = document.querySelector('#attr-thead tr'); tr.innerHTML = '';
       hdrs.forEach(h => {
-        const th = document.createElement('th');
-        th.textContent = h.l;
-        if (h.cls) th.className = h.cls;
-        th.onclick = () => {
-          authorSort = authorSort.col === h.k ? { col: h.k, dir: authorSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' };
-          renderAuthorRows(authors);
-        };
+        const th = document.createElement('th'); th.textContent = h.l;
+        if (h.cls) th.className = h.cls; th.style.cursor = 'pointer';
+        th.onclick = () => { attrSort = attrSort.col === h.k ? { col: h.k, dir: attrSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' }; renderAttrTable(); };
         tr.appendChild(th);
       });
 
+      const items = attrUserFilter ? attrData.instances.filter(i => i.author === attrUserFilter) : attrData.instances.slice();
+      items.sort((a, b) => { const col = attrSort.col; let av = a[col], bv = b[col]; if (av == null) av = col === 'cost_usd' ? 0 : ''; if (bv == null) bv = col === 'cost_usd' ? 0 : ''; if (typeof av === 'string') return attrSort.dir === 'asc' ? av.localeCompare(bv) : bv.localeCompare(av); return attrSort.dir === 'asc' ? av - bv : bv - av; });
+
+      const typeBadge = t => { const colors = { 'merge-queue': '#58a6ff', 'pr': '#3fb950', 'nightly': '#d2a8ff', 'releases': '#f0883e', 'network': '#f85149', 'deflake': '#a5d6ff' }; return `<span style="color:${colors[t] || '#888'}">${t}</span>`; };
+
+      document.getElementById('attr-tbody').innerHTML = items.map(i =>
+        `<tr>` +
+        `<td style="color:#ccc">${escapeHtml(i.instance_name)}</td>` +
+        `<td><span class="attr-user-link" style="cursor:pointer;color:#58a6ff" data-user="${escapeHtml(i.author)}">${escapeHtml(i.author)}</span></td>` +
+        `<td>${typeBadge(i.type)}</td>` +
+        `<td style="color:#888;max-width:200px;overflow:hidden;text-overflow:ellipsis">${escapeHtml(i.branch)}</td>` +
+        `<td class="amt" style="color:#fff">${fmt(i.cost_usd)}</td>` +
+        `<td class="amt">${i.duration_mins != null ? i.duration_mins.toFixed(1) : ''}</td>` +
+        `<td style="color:#888">${escapeHtml(i.instance_type || '')}</td>` +
+        `<td>${i.spot ? '<span style="color:#3fb950">spot</span>' : '<span style="color:#f0883e">OD</span>'}</td>` +
+        `<td style="color:#888">${fmtDate(i.date)}</td>` +
+        `</tr>`
+      ).join('');
+      document.querySelectorAll('.attr-user-link').forEach(el => { el.onclick = () => setAttrUserFilter(el.dataset.user); });
+    }
+
+    function renderAuthorTable() {
+      const authors = prData?.by_author || [];
+      if (!authors.length) { document.getElementById('author-tbody').innerHTML = '<tr><td colspan="6" style="color:#888">no PR data</td></tr>'; return; }
+      const hdrs = [
+        { k: 'author', l: 'Author' }, { k: 'pr_count', l: 'PRs', cls: 'amt' }, { k: 'total_cost', l: 'CI Cost', cls: 'amt' },
+        { k: 'avg_runs', l: 'Runs/PR', cls: 'amt' }, { k: 'avg_ci_time', l: 'CI Time/PR', cls: 'amt' }, { k: 'avg_merge_time', l: 'Merge Time', cls: 'amt' },
+      ];
+      const tr = document.querySelector('#author-thead tr'); tr.innerHTML = '';
+      hdrs.forEach(h => { const th = document.createElement('th'); th.textContent = h.l; if (h.cls) th.className = h.cls; th.onclick = () => { authorSort = authorSort.col === h.k ? { col: h.k, dir: authorSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' }; renderAuthorRows(authors); }; tr.appendChild(th); });
       renderAuthorRows(authors);
     }
 
     function renderAuthorRows(authors) {
       const rows = authors.slice();
       rows.sort((a, b) => {
-        const col = authorSort.col;
-        let av = a[col], bv = b[col];
+        const col = authorSort.col; let av = a[col], bv = b[col];
         if (col === 'avg_runs') { av = a.avg_runs_per_pr || 0; bv = b.avg_runs_per_pr || 0; }
         if (col === 'avg_ci_time') { av = a.avg_ci_time_hrs || 0; bv = b.avg_ci_time_hrs || 0; }
         if (col === 'avg_merge_time') { av = a.avg_merge_time_hrs || 0; bv = b.avg_merge_time_hrs || 0; }
         if (typeof av === 'string') return authorSort.dir === 'asc' ? av.localeCompare(bv) : bv.localeCompare(av);
-        return authorSort.dir === 'asc' ? (av || 0) - (bv || 0) : (bv || 0) - (av || 0);
+        return authorSort.dir === 'asc' ? (av||0)-(bv||0) : (bv||0)-(av||0);
       });
-
       document.getElementById('author-tbody').innerHTML = rows.map(a => {
         const runs = a.avg_runs_per_pr != null ? a.avg_runs_per_pr.toFixed(1) : '--';
         const ciTime = a.avg_ci_time_hrs != null ? a.avg_ci_time_hrs.toFixed(1) + 'h' : '--';
         const mergeTime = a.avg_merge_time_hrs != null ? a.avg_merge_time_hrs.toFixed(1) + 'h' : '--';
-        return `<tr>` +
-          `<td>${escapeHtml(a.author)}</td>` +
-          `<td class="amt">${a.pr_count}</td>` +
-          `<td class="amt" style="color:#fff">${fmt(a.total_cost)}</td>` +
-          `<td class="amt">${runs}</td>` +
-          `<td class="amt">${ciTime}</td>` +
-          `<td class="amt">${mergeTime}</td>` +
-          `</tr>`;
+        return `<tr><td>${escapeHtml(a.author)}</td><td class="amt">${a.pr_count}</td><td class="amt" style="color:#fff">${fmt(a.total_cost)}</td><td class="amt">${runs}</td><td class="amt">${ciTime}</td><td class="amt">${mergeTime}</td></tr>`;
       }).join('');
     }
 
-    // ---- URL state ----
+    // ==================================================================
+    //  Tab switching + URL state + Init
+    // ==================================================================
+    let activeTab = 'overview';
+
+    function switchTab(name) {
+      activeTab = name;
+      document.querySelectorAll('.tab').forEach(t => t.classList.toggle('active', t.dataset.tab === name));
+      document.querySelectorAll('.tab-content').forEach(c => c.classList.toggle('active', c.id === 'tab-' + name));
+      if (name === 'overview' && !perfData) loadOverview();
+      if (name === 'attribution' && !attrData) loadAttribution();
+      saveUrl();
+    }
+
     function saveUrl() {
       const p = new URLSearchParams();
       p.set('from', document.getElementById('dateFrom').value);
       p.set('to', document.getElementById('dateTo').value);
       p.set('g', granularity());
+      if (activeTab !== 'overview') p.set('tab', activeTab);
       if (pipelineFilter) p.set('pipeline', pipelineFilter);
       history.replaceState({}, '', '?' + p);
       const shared = new URLSearchParams();
@@ -620,9 +1166,16 @@ <h3>flakes + test failures per day</h3>
       if (p.get('to')) document.getElementById('dateTo').value = p.get('to');
       if (p.get('g')) document.querySelectorAll('[data-g]').forEach(b => b.classList.toggle('active', b.dataset.g === p.get('g')));
       if (p.get('pipeline')) pipelineFilter = p.get('pipeline');
+      if (p.get('tab')) switchTab(p.get('tab'));
+    }
+
+    function clearAndReload() {
+      mqData = null; perfData = null; flakeData = null; prData = null; ttData = null; attrData = null; phaseData = null;
+      attrUserFilter = ''; document.getElementById('attr-user-filter').style.display = 'none';
+      if (activeTab === 'overview') loadOverview();
+      else if (activeTab === 'attribution') loadAttribution();
     }
 
-    // ---- Init ----
     window.addEventListener('DOMContentLoaded', () => {
       const now = new Date(), from = new Date();
       from.setDate(from.getDate() - 30);
@@ -631,12 +1184,17 @@ <h3>flakes + test failures per day</h3>
 
       loadUrl();
 
-      document.getElementById('pf-clear').onclick = () => { pipelineFilter = ''; load(); };
-      document.getElementById('refreshBtn').onclick = load;
+      // Tab switching
+      document.querySelectorAll('.tab').forEach(t => t.onclick = () => switchTab(t.dataset.tab));
+
+      // Controls
+      document.getElementById('pf-clear').onclick = () => { pipelineFilter = ''; loadOverview(); };
+      document.getElementById('attr-uf-clear').onclick = () => setAttrUserFilter('');
+      document.getElementById('refreshBtn').onclick = clearAndReload;
       document.querySelectorAll('[data-g]').forEach(b => b.onclick = () => {
         document.querySelectorAll('[data-g]').forEach(x => x.classList.remove('active'));
         b.classList.add('active');
-        load();
+        clearAndReload();
       });
       document.querySelectorAll('[data-range]').forEach(b => b.onclick = () => {
         document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active'));
@@ -646,12 +1204,17 @@ <h3>flakes + test failures per day</h3>
         fr.setDate(fr.getDate() - days);
         document.getElementById('dateFrom').value = fr.toISOString().split('T')[0];
         document.getElementById('dateTo').value = to.toISOString().split('T')[0];
-        load();
+        clearAndReload();
       });
-      document.getElementById('dateFrom').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); load(); };
-      document.getElementById('dateTo').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); load(); };
+      document.getElementById('dateFrom').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); clearAndReload(); };
+      document.getElementById('dateTo').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); clearAndReload(); };
+
+      // Test details filters (reload just test timings)
+      document.getElementById('ttDashboard').onchange = () => { ttData = null; ttLoad(); };
+      document.getElementById('ttStatus').onchange = () => { ttData = null; ttLoad(); };
 
-      load();
+      // Load default tab
+      loadOverview();
     });
   </script>
 </body>
diff --git a/ci3/ci-metrics/views/commits.html b/ci3/ci-metrics/views/commits.html
new file mode 100644
index 000000000000..03143adff905
--- /dev/null
+++ b/ci3/ci-metrics/views/commits.html
@@ -0,0 +1,345 @@
+<!DOCTYPE html>
+<html>
+<head>
+  <meta charset="utf-8" />
+  <title>Commits — aztec-packages</title>
+  <style>
+    * { box-sizing: border-box; }
+    body { background: #0d1117; color: #e6edf3; font-family: monospace; font-size: 13px; padding: 16px; margin: 0; }
+    a { color: #58a6ff; text-decoration: none; }
+    a:hover { text-decoration: underline; }
+    .nav { margin: 8px 0 14px; display: flex; gap: 8px; align-items: center; flex-wrap: wrap; }
+    .nav a { color: #58a6ff; font-size: 13px; }
+    .nav a.active { color: #fff; border-bottom: 1px solid #58a6ff; }
+    .sep { color: #30363d; }
+    h2 { margin: 0 0 10px; color: #f0f6fc; font-size: 16px; font-weight: normal; }
+
+    .controls { display: flex; gap: 10px; align-items: center; flex-wrap: wrap; margin-bottom: 12px; }
+    .controls select, .controls input {
+      background: #161b22; border: 1px solid #30363d; color: #e6edf3;
+      font-family: monospace; font-size: 13px; padding: 5px 10px;
+    }
+    .controls input:focus, .controls select:focus { outline: none; border-color: #58a6ff; }
+    .controls input#search { width: 220px; }
+    .type-btn {
+      background: #161b22; border: 1px solid #30363d; color: #8b949e;
+      font-family: monospace; font-size: 12px; padding: 4px 10px; cursor: pointer;
+    }
+    .type-btn:hover { color: #e6edf3; border-color: #58a6ff; }
+    .type-btn[data-t="feat"].active    { border-color: #58a6ff; color: #58a6ff; }
+    .type-btn[data-t="fix"].active     { border-color: #3fb950; color: #3fb950; }
+    .type-btn[data-t="chore"].active   { border-color: #8b949e; color: #8b949e; }
+    .type-btn[data-t="refactor"].active{ border-color: #d2a8ff; color: #d2a8ff; }
+    .type-btn[data-t="perf"].active    { border-color: #f0883e; color: #f0883e; }
+    .type-btn[data-t="docs"].active    { border-color: #e3b341; color: #e3b341; }
+    .type-btn[data-t="other"].active   { border-color: #666;    color: #ccc; }
+
+    .day-header {
+      color: #8b949e; font-size: 11px; text-transform: uppercase; letter-spacing: 1px;
+      padding: 10px 0 4px; border-bottom: 1px solid #21262d; margin-bottom: 2px;
+    }
+    .commit-row {
+      display: grid;
+      grid-template-columns: 7ch 1fr auto;
+      gap: 0 10px;
+      align-items: baseline;
+      padding: 4px 2px;
+      border-bottom: 1px solid #0d1117;
+    }
+    .commit-row:hover { background: #161b22; }
+
+    .sha-col { color: #8b949e; font-size: 12px; }
+    .sha-col a { color: #8b949e; }
+    .sha-col a:hover { color: #e6edf3; }
+
+    .msg-col { overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }
+    .msg-col > a {
+      color: #e6edf3; display: block; overflow: hidden;
+      text-overflow: ellipsis; white-space: nowrap; text-decoration: none;
+    }
+    .msg-col > a:hover { color: #fff; }
+    .type-tag { font-weight: bold; }
+    .type-feat    { color: #58a6ff; }
+    .type-fix     { color: #3fb950; }
+    .type-chore   { color: #8b949e; }
+    .type-refactor{ color: #d2a8ff; }
+    .type-perf    { color: #f0883e; }
+    .type-docs    { color: #e3b341; }
+    .type-test    { color: #79c0ff; }
+    .type-ci      { color: #a5d6ff; }
+    .type-build   { color: #ffa657; }
+    .type-style   { color: #ff7b72; }
+    .type-revert  { color: #f85149; }
+    .scope        { color: #8b949e; }
+    .breaking-bang{ color: #f85149; font-weight: bold; }
+    .merge-tag    {
+      background: #21262d; color: #8b949e; font-size: 10px;
+      padding: 1px 5px; border-radius: 3px; margin-right: 6px; vertical-align: middle;
+    }
+    .meta-col {
+      color: #8b949e; font-size: 12px; white-space: nowrap;
+      display: flex; align-items: center; gap: 6px; justify-content: flex-end;
+    }
+    .meta-col a { color: #8b949e; }
+    .meta-col a:hover { color: #e6edf3; }
+    .gh-icon { color: #484f58; display: inline-flex; align-items: center; }
+    .gh-icon:hover { color: #58a6ff; }
+    .gh-icon svg { fill: currentColor; vertical-align: middle; }
+    .ci-link { color: #484f58; font-size: 11px; letter-spacing: 0.5px; }
+    .ci-link:hover { color: #3fb950; text-decoration: none; }
+
+    .pagination {
+      display: flex; align-items: center; gap: 12px; margin-top: 14px;
+      color: #8b949e; font-size: 12px;
+    }
+    .pagination button {
+      background: #161b22; border: 1px solid #30363d; color: #e6edf3;
+      font-family: monospace; font-size: 12px; padding: 4px 12px; cursor: pointer;
+    }
+    .pagination button:hover:not(:disabled) { border-color: #58a6ff; color: #58a6ff; }
+    .pagination button:disabled { color: #484f58; cursor: default; border-color: #21262d; }
+
+    .empty  { color: #8b949e; padding: 20px 0; }
+    .loading{ color: #8b949e; padding: 12px 0; }
+  </style>
+</head>
+<body>
+  <div class="nav">
+    <a href="/">&lt; CI</a> <span class="sep">|</span>
+    <a href="/cost-overview">cost overview</a> <span class="sep">|</span>
+    <a href="/namespace-billing">namespace billing</a> <span class="sep">|</span>
+    <a href="/ci-insights">ci insights</a> <span class="sep">|</span>
+    <a href="/flake-prs">flake prs</a> <span class="sep">|</span>
+    <a href="/commits" class="active">commits</a>
+  </div>
+
+  <h2>commits — <span id="branch-label">next</span></h2>
+
+  <div class="controls">
+    <select id="branch-select" onchange="setBranch(this.value)">
+      <option value="next" selected>next</option>
+      <option value="master">master</option>
+      <option value="staging-public">staging-public</option>
+    </select>
+    <input id="search" type="text" placeholder="filter or SHA…" oninput="applyFilter()" onkeydown="searchKeydown(event)" />
+    <button class="type-btn" data-t="feat"     onclick="toggleType('feat')">feat</button>
+    <button class="type-btn" data-t="fix"      onclick="toggleType('fix')">fix</button>
+    <button class="type-btn" data-t="chore"    onclick="toggleType('chore')">chore</button>
+    <button class="type-btn" data-t="refactor" onclick="toggleType('refactor')">refactor</button>
+    <button class="type-btn" data-t="perf"     onclick="toggleType('perf')">perf</button>
+    <button class="type-btn" data-t="docs"     onclick="toggleType('docs')">docs</button>
+    <button class="type-btn" data-t="other"    onclick="toggleType('other')">other</button>
+    <button class="type-btn" onclick="clearFilters()" style="margin-left:4px;color:#484f58">clear</button>
+  </div>
+
+  <div id="list" class="loading">Loading…</div>
+
+  <div class="pagination">
+    <button id="prev-btn" onclick="goPage(currentPage - 1)" disabled>← prev</button>
+    <span id="page-info">—</span>
+    <button id="next-btn" onclick="goPage(currentPage + 1)" disabled>next →</button>
+  </div>
+
+<script>
+  const REPO = 'AztecProtocol/aztec-packages';
+  const BASE  = `https://github.com/${REPO}`;
+
+  let allCommits  = [];   // page's commits (before filter)
+  let currentPage = 1;
+  let totalPages  = 1;
+  let totalCommits= 0;
+  let currentBranch = 'next';
+  let activeTypes = new Set();
+
+  const TYPE_CLASS = {
+    feat:'type-feat', fix:'type-fix', chore:'type-chore', refactor:'type-refactor',
+    perf:'type-perf', docs:'type-docs', test:'type-test', ci:'type-ci',
+    build:'type-build', style:'type-style', revert:'type-revert',
+  };
+
+  function ghIcon() {
+    return `<svg aria-hidden="true" height="14" viewBox="0 0 16 16" width="14"><path d="M8 0c4.42 0 8 3.58 8 8a8.013 8.013 0 0 1-5.45 7.59c-.4.08-.55-.17-.55-.38 0-.27.01-1.13.01-2.2 0-.75-.25-1.23-.54-1.48 1.78-.2 3.65-.88 3.65-3.95 0-.88-.31-1.59-.82-2.15.08-.2.36-1.02-.08-2.12 0 0-.67-.22-2.2.82-.64-.18-1.32-.27-2-.27-.68 0-1.36.09-2 .27-1.53-1.03-2.2-.82-2.2-.82-.44 1.1-.16 1.92-.08 2.12-.51.56-.82 1.28-.82 2.15 0 3.06 1.86 3.75 3.64 3.95-.23.2-.44.55-.51 1.07-.46.21-1.61.55-2.33-.66-.15-.24-.6-.83-1.23-.82-.67.01-.27.38.01.53.34.19.73.9.82 1.13.16.45.68 1.31 2.69.94 0 .67.01 1.3.01 1.49 0 .21-.15.45-.55.38A7.995 7.995 0 0 1 0 8c0-4.42 3.58-8 8-8Z"/></svg>`;
+  }
+
+  function esc(s) {
+    return (s||'').replace(/&/g,'&amp;').replace(/</g,'&lt;').replace(/>/g,'&gt;');
+  }
+
+  function relTime(iso) {
+    if (!iso) return '';
+    const diff = Date.now() - new Date(iso);
+    const m = Math.floor(diff / 60000);
+    if (m < 1)  return 'now';
+    if (m < 60) return m + 'm';
+    const h = Math.floor(m / 60);
+    if (h < 24) return h + 'h';
+    return Math.floor(h / 24) + 'd';
+  }
+
+  function dayKey(iso) {
+    return iso ? iso.slice(0, 10) : '';
+  }
+
+  function abbrev(s) {
+    return s === 'barretenberg' ? 'bb' : s.length > 16 ? s.slice(0,14)+'…' : s;
+  }
+
+  function renderCommit(c) {
+    const sha7     = c.sha.slice(0, 7);
+    const ghCommit = `${BASE}/commit/${c.sha}`;
+    const ghPR     = c.pr ? `${BASE}/pull/${c.pr}` : '';
+    const ghAuthor = c.author
+      ? `${BASE}/pulls?q=is:pr+author:${encodeURIComponent(c.author)}+sort:updated-desc`
+      : '';
+
+    const tm = c.subject.match(/^(fix|feat|chore|refactor|docs|style|test|perf|ci|build|revert)(\([^)]+\))?(!)?: (.*)/);
+    let msgHtml;
+    if (tm) {
+      const cls  = TYPE_CLASS[tm[1]] || '';
+      const sc   = tm[2] || '';
+      const bang = tm[3] || '';
+      const rest = tm[4];
+      msgHtml = `<span class="type-tag ${cls}">${tm[1]}</span>` +
+        (sc   ? `<span class="scope">${sc}</span>` : '') +
+        (bang ? `<span class="breaking-bang">!</span>` : '') +
+        `<span class="scope">: </span>${esc(rest)}`;
+    } else {
+      msgHtml = esc(c.subject);
+    }
+
+    const mergeTag = c.merge_train
+      ? `<span class="merge-tag">${abbrev(c.merge_train)}</span>`
+      : (c.is_merge ? `<span class="merge-tag">merge</span>` : '');
+
+    const prIcon = c.pr
+      ? `<a href="${ghPR}" target="_blank" class="gh-icon" title="PR #${c.pr}">${ghIcon()}</a>`
+      : '';
+
+    const ciLink = `<a href="/commit/${c.sha}" class="ci-link" title="CI logs for this commit">ci</a>`;
+
+    const authorHtml = c.author
+      ? `<a href="${ghAuthor}" target="_blank">${esc(c.author)}</a>`
+      : esc(c.author || '');
+
+    return `<div class="commit-row">
+      <span class="sha-col"><a href="${ghCommit}" target="_blank">${sha7}</a></span>
+      <span class="msg-col"><a href="${ghCommit}" target="_blank">${mergeTag}${msgHtml}</a></span>
+      <span class="meta-col"><span>${authorHtml}</span><span>· ${relTime(c.date)}</span>${ciLink}${prIcon}</span>
+    </div>`;
+  }
+
+  function searchKeydown(e) {
+    if (e.key !== 'Enter') return;
+    const q = document.getElementById('search').value.trim();
+    // If it looks like a hex SHA (7-40 hex chars), navigate to commit detail
+    if (/^[0-9a-f]{7,40}$/i.test(q)) {
+      window.location.href = '/commit/' + q;
+    }
+  }
+
+  function applyFilter() {
+    const q = document.getElementById('search').value.trim().toLowerCase();
+    const knownTypes = new Set(['feat','fix','chore','refactor','perf','docs','test','ci','build','style','revert']);
+
+    let rows = allCommits.filter(c => c.pr);
+
+    if (activeTypes.size > 0) {
+      const wantOther = activeTypes.has('other');
+      rows = rows.filter(c => {
+        if (activeTypes.has(c.type)) return true;
+        if (wantOther && !knownTypes.has(c.type)) return true;
+        return false;
+      });
+    }
+
+    if (q) {
+      rows = rows.filter(c =>
+        c.subject.toLowerCase().includes(q) ||
+        (c.author||'').toLowerCase().includes(q) ||
+        (c.pr ? String(c.pr).includes(q) : false) ||
+        c.sha.startsWith(q)
+      );
+    }
+
+    renderList(rows);
+  }
+
+  function renderList(commits) {
+    const el = document.getElementById('list');
+    if (!commits.length) {
+      el.innerHTML = '<div class="empty">No matching commits.</div>';
+      return;
+    }
+    const groups = {};
+    const keys = [];
+    commits.forEach(c => {
+      const k = dayKey(c.date);
+      if (!groups[k]) { groups[k] = []; keys.push(k); }
+      groups[k].push(c);
+    });
+    el.innerHTML = keys.map(k =>
+      `<div class="day-header">${k} — ${groups[k].length}</div>` +
+      groups[k].map(renderCommit).join('')
+    ).join('');
+  }
+
+  function toggleType(t) {
+    if (activeTypes.has(t)) activeTypes.delete(t);
+    else activeTypes.add(t);
+    document.querySelectorAll('.type-btn[data-t]').forEach(b => {
+      b.classList.toggle('active', activeTypes.has(b.dataset.t));
+    });
+    applyFilter();
+  }
+
+  function clearFilters() {
+    activeTypes.clear();
+    document.querySelectorAll('.type-btn[data-t]').forEach(b => b.classList.remove('active'));
+    document.getElementById('search').value = '';
+    applyFilter();
+  }
+
+  function updatePagination() {
+    document.getElementById('page-info').textContent =
+      `page ${currentPage} of ${totalPages} · ${totalCommits} cached`;
+    document.getElementById('prev-btn').disabled = currentPage <= 1;
+    document.getElementById('next-btn').disabled = currentPage >= totalPages;
+  }
+
+  async function goPage(page) {
+    if (page < 1 || page > totalPages) return;
+    document.getElementById('list').innerHTML = '<div class="loading">Loading…</div>';
+    document.getElementById('prev-btn').disabled = true;
+    document.getElementById('next-btn').disabled = true;
+    await loadPage(currentBranch, page);
+    window.scrollTo(0, 0);
+  }
+
+  async function loadPage(branch, page) {
+    try {
+      const resp = await fetch(`/api/commits?branch=${encodeURIComponent(branch)}&page=${page}`);
+      if (!resp.ok) throw new Error(resp.statusText);
+      const data = await resp.json();
+      allCommits   = data.commits || [];
+      currentPage  = data.page || page;
+      totalPages   = data.total_pages || 1;
+      totalCommits = data.total || allCommits.length;
+      applyFilter();
+      updatePagination();
+    } catch (e) {
+      document.getElementById('list').innerHTML = `<div class="empty">Error: ${e.message}</div>`;
+    }
+  }
+
+  function setBranch(branch) {
+    currentBranch = branch;
+    document.getElementById('branch-label').textContent = branch;
+    currentPage = 1;
+    clearFilters();
+    loadPage(branch, 1);
+  }
+
+  loadPage('next', 1);
+</script>
+</body>
+</html>
diff --git a/ci3/ci-metrics/views/cost-overview.html b/ci3/ci-metrics/views/cost-overview.html
index 53424a2d2d70..da8d73e0b7f8 100644
--- a/ci3/ci-metrics/views/cost-overview.html
+++ b/ci3/ci-metrics/views/cost-overview.html
@@ -71,17 +71,23 @@
 <body>
   <div class="nav" id="nav">
     <a href="/">&lt; CI</a> <span class="sep">|</span>
-    <a href="/cost-overview" class="active">cost overview</a>
-    <a href="/namespace-billing">namespace billing</a>
-    <a href="/ci-insights">ci insights</a>
+    <a href="/cost-overview" class="active">cost overview</a> <span class="sep">|</span>
+    <a href="/namespace-billing">namespace billing</a> <span class="sep">|</span>
+    <a href="/ci-insights">ci insights</a> <span class="sep">|</span>
+    <a href="/flake-prs">flake prs</a> <span class="sep">|</span>
+    <a href="/commits">commits</a>
   </div>
 
-  <h2 style="margin:8px 0;color:#ccc;">cost overview</h2>
+  <h2 style="margin:8px 0;color:#ccc;">cost overview <span id="period-label" style="font-size:12px;color:#666;font-weight:normal"></span></h2>
 
   <div class="controls">
-    <button data-range="30">1m</button>
-    <button data-range="90">3m</button>
     <button data-range="365">1y</button>
+    <button data-range="180">6m</button>
+    <button data-range="30">1m</button>
+    <button data-range="14">2w</button>
+    <button data-range="7">1w</button>
+    <button data-range="2">2d</button>
+    <button data-range="1">1d</button>
     <span style="color:#333">|</span>
     <label>from</label> <input type="date" id="dateFrom" />
     <label>to</label> <input type="date" id="dateTo" />
@@ -98,7 +104,6 @@ <h2 style="margin:8px 0;color:#ccc;">cost overview</h2>
   <div class="tabs">
     <div class="tab active" data-tab="overview">Overview</div>
     <div class="tab" data-tab="details">Resource Details</div>
-    <div class="tab" data-tab="attribution">CI Attribution</div>
   </div>
 
   <div class="tab-content active" id="tab-overview">
@@ -136,35 +141,6 @@ <h3>aws vs gcp split</h3>
     </div>
   </div><!-- end tab-details -->
 
-  <div class="tab-content" id="tab-attribution">
-    <div class="stats" id="attr-stats"></div>
-    <div id="attr-user-filter" style="display:none; margin:8px 0; padding:6px 12px; background:#1a1a2e; border:1px solid #58a6ff; align-items:center; gap:8px; font-size:13px;">
-      filtered to user: <span id="attr-uf-name" style="color:#fff;font-weight:bold"></span>
-      <span id="attr-uf-clear" style="cursor:pointer;color:#888;margin-left:8px">[clear]</span>
-    </div>
-    <div id="attr-msg" class="msg"></div>
-    <div class="charts">
-      <div class="chart-box full">
-        <h3>ci cost by run type (time series)</h3>
-        <div class="chart-wrap tall"><canvas id="attrTimeSeries"></canvas></div>
-      </div>
-      <div class="chart-box">
-        <h3>cost by user (AWS + GCP)</h3>
-        <div class="chart-wrap" style="height:400px"><canvas id="userBar"></canvas></div>
-      </div>
-      <div class="chart-box">
-        <h3>cost by run type</h3>
-        <div class="chart-wrap med"><canvas id="typeDonut"></canvas></div>
-      </div>
-    </div>
-    <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px">instances</h3>
-    <div class="detail-scroll" style="max-height:500px">
-      <table class="detail-table">
-        <thead id="attr-thead"><tr></tr></thead>
-        <tbody id="attr-tbody"></tbody>
-      </table>
-    </div>
-  </div><!-- end tab-attribution -->
 
   <script src="https://cdn.jsdelivr.net/npm/chart.js@3.9.1/dist/chart.min.js"></script>
   <script>
@@ -185,7 +161,9 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
     let svcKeys = []; // dynamically built from data
 
     const fmt = v => v >= 1000 ? '$' + v.toFixed(0).replace(/\B(?=(\d{3})+(?!\d))/g, ',') : v >= 1 ? '$' + v.toFixed(2) : '$' + v.toFixed(4);
-    const fmtDate = s => { const d = new Date(s + 'T00:00:00'); return d.toLocaleDateString('en-US', { month: 'short', day: 'numeric' }); };
+    const MONTHS = ['Jan','Feb','Mar','Apr','May','Jun','Jul','Aug','Sep','Oct','Nov','Dec'];
+    const fmtDate = s => { const d = new Date(s + 'T00:00:00'); return MONTHS[d.getMonth()] + ' ' + d.getDate(); };
+    const fmtDateFull = s => { const d = new Date(s + 'T00:00:00'); return MONTHS[d.getMonth()] + ' ' + d.getDate() + ', ' + d.getFullYear(); };
     const escapeHtml = s => { const d = document.createElement('div'); d.textContent = s; return d.innerHTML; };
     const cap = s => s.split('_').map(w => w[0].toUpperCase() + w.slice(1)).join(' ');
 
@@ -248,6 +226,10 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
       Object.values(charts).forEach(c => c.destroy());
       charts = {};
 
+      if (apiData.period) {
+        document.getElementById('period-label').textContent = `(${apiData.period.from} to ${apiData.period.to})`;
+      }
+
       const byDate = apiData.by_date;
       const totals = apiData.totals;
       const days = byDate.length || 1;
@@ -260,13 +242,21 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
       const trendPct = firstHalf > 0 ? ((secondHalf - firstHalf) / firstHalf * 100) : 0;
       const trendStr = trendPct >= 0 ? `+${trendPct.toFixed(1)}%` : `${trendPct.toFixed(1)}%`;
 
-      // stats row
+      // stats row — show operational totals (exclude one-time Savings Plan / RI payments)
+      const ONE_TIME_CATS = new Set(['savings_plan_1yr_annual','savings_plan_3yr_annual',
+          'savings_plan_1yr_annual_partial','savings_plan_3yr_annual_partial','reserved_instance_monthly']);
+      const oneTime = totals.aws_one_time || 0;
+      const opCombined = totals.combined_operational ?? totals.combined;
+      const opDailyAvg = opCombined / days;
+      const oneTimeNote = oneTime > 0
+        ? ` &middot; <span style="color:#d2a8ff" title="Annual Savings Plan and monthly Reserved Instance payments — not operational spend">one-time: <b>${fmt(oneTime)}</b></span>`
+        : '';
       document.getElementById('stats').innerHTML =
-        `total: <span>${fmt(totals.combined)}</span> &middot; ` +
-        `daily avg: <span>${fmt(dailyAvg)}</span> &middot; ` +
-        `aws: <span>${fmt(totals.aws)}</span> &middot; ` +
+        `operational: <span>${fmt(opCombined)}</span> &middot; ` +
+        `daily avg: <span>${fmt(opDailyAvg)}</span> &middot; ` +
+        `aws: <span>${fmt(totals.aws_operational ?? totals.aws)}</span> &middot; ` +
         `gcp: <span>${fmt(totals.gcp)}</span> &middot; ` +
-        `trend: <span>${trendStr}</span>`;
+        `trend: <span>${trendStr}</span>` + oneTimeNote;
 
       // ---- compute service totals and filter insignificant (<1% of total) ----
       const svcTotals = {};
@@ -278,20 +268,24 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
       const threshold = totals.combined * 0.01;
       const significantSvcs = svcKeys.filter(s => svcTotals[s.key] >= threshold);
       const minorSvcs = svcKeys.filter(s => svcTotals[s.key] > 0 && svcTotals[s.key] < threshold);
+      // For the stacked bar: exclude one-time contract payments so daily chart shows operational spend
+      const chartSvcs = significantSvcs.filter(s => !ONE_TIME_CATS.has(s.key));
+      const hasOtherChart = minorSvcs.filter(s => !ONE_TIME_CATS.has(s.key)).length > 0;
       const hasOther = minorSvcs.length > 0;
 
       // ---- stacked bar chart (full width) ----
       const dates = byDate.map(e => e.date);
-      const datasets = significantSvcs.map((s, i) => ({
+      const datasets = chartSvcs.map((s, i) => ({
         label: s.label,
         data: byDate.map(e => extractServices(e)[s.key]),
-        backgroundColor: COLORS[i % COLORS.length],
+        backgroundColor: COLORS[significantSvcs.indexOf(s) % COLORS.length],
         borderWidth: 0
       }));
-      if (hasOther) {
+      if (hasOtherChart) {
+        const minorChartSvcs = minorSvcs.filter(s => !ONE_TIME_CATS.has(s.key));
         datasets.push({
           label: 'Other',
-          data: byDate.map(e => { const svcs = extractServices(e); return minorSvcs.reduce((s, k) => s + svcs[k.key], 0); }),
+          data: byDate.map(e => { const svcs = extractServices(e); return minorChartSvcs.reduce((s, k) => s + svcs[k.key], 0); }),
           backgroundColor: '#555',
           borderWidth: 0
         });
@@ -314,6 +308,7 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
               itemSort: (a, b) => b.raw - a.raw,
               filter: c => c.raw > 0,
               callbacks: {
+                title: items => items.length ? fmtDateFull(dates[items[0].dataIndex]) : '',
                 label: c => `${c.dataset.label}: ${fmt(c.raw)}`,
                 footer: items => `total: ${fmt(items.reduce((s, i) => s + i.raw, 0))}`
               }
@@ -574,249 +569,6 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
       }).join('');
     }
 
-    // ---- CI attribution ----
-    let attrData = null;
-    let attrSort = { col: 'cost_usd', dir: 'desc' };
-    let attrUserFilter = '';
-
-    function setAttrUserFilter(user) {
-      attrUserFilter = user;
-      const el = document.getElementById('attr-user-filter');
-      if (user) {
-        el.style.display = 'inline-flex';
-        document.getElementById('attr-uf-name').textContent = user;
-      } else {
-        el.style.display = 'none';
-      }
-      renderAttribution();
-    }
-
-    async function loadAttribution() {
-      const msg = document.getElementById('attr-msg');
-      msg.className = 'msg'; msg.textContent = 'loading...';
-      try {
-        const f = document.getElementById('dateFrom').value;
-        const t = document.getElementById('dateTo').value;
-        const g = granularity();
-        const resp = await fetch(`/api/costs/attribution?from=${f}&to=${t}&granularity=${g}`);
-        if (!resp.ok) throw new Error(`HTTP ${resp.status}`);
-        attrData = await resp.json();
-        msg.textContent = '';
-        renderAttribution();
-      } catch (e) {
-        msg.className = 'msg err'; msg.textContent = 'error: ' + e.message;
-      }
-    }
-
-    function renderAttribution() {
-      if (!attrData) return;
-      const { by_user, by_type, totals } = attrData;
-
-      // Apply user filter
-      const filteredInstances = attrUserFilter
-        ? attrData.instances.filter(i => i.author === attrUserFilter)
-        : attrData.instances;
-      const filteredByType = {};
-      filteredInstances.forEach(i => {
-        if (!filteredByType[i.type]) filteredByType[i.type] = { type: i.type, cost: 0, runs: 0 };
-        filteredByType[i.type].cost += i.cost_usd || 0;
-        filteredByType[i.type].runs += 1;
-      });
-      const displayByType = attrUserFilter ? Object.values(filteredByType).sort((a, b) => b.cost - a.cost) : by_type;
-
-      // Build filtered time series
-      const filteredByDate = {};
-      filteredInstances.forEach(i => {
-        if (!filteredByDate[i.date]) filteredByDate[i.date] = {};
-        filteredByDate[i.date][i.type] = (filteredByDate[i.date][i.type] || 0) + (i.cost_usd || 0);
-      });
-
-      const filteredAws = filteredInstances.reduce((s, i) => s + (i.cost_usd || 0), 0);
-      const filteredUser = attrUserFilter ? by_user.find(u => u.author === attrUserFilter) : null;
-      const filteredGcp = filteredUser ? filteredUser.gcp_cost : 0;
-
-      const unattr = totals.gcp_unattributed || 0;
-      if (attrUserFilter) {
-        document.getElementById('attr-stats').innerHTML =
-          `<span style="color:#fff">${attrUserFilter}</span>: ` +
-          `aws: <span>${fmt(filteredAws)}</span> &middot; ` +
-          `gcp: <span>${fmt(filteredGcp)}</span> &middot; ` +
-          `runs: <span>${filteredInstances.length}</span>`;
-      } else {
-        document.getElementById('attr-stats').innerHTML =
-          `ci compute (aws): <span>${fmt(totals.aws)}</span> &middot; ` +
-          `gke namespaces (gcp): <span>${fmt(totals.gcp)}</span>` +
-          (unattr > 0 ? ` <span style="color:#888">(${fmt(unattr)} unattributed)</span>` : '') + ` &middot; ` +
-          `combined: <span style="color:#fff">${fmt(totals.combined)}</span> &middot; ` +
-          `users: <span>${by_user.length}</span> &middot; ` +
-          `instances: <span>${attrData.instances.length}</span>`;
-      }
-
-      // Destroy old charts
-      if (charts.attrTimeSeries) { charts.attrTimeSeries.destroy(); delete charts.attrTimeSeries; }
-      if (charts.userBar) { charts.userBar.destroy(); delete charts.userBar; }
-      if (charts.typeDonut) { charts.typeDonut.destroy(); delete charts.typeDonut; }
-
-      // Time series: stacked bar by run type
-      const allRunTypes = attrData.run_types || [];
-      const byDateSorted = Object.keys(filteredByDate).sort();
-      const byDate = byDateSorted.map(d => ({ date: d, ...filteredByDate[d] }));
-      const runTypes = attrUserFilter
-        ? [...new Set(filteredInstances.map(i => i.type))].sort()
-        : allRunTypes;
-      if (byDate.length > 0) {
-        const typeColors = { 'merge-queue': '#58a6ff', 'pr': '#3fb950', 'nightly': '#d2a8ff', 'releases': '#f0883e', 'network': '#f85149', 'deflake': '#a5d6ff', 'other': '#555' };
-        const tsDatasets = runTypes.map(rt => ({
-          label: rt,
-          data: byDate.map(d => d[rt] || 0),
-          backgroundColor: typeColors[rt] || '#555',
-          borderWidth: 0,
-        }));
-        charts.attrTimeSeries = new Chart(document.getElementById('attrTimeSeries').getContext('2d'), {
-          type: 'bar',
-          data: { labels: byDate.map(d => fmtDate(d.date)), datasets: tsDatasets },
-          options: {
-            responsive: true, maintainAspectRatio: false,
-            interaction: { mode: 'index', intersect: false },
-            scales: {
-              x: { stacked: true, ticks: { color: '#555', maxRotation: 45 }, grid: { color: '#181818' } },
-              y: { stacked: true, ticks: { color: '#555', callback: v => '$' + v }, grid: { color: '#181818' } }
-            },
-            plugins: {
-              legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
-              tooltip: {
-                itemSort: (a, b) => b.raw - a.raw,
-                filter: c => c.raw > 0,
-                callbacks: {
-                  label: c => `${c.dataset.label}: ${fmt(c.raw)}`,
-                  footer: items => `total: ${fmt(items.reduce((s, i) => s + i.raw, 0))}`
-                }
-              }
-            }
-          }
-        });
-      }
-
-      // User bar chart (horizontal) — clickable to filter
-      const topUsers = by_user.slice(0, 15);
-      charts.userBar = new Chart(document.getElementById('userBar').getContext('2d'), {
-        type: 'bar',
-        data: {
-          labels: topUsers.map(u => u.author),
-          datasets: [
-            { label: 'AWS (compute)', data: topUsers.map(u => u.aws_cost), backgroundColor: topUsers.map(u => u.author === attrUserFilter ? '#8cc9ff' : '#58a6ff'), barPercentage: 0.6 },
-            { label: 'GCP (namespace)', data: topUsers.map(u => u.gcp_cost), backgroundColor: topUsers.map(u => u.author === attrUserFilter ? '#6fdb7a' : '#3fb950'), barPercentage: 0.6 },
-          ]
-        },
-        options: {
-          responsive: true, maintainAspectRatio: false, indexAxis: 'y',
-          onClick: (e, elements) => {
-            if (elements.length > 0) {
-              const user = topUsers[elements[0].index].author;
-              setAttrUserFilter(attrUserFilter === user ? '' : user);
-            }
-          },
-          scales: {
-            x: { stacked: true, ticks: { color: '#555', callback: v => '$' + v }, grid: { color: '#181818' } },
-            y: { stacked: true, ticks: { color: '#ccc', font: { family: 'monospace' } }, grid: { display: false } }
-          },
-          plugins: {
-            legend: { position: 'bottom', labels: { color: '#888', boxWidth: 10, padding: 8, font: { size: 10, family: 'monospace' } } },
-            tooltip: {
-              callbacks: {
-                label: c => `${c.dataset.label}: ${fmt(c.raw)}`,
-                footer: items => `total: ${fmt(items.reduce((s, i) => s + i.raw, 0))}`
-              }
-            }
-          }
-        }
-      });
-
-      // Type donut (filtered)
-      const typeColors = { 'merge-queue': '#58a6ff', 'pr': '#3fb950', 'nightly': '#d2a8ff', 'releases': '#f0883e', 'network': '#f85149', 'deflake': '#a5d6ff', 'other': '#555' };
-      charts.typeDonut = new Chart(document.getElementById('typeDonut').getContext('2d'), {
-        type: 'doughnut',
-        data: {
-          labels: displayByType.map(t => t.type),
-          datasets: [{ data: displayByType.map(t => t.cost), backgroundColor: displayByType.map(t => typeColors[t.type] || '#555'), borderColor: '#0a0a0a', borderWidth: 2 }]
-        },
-        options: {
-          responsive: true, maintainAspectRatio: false,
-          plugins: {
-            legend: { position: 'right', labels: { color: '#888', boxWidth: 10, padding: 6, font: { size: 10, family: 'monospace' } } },
-            tooltip: { callbacks: { label: c => `${c.label}: ${fmt(c.raw)} (${c.dataset.data.reduce((s,v) => s+v, 0) > 0 ? ((c.raw / c.dataset.data.reduce((s,v) => s+v, 0)) * 100).toFixed(1) : 0}%)` } }
-          }
-        }
-      });
-
-      // Instance table
-      renderAttrTable();
-    }
-
-    function renderAttrTable() {
-      if (!attrData) return;
-      const hdrs = [
-        { k: 'instance_name', l: 'Instance' },
-        { k: 'author', l: 'Author' },
-        { k: 'type', l: 'Type' },
-        { k: 'branch', l: 'Branch' },
-        { k: 'cost_usd', l: 'Cost', cls: 'amt' },
-        { k: 'duration_mins', l: 'Mins', cls: 'amt' },
-        { k: 'instance_type', l: 'EC2 Type' },
-        { k: 'spot', l: 'Spot' },
-        { k: 'date', l: 'Date' },
-      ];
-      const tr = document.querySelector('#attr-thead tr');
-      tr.innerHTML = '';
-      hdrs.forEach(h => {
-        const th = document.createElement('th');
-        th.textContent = h.l;
-        if (h.cls) th.className = h.cls;
-        th.style.cursor = 'pointer';
-        th.onclick = () => {
-          attrSort = attrSort.col === h.k ? { col: h.k, dir: attrSort.dir === 'asc' ? 'desc' : 'asc' } : { col: h.k, dir: 'desc' };
-          renderAttrTable();
-        };
-        tr.appendChild(th);
-      });
-
-      const items = attrUserFilter
-        ? attrData.instances.filter(i => i.author === attrUserFilter)
-        : attrData.instances.slice();
-      items.sort((a, b) => {
-        const col = attrSort.col;
-        let av = a[col], bv = b[col];
-        if (av == null) av = col === 'cost_usd' ? 0 : '';
-        if (bv == null) bv = col === 'cost_usd' ? 0 : '';
-        if (typeof av === 'string') return attrSort.dir === 'asc' ? av.localeCompare(bv) : bv.localeCompare(av);
-        return attrSort.dir === 'asc' ? av - bv : bv - av;
-      });
-
-      const typeBadge = t => {
-        const colors = { 'merge-queue': '#58a6ff', 'pr': '#3fb950', 'nightly': '#d2a8ff', 'releases': '#f0883e', 'network': '#f85149', 'deflake': '#a5d6ff' };
-        return `<span style="color:${colors[t] || '#888'}">${t}</span>`;
-      };
-
-      document.getElementById('attr-tbody').innerHTML = items.map(i =>
-        `<tr>` +
-        `<td style="color:#ccc">${escapeHtml(i.instance_name)}</td>` +
-        `<td><span class="attr-user-link" style="cursor:pointer;color:#58a6ff" data-user="${escapeHtml(i.author)}">${escapeHtml(i.author)}</span></td>` +
-        `<td>${typeBadge(i.type)}</td>` +
-        `<td style="color:#888;max-width:200px;overflow:hidden;text-overflow:ellipsis">${escapeHtml(i.branch)}</td>` +
-        `<td class="amt" style="color:#fff">${fmt(i.cost_usd)}</td>` +
-        `<td class="amt">${i.duration_mins != null ? i.duration_mins.toFixed(1) : ''}</td>` +
-        `<td style="color:#888">${escapeHtml(i.instance_type || '')}</td>` +
-        `<td>${i.spot ? '<span style="color:#3fb950">spot</span>' : '<span style="color:#f0883e">OD</span>'}</td>` +
-        `<td style="color:#888">${fmtDate(i.date)}</td>` +
-        `</tr>`
-      ).join('');
-
-      // Make author names clickable
-      document.querySelectorAll('.attr-user-link').forEach(el => {
-        el.onclick = () => setAttrUserFilter(el.dataset.user);
-      });
-    }
-
     // ---- url state ----
     function saveUrl() {
       const p = new URLSearchParams();
@@ -853,7 +605,6 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
       document.querySelectorAll('.tab').forEach(t => t.classList.toggle('active', t.dataset.tab === name));
       document.querySelectorAll('.tab-content').forEach(c => c.classList.toggle('active', c.id === 'tab-' + name));
       if (name === 'details' && !detailData) loadDetails();
-      if (name === 'attribution' && !attrData) loadAttribution();
       saveUrl();
     }
 
@@ -869,10 +620,7 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
       // Tab switching
       document.querySelectorAll('.tab').forEach(t => t.onclick = () => switchTab(t.dataset.tab));
 
-      // Clear user filter
-      document.getElementById('attr-uf-clear').onclick = () => setAttrUserFilter('');
-
-      document.getElementById('refreshBtn').onclick = () => { detailData = null; attrData = null; attrUserFilter = ''; document.getElementById('attr-user-filter').style.display = 'none'; load(); const t = document.querySelector('.tab.active').dataset.tab; if (t === 'details') loadDetails(); if (t === 'attribution') loadAttribution(); };
+      document.getElementById('refreshBtn').onclick = () => { detailData = null; load(); const t = document.querySelector('.tab.active').dataset.tab; if (t === 'details') loadDetails(); };
       document.querySelectorAll('[data-range]').forEach(b => b.onclick = () => {
         document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active'));
         b.classList.add('active');
@@ -881,22 +629,18 @@ <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:16px 0 8px"
         fr.setDate(fr.getDate() - days);
         document.getElementById('dateFrom').value = fr.toISOString().split('T')[0];
         document.getElementById('dateTo').value = to.toISOString().split('T')[0];
-        detailData = null; attrData = null;
+        detailData = null;
         load();
         const _t = document.querySelector('.tab.active').dataset.tab;
         if (_t === 'details') loadDetails();
-        if (_t === 'attribution') loadAttribution();
       });
       document.querySelectorAll('[data-g]').forEach(b => b.onclick = () => {
         document.querySelectorAll('[data-g]').forEach(x => x.classList.remove('active'));
         b.classList.add('active');
-        attrData = null;
         load();
-        const _t3 = document.querySelector('.tab.active').dataset.tab;
-        if (_t3 === 'attribution') loadAttribution();
       });
-      document.getElementById('dateFrom').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); detailData = null; attrData = null; load(); { const _t2 = document.querySelector('.tab.active').dataset.tab; if (_t2 === 'details') loadDetails(); if (_t2 === 'attribution') loadAttribution(); } };
-      document.getElementById('dateTo').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); detailData = null; attrData = null; load(); { const _t2 = document.querySelector('.tab.active').dataset.tab; if (_t2 === 'details') loadDetails(); if (_t2 === 'attribution') loadAttribution(); } };
+      document.getElementById('dateFrom').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); detailData = null; load(); { const _t2 = document.querySelector('.tab.active').dataset.tab; if (_t2 === 'details') loadDetails(); } };
+      document.getElementById('dateTo').onchange = () => { document.querySelectorAll('[data-range]').forEach(x => x.classList.remove('active')); detailData = null; load(); { const _t2 = document.querySelector('.tab.active').dataset.tab; if (_t2 === 'details') loadDetails(); } };
 
       load();
     });
diff --git a/ci3/ci-metrics/views/flake-prs.html b/ci3/ci-metrics/views/flake-prs.html
new file mode 100644
index 000000000000..a962d94d6756
--- /dev/null
+++ b/ci3/ci-metrics/views/flake-prs.html
@@ -0,0 +1,155 @@
+<!DOCTYPE html>
+<html>
+<head>
+  <meta charset="utf-8" />
+  <title>Flake PRs</title>
+  <style>
+    body { background: #0d1117; color: #c9d1d9; font-family: monospace; font-size: 14px; padding: 16px; margin: 0; }
+    a { color: #58a6ff; text-decoration: none; }
+    a:hover { text-decoration: underline; }
+    .nav { margin: 8px 0 16px; display: flex; gap: 8px; align-items: center; flex-wrap: wrap; }
+    .nav a { color: #58a6ff; font-size: 13px; }
+    .nav a.active { color: #fff; border-bottom: 1px solid #58a6ff; }
+    .sep { color: #333; }
+    h2 { margin: 0 0 8px; color: #e6edf3; font-size: 18px; font-weight: normal; }
+    .stats-bar { color: #8b949e; font-size: 13px; margin-bottom: 12px; }
+    .stats-bar span { color: #c9d1d9; }
+    .filter-row { margin-bottom: 16px; }
+    input#filter { background: #161b22; border: 1px solid #30363d; color: #c9d1d9;
+      font-family: monospace; font-size: 13px; padding: 6px 12px; width: 320px; }
+    input#filter:focus { outline: none; border-color: #58a6ff; }
+    .month-group { margin-bottom: 24px; }
+    .month-header { color: #8b949e; font-size: 13px; text-transform: uppercase;
+      letter-spacing: 1px; padding: 6px 0; border-bottom: 1px solid #21262d; margin-bottom: 4px; }
+    .pr-row { display: flex; align-items: center; gap: 12px; padding: 7px 4px;
+      border-bottom: 1px solid #161b22; }
+    .pr-row:hover { background: #161b22; }
+    .dot { color: #3fb950; font-size: 10px; flex-shrink: 0; }
+    .pr-num { color: #8b949e; font-size: 13px; flex-shrink: 0; min-width: 52px; }
+    .pr-num a { color: #8b949e; }
+    .pr-num a:hover { color: #58a6ff; }
+    .pr-title { flex: 1; min-width: 0; overflow: hidden; text-overflow: ellipsis; white-space: nowrap; }
+    .kw { color: #f0883e; font-weight: bold; }
+    .pr-author { color: #8b949e; font-size: 12px; flex-shrink: 0; }
+    .pr-diff { color: #8b949e; font-size: 12px; flex-shrink: 0; white-space: nowrap; }
+    .pr-diff .add { color: #3fb950; }
+    .pr-diff .del { color: #f85149; }
+    .pr-date { color: #8b949e; font-size: 12px; flex-shrink: 0; min-width: 80px; text-align: right; }
+    .empty { color: #8b949e; padding: 24px 0; }
+  </style>
+</head>
+<body>
+  <div class="nav">
+    <a href="/">&lt; CI</a> <span class="sep">|</span>
+    <a href="/cost-overview">cost overview</a> <span class="sep">|</span>
+    <a href="/namespace-billing">namespace billing</a> <span class="sep">|</span>
+    <a href="/ci-insights">ci insights</a> <span class="sep">|</span>
+    <a href="/flake-prs" class="active">flake prs</a> <span class="sep">|</span>
+    <a href="/commits">commits</a>
+  </div>
+
+  <h2>Flake / Deflake PRs</h2>
+  <div class="stats-bar" id="stats-bar">loading…</div>
+
+  <div class="filter-row">
+    <input id="filter" type="text" placeholder="filter by title or author…" oninput="applyFilter()" />
+  </div>
+
+  <div id="list"></div>
+
+<script>
+  let allPRs = [];
+  const KEYWORDS = ['flake', 'deflake', 'flaky'];
+
+  function highlight(text) {
+    return text.replace(new RegExp('(' + KEYWORDS.join('|') + ')', 'gi'),
+      '<span class="kw">$1</span>');
+  }
+
+  function fmtDate(str) {
+    if (!str) return '';
+    const d = new Date(str);
+    if (isNaN(d)) return str.slice(0, 10);
+    return d.toISOString().slice(0, 10);
+  }
+
+  function monthKey(str) {
+    if (!str) return 'unknown';
+    return (str + '').slice(0, 7);
+  }
+
+  function fmtMonth(key) {
+    if (key === 'unknown') return 'Unknown';
+    const [y, m] = key.split('-');
+    const months = ['Jan','Feb','Mar','Apr','May','Jun','Jul','Aug','Sep','Oct','Nov','Dec'];
+    return `${months[parseInt(m, 10) - 1]} ${y}`;
+  }
+
+  function renderList(prs) {
+    const container = document.getElementById('list');
+    if (!prs.length) {
+      container.innerHTML = '<div class="empty">No matching PRs found.</div>';
+      return;
+    }
+
+    // Group by month (from fetched_at)
+    const groups = {};
+    prs.forEach(pr => {
+      const key = monthKey(pr.fetched_at);
+      if (!groups[key]) groups[key] = [];
+      groups[key].push(pr);
+    });
+
+    const sortedKeys = Object.keys(groups).sort().reverse();
+    container.innerHTML = sortedKeys.map(key => {
+      const rows = groups[key].map(pr => {
+        const ghUrl = `https://github.com/AztecProtocol/aztec-packages/pull/${pr.pr_number}`;
+        const adds = pr.additions != null ? `<span class="add">+${pr.additions}</span>` : '';
+        const dels = pr.deletions != null ? `<span class="del">-${pr.deletions}</span>` : '';
+        const diff = (adds || dels) ? `<span class="pr-diff">${adds} ${dels}</span>` : '';
+        return `<div class="pr-row">
+          <span class="dot">●</span>
+          <span class="pr-num"><a href="${ghUrl}" target="_blank">#${pr.pr_number}</a></span>
+          <span class="pr-title" title="${pr.title}">${highlight(pr.title || '')}</span>
+          <span class="pr-author">${pr.author || ''}</span>
+          ${diff}
+          <span class="pr-date">${fmtDate(pr.fetched_at)}</span>
+        </div>`;
+      }).join('');
+      return `<div class="month-group">
+        <div class="month-header">${fmtMonth(key)} — ${groups[key].length} PRs</div>
+        ${rows}
+      </div>`;
+    }).join('');
+  }
+
+  function applyFilter() {
+    const q = document.getElementById('filter').value.trim().toLowerCase();
+    if (!q) { renderList(allPRs); return; }
+    renderList(allPRs.filter(pr =>
+      (pr.title || '').toLowerCase().includes(q) ||
+      (pr.author || '').toLowerCase().includes(q) ||
+      String(pr.pr_number).includes(q)
+    ));
+  }
+
+  async function load() {
+    try {
+      const resp = await fetch('/api/flake-prs');
+      if (!resp.ok) throw new Error(resp.statusText);
+      allPRs = await resp.json();
+
+      const authors = new Set(allPRs.map(p => p.author).filter(Boolean));
+      document.getElementById('stats-bar').innerHTML =
+        `<span>${allPRs.length}</span> PRs &middot; <span>${authors.size}</span> contributors`;
+
+      renderList(allPRs);
+    } catch (e) {
+      document.getElementById('stats-bar').textContent = 'Error loading data: ' + e.message;
+    }
+  }
+
+  load();
+</script>
+</body>
+</html>
diff --git a/ci3/ci-metrics/views/test-timings.html b/ci3/ci-metrics/views/test-timings.html
index 0bf6c7213bd6..63cc54bb3690 100644
--- a/ci3/ci-metrics/views/test-timings.html
+++ b/ci3/ci-metrics/views/test-timings.html
@@ -1,289 +1,7 @@
 <!DOCTYPE html>
 <html>
-<head>
-  <meta charset="utf-8" />
-  <title>ACI - Test Timings</title>
-  <style>
-    * { box-sizing: border-box; }
-    body { background:#000; color:#ccc; font-family:monospace; padding:10px; font-size:14px; margin:0; }
-    a { color:#58a6ff; text-decoration:none; }
-    a:hover { text-decoration:underline; }
-    .nav { margin:8px 0; display:flex; gap:8px; align-items:center; flex-wrap:wrap; }
-    .nav a { color:#58a6ff; font-size:13px; }
-    .nav a.active { color:#fff; border-bottom:1px solid #58a6ff; }
-    .sep { color:#333; }
-    .controls { margin:10px 0; display:flex; gap:12px; align-items:center; flex-wrap:wrap; }
-    .controls label { color:#888; }
-    input, select { background:#111; border:1px solid #333; color:#ccc; font-family:monospace; font-size:13px; padding:4px 8px; }
-    input:focus, select:focus { outline:none; border-color:#58a6ff; }
-    button { background:#222; border:1px solid #444; color:#ccc; font-family:monospace; font-size:13px; padding:4px 12px; cursor:pointer; }
-    button:hover { background:#333; }
-    button.active { background:#238636; border-color:#238636; color:#fff; }
-    .msg { color:#888; padding:8px 0; }
-    .msg.err { color:#f85149; }
-    .kpi-strip { display:flex; gap:12px; margin:16px 0; flex-wrap:wrap; }
-    .kpi { background:#0a0a0a; border:1px solid #222; padding:12px 16px; flex:1; min-width:160px; }
-    .kpi .label { color:#666; font-size:11px; text-transform:uppercase; margin-bottom:4px; }
-    .kpi .value { color:#fff; font-size:22px; font-weight:bold; }
-    .charts { display:grid; grid-template-columns:1fr 1fr; gap:16px; margin:16px 0; }
-    .charts .full { grid-column:1 / -1; }
-    @media (max-width:1000px) { .charts { grid-template-columns:1fr; } }
-    .chart-box { background:#0a0a0a; border:1px solid #222; padding:12px; }
-    .chart-box h3 { color:#888; font-size:12px; font-weight:normal; text-transform:uppercase; margin:0 0 8px 0; }
-    .chart-wrap { position:relative; height:250px; }
-    table { width:100%; border-collapse:collapse; font-size:13px; }
-    th { text-align:left; padding:6px 8px; border-bottom:1px solid #333; color:#888; cursor:pointer; white-space:nowrap; }
-    th:hover { color:#ccc; }
-    td { padding:6px 8px; border-bottom:1px solid #111; }
-    tr:hover td { background:#111; }
-    .amt { font-variant-numeric:tabular-nums; text-align:right; }
-    th.amt { text-align:right; }
-    .detail-scroll { max-height:600px; overflow:auto; }
-    .cmd { max-width:500px; overflow:hidden; text-overflow:ellipsis; white-space:nowrap; }
-    .pass { color:#3fb950; }
-    .fail { color:#f85149; }
-    .flake { color:#d29922; }
-  </style>
-</head>
+<head><meta charset="utf-8" /><title>Redirecting...</title></head>
 <body>
-  <div class="nav">
-    <a href="/">&lt; CI</a> <span class="sep">|</span>
-    <a href="/cost-overview">cost overview</a>
-    <a href="/namespace-billing">namespace billing</a>
-    <a href="/ci-insights">ci insights</a>
-    <a href="/test-timings" class="active">test timings</a>
-  </div>
-
-  <h2 style="margin:8px 0;color:#ccc;">test timings</h2>
-
-  <div class="controls">
-    <button data-range="7">1w</button>
-    <button data-range="14">2w</button>
-    <button data-range="30">1m</button>
-    <button data-range="90">3m</button>
-    <span class="sep">|</span>
-    <label>from</label> <input type="date" id="dateFrom" />
-    <label>to</label> <input type="date" id="dateTo" />
-    <span class="sep">|</span>
-    <label>pipeline</label>
-    <select id="dashboard">
-      <option value="">all</option>
-      <option value="prs">prs</option>
-      <option value="next">next</option>
-      <option value="master">master</option>
-    </select>
-    <span class="sep">|</span>
-    <label>status</label>
-    <select id="statusFilter">
-      <option value="">all</option>
-      <option value="passed">passed</option>
-      <option value="failed">failed</option>
-      <option value="flaked">flaked</option>
-    </select>
-  </div>
-
-  <div id="status" class="msg">loading...</div>
-
-  <div class="kpi-strip" id="kpis"></div>
-
-  <div class="charts">
-    <div class="chart-box full">
-      <h3>avg duration by day</h3>
-      <div class="chart-wrap" id="chartDuration"></div>
-    </div>
-    <div class="chart-box full">
-      <h3>test run count by day</h3>
-      <div class="chart-wrap" id="chartCount"></div>
-    </div>
-  </div>
-
-  <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:24px 0 8px 0;">tests by duration</h3>
-  <div class="detail-scroll">
-    <table id="testTable">
-      <thead>
-        <tr>
-          <th>test command</th>
-          <th class="amt">runs</th>
-          <th class="amt">avg (s)</th>
-          <th class="amt">min (s)</th>
-          <th class="amt">max (s)</th>
-          <th class="amt">total (h)</th>
-          <th class="amt">pass %</th>
-          <th class="amt">passed</th>
-          <th class="amt">failed</th>
-          <th class="amt">flaked</th>
-        </tr>
-      </thead>
-      <tbody></tbody>
-    </table>
-  </div>
-
-  <h3 style="color:#888;font-size:12px;text-transform:uppercase;margin:24px 0 8px 0;">slowest individual runs</h3>
-  <div class="detail-scroll">
-    <table id="slowestTable">
-      <thead>
-        <tr>
-          <th>test command</th>
-          <th class="amt">duration (s)</th>
-          <th>status</th>
-          <th>date</th>
-          <th>author</th>
-          <th>pipeline</th>
-          <th>log</th>
-        </tr>
-      </thead>
-      <tbody></tbody>
-    </table>
-  </div>
-
-  <script src="https://cdn.jsdelivr.net/npm/chart.js@4"></script>
-  <script>
-const $ = s => document.querySelector(s);
-const dF = $('#dateFrom'), dT = $('#dateTo'), dash = $('#dashboard'), statusF = $('#statusFilter');
-
-function initDates(days) {
-  const to = new Date(), from = new Date();
-  from.setDate(from.getDate() - days);
-  dF.value = from.toISOString().slice(0, 10);
-  dT.value = to.toISOString().slice(0, 10);
-}
-initDates(30);
-
-let charts = {};
-
-function makeChart(id, type, data, opts = {}) {
-  if (charts[id]) charts[id].destroy();
-  const ctx = document.createElement('canvas');
-  document.getElementById(id).innerHTML = '';
-  document.getElementById(id).appendChild(ctx);
-  charts[id] = new Chart(ctx, {
-    type, data,
-    options: {
-      responsive: true, maintainAspectRatio: false,
-      plugins: { legend: { display: !!opts.legend, labels: { color: '#888', font: { family: 'monospace', size: 11 } } } },
-      scales: {
-        x: { ticks: { color: '#555', font: { family: 'monospace', size: 10 } }, grid: { color: '#111' } },
-        y: { ticks: { color: '#555', font: { family: 'monospace', size: 10 } }, grid: { color: '#111' }, ...opts.yAxis || {} },
-      },
-      ...opts.extra || {},
-    }
-  });
-}
-
-function fmt(v) { return v == null ? '-' : v.toLocaleString(); }
-function fmtH(secs) { return secs == null ? '-' : (secs / 3600).toFixed(1); }
-
-async function load() {
-  $('#status').textContent = 'loading...';
-  $('#status').className = 'msg';
-  const p = new URLSearchParams({
-    from: dF.value, to: dT.value,
-    dashboard: dash.value, status: statusF.value,
-  });
-  try {
-    const r = await fetch('/api/tests/timings?' + p);
-    if (!r.ok) throw new Error(r.statusText);
-    const d = await r.json();
-    render(d);
-    $('#status').textContent = '';
-  } catch (e) {
-    $('#status').textContent = 'error: ' + e.message;
-    $('#status').className = 'msg err';
-  }
-}
-
-function render(d) {
-  const s = d.summary;
-  $('#kpis').innerHTML = [
-    kpi('total runs', fmt(s.total_runs)),
-    kpi('avg duration', s.avg_duration_secs != null ? s.avg_duration_secs + 's' : '-'),
-    kpi('max duration', s.max_duration_secs != null ? s.max_duration_secs + 's' : '-'),
-    kpi('total compute', fmtH(s.total_compute_secs) + 'h'),
-    kpi('passed', `<span class="pass">${fmt(s.passed)}</span>`),
-    kpi('failed', `<span class="fail">${fmt(s.failed)}</span>`),
-    kpi('flaked', `<span class="flake">${fmt(s.flaked)}</span>`),
-  ].join('');
-
-  // Duration chart
-  const dates = d.by_date.map(r => r.date);
-  makeChart('chartDuration', 'line', {
-    labels: dates,
-    datasets: [
-      { label: 'avg (s)', data: d.by_date.map(r => r.avg_secs), borderColor: '#58a6ff', backgroundColor: 'rgba(88,166,255,0.1)', fill: true, tension: 0.3, pointRadius: 1 },
-      { label: 'max (s)', data: d.by_date.map(r => r.max_secs), borderColor: '#f8514966', borderDash: [4, 4], tension: 0.3, pointRadius: 0 },
-    ]
-  }, { legend: true });
-
-  // Count chart
-  makeChart('chartCount', 'bar', {
-    labels: dates,
-    datasets: [
-      { label: 'passed', data: d.by_date.map(r => r.passed), backgroundColor: '#238636' },
-      { label: 'failed', data: d.by_date.map(r => r.failed), backgroundColor: '#da3633' },
-      { label: 'flaked', data: d.by_date.map(r => r.flaked), backgroundColor: '#9e6a03' },
-    ]
-  }, { legend: true, extra: { scales: { x: { stacked: true, ticks: { color: '#555', font: { family: 'monospace', size: 10 } }, grid: { color: '#111' } }, y: { stacked: true, ticks: { color: '#555', font: { family: 'monospace', size: 10 } }, grid: { color: '#111' } } } } });
-
-  // Test table
-  const tb = $('#testTable tbody');
-  tb.innerHTML = d.by_test.map(t => `<tr>
-    <td class="cmd" title="${esc(t.test_cmd)}">${esc(t.test_cmd)}</td>
-    <td class="amt">${t.count}</td>
-    <td class="amt">${t.avg_secs}</td>
-    <td class="amt">${t.min_secs}</td>
-    <td class="amt">${t.max_secs}</td>
-    <td class="amt">${fmtH(t.total_time_secs)}</td>
-    <td class="amt">${t.pass_rate}%</td>
-    <td class="amt pass">${t.passed}</td>
-    <td class="amt fail">${t.failed}</td>
-    <td class="amt flake">${t.flaked}</td>
-  </tr>`).join('');
-
-  // Slowest table
-  const sb = $('#slowestTable tbody');
-  sb.innerHTML = d.slowest.map(t => `<tr>
-    <td class="cmd" title="${esc(t.test_cmd)}">${esc(t.test_cmd)}</td>
-    <td class="amt">${t.duration_secs}</td>
-    <td class="${t.status === 'passed' ? 'pass' : t.status === 'failed' ? 'fail' : 'flake'}">${t.status}</td>
-    <td>${t.date}</td>
-    <td>${esc(t.commit_author || '')}</td>
-    <td>${esc(t.dashboard || '')}</td>
-    <td>${t.log_url ? '<a href="' + esc(t.log_url) + '" target="_blank">log</a>' : ''}</td>
-  </tr>`).join('');
-}
-
-function kpi(label, value) {
-  return `<div class="kpi"><div class="label">${label}</div><div class="value">${value}</div></div>`;
-}
-function esc(s) { const d = document.createElement('div'); d.textContent = s; return d.innerHTML; }
-
-// Sort tables by clicking headers
-document.querySelectorAll('table').forEach(table => {
-  table.querySelectorAll('th').forEach((th, i) => {
-    th.addEventListener('click', () => {
-      const rows = [...table.querySelectorAll('tbody tr')];
-      const asc = th.dataset.sort !== 'asc';
-      th.dataset.sort = asc ? 'asc' : 'desc';
-      rows.sort((a, b) => {
-        let va = a.cells[i].textContent.replace(/[%h]/g, '');
-        let vb = b.cells[i].textContent.replace(/[%h]/g, '');
-        const na = parseFloat(va), nb = parseFloat(vb);
-        if (!isNaN(na) && !isNaN(nb)) return asc ? na - nb : nb - na;
-        return asc ? va.localeCompare(vb) : vb.localeCompare(va);
-      });
-      table.querySelector('tbody').append(...rows);
-    });
-  });
-});
-
-// Controls
-document.querySelectorAll('[data-range]').forEach(b => b.addEventListener('click', () => { initDates(+b.dataset.range); load(); }));
-dF.addEventListener('change', load);
-dT.addEventListener('change', load);
-dash.addEventListener('change', load);
-statusF.addEventListener('change', load);
-
-load();
-  </script>
+<script>location.href = '/ci-insights' + (location.search || '');</script>
 </body>
 </html>
diff --git a/ci3/dashboard/Dockerfile b/ci3/dashboard/Dockerfile
index 2da7805ffa83..cd2e5b1f9b1d 100644
--- a/ci3/dashboard/Dockerfile
+++ b/ci3/dashboard/Dockerfile
@@ -24,4 +24,4 @@ RUN pip install --no-cache-dir -r ci-metrics/requirements.txt
 RUN git config --global --add safe.directory /aztec-packages
 COPY . .
 EXPOSE 8080 8081
-CMD ["gunicorn", "-w", "100", "-b", "0.0.0.0:8080", "rk:app"]
+CMD ["gunicorn", "-w", "50", "-b", "0.0.0.0:8080", "rk:app"]
diff --git a/ci3/dashboard/requirements.txt b/ci3/dashboard/requirements.txt
index 9c1526f5b7a8..f3e1e9c53c08 100644
--- a/ci3/dashboard/requirements.txt
+++ b/ci3/dashboard/requirements.txt
@@ -5,3 +5,4 @@ ansi2html
 Flask-Compress
 requests
 Flask-HTTPAuth
+boto3
diff --git a/ci3/dashboard/rk.py b/ci3/dashboard/rk.py
index aedf35a824e2..12b9a414077f 100644
--- a/ci3/dashboard/rk.py
+++ b/ci3/dashboard/rk.py
@@ -1,6 +1,8 @@
 from flask import Flask, render_template_string, request, Response, redirect
 from flask_compress import Compress
 from flask_httpauth import HTTPBasicAuth
+import boto3
+from botocore.exceptions import ClientError
 import gzip
 import json
 import os
@@ -9,6 +11,7 @@
 import shlex
 import subprocess
 import threading
+import time as _time
 import uuid
 from ansi2html import Ansi2HTMLConverter
 from pathlib import Path
@@ -19,6 +22,10 @@
     hyperlink, r, get_section_data, get_list_as_string
 )
 LOGS_DISK_PATH = os.getenv('LOGS_DISK_PATH', '/logs-disk')
+S3_LOGS_BUCKET = os.getenv('S3_LOGS_BUCKET', 'aztec-ci-artifacts')
+S3_LOGS_PREFIX = os.getenv('S3_LOGS_PREFIX', 'logs')
+
+_s3 = boto3.client('s3', region_name='us-east-2')
 DASHBOARD_PASSWORD = os.getenv('DASHBOARD_PASSWORD', 'password')
 CI_METRICS_PORT = int(os.getenv('CI_METRICS_PORT', '8081'))
 CI_METRICS_URL = os.getenv('CI_METRICS_URL', f'http://localhost:{CI_METRICS_PORT}')
@@ -27,37 +34,47 @@
 Compress(app)
 auth = HTTPBasicAuth()
 
-# Start the ci-metrics server as a subprocess
-# Check sibling dir (repo layout) then subdirectory (Docker layout)
+# Start the ci-metrics server as a subprocess (once across all workers).
+# Uses a file lock so only the first gunicorn worker to import this module
+# actually spawns the process; the rest skip silently.
+import fcntl
+import signal
+
 _ci_metrics_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), '..', 'ci-metrics')
 if not os.path.isdir(_ci_metrics_dir):
     _ci_metrics_dir = os.path.join(os.path.dirname(os.path.abspath(__file__)), 'ci-metrics')
 if os.path.isdir(_ci_metrics_dir):
-    # Kill any stale process on the port (e.g. leftover from previous reload)
-    import signal
+    _lock_path = f'/tmp/ci-metrics-{CI_METRICS_PORT}.lock'
     try:
-        out = subprocess.check_output(
-            ['lsof', '-ti', f':{CI_METRICS_PORT}'], stderr=subprocess.DEVNULL, text=True)
-        for pid in out.strip().split('\n'):
-            if pid:
-                os.kill(int(pid), signal.SIGTERM)
-        import time; time.sleep(0.5)
-    except (subprocess.CalledProcessError, OSError):
+        _lock_fd = open(_lock_path, 'w')
+        fcntl.flock(_lock_fd, fcntl.LOCK_EX | fcntl.LOCK_NB)
+        # We hold the lock — kill stale process and spawn fresh one
+        try:
+            out = subprocess.check_output(
+                ['lsof', '-ti', f':{CI_METRICS_PORT}'], stderr=subprocess.DEVNULL, text=True)
+            for pid in out.strip().split('\n'):
+                if pid:
+                    os.kill(int(pid), signal.SIGTERM)
+            _time.sleep(0.5)
+        except (subprocess.CalledProcessError, OSError):
+            pass
+        _ci_metrics_env = {**os.environ, 'CI_METRICS_PORT': str(CI_METRICS_PORT)}
+        subprocess.Popen(
+            ['gunicorn', '-w', '1', '-b', f'0.0.0.0:{CI_METRICS_PORT}',
+             '--timeout', '120', 'app:app'],
+            cwd=_ci_metrics_dir,
+            env=_ci_metrics_env,
+        )
+        print(f"[rk.py] ci-metrics server started on port {CI_METRICS_PORT}")
+        # Hold the lock until this process exits so other workers skip
+    except OSError:
+        # Another worker already holds the lock — nothing to do
         pass
-    _ci_metrics_env = {**os.environ, 'CI_METRICS_PORT': str(CI_METRICS_PORT)}
-    subprocess.Popen(
-        ['gunicorn', '-w', '4', '-b', f'0.0.0.0:{CI_METRICS_PORT}', '--timeout', '120', 'app:app'],
-        cwd=_ci_metrics_dir,
-        env=_ci_metrics_env,
-    )
-    print(f"[rk.py] ci-metrics server started on port {CI_METRICS_PORT}")
 
 def read_from_disk(key):
-    """Read log from disk as fallback when Redis key not found."""
+    """Read log from disk."""
     try:
-        # Use first 4 chars as subdirectory
         prefix = key[:4]
-        log_file = f"/logs-disk/{prefix}/{key}.log.gz"
         log_file = f"{LOGS_DISK_PATH}/{prefix}/{key}.log.gz"
         if os.path.exists(log_file):
             with gzip.open(log_file, 'rb') as f:
@@ -66,6 +83,20 @@ def read_from_disk(key):
         print(f"Error reading from disk: {e}")
     return None
 
+def read_from_s3(key):
+    """Read log from S3 (fallback when Redis and disk both miss)."""
+    try:
+        prefix = key[:4]
+        s3_key = f"{S3_LOGS_PREFIX}/{prefix}/{key}.log.gz"
+        obj = _s3.get_object(Bucket=S3_LOGS_BUCKET, Key=s3_key)
+        return gzip.decompress(obj['Body'].read()).decode('utf-8', errors='replace')
+    except ClientError as e:
+        if e.response['Error']['Code'] != 'NoSuchKey':
+            print(f"S3 error reading {key}: {e}")
+    except Exception as e:
+        print(f"Error reading from S3: {e}")
+    return None
+
 def read_breakdown_from_disk(runtime, flow_name, sha):
     """Read benchmark breakdown JSON from disk."""
     try:
@@ -178,7 +209,6 @@ def root() -> str:
         f"{hyperlink('/cost-overview', 'cost overview (AWS + GCP)')}\n"
         f"{hyperlink('/namespace-billing', 'namespace billing')}\n"
         f"{hyperlink('/ci-insights', 'ci insights')}\n"
-        f"{hyperlink('/test-timings', 'test timings')}\n"
         f"{RESET}"
     )
 
@@ -528,32 +558,32 @@ def make_options(param_name, options, current_value, suffix=''):
 _proxy_session = requests.Session()
 _HOP_BY_HOP = frozenset([
     'connection', 'keep-alive', 'proxy-authenticate', 'proxy-authorization',
-    'te', 'trailers', 'transfer-encoding', 'upgrade', 'content-length',
-    # `requests` auto-decompresses gzip responses, so Content-Encoding is
-    # stale — strip it so the browser doesn't try to decompress plain content.
-    # Flask-Compress on rkapp handles browser compression.
-    'content-encoding',
+    'te', 'trailers', 'transfer-encoding', 'upgrade',
 ])
-# Don't forward Accept-Encoding — let `requests` negotiate with ci-metrics
-# (it adds its own and auto-decompresses).
-_STRIP_REQUEST_HEADERS = frozenset(['host', 'accept-encoding'])
+_STRIP_REQUEST_HEADERS = frozenset(['host'])
 
 def _proxy(path):
-    """Forward request to ci-metrics, streaming the response back."""
+    """Forward request to ci-metrics, streaming the response back.
+
+    Passes the browser's Accept-Encoding through to ci-metrics so it
+    compresses directly for the browser.  We stream the raw (still
+    compressed) bytes back without decompression.
+    """
     url = f'{CI_METRICS_URL}/{path.lstrip("/")}'
     try:
+        fwd_headers = {k: v for k, v in request.headers if k.lower() not in _STRIP_REQUEST_HEADERS}
         resp = _proxy_session.request(
             method=request.method,
             url=url,
             params=request.args,
             data=request.get_data(),
-            headers={k: v for k, v in request.headers if k.lower() not in _STRIP_REQUEST_HEADERS},
+            headers=fwd_headers,
             stream=True,
-            timeout=60,
+            timeout=180,
         )
-        # Strip hop-by-hop headers
+        # Stream raw bytes (skip requests auto-decompression)
         headers = {k: v for k, v in resp.headers.items() if k.lower() not in _HOP_BY_HOP}
-        return Response(resp.iter_content(chunk_size=8192),
+        return Response(resp.raw.stream(8192),
                         status=resp.status_code, headers=headers)
     except Exception as e:
         return Response(json.dumps({'error': f'ci-metrics unavailable: {e}'}),
@@ -564,10 +594,13 @@ def _proxy(path):
 @app.route('/ci-insights')
 @app.route('/cost-overview')
 @app.route('/test-timings')
+@app.route('/ci-health-report')
+@app.route('/flake-prs')
 @auth.login_required
 def proxy_dashboard():
     return _proxy(request.path)
 
+
 @app.route('/api/<path:path>', methods=['GET', 'POST', 'PUT', 'DELETE'])
 @auth.login_required
 def proxy_api(path):
@@ -583,11 +616,13 @@ def get_value(key):
 
     value = r.get(key)
     if value is None:
-        # Try disk fallback
         value = read_from_disk(key)
-        if value is None:
-            value = "Key not found"
-    else:
+    if value is None:
+        value = read_from_s3(key)
+    if value is None:
+        value = "Key not found"
+    elif isinstance(value, bytes):
+        # Redis returns raw bytes — decompress if gzip.
         try:
             if value.startswith(b"\x1f\x8b"):
                 value = gzip.decompress(value).decode()