vercel
diff --git a/‎.github/scripts/aggregate-benchmarks.js‎
Lines changed: 70 additions & 10 deletions b/‎.github/scripts/aggregate-benchmarks.js‎
Lines changed: 70 additions & 10 deletions
diff --git a/‎.github/scripts/aggregate-e2e-results.js‎
Lines changed: 58 additions & 31 deletions b/‎.github/scripts/aggregate-e2e-results.js‎
Lines changed: 58 additions & 31 deletions
@@ -7,11 +7,15 @@ const path = require('path');
 const args = process.argv.slice(2);
 let resultsDir = '.';
 let baselineDir = null;
+let runUrl = '';
 
 for (let i = 0; i < args.length; i++) {
   if (args[i] === '--baseline' && args[i + 1]) {
     baselineDir = args[i + 1];
     i++;
+  } else if (args[i] === '--run-url' && args[i + 1]) {
+    runUrl = args[i + 1];
+    i++;
   } else if (!args[i].startsWith('--')) {
     resultsDir = args[i];
   }
@@ -127,6 +131,16 @@ function loadTimingData(benchmarkFile) {
   return null;
 }
 
+// Generate Vercel observability URL for a workflow run
+function getObservabilityUrl(vercelMetadata, runId) {
+  if (!vercelMetadata || !runId) return null;
+  const { teamSlug, projectSlug, environment } = vercelMetadata;
+  if (!teamSlug || !projectSlug) return null;
+  // Always use 'preview' for PR benchmarks
+  const env = environment === 'production' ? 'production' : 'preview';
+  return `https://vercel.com/${teamSlug}/${projectSlug}/observability/workflows/runs/${runId}?environment=${env}`;
+}
+
 // Collect all benchmark data
 function collectBenchmarkData(resultFiles) {
   // Structure: { [benchmarkName]: { [app]: { [backend]: { wallTime, workflowTime, overhead, min, max, samples, firstByteTime } } } }
@@ -162,13 +176,29 @@ function collectBenchmarkData(resultFiles) {
             // Get workflow timing if available
             let workflowTimeMs = null;
             let firstByteTimeMs = null;
+            let lastRunId = null;
+            let observabilityUrl = null;
             if (timings?.summary?.[benchName]) {
               workflowTimeMs = timings.summary[benchName].avgExecutionTimeMs;
               // Get TTFB for stream benchmarks
               if (timings.summary[benchName].avgFirstByteTimeMs !== undefined) {
                 firstByteTimeMs = timings.summary[benchName].avgFirstByteTimeMs;
               }
             }
+            // Get the last runId for observability link (Vercel only)
+            if (timings?.timings?.[benchName]?.length > 0) {
+              const lastTiming =
+                timings.timings[benchName][
+                  timings.timings[benchName].length - 1
+                ];
+              lastRunId = lastTiming?.runId;
+              if (timings?.vercel && lastRunId) {
+                observabilityUrl = getObservabilityUrl(
+                  timings.vercel,
+                  lastRunId
+                );
+              }
+            }
 
             data[benchName][app][backend] = {
               wallTime: bench.mean,
@@ -179,6 +209,8 @@ function collectBenchmarkData(resultFiles) {
               max: bench.max,
               samples: bench.sampleCount,
               firstByteTime: firstByteTimeMs,
+              runId: lastRunId,
+              observabilityUrl: observabilityUrl,
             };
           }
         }
@@ -378,6 +410,18 @@ function renderBenchmarkTable(
     }
   }
   console.log('');
+
+  // Collect and render observability links for Vercel world
+  const observabilityLinks = dataPoints
+    .filter((dp) => dp.metrics?.observabilityUrl && dp.backend === 'vercel')
+    .map((dp) => {
+      const frameworkInfo = frameworkConfig[dp.app] || { label: dp.app };
+      return `[${frameworkInfo.label}](${dp.metrics.observabilityUrl})`;
+    });
+
+  if (observabilityLinks.length > 0) {
+    console.log(`_🔍 Observability: ${observabilityLinks.join(' | ')}_\n`);
+  }
 }
 
 // Render the comparison tables
@@ -419,7 +463,8 @@ function renderComparison(data, baselineData) {
   const renderBenchmarkWithEnvironments = (benchName, benchData, isStream) => {
     const baselineBenchData = baselineData?.[benchName] || null;
 
-    console.log(`## ${benchName}\n`);
+    console.log(`<details>`);
+    console.log(`<summary><strong>${benchName}</strong></summary>\n`);
 
     // Render Local Development table
     if (localDevBackends.length > 0) {
@@ -448,6 +493,8 @@ function renderComparison(data, baselineData) {
         { showHeading: false }
       );
     }
+
+    console.log('</details>\n');
   };
 
   // Render regular benchmarks
@@ -457,15 +504,16 @@ function renderComparison(data, baselineData) {
 
   // Render stream benchmarks in a separate section
   if (streamBenchmarks.length > 0) {
-    console.log('---\n');
-    console.log('## Stream Benchmarks\n');
+    console.log('<details>');
     console.log(
-      '_Stream benchmarks include Time to First Byte (TTFB) metrics._\n'
+      '<summary><strong>Stream Benchmarks</strong> <em>(includes TTFB metrics)</em></summary>\n'
     );
 
     for (const [benchName, benchData] of streamBenchmarks) {
       renderBenchmarkWithEnvironments(benchName, benchData, true);
     }
+
+    console.log('</details>\n');
   }
 
   // Summary: Count wins per framework (within each world) and per world (within each framework)
@@ -541,8 +589,11 @@ function renderComparison(data, baselineData) {
   }
 
   // Summary: Best framework per world (by wins)
-  console.log('---\n');
-  console.log('## Summary: Fastest Framework by World\n');
+  console.log('### Summary\n');
+  console.log('<details>');
+  console.log(
+    '<summary><strong>Fastest Framework by World</strong></summary>\n'
+  );
   console.log(`_Winner determined by most benchmark wins_\n`);
   console.log('| World | 🥇 Fastest Framework | Wins |');
   console.log('|:------|:---------------------|-----:|');
@@ -579,10 +630,13 @@ function renderComparison(data, baselineData) {
       );
     }
   }
-  console.log('');
+  console.log('\n</details>\n');
 
   // Summary: Best world per framework (by wins)
-  console.log('## Summary: Fastest World by Framework\n');
+  console.log('<details>');
+  console.log(
+    '<summary><strong>Fastest World by Framework</strong></summary>\n'
+  );
   console.log(`_Winner determined by most benchmark wins_\n`);
   console.log('| Framework | 🥇 Fastest World | Wins |');
   console.log('|:----------|:-----------------|-----:|');
@@ -615,11 +669,11 @@ function renderComparison(data, baselineData) {
       );
     }
   }
-  console.log('');
+  console.log('\n</details>\n');
 
   // Legend
   console.log('<details>');
-  console.log('<summary>Column Definitions</summary>\n');
+  console.log('<summary><strong>Column Definitions</strong></summary>\n');
   console.log(
     '- **Workflow Time**: Runtime reported by workflow (completedAt - createdAt) - *primary metric*'
   );
@@ -646,6 +700,12 @@ function renderComparison(data, baselineData) {
     }
   }
   console.log('</details>');
+
+  // Add link to workflow run
+  if (runUrl) {
+    console.log('\n---');
+    console.log(`📋 [View full workflow run](${runUrl})`);
+  }
 }
 
 // Main
 
@@ -8,6 +8,7 @@ const args = process.argv.slice(2);
 let resultsDir = '.';
 let jobName = 'E2E Tests';
 let mode = 'single'; // 'single' for step summary, 'aggregate' for PR comment
+let runUrl = '';
 
 for (let i = 0; i < args.length; i++) {
   if (args[i] === '--job-name' && args[i + 1]) {
@@ -16,6 +17,9 @@ for (let i = 0; i < args.length; i++) {
   } else if (args[i] === '--mode' && args[i + 1]) {
     mode = args[i + 1];
     i++;
+  } else if (args[i] === '--run-url' && args[i + 1]) {
+    runUrl = args[i + 1];
+    i++;
   } else if (!args[i].startsWith('--')) {
     resultsDir = args[i];
   }
@@ -106,6 +110,7 @@ function parseJobInfo(filename) {
           'sveltekit',
           'hono',
           'express',
+          'fastify',
           'astro',
           'example',
           'turso',
@@ -211,14 +216,9 @@ function aggregateByCategory(files) {
 function renderSingleJobSummary(summary) {
   const total =
     summary.totalPassed + summary.totalFailed + summary.totalSkipped;
-  const statusEmoji =
-    summary.totalFailed > 0 ? '❌' : summary.totalSkipped > 0 ? '⚠️' : '✅';
+  const statusEmoji = summary.totalFailed > 0 ? '❌' : '✅';
   const statusText =
-    summary.totalFailed > 0
-      ? 'Some tests failed'
-      : summary.totalSkipped > 0
-        ? 'All tests passed (some skipped)'
-        : 'All tests passed';
+    summary.totalFailed > 0 ? 'Some tests failed' : 'All tests passed';
 
   console.log(`## ${statusEmoji} ${jobName}\n`);
   console.log(`**Status:** ${statusText}\n`);
@@ -259,8 +259,7 @@ function renderSingleJobSummary(summary) {
     console.log('| File | Passed | Failed | Skipped |');
     console.log('|:-----|-------:|-------:|--------:|');
     for (const result of summary.fileResults) {
-      const fileStatus =
-        result.failed > 0 ? '❌' : result.skipped > 0 ? '⚠️' : '✅';
+      const fileStatus = result.failed > 0 ? '❌' : '✅';
       console.log(
         `| ${fileStatus} ${result.file} | ${result.passed} | ${result.failed} | ${result.skipped} |`
       );
@@ -297,18 +296,9 @@ function renderAggregatedSummary(categories, overallSummary) {
     overallSummary.totalPassed +
     overallSummary.totalFailed +
     overallSummary.totalSkipped;
-  const statusEmoji =
-    overallSummary.totalFailed > 0
-      ? '❌'
-      : overallSummary.totalSkipped > 0
-        ? '⚠️'
-        : '✅';
+  const statusEmoji = overallSummary.totalFailed > 0 ? '❌' : '✅';
   const statusText =
-    overallSummary.totalFailed > 0
-      ? 'Some tests failed'
-      : overallSummary.totalSkipped > 0
-        ? 'All tests passed (some skipped)'
-        : 'All tests passed';
+    overallSummary.totalFailed > 0 ? 'Some tests failed' : 'All tests passed';
 
   console.log('<!-- e2e-test-results -->');
   console.log(`## 🧪 E2E Test Results\n`);
@@ -328,7 +318,7 @@ function renderAggregatedSummary(categories, overallSummary) {
 
   for (const [catName, cat] of sortedCategories) {
     const catTotal = cat.passed + cat.failed + cat.skipped;
-    const catStatus = cat.failed > 0 ? '❌' : cat.skipped > 0 ? '⚠️' : '✅';
+    const catStatus = cat.failed > 0 ? '❌' : '✅';
     const displayName = categoryNames[catName] || catName;
     console.log(
       `| ${catStatus} ${displayName} | ${cat.passed} | ${cat.failed} | ${cat.skipped} | ${catTotal} |`
@@ -340,21 +330,52 @@ function renderAggregatedSummary(categories, overallSummary) {
   );
   console.log('');
 
-  // Failed tests section
+  // Failed tests section - grouped by category and app
   if (overallSummary.allFailedTests.length > 0) {
     console.log('### ❌ Failed Tests\n');
+
+    // Group failed tests by category, then by app
+    const failedByCategory = new Map();
     for (const test of overallSummary.allFailedTests) {
-      const catDisplay = categoryNames[test.category] || test.category;
+      if (!failedByCategory.has(test.category)) {
+        failedByCategory.set(test.category, new Map());
+      }
+      const catMap = failedByCategory.get(test.category);
+      if (!catMap.has(test.app)) {
+        catMap.set(test.app, []);
+      }
+      catMap.get(test.app).push(test);
+    }
+
+    // Sort categories by defined order
+    const sortedFailedCategories = Array.from(failedByCategory.entries()).sort(
+      ([a], [b]) =>
+        (categoryOrder.indexOf(a) === -1 ? 999 : categoryOrder.indexOf(a)) -
+        (categoryOrder.indexOf(b) === -1 ? 999 : categoryOrder.indexOf(b))
+    );
+
+    for (const [catName, appsMap] of sortedFailedCategories) {
+      const catDisplay = categoryNames[catName] || catName;
+      const catFailedCount = Array.from(appsMap.values()).reduce(
+        (sum, tests) => sum + tests.length,
+        0
+      );
+
       console.log(`<details>`);
       console.log(
-        `<summary>${test.app} (${catDisplay}): ${test.name}</summary>\n`
+        `<summary>${catDisplay} (${catFailedCount} failed)</summary>\n`
       );
-      console.log(`**File:** \`${test.file}\`\n`);
-      if (test.message) {
-        console.log('```');
-        console.log(test.message);
-        console.log('```');
+
+      for (const [appName, tests] of appsMap.entries()) {
+        console.log(`**${appName}** (${tests.length} failed):\n`);
+        for (const test of tests) {
+          // Extract just the test name without "e2e " prefix if present
+          const testName = test.name.replace(/^e2e\s+/, '');
+          console.log(`- \`${testName}\``);
+        }
+        console.log('');
       }
+
       console.log('</details>\n');
     }
   }
@@ -363,21 +384,27 @@ function renderAggregatedSummary(categories, overallSummary) {
   console.log('### Details by Category\n');
 
   for (const [catName, cat] of sortedCategories) {
-    const catStatus = cat.failed > 0 ? '❌' : cat.skipped > 0 ? '⚠️' : '✅';
+    const catStatus = cat.failed > 0 ? '❌' : '✅';
     const displayName = categoryNames[catName] || catName;
 
     console.log(`<details>`);
     console.log(`<summary>${catStatus} ${displayName}</summary>\n`);
     console.log('| App | Passed | Failed | Skipped |');
     console.log('|:----|-------:|-------:|--------:|');
     for (const app of cat.apps) {
-      const appStatus = app.failed > 0 ? '❌' : app.skipped > 0 ? '⚠️' : '✅';
+      const appStatus = app.failed > 0 ? '❌' : '✅';
       console.log(
         `| ${appStatus} ${app.name} | ${app.passed} | ${app.failed} | ${app.skipped} |`
       );
     }
     console.log('</details>\n');
   }
+
+  // Add link to workflow run
+  if (runUrl) {
+    console.log('---');
+    console.log(`📋 [View full workflow run](${runUrl})`);
+  }
 }
 
 // Main