vercel
diff --git a/‎.github/scripts/aggregate-benchmarks.js‎
Lines changed: 17 additions & 3 deletions b/‎.github/scripts/aggregate-benchmarks.js‎
Lines changed: 17 additions & 3 deletions
diff --git a/‎.github/scripts/aggregate-e2e-results.js‎
Lines changed: 76 additions & 3 deletions b/‎.github/scripts/aggregate-e2e-results.js‎
Lines changed: 76 additions & 3 deletions
diff --git a/‎.github/workflows/benchmarks.yml‎
Lines changed: 22 additions & 2 deletions b/‎.github/workflows/benchmarks.yml‎
Lines changed: 22 additions & 2 deletions
diff --git a/‎.github/workflows/tests.yml‎
Lines changed: 37 additions & 3 deletions b/‎.github/workflows/tests.yml‎
Lines changed: 37 additions & 3 deletions
@@ -176,6 +176,7 @@ function collectBenchmarkData(resultFiles) {
             // Get workflow timing if available
             let workflowTimeMs = null;
             let firstByteTimeMs = null;
+            let slurpTimeMs = null;
             let lastRunId = null;
             let observabilityUrl = null;
             if (timings?.summary?.[benchName]) {
@@ -184,6 +185,10 @@ function collectBenchmarkData(resultFiles) {
               if (timings.summary[benchName].avgFirstByteTimeMs !== undefined) {
                 firstByteTimeMs = timings.summary[benchName].avgFirstByteTimeMs;
               }
+              // Get slurp time for stream benchmarks (time from first byte to completion)
+              if (timings.summary[benchName].avgSlurpTimeMs !== undefined) {
+                slurpTimeMs = timings.summary[benchName].avgSlurpTimeMs;
+              }
             }
             // Get the last runId for observability link (Vercel only)
             if (timings?.timings?.[benchName]?.length > 0) {
@@ -209,6 +214,7 @@ function collectBenchmarkData(resultFiles) {
               max: bench.max,
               samples: bench.sampleCount,
               firstByteTime: firstByteTimeMs,
+              slurpTime: slurpTimeMs,
               runId: lastRunId,
               observabilityUrl: observabilityUrl,
             };
@@ -329,10 +335,10 @@ function renderBenchmarkTable(
   // Render table - different columns for stream vs regular benchmarks
   if (isStream) {
     console.log(
-      '| World | Framework | Workflow Time | TTFB | Wall Time | Overhead | Samples | vs Fastest |'
+      '| World | Framework | Workflow Time | TTFB | Slurp | Wall Time | Overhead | Samples | vs Fastest |'
     );
     console.log(
-      '|:------|:----------|--------------:|-----:|----------:|---------:|--------:|-----------:|'
+      '|:------|:----------|--------------:|-----:|------:|----------:|---------:|--------:|-----------:|'
     );
   } else {
     console.log(
@@ -391,6 +397,11 @@ function renderBenchmarkTable(
       baseline?.firstByteTime
     );
 
+    // Format slurp time with delta for stream benchmarks (time from first byte to completion)
+    const slurpSec =
+      metrics.slurpTime !== null ? formatSec(metrics.slurpTime) : '-';
+    const slurpDelta = formatDelta(metrics.slurpTime, baseline?.slurpTime);
+
     // Format samples count
     const samplesCount = metrics.samples ?? '-';
 
@@ -401,7 +412,7 @@ function renderBenchmarkTable(
 
     if (isStream) {
       console.log(
-        `| ${worldInfo.emoji} ${worldInfo.label} | ${medal}${frameworkInfo.label} | ${workflowTimeSec}s${workflowDelta} | ${firstByteSec}s${ttfbDelta} | ${wallTimeSec}s${wallDelta} | ${overheadSec}s | ${samplesCount} | ${factor} |`
+        `| ${worldInfo.emoji} ${worldInfo.label} | ${medal}${frameworkInfo.label} | ${workflowTimeSec}s${workflowDelta} | ${firstByteSec}s${ttfbDelta} | ${slurpSec}s${slurpDelta} | ${wallTimeSec}s${wallDelta} | ${overheadSec}s | ${samplesCount} | ${factor} |`
       );
     } else {
       console.log(
@@ -680,6 +691,9 @@ function renderComparison(data, baselineData) {
   console.log(
     '- **TTFB**: Time to First Byte - time from workflow start until first stream byte received (stream benchmarks only)'
   );
+  console.log(
+    '- **Slurp**: Time from first byte to complete stream consumption (stream benchmarks only)'
+  );
   console.log(
     '- **Wall Time**: Total testbench time (trigger workflow + poll for result)'
   );
 
@@ -36,6 +36,7 @@ function findResultFiles(dir) {
         files.push(...findResultFiles(fullPath));
       } else if (
         entry.name.startsWith('e2e-') &&
+        !entry.name.startsWith('e2e-metadata-') &&
         entry.name.endsWith('.json')
       ) {
         files.push(fullPath);
@@ -47,6 +48,67 @@ function findResultFiles(dir) {
   return files;
 }
 
+// Find all e2e metadata JSON files
+function findMetadataFiles(dir) {
+  const files = [];
+  try {
+    const entries = fs.readdirSync(dir, { withFileTypes: true });
+    for (const entry of entries) {
+      const fullPath = path.join(dir, entry.name);
+      if (entry.isDirectory()) {
+        files.push(...findMetadataFiles(fullPath));
+      } else if (
+        entry.name.startsWith('e2e-metadata-') &&
+        entry.name.endsWith('.json')
+      ) {
+        files.push(fullPath);
+      }
+    }
+  } catch (e) {
+    // Directory doesn't exist or can't be read
+  }
+  return files;
+}
+
+// Load metadata indexed by app name
+function loadMetadata(dir) {
+  const metadata = new Map(); // app -> { runIds, vercel }
+  const metadataFiles = findMetadataFiles(dir);
+
+  for (const file of metadataFiles) {
+    try {
+      const content = JSON.parse(fs.readFileSync(file, 'utf-8'));
+      // Extract app name from filename: e2e-metadata-{app}-vercel.json
+      const basename = path.basename(file, '.json');
+      const match = basename.match(/^e2e-metadata-(.+)-vercel$/);
+      if (match && content.vercel) {
+        const appName = match[1];
+        metadata.set(appName, content);
+      }
+    } catch (e) {
+      // Skip invalid metadata files
+    }
+  }
+
+  return metadata;
+}
+
+// Generate observability URL for a test
+function getObservabilityUrl(metadata, appName, testName) {
+  const appMetadata = metadata.get(appName);
+  if (!appMetadata || !appMetadata.vercel) return null;
+
+  const { vercel, runIds } = appMetadata;
+  if (!vercel.teamSlug || !vercel.projectSlug) return null;
+
+  // Find the runId for this test
+  const runInfo = runIds?.find((r) => r.testName === testName);
+  if (!runInfo) return null;
+
+  const env = vercel.environment === 'production' ? 'production' : 'preview';
+  return `https://vercel.com/${vercel.teamSlug}/${vercel.projectSlug}/observability/workflows/runs/${runInfo.runId}?environment=${env}`;
+}
+
 // Parse vitest JSON output
 function parseVitestResults(file) {
   try {
@@ -291,7 +353,7 @@ const categoryOrder = [
 ];
 
 // Render aggregated PR comment summary
-function renderAggregatedSummary(categories, overallSummary) {
+function renderAggregatedSummary(categories, overallSummary, metadata) {
   const total =
     overallSummary.totalPassed +
     overallSummary.totalFailed +
@@ -371,7 +433,17 @@ function renderAggregatedSummary(categories, overallSummary) {
         for (const test of tests) {
           // Extract just the test name without "e2e " prefix if present
           const testName = test.name.replace(/^e2e\s+/, '');
-          console.log(`- \`${testName}\``);
+          // Add observability link for vercel-prod tests
+          if (catName === 'vercel-prod') {
+            const obsUrl = getObservabilityUrl(metadata, appName, test.name);
+            if (obsUrl) {
+              console.log(`- \`${testName}\` ([🔍 observability](${obsUrl}))`);
+            } else {
+              console.log(`- \`${testName}\``);
+            }
+          } else {
+            console.log(`- \`${testName}\``);
+          }
         }
         console.log('');
       }
@@ -425,7 +497,8 @@ if (resultFiles.length === 0) {
 
 if (mode === 'aggregate') {
   const { categories, overallSummary } = aggregateByCategory(resultFiles);
-  renderAggregatedSummary(categories, overallSummary);
+  const metadata = loadMetadata(resultsDir);
+  renderAggregatedSummary(categories, overallSummary, metadata);
 
   // Exit with non-zero if any tests failed
   if (overallSummary.totalFailed > 0) {
 
@@ -495,12 +495,19 @@ jobs:
           echo "vercel=$VERCEL_STATUS" >> $GITHUB_OUTPUT
           echo "community=$COMMUNITY_STATUS" >> $GITHUB_OUTPUT
 
-          if [[ "$LOCAL_STATUS" == "failure" || "$POSTGRES_STATUS" == "failure" || "$VERCEL_STATUS" == "failure" || "$COMMUNITY_STATUS" == "failure" ]]; then
+          # Community world failures are warnings, not errors
+          if [[ "$LOCAL_STATUS" == "failure" || "$POSTGRES_STATUS" == "failure" || "$VERCEL_STATUS" == "failure" ]]; then
             echo "has_failures=true" >> $GITHUB_OUTPUT
           else
             echo "has_failures=false" >> $GITHUB_OUTPUT
           fi
 
+          if [[ "$COMMUNITY_STATUS" == "failure" ]]; then
+            echo "has_warnings=true" >> $GITHUB_OUTPUT
+          else
+            echo "has_warnings=false" >> $GITHUB_OUTPUT
+          fi
+
       - name: Update PR comment with results
         if: github.event_name == 'pull_request'
         uses: marocchino/sticky-pull-request-comment@v2
@@ -517,10 +524,23 @@ jobs:
           message: |
 
             ---
-            ⚠️ **Some benchmark jobs failed:**
+            ❌ **Some benchmark jobs failed:**
             - Local: ${{ needs.benchmark-local.result }}
             - Postgres: ${{ needs.benchmark-postgres.result }}
             - Vercel: ${{ needs.benchmark-vercel.result }}
+
+            Check the [workflow run](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}) for details.
+
+      - name: Append community warning to PR comment
+        if: github.event_name == 'pull_request' && steps.check-status.outputs.has_warnings == 'true'
+        uses: marocchino/sticky-pull-request-comment@v2
+        with:
+          header: benchmark-results
+          append: true
+          message: |
+
+            ---
+            ⚠️ **Community world benchmarks failed** (non-blocking):
             - Community Worlds: ${{ needs.benchmark-community.result }}
 
             Check the [workflow run](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}) for details.
 
@@ -181,26 +181,37 @@ jobs:
         app:
           - name: "example"
             project-id: "prj_xWq20Dd860HHAfzMjK2Mb6TPVxMa"
+            project-slug: "example-workflow"
           - name: "nextjs-turbopack"
             project-id: "prj_yjkM7UdHliv8bfxZ1sMJQf1pMpdi"
+            project-slug: "example-nextjs-workflow-turbopack"
           - name: "nextjs-webpack"
             project-id: "prj_avRPBF3eWjh6iDNQgmhH4VOg27h0"
+            project-slug: "example-nextjs-workflow-webpack"
           - name: "nitro"
             project-id: "prj_e7DZirYdLrQKXNrlxg7KmA6ABx8r"
+            project-slug: "workbench-nitro-workflow"
           - name: "vite"
             project-id: "prj_uLIcNZNDmETulAvj5h0IcDHi5432"
+            project-slug: "workbench-vite-workflow"
           - name: "nuxt"
             project-id: "prj_oTgiz3SGX2fpZuM6E0P38Ts8de6d"
+            project-slug: "workbench-nuxt-workflow"
           - name: "sveltekit"
             project-id: "prj_MqnBLm71ceXGSnm3Fs8i8gBnI23G"
+            project-slug: "workbench-sveltekit-workflow"
           - name: "hono"
             project-id: "prj_p0GIEsfl53L7IwVbosPvi9rPSOYW"
+            project-slug: "workbench-hono-workflow"
           - name: "express"
             project-id: "prj_cCZjpBy92VRbKHHbarDMhOHtkuIr"
+            project-slug: "workbench-express-workflow"
           - name: "fastify"
             project-id: "prj_5Yap0VDQ633v998iqQ3L3aQ25Cck"
+            project-slug: "workbench-fastify-workflow"
           - name: "astro"
             project-id: "prj_YDAXj3K8LM0hgejuIMhioz2yLgTI"
+            project-slug: "workbench-astro-workflow"
     env:
       TURBO_TOKEN: ${{ secrets.TURBO_TOKEN }}
       TURBO_TEAM: ${{ vars.TURBO_TEAM }}
@@ -236,6 +247,7 @@ jobs:
           WORKFLOW_VERCEL_AUTH_TOKEN: ${{ secrets.VERCEL_LABS_TOKEN }}
           WORKFLOW_VERCEL_TEAM: "team_nO2mCG4W8IxPIeKoSsqwAxxB"
           WORKFLOW_VERCEL_PROJECT: ${{ matrix.app.project-id }}
+          WORKFLOW_VERCEL_PROJECT_SLUG: ${{ matrix.app.project-slug }}
 
       - name: Generate E2E summary
         if: always()
@@ -246,7 +258,9 @@ jobs:
         uses: actions/upload-artifact@v4
         with:
           name: e2e-results-vercel-prod-${{ matrix.app.name }}
-          path: e2e-vercel-prod-${{ matrix.app.name }}.json
+          path: |
+            e2e-vercel-prod-${{ matrix.app.name }}.json
+            e2e-metadata-${{ matrix.app.name }}-vercel.json
           retention-days: 7
           if-no-files-found: ignore
 
@@ -621,12 +635,19 @@ jobs:
           echo "windows=$WINDOWS_STATUS" >> $GITHUB_OUTPUT
           echo "community=$COMMUNITY_STATUS" >> $GITHUB_OUTPUT
 
-          if [[ "$VERCEL_STATUS" == "failure" || "$LOCAL_DEV_STATUS" == "failure" || "$LOCAL_PROD_STATUS" == "failure" || "$POSTGRES_STATUS" == "failure" || "$WINDOWS_STATUS" == "failure" || "$COMMUNITY_STATUS" == "failure" ]]; then
+          # Community world failures are warnings, not errors
+          if [[ "$VERCEL_STATUS" == "failure" || "$LOCAL_DEV_STATUS" == "failure" || "$LOCAL_PROD_STATUS" == "failure" || "$POSTGRES_STATUS" == "failure" || "$WINDOWS_STATUS" == "failure" ]]; then
             echo "has_failures=true" >> $GITHUB_OUTPUT
           else
             echo "has_failures=false" >> $GITHUB_OUTPUT
           fi
 
+          if [[ "$COMMUNITY_STATUS" == "failure" ]]; then
+            echo "has_warnings=true" >> $GITHUB_OUTPUT
+          else
+            echo "has_warnings=false" >> $GITHUB_OUTPUT
+          fi
+
       - name: Update PR comment with results
         if: github.event_name == 'pull_request'
         uses: marocchino/sticky-pull-request-comment@v2
@@ -643,12 +664,25 @@ jobs:
           message: |
 
             ---
-            ⚠️ **Some E2E test jobs failed:**
+            ❌ **Some E2E test jobs failed:**
             - Vercel Prod: ${{ needs.e2e-vercel-prod.result }}
             - Local Dev: ${{ needs.e2e-local-dev.result }}
             - Local Prod: ${{ needs.e2e-local-prod.result }}
             - Local Postgres: ${{ needs.e2e-local-postgres.result }}
             - Windows: ${{ needs.e2e-windows.result }}
+
+            Check the [workflow run](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}) for details.
+
+      - name: Append community warning to PR comment
+        if: github.event_name == 'pull_request' && steps.check-status.outputs.has_warnings == 'true'
+        uses: marocchino/sticky-pull-request-comment@v2
+        with:
+          header: e2e-test-results
+          append: true
+          message: |
+
+            ---
+            ⚠️ **Community world tests failed** (non-blocking):
             - Community Worlds: ${{ needs.e2e-community.result }}
 
             Check the [workflow run](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}) for details.