fix: rewrite parser with correct sitespeed.io v39 JSON paths

All metric paths were wrong. Corrected based on browsertimeAggregator.js
and axeAggregator.js source:

- pageTimings (load, FE/BE, DOM) live at statistics.pageTimings.* not
  statistics.timings.pageTimings.*
- FCP is statistics.paintTiming['first-contentful-paint'].median
- CLS is statistics.pageinfo.cumulativeLayoutShift.median
- TBT/FID/tasks are under statistics.cpu.longTasks.*
- Axe data is in axe.pageSummary.json (violations.*.median), not
  in the browsertime file under accessibility.summary.*
- sustainable pageSummary has co2PerPageView/FirstParty/ThirdParty.median
  (no totalCO2 at per-URL level)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
2026-04-07 10:23:48 +02:00
parent ea70d34d7f
commit 500f69efcc

185
parser.js
View File

@@ -2,12 +2,11 @@ import { readdir, readFile } from 'fs/promises';
import { join } from 'path';
/**
* Walk the outputFolder looking for the pageSummary JSON files
* produced by sitespeed.io. The structure is:
* outputFolder/pages/<hostname>/<urlpath>/<plugin>.pageSummary.json
* Recursively find all *.pageSummary.json files under outputFolder.
* sitespeed.io v39 writes them into:
* pages/<hostname>/<urlpath>/data/<plugin>.pageSummary.json
*/
async function findPageSummaries(outputFolder) {
const pagesDir = join(outputFolder, 'pages');
const summaries = {};
async function walk(dir) {
@@ -29,7 +28,7 @@ async function findPageSummaries(outputFolder) {
}
}
await walk(pagesDir);
await walk(outputFolder);
return summaries;
}
@@ -38,6 +37,7 @@ async function readJson(filePath) {
return JSON.parse(raw);
}
// Safe deep-get: safe(obj, 'a', 'b', 'c') === obj?.a?.b?.c
function safe(obj, ...path) {
let cur = obj;
for (const key of path) {
@@ -47,8 +47,9 @@ function safe(obj, ...path) {
return cur ?? null;
}
function median(obj) {
return safe(obj, 'median') ?? safe(obj, 'mean') ?? null;
// Get the median from a stats object { median, min, max, ... }
function med(obj) {
return safe(obj, 'median');
}
export async function parseResults(outputFolder, _url) {
@@ -56,119 +57,121 @@ export async function parseResults(outputFolder, _url) {
const metrics = {};
// ─── browsertime.pageSummary ───────────────────────────────────────────────
// All aggregated values live under `statistics.*`
// Key layout (from browsertimeAggregator.js):
// statistics.timings.largestContentfulPaint — LCP renderTime
// statistics.timings.fullyLoaded
// statistics.pageTimings.* — pageLoadTime, backEndTime, etc.
// statistics.paintTiming.* — 'first-contentful-paint', etc.
// statistics.pageinfo.cumulativeLayoutShift — CLS
// statistics.visualMetrics.* — SpeedIndex, FirstVisualChange, etc.
// statistics.cpu.longTasks.* — totalBlockingTime, tasks, etc.
const btFiles = summaries['browsertime'] || [];
if (btFiles.length > 0) {
const bt = await readJson(btFiles[0]);
const stats = safe(bt, 'statistics');
const timings = safe(stats, 'timings');
const pageTimings = safe(timings, 'pageTimings');
const userTimings = safe(timings, 'userTimings');
const visualMetrics = safe(stats, 'visualMetrics');
const cpu = safe(stats, 'cpu');
const axe = safe(bt, 'accessibility', 'summary');
const s = safe(bt, 'statistics');
// Core Web Vitals / timings
if (timings) {
metrics.ttfb = median(safe(timings, 'timeToFirstByte'));
metrics.fcp = median(safe(timings, 'firstContentfulPaint'));
metrics.lcp = median(safe(timings, 'largestContentfulPaint'));
metrics.cls = median(safe(timings, 'cumulativeLayoutShift'));
metrics.tbt = median(safe(timings, 'totalBlockingTime'));
metrics.max_potential_fid = median(safe(timings, 'maxPotentialFID'));
}
if (s) {
// Core Web Vitals
metrics.lcp = med(safe(s, 'timings', 'largestContentfulPaint'));
metrics.fcp = med(safe(s, 'paintTiming', 'first-contentful-paint'));
metrics.cls = med(safe(s, 'pageinfo', 'cumulativeLayoutShift'));
metrics.tbt = med(safe(s, 'cpu', 'longTasks', 'totalBlockingTime'));
metrics.ttfb = med(safe(s, 'pageTimings', 'backEndTime'));
metrics.max_potential_fid = med(safe(s, 'cpu', 'longTasks', 'maxPotentialFid'));
if (pageTimings) {
metrics.page_load_time = median(safe(pageTimings, 'pageLoadTime'));
metrics.fully_loaded = median(safe(pageTimings, 'fullyLoaded'));
metrics.dom_content_loaded = median(safe(pageTimings, 'domContentLoadedEventEnd'));
metrics.dom_interactive = median(safe(pageTimings, 'domInteractive'));
metrics.front_end_time = median(safe(pageTimings, 'frontEndTime'));
metrics.back_end_time = median(safe(pageTimings, 'backEndTime'));
metrics.time_to_first_byte = median(safe(pageTimings, 'timeToFirstByte'))
?? metrics.ttfb;
}
// Navigation timings (pageTimings keys come from browsertime's pageTimings object)
metrics.page_load_time = med(safe(s, 'pageTimings', 'pageLoadTime'));
metrics.fully_loaded = med(safe(s, 'timings', 'fullyLoaded'));
metrics.dom_content_loaded = med(safe(s, 'pageTimings', 'domContentLoadedTime'));
metrics.dom_interactive = med(safe(s, 'pageTimings', 'domInteractiveTime'));
metrics.front_end_time = med(safe(s, 'pageTimings', 'frontEndTime'));
metrics.back_end_time = med(safe(s, 'pageTimings', 'backEndTime'));
metrics.time_to_first_byte = metrics.ttfb;
if (visualMetrics) {
metrics.speed_index = median(safe(visualMetrics, 'SpeedIndex'));
metrics.first_visual_change = median(safe(visualMetrics, 'FirstVisualChange'));
metrics.last_visual_change = median(safe(visualMetrics, 'LastVisualChange'));
metrics.visual_complete_85 = median(safe(visualMetrics, 'VisualComplete85'));
metrics.perceptual_speed_index = median(safe(visualMetrics, 'PerceptualSpeedIndex'));
}
// Visual metrics (from sitespeed-scroll-server / ffmpeg video analysis)
metrics.speed_index = med(safe(s, 'visualMetrics', 'SpeedIndex'));
metrics.first_visual_change = med(safe(s, 'visualMetrics', 'FirstVisualChange'));
metrics.last_visual_change = med(safe(s, 'visualMetrics', 'LastVisualChange'));
metrics.visual_complete_85 = med(safe(s, 'visualMetrics', 'VisualComplete85'));
metrics.perceptual_speed_index = med(safe(s, 'visualMetrics', 'PerceptualSpeedIndex'));
// CPU / Long Tasks
if (cpu) {
metrics.long_tasks_count = median(safe(cpu, 'longTasks', 'tasks'));
metrics.long_tasks_duration = median(safe(cpu, 'longTasks', 'totalDuration'));
}
// Axe accessibility
if (axe) {
metrics.axe_critical = safe(axe, 'critical') ?? 0;
metrics.axe_serious = safe(axe, 'serious') ?? 0;
metrics.axe_moderate = safe(axe, 'moderate') ?? 0;
metrics.axe_minor = safe(axe, 'minor') ?? 0;
metrics.long_tasks_count = med(safe(s, 'cpu', 'longTasks', 'tasks'));
metrics.long_tasks_duration = med(safe(s, 'cpu', 'longTasks', 'totalDuration'));
}
}
// ─── coach.pageSummary ─────────────────────────────────────────────────────
// ─── axe.pageSummary ─────────────────────────────────────────────────────
// Produced by AxeAggregator.summarizeStats():
// { violations: { critical: {median,…}, serious, moderate, minor }, … }
const axeFiles = summaries['axe'] || [];
if (axeFiles.length > 0) {
const axe = await readJson(axeFiles[0]);
metrics.axe_critical = med(safe(axe, 'violations', 'critical')) ?? 0;
metrics.axe_serious = med(safe(axe, 'violations', 'serious')) ?? 0;
metrics.axe_moderate = med(safe(axe, 'violations', 'moderate')) ?? 0;
metrics.axe_minor = med(safe(axe, 'violations', 'minor')) ?? 0;
}
// ─── coach.pageSummary ────────────────────────────────────────────────────
// Coach sends the median-run's full coach result: { advice: { score, performance, … } }
const coachFiles = summaries['coach'] || [];
if (coachFiles.length > 0) {
const coach = await readJson(coachFiles[0]);
const advice = safe(coach, 'advice');
if (advice) {
metrics.score_overall = safe(advice, 'score') ?? safe(advice, 'overall', 'score');
metrics.score_performance = safe(advice, 'performance', 'score');
metrics.score_accessibility = safe(advice, 'accessibility', 'score');
metrics.score_bestpractice = safe(advice, 'bestpractice', 'score');
metrics.score_privacy = safe(advice, 'privacy', 'score');
}
metrics.score_overall = safe(coach, 'advice', 'score');
metrics.score_performance = safe(coach, 'advice', 'performance', 'score');
metrics.score_accessibility = safe(coach, 'advice', 'accessibility', 'score');
metrics.score_bestpractice = safe(coach, 'advice', 'bestpractice', 'score');
metrics.score_privacy = safe(coach, 'advice', 'privacy', 'score');
}
// ─── pagexray.pageSummary ─────────────────────────────────────────────────
// ─── pagexray.pageSummary ─────────────────────────────────────────────────
// Sent as pageSummary[0] with `.statistics` added by the aggregator.
// Use statistics.*.median when available; fall back to direct property.
const xrayFiles = summaries['pagexray'] || [];
if (xrayFiles.length > 0) {
const xray = await readJson(xrayFiles[0]);
// pagexray has multiple runs — use the first or median-like object
const page = Array.isArray(xray) ? xray[0] : xray;
const ct = safe(page, 'contentTypes');
const xs = safe(xray, 'statistics');
if (ct) {
metrics.transfer_total = safe(page, 'transferSize');
metrics.requests_total = safe(page, 'requests');
metrics.transfer_html = safe(ct, 'html', 'transferSize');
metrics.transfer_js = safe(ct, 'javascript', 'transferSize');
metrics.transfer_css = safe(ct, 'css', 'transferSize');
metrics.transfer_image = safe(ct, 'image', 'transferSize');
metrics.transfer_font = safe(ct, 'font', 'transferSize');
metrics.requests_js = safe(ct, 'javascript', 'requests');
metrics.requests_css = safe(ct, 'css', 'requests');
metrics.requests_image = safe(ct, 'image', 'requests');
metrics.requests_font = safe(ct, 'font', 'requests');
function xv(statPath, directPath) {
// Try statistics.X.median first, then direct property
const fromStats = med(safe(xs, ...statPath));
if (fromStats !== null) return fromStats;
return safe(xray, ...directPath);
}
const tp = safe(page, 'thirdParty');
if (tp) {
metrics.third_party_requests = safe(tp, 'requests');
metrics.third_party_transfer = safe(tp, 'transferSize');
}
metrics.transfer_total = xv(['transferSize'], ['transferSize']);
metrics.requests_total = xv(['requests'], ['requests']);
metrics.transfer_html = xv(['contentTypes', 'html', 'transferSize'], ['contentTypes', 'html', 'transferSize']);
metrics.transfer_js = xv(['contentTypes', 'javascript', 'transferSize'], ['contentTypes', 'javascript', 'transferSize']);
metrics.transfer_css = xv(['contentTypes', 'css', 'transferSize'], ['contentTypes', 'css', 'transferSize']);
metrics.transfer_image = xv(['contentTypes', 'image', 'transferSize'], ['contentTypes', 'image', 'transferSize']);
metrics.transfer_font = xv(['contentTypes', 'font', 'transferSize'], ['contentTypes', 'font', 'transferSize']);
metrics.requests_js = xv(['contentTypes', 'javascript', 'requests'], ['contentTypes', 'javascript', 'requests']);
metrics.requests_css = xv(['contentTypes', 'css', 'requests'], ['contentTypes', 'css', 'requests']);
metrics.requests_image = xv(['contentTypes', 'image', 'requests'], ['contentTypes', 'image', 'requests']);
metrics.requests_font = xv(['contentTypes', 'font', 'requests'], ['contentTypes', 'font', 'requests']);
metrics.third_party_transfer = xv(['thirdParty', 'transferSize'], ['thirdParty', 'transferSize']);
metrics.third_party_requests = xv(['thirdParty', 'requests'], ['thirdParty', 'requests']);
}
// ─── sustainable.pageSummary ──────────────────────────────────────────────
// ─── sustainable.pageSummary ──────────────────────────────────────────────
// Aggregator stores per-URL stats:
// { co2PerPageView: {median,…}, co2FirstParty: {median,…}, co2ThirdParty: {median,…} }
const sustainFiles = summaries['sustainable'] || [];
if (sustainFiles.length > 0) {
const sust = await readJson(sustainFiles[0]);
metrics.co2_per_page_view = safe(sust, 'co2PerPageView')
?? safe(sust, 'statistics', 'co2PerPageView', 'median');
metrics.co2_total = safe(sust, 'totalCO2')
?? safe(sust, 'statistics', 'totalCO2', 'median');
metrics.co2_first_party = safe(sust, 'firstParty', 'co2')
?? safe(sust, 'statistics', 'firstParty', 'co2', 'median');
metrics.co2_third_party = safe(sust, 'thirdParty', 'co2')
?? safe(sust, 'statistics', 'thirdParty', 'co2', 'median');
metrics.co2_per_page_view = med(safe(sust, 'co2PerPageView'));
metrics.co2_total = med(safe(sust, 'co2PerPageView')); // totalCO2 not in per-URL summary
metrics.co2_first_party = med(safe(sust, 'co2FirstParty'));
metrics.co2_third_party = med(safe(sust, 'co2ThirdParty'));
}
// Remove null values to avoid overwriting real DB values with NULL
// Strip nulls so we don't overwrite good DB values with NULL
return Object.fromEntries(
Object.entries(metrics).filter(([, v]) => v !== null && v !== undefined)
);