Files
greptimedb/.github/scripts/query-regression-summary.py
discord9 c44f8da646 feat: add query regression perf harness (#8406)
* feat: add query regression perf harness

Signed-off-by: discord9 <discord9@163.com>

* feat: extend query regression cases

Signed-off-by: discord9 <discord9@163.com>

* ci: harden query regression workflows

Signed-off-by: discord9 <discord9@163.com>

* fix: address query regression review comments

Signed-off-by: discord9 <discord9@163.com>

* ci: limit query regression PR triggers

Signed-off-by: discord9 <discord9@163.com>

* ci: run full query regression case set

Signed-off-by: discord9 <discord9@163.com>

* refactor: model query regression scenarios

Signed-off-by: discord9 <discord9@163.com>

* fix: avoid unenforced query regression thresholds

Signed-off-by: discord9 <discord9@163.com>

---------

Signed-off-by: discord9 <discord9@163.com>
2026-07-03 09:09:01 +00:00

225 lines
8.2 KiB
Python

#!/usr/bin/env python3
# Copyright 2023 Greptime Team
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Format tests/perf query regression JSON reports as GitHub Markdown."""
from __future__ import annotations
import argparse
import json
from pathlib import Path
from typing import Any
def fmt_ms(value: Any) -> str:
if value is None:
return "N/A"
try:
return f"{float(value):.2f}"
except (TypeError, ValueError):
return "N/A"
def esc(value: Any) -> str:
text = "N/A" if value is None else str(value)
return text.replace("|", "\\|").replace("\n", " ")
def status_emoji(status: str | None) -> str:
return {"ok": "", "measured": "", "failed": "", "planned": "📝", "fixture-ready": "🧪"}.get(
status or "", "⚠️"
)
def measurement_map(target: dict[str, Any]) -> dict[str, dict[str, Any]]:
return {m.get("name") or f"query-{i}": m for i, m in enumerate(target.get("measurements", []))}
def regression_pct(base: Any, candidate: Any) -> str:
try:
b = float(base)
c = float(candidate)
except (TypeError, ValueError):
return "N/A"
if b == 0:
return "N/A"
return f"{(c - b) / b * 100:+.1f}%"
def threshold_status(thresholds: list[dict[str, Any]], query: str) -> str:
hits = [t for t in thresholds if t.get("query") == query]
if not hits:
return "N/A"
return ", ".join(f"{t.get('threshold')}: {t.get('status')}" for t in hits)
def target_table(targets: list[dict[str, Any]]) -> str:
rows = ["| Target | Status | Validation errors | Region | Datanode data home |", "| --- | --- | ---: | --- | --- |"]
for target in targets:
errors = len(target.get("validation_errors") or [])
discovered = target.get("discovered") or {}
if isinstance(discovered, list):
region = ", ".join(str(item.get("region_id")) for item in discovered)
else:
region = discovered.get("region_id")
rows.append(
"| {name} | {status} {raw} | {errors} | {region} | `{data}` |".format(
name=esc(target.get("name")),
status=status_emoji(target.get("status")),
raw=esc(target.get("status")),
errors=errors,
region=esc(region),
data=esc(target.get("datanode_data_home") or target.get("data_dir")),
)
)
return "\n".join(rows)
def comparison_table(targets: list[dict[str, Any]], thresholds: list[dict[str, Any]]) -> str:
if len(targets) < 2:
return "No base/candidate measurements found."
base = measurement_map(targets[0])
candidate = measurement_map(targets[1])
names = sorted(set(base) | set(candidate))
rows = [
"| Query | Base median ms | Base p95 ms | Candidate median ms | Candidate p95 ms | Regression | Threshold |",
"| --- | ---: | ---: | ---: | ---: | ---: | --- |",
]
for name in names:
bm = base.get(name, {})
cm = candidate.get(name, {})
rows.append(
"| {q} | {bm} | {bp} | {cm} | {cp} | {reg} | {th} |".format(
q=esc(name),
bm=fmt_ms(bm.get("latency_ms_median")),
bp=fmt_ms(bm.get("latency_ms_p95")),
cm=fmt_ms(cm.get("latency_ms_median")),
cp=fmt_ms(cm.get("latency_ms_p95")),
reg=regression_pct(bm.get("latency_ms_median"), cm.get("latency_ms_median")),
th=esc(threshold_status(thresholds, name)),
)
)
return "\n".join(rows)
def build_markdown(
report: dict[str, Any],
report_path: Path,
run_url: str | None,
case_name: str | None,
base_ref: str | None,
candidate_ref: str | None,
) -> str:
status = report.get("status", "missing")
case = report.get("case") or {}
title_case = case_name or case.get("name") or report_path.name
lines = [f"## {status_emoji(status)} Query regression report: `{esc(title_case)}`", ""]
lines.append(f"- **Status:** `{esc(status)}`")
lines.append(f"- **Case path:** `{esc(report.get('case_path'))}`")
lines.append(f"- **Query mode:** `{esc(report.get('query_mode'))}`")
if base_ref:
lines.append(f"- **Base ref:** `{esc(base_ref)}`")
if candidate_ref:
lines.append(f"- **Candidate ref:** `{esc(candidate_ref)}`")
if run_url:
lines.append(f"- **Workflow run:** {run_url}")
if report.get("error"):
lines.append(f"- **Error:** `{esc(report.get('error'))}`")
lines.append("- **Artifacts:** query-regression-work logs, fixture metadata, and JSON report are uploaded with this run.")
targets = report.get("targets") or []
lines.extend(["", "### Targets", "", target_table(targets)])
lines.extend(["", "### Query comparison", "", comparison_table(targets, report.get("thresholds") or [])])
not_enforced = [t for t in report.get("thresholds") or [] if t.get("status") == "not_enforced"]
if not_enforced:
lines.extend(["", "### Not enforced thresholds", ""])
for item in not_enforced:
lines.append(f"- `{esc(item.get('query'))}` / `{esc(item.get('threshold'))}`: {esc(item.get('reason'))}")
return "\n".join(lines) + "\n"
def build_combined_markdown(
reports: list[tuple[Path, dict[str, Any]]],
run_url: str | None,
case_name: str | None,
base_ref: str | None,
candidate_ref: str | None,
) -> str:
if len(reports) == 1:
path, report = reports[0]
return build_markdown(report, path, run_url, case_name, base_ref, candidate_ref)
overall = "failed" if any(report.get("status") != "ok" for _, report in reports) else "ok"
lines = [f"## {status_emoji(overall)} Query regression report: `{esc(case_name or 'multiple cases')}`", ""]
lines.append(f"- **Status:** `{esc(overall)}`")
if base_ref:
lines.append(f"- **Base ref:** `{esc(base_ref)}`")
if candidate_ref:
lines.append(f"- **Candidate ref:** `{esc(candidate_ref)}`")
if run_url:
lines.append(f"- **Workflow run:** {run_url}")
lines.append("- **Artifacts:** query-regression-work logs, fixture metadata, and JSON reports are uploaded with this run.")
lines.extend(["", "### Cases", "", "| Case | Status | Report |", "| --- | --- | --- |"])
for path, report in reports:
case = report.get("case") or {}
name = case.get("name") or path.parent.name
status = report.get("status", "missing")
lines.append(f"| `{esc(name)}` | {status_emoji(status)} `{esc(status)}` | `{esc(path)}` |")
for path, report in reports:
case = report.get("case") or {}
name = case.get("name") or path.parent.name
lines.extend(["", "---", ""])
lines.append(build_markdown(report, path, None, name, None, None).rstrip())
return "\n".join(lines) + "\n"
def main() -> int:
parser = argparse.ArgumentParser()
parser.add_argument("--report", required=True, type=Path, action="append")
parser.add_argument("--run-url")
parser.add_argument("--case-name")
parser.add_argument("--base-ref")
parser.add_argument("--candidate-ref")
parser.add_argument("--output", type=Path)
args = parser.parse_args()
reports = []
for report_path in args.report:
if report_path.exists():
report = json.loads(report_path.read_text())
else:
report = {"status": "failed", "error": f"report not found: {report_path}", "targets": []}
reports.append((report_path, report))
markdown = build_combined_markdown(
reports,
args.run_url,
args.case_name,
args.base_ref,
args.candidate_ref,
)
if args.output:
args.output.write_text(markdown)
else:
print(markdown, end="")
return 0
if __name__ == "__main__":
raise SystemExit(main())