Refactor custom benchmark report script to improve HTML generation and structure

This commit is contained in:
Palash Tyagi 2025-05-07 00:08:39 +01:00
parent 34809656f6
commit 498f822672

View File

@ -25,7 +25,17 @@ ESTIMATES_PATH_BASE = Path("base") / "estimates.json"
REPORT_HTML_RELATIVE_PATH = Path("report") / "index.html" REPORT_HTML_RELATIVE_PATH = Path("report") / "index.html"
def load_criterion_reports(criterion_root_dir: Path) -> Dict[str, Dict[str, Dict[str, Any]]]: def get_default_criterion_report_path() -> Path:
"""
Returns the default path for the Criterion benchmark report.
This is typically 'target/criterion'.
"""
return Path("target") / "criterion" / "report" / "index.html"
def load_criterion_reports(
criterion_root_dir: Path,
) -> Dict[str, Dict[str, Dict[str, Any]]]:
""" """
Loads Criterion benchmark results from a specified directory and finds HTML paths. Loads Criterion benchmark results from a specified directory and finds HTML paths.
@ -50,58 +60,51 @@ def load_criterion_reports(criterion_root_dir: Path) -> Dict[str, Dict[str, Dict
print(f"Scanning for benchmark reports in: {criterion_root_dir}") print(f"Scanning for benchmark reports in: {criterion_root_dir}")
for item in criterion_root_dir.iterdir(): for item in criterion_root_dir.iterdir():
# We are only interested in directories matching the pattern
if not item.is_dir(): if not item.is_dir():
continue continue
match = DIR_PATTERN.match(item.name) match = DIR_PATTERN.match(item.name)
if not match: if not match:
# print(f"Skipping directory (name doesn't match pattern): {item.name}")
continue continue
test_name = match.group(1).strip() test_name = match.group(1).strip()
size = match.group(2).strip() size = match.group(2).strip()
benchmark_dir_name = item.name # Store the original directory name benchmark_dir_name = item.name
benchmark_dir_path = item # The Path object to the benchmark dir benchmark_dir_path = item
json_path: Optional[Path] = None json_path: Optional[Path] = None
# Look for the estimates JSON file (prefer 'new', fallback to 'base')
if (benchmark_dir_path / ESTIMATES_PATH_NEW).is_file(): if (benchmark_dir_path / ESTIMATES_PATH_NEW).is_file():
json_path = benchmark_dir_path / ESTIMATES_PATH_NEW json_path = benchmark_dir_path / ESTIMATES_PATH_NEW
elif (benchmark_dir_path / ESTIMATES_PATH_BASE).is_file(): elif (benchmark_dir_path / ESTIMATES_PATH_BASE).is_file():
json_path = benchmark_dir_path / ESTIMATES_PATH_BASE json_path = benchmark_dir_path / ESTIMATES_PATH_BASE
# The HTML report is at a fixed location relative to the benchmark directory
html_path = benchmark_dir_path / REPORT_HTML_RELATIVE_PATH html_path = benchmark_dir_path / REPORT_HTML_RELATIVE_PATH
if json_path is None or not json_path.is_file(): if json_path is None or not json_path.is_file():
print( print(
f"Warning: Could not find estimates JSON in {benchmark_dir_path}. Skipping benchmark size '{test_name} ({size})'.", f"Warning: Could not find estimates JSON in {benchmark_dir_path}. Skipping benchmark size '{test_name} ({size})'.",
file=sys.stderr, file=sys.stderr,
) )
continue # Skip if no JSON data continue
if not html_path.is_file(): if not html_path.is_file():
print( print(
f"Warning: Could not find HTML report at expected location {html_path}. Skipping benchmark size '{test_name} ({size})'.", f"Warning: Could not find HTML report at expected location {html_path}. Skipping benchmark size '{test_name} ({size})'.",
file=sys.stderr, file=sys.stderr,
) )
continue # Skip if no HTML report continue
# Try loading the JSON data
try: try:
with json_path.open("r", encoding="utf-8") as f: with json_path.open("r", encoding="utf-8") as f:
json_data = json.load(f) json_data = json.load(f)
# Store both the JSON data and the relative path to the HTML report
results[test_name][size] = { results[test_name][size] = {
'json': json_data, "json": json_data,
# The path from the criterion root to the specific benchmark's report/index.html "html_path_relative_to_criterion_root": str(
'html_path_relative_to_criterion_root': str(Path(benchmark_dir_name) / REPORT_HTML_RELATIVE_PATH).replace('\\', '/') # Ensure forward slashes Path(benchmark_dir_name) / REPORT_HTML_RELATIVE_PATH
).replace("\\", "/"),
} }
# print(f" Loaded: {test_name} ({size}) from {json_path}, html: {html_path}")
except json.JSONDecodeError: except json.JSONDecodeError:
print(f"Error: Failed to decode JSON from {json_path}", file=sys.stderr) print(f"Error: Failed to decode JSON from {json_path}", file=sys.stderr)
except IOError as e: except IOError as e:
@ -112,7 +115,6 @@ def load_criterion_reports(criterion_root_dir: Path) -> Dict[str, Dict[str, Dict
file=sys.stderr, file=sys.stderr,
) )
# Convert defaultdict back to regular dict for cleaner output (optional)
return dict(results) return dict(results)
@ -130,118 +132,215 @@ def format_nanoseconds(ns: float) -> str:
return f"{ns / 1_000_000_000:.2f} s" return f"{ns / 1_000_000_000:.2f} s"
def generate_html_table_with_links(results: Dict[str, Dict[str, Dict[str, Any]]], html_base_path: str) -> str: def generate_html_table_with_links(
results: Dict[str, Dict[str, Dict[str, Any]]], html_base_path: str
) -> str:
""" """
Generates an HTML table from benchmark results, with cells linking to reports. Generates a full HTML page with a styled table from benchmark results.
Args:
results: The nested dictionary loaded by load_criterion_reports,
including 'json' data and 'html_path_relative_to_criterion_root'.
html_base_path: The base URL path where the 'target/criterion' directory
is hosted on the static site, relative to the output HTML file.
e.g., '../target/criterion/'
Returns:
A string containing the full HTML table.
""" """
css_styles = """
<style>
body {
font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, Helvetica, Arial, sans-serif, "Apple Color Emoji", "Segoe UI Emoji", "Segoe UI Symbol";
line-height: 1.6;
margin: 0;
padding: 20px;
background-color: #f4f7f6;
color: #333;
}
.container {
max-width: 1200px;
margin: 20px auto;
padding: 20px;
background-color: #fff;
box-shadow: 0 0 15px rgba(0,0,0,0.1);
border-radius: 8px;
}
h1 {
color: #2c3e50;
text-align: center;
margin-bottom: 10px;
}
p.subtitle {
text-align: center;
margin-bottom: 8px;
color: #555;
font-size: 0.95em;
}
p.note {
text-align: center;
margin-bottom: 25px;
color: #777;
font-size: 0.85em;
}
.benchmark-table {
width: 100%;
border-collapse: collapse;
margin-top: 25px;
box-shadow: 0 2px 8px rgba(0,0,0,0.05);
}
.benchmark-table th, .benchmark-table td {
border: 1px solid #dfe6e9; /* Lighter border */
padding: 12px 15px;
}
.benchmark-table th {
background-color: #3498db; /* Primary blue */
color: #ffffff;
font-weight: 600; /* Slightly bolder */
text-transform: uppercase;
letter-spacing: 0.05em;
text-align: center; /* Center align headers */
}
.benchmark-table td {
text-align: right; /* Default for data cells (times) */
}
.benchmark-table td:first-child { /* Benchmark Name column */
font-weight: 500;
color: #2d3436;
text-align: left; /* Left align benchmark names */
}
.benchmark-table tbody tr:nth-child(even) {
background-color: #f8f9fa; /* Very light grey for even rows */
}
.benchmark-table tbody tr:hover {
background-color: #e9ecef; /* Slightly darker on hover */
}
.benchmark-table a {
color: #2980b9; /* Link blue */
text-decoration: none;
font-weight: 500;
}
.benchmark-table a:hover {
text-decoration: underline;
color: #1c5a81; /* Darker blue on hover */
}
.no-results {
text-align: center;
font-size: 1.2em;
color: #7f8c8d;
margin-top: 30px;
}
</style>
"""
html_doc_start = f"""<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>Criterion Benchmark Results</title>
{css_styles}
</head>
<body>
<div class="container">
<h1 id="criterion-benchmark-results">Criterion Benchmark Results</h1>
"""
html_doc_end = """
</div>
</body>
</html>"""
if not results: if not results:
return "<p>No benchmark results found or loaded.</p>" return f"""{html_doc_start}
<p class="no-results">No benchmark results found or loaded.</p>
{html_doc_end}"""
# Get all unique sizes (columns) and test names (rows) all_sizes = sorted(
# Using ordered dictionaries to maintain insertion order from loading, then sorting keys list(set(size for test_data in results.values() for size in test_data.keys()))
# Or simply sort the keys after extraction: )
all_sizes = sorted(list(set(size for test_data in results.values() for size in test_data.keys())))
all_test_names = sorted(list(results.keys())) all_test_names = sorted(list(results.keys()))
html_string = """ table_content = """
<meta charset="utf-8"> <p class="subtitle">Each cell links to the detailed Criterion.rs report for that specific benchmark size.</p>
<h1 id="criterion-benchmark-results">Criterion Benchmark Results</h1> <p class="note">Note: Values shown are the midpoint of the mean confidence interval, formatted for readability.</p>
<p>Each cell links to the detailed Criterion report for that specific benchmark size.</p> <p class="note"><a href="report/index.html">[Switch to the standard Criterion.rs report]</a></p>
<p>Note: Values shown are the midpoint of the mean confidence interval, formatted for readability.</p> <table class="benchmark-table">
<table class="table table-striped" border="1" justify="center">
<thead> <thead>
<tr> <tr>
<th>Benchmark Name</th> <th>Benchmark Name</th>
""" """
# Add size headers
for size in all_sizes: for size in all_sizes:
html_string += f"<th>{html.escape(size)}</th>\n" table_content += f"<th>{html.escape(size)}</th>\n"
html_string += """ table_content += """
</tr> </tr>
</thead> </thead>
<tbody> <tbody>
""" """
# Add data rows
for test_name in all_test_names: for test_name in all_test_names:
html_string += f"<tr>\n" table_content += f"<tr>\n"
html_string += f" <td>{html.escape(test_name)}</td>\n" table_content += f" <td>{html.escape(test_name)}</td>\n"
# Iterate through all possible sizes to ensure columns align
for size in all_sizes: for size in all_sizes:
cell_data = results.get(test_name, {}).get(size) cell_data = results.get(test_name, {}).get(size)
mean_value = pd.NA # Default value mean_value = pd.NA
full_report_url = "#" # Default link to self or dummy full_report_url = "#"
if cell_data and 'json' in cell_data and 'html_path_relative_to_criterion_root' in cell_data: if (
cell_data
and "json" in cell_data
and "html_path_relative_to_criterion_root" in cell_data
):
try: try:
# Extract mean from JSON mean_data = cell_data["json"].get("mean")
mean_data = cell_data['json'].get("mean")
if mean_data and "confidence_interval" in mean_data: if mean_data and "confidence_interval" in mean_data:
ci = mean_data["confidence_interval"] ci = mean_data["confidence_interval"]
if "lower_bound" in ci and "upper_bound" in ci: if "lower_bound" in ci and "upper_bound" in ci:
lower, upper = ci["lower_bound"], ci["upper_bound"] lower, upper = ci["lower_bound"], ci["upper_bound"]
if isinstance(lower, (int, float)) and isinstance(upper, (int, float)): if isinstance(lower, (int, float)) and isinstance(
upper, (int, float)
):
mean_value = (lower + upper) / 2.0 mean_value = (lower + upper) / 2.0
else: else:
print(f"Warning: Non-numeric bounds for {test_name} ({size}).", file=sys.stderr) print(
f"Warning: Non-numeric bounds for {test_name} ({size}).",
file=sys.stderr,
)
else: else:
print(f"Warning: Missing confidence_interval bounds for {test_name} ({size}).", file=sys.stderr) print(
f"Warning: Missing confidence_interval bounds for {test_name} ({size}).",
file=sys.stderr,
)
else: else:
print(f"Warning: Missing 'mean' data for {test_name} ({size}).", file=sys.stderr) print(
f"Warning: Missing 'mean' data for {test_name} ({size}).",
# Construct the full relative URL file=sys.stderr,
relative_report_path = cell_data['html_path_relative_to_criterion_root'] )
full_report_url = f"{html_base_path}{relative_report_path}"
# Ensure forward slashes and resolve potential double slashes if html_base_path ends in /
full_report_url = str(Path(full_report_url)).replace('\\', '/')
relative_report_path = cell_data[
"html_path_relative_to_criterion_root"
]
joined_path = Path(html_base_path) / relative_report_path
full_report_url = str(joined_path).replace("\\", "/")
except Exception as e: except Exception as e:
print(f"Error processing cell data for {test_name} ({size}): {e}", file=sys.stderr) print(
# Keep mean_value as NA and URL as '#' f"Error processing cell data for {test_name} ({size}): {e}",
file=sys.stderr,
)
# Format the mean value for display
formatted_mean = format_nanoseconds(mean_value) formatted_mean = format_nanoseconds(mean_value)
# Create the link cell
# Only make it a link if a valid report path was found
if full_report_url and full_report_url != "#": if full_report_url and full_report_url != "#":
html_string += f' <td><a href="{html.escape(full_report_url)}">{html.escape(formatted_mean)}</a></td>\n' table_content += f' <td><a href="{html.escape(full_report_url)}">{html.escape(formatted_mean)}</a></td>\n'
else: else:
# Display value without a link if no report path table_content += f" <td>{html.escape(formatted_mean)}</td>\n"
html_string += f' <td>{html.escape(formatted_mean)}</td>\n' table_content += "</tr>\n"
table_content += """
html_string += f"</tr>\n"
html_string += """
</tbody> </tbody>
</table> </table>
""" """
return f"{html_doc_start}{table_content}{html_doc_end}"
return html_string
if __name__ == "__main__": if __name__ == "__main__":
DEFAULT_CRITERION_PATH = "target/criterion" DEFAULT_CRITERION_PATH = "target/criterion"
# Default relative path from benchmark_results.html to the criterion root on the hosted site DEFAULT_OUTPUT_FILE = "./target/criterion/index.html"
# Assumes benchmark_results.html is in .../doc/<branch-slug>/benchmarks/ DEFAULT_HTML_BASE_PATH = ""
# And target/criterion is copied to .../doc/<branch-slug>/target/criterion/
# So the path from benchmarks/ to target/criterion/ is ../target/criterion/
DEFAULT_HTML_BASE_PATH = "../target/criterion/"
parser = argparse.ArgumentParser( parser = argparse.ArgumentParser(
description="Load Criterion benchmark results from JSON files and generate an HTML table with links to reports." description="Load Criterion benchmark results from JSON files and generate an HTML table with links to reports."
@ -250,51 +349,65 @@ if __name__ == "__main__":
"--criterion-dir", "--criterion-dir",
type=str, type=str,
default=DEFAULT_CRITERION_PATH, default=DEFAULT_CRITERION_PATH,
help=f"Path to the main 'target/criterion' directory (default: {DEFAULT_CRITERION_PATH}) on the runner.", help=f"Path to the main 'target/criterion' directory (default: {DEFAULT_CRITERION_PATH}) containing benchmark data.",
) )
parser.add_argument( parser.add_argument(
"--html-base-path", "--html-base-path",
type=str, type=str,
default=DEFAULT_HTML_BASE_PATH, default=DEFAULT_HTML_BASE_PATH,
help=f"Relative URL path from the output HTML file to the hosted 'target/criterion' directory (default: {DEFAULT_HTML_BASE_PATH}).", help=(
f"Prefix for HTML links to individual benchmark reports. "
f"This is prepended to each report's relative path (e.g., 'benchmark_name/report/index.html'). "
f"If the main output HTML (default: '{DEFAULT_OUTPUT_FILE}') is in the 'target/criterion/' directory, "
f"this should typically be empty (default: '{DEFAULT_HTML_BASE_PATH}'). "
),
) )
parser.add_argument( parser.add_argument(
"--output-file", "--output-file",
type=str, type=str,
default="benchmark_results.html", default=DEFAULT_OUTPUT_FILE,
help="Name of the output HTML file (default: benchmark_results.html)." help=f"Path to save the generated HTML summary report (default: {DEFAULT_OUTPUT_FILE}).",
) )
args = parser.parse_args() args = parser.parse_args()
criterion_path = Path(args.criterion_dir) criterion_path = Path(args.criterion_dir)
output_file_path = Path(args.output_file)
try:
output_file_path.parent.mkdir(parents=True, exist_ok=True)
except OSError as e:
print(
f"Error: Could not create output directory {output_file_path.parent}: {e}",
file=sys.stderr,
)
sys.exit(1)
all_results = load_criterion_reports(criterion_path) all_results = load_criterion_reports(criterion_path)
# Generate HTML output regardless of whether results were found (handles "no results" page)
html_output = generate_html_table_with_links(all_results, args.html_base_path)
if not all_results: if not all_results:
print("\nNo benchmark results found or loaded.") print("\nNo benchmark results found or loaded.")
# Still create an empty file or a file with an error message # Fallthrough to write the "no results" page generated by generate_html_table_with_links
try: else:
with open(args.output_file, "w", encoding="utf-8") as f:
f.write("<h1>Criterion Benchmark Results</h1><p>No benchmark results found or loaded.</p>")
print(f"Created empty/error HTML file: {args.output_file}")
except IOError as e:
print(f"Error creating empty/error HTML file {args.output_file}: {e}", file=sys.stderr)
sys.exit(1) # Indicate failure if no data was loaded successfully
print("\nSuccessfully loaded benchmark results.") print("\nSuccessfully loaded benchmark results.")
# pprint(all_results) # Uncomment for debugging # pprint(all_results) # Uncomment for debugging
print(f"Generating HTML table with links using base path: {args.html_base_path}") print(
html_output = generate_html_table_with_links(all_results, args.html_base_path) f"Generating HTML report with links using HTML base path: '{args.html_base_path}'"
)
try: try:
with open(args.output_file, "w", encoding="utf-8") as f: with output_file_path.open("w", encoding="utf-8") as f:
f.write(html_output) f.write(html_output)
print(f"\nSuccessfully wrote HTML table to {args.output_file}") print(f"\nSuccessfully wrote HTML report to {output_file_path}")
sys.exit(0) # Exit successfully if not all_results:
sys.exit(1) # Exit with error code if no results, though file is created
sys.exit(0)
except IOError as e: except IOError as e:
print(f"Error writing HTML output to {args.output_file}: {e}", file=sys.stderr) print(f"Error writing HTML output to {output_file_path}: {e}", file=sys.stderr)
sys.exit(1) sys.exit(1)
except Exception as e: except Exception as e:
print(f"An unexpected error occurred while writing HTML: {e}", file=sys.stderr) print(f"An unexpected error occurred while writing HTML: {e}", file=sys.stderr)