Skip to content

Instantly share code, notes, and snippets.

@Tomcat-42
Created May 4, 2024 13:12
Show Gist options
  • Save Tomcat-42/78b5929cafbbf9fac0617bfee8f90bf5 to your computer and use it in GitHub Desktop.
Save Tomcat-42/78b5929cafbbf9fac0617bfee8f90bf5 to your computer and use it in GitHub Desktop.
#!/usr/bin/env python
"""This script performs Welch's t-test on a JSON export file with two
benchmark results to test whether or not the two distributions are
the same."""
import argparse
import json
import sys
from scipy import stats
parser = argparse.ArgumentParser(description=__doc__)
parser.add_argument("file", help="JSON file with two benchmark results")
args = parser.parse_args()
with open(args.file) as f:
results = json.load(f)["results"]
if len(results) != 2:
print("The input file has to contain exactly two benchmarks")
sys.exit(1)
a, b = [x["command"] for x in results[:2]]
X, Y = [x["times"] for x in results[:2]]
print("Command 1: {}".format(a))
print("Command 2: {}\n".format(b))
t, p = stats.ttest_ind(X, Y, equal_var=False)
th = 0.05
dispose = p < th
print("t = {:.3}, p = {:.3}".format(t, p))
print()
if dispose:
print("There is a difference between the two benchmarks (p < {}).".format(th))
else:
print("The two benchmarks are almost the same (p >= {}).".format(th))
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment