mirror of
https://github.com/pytorch/pytorch.git
synced 2025-10-24 15:44:58 +08:00
Summary: This is basically a reborn version of https://github.com/pytorch/pytorch/issues/45254 . Ref: https://github.com/pytorch/pytorch/issues/42919 Pull Request resolved: https://github.com/pytorch/pytorch/pull/48077 Reviewed By: ngimel Differential Revision: D25687042 Pulled By: bugra fbshipit-source-id: 05f20a6f3c5212f73d0b1505b493b720e6cf74e5
82 lines
2.5 KiB
Python
82 lines
2.5 KiB
Python
#!/usr/bin/env python3
|
|
#
|
|
# Computes difference between measurements produced by ./benchmark.py.
|
|
#
|
|
|
|
import argparse
|
|
import json
|
|
|
|
import numpy as np
|
|
|
|
|
|
def load(path):
|
|
with open(path, 'r') as f:
|
|
return json.load(f)
|
|
|
|
|
|
def main():
|
|
parser = argparse.ArgumentParser(description='PyTorch distributed benchmark diff')
|
|
parser.add_argument("file", nargs=2)
|
|
args = parser.parse_args()
|
|
|
|
if len(args.file) != 2:
|
|
raise RuntimeError("Must specify 2 files to diff")
|
|
|
|
ja = load(args.file[0])
|
|
jb = load(args.file[1])
|
|
|
|
keys = (set(ja.keys()) | set(jb.keys())) - set(["benchmark_results"])
|
|
print("{:20s} {:>20s} {:>20s}".format("", "baseline", "test"))
|
|
print("{:20s} {:>20s} {:>20s}".format("", "-" * 20, "-" * 20))
|
|
for key in sorted(keys):
|
|
va = str(ja.get(key, "-"))
|
|
vb = str(jb.get(key, "-"))
|
|
print("{:20s} {:>20s} vs {:>20s}".format(key + ":", va, vb))
|
|
print("")
|
|
|
|
ba = ja["benchmark_results"]
|
|
bb = jb["benchmark_results"]
|
|
for ra, rb in zip(ba, bb):
|
|
if ra["model"] != rb["model"]:
|
|
continue
|
|
if ra["batch_size"] != rb["batch_size"]:
|
|
continue
|
|
|
|
model = ra["model"]
|
|
batch_size = int(ra["batch_size"])
|
|
name = "{} with batch size {}".format(model, batch_size)
|
|
print("Benchmark: {}".format(name))
|
|
|
|
# Print header
|
|
print("")
|
|
print("{:>10s}".format(""), end='') # noqa: E999
|
|
for _ in [75, 95]:
|
|
print("{:>16s}{:>10s}{:>10s}".format("sec/iter", "ex/sec", "diff"), end='') # noqa: E999
|
|
print("")
|
|
|
|
# Print measurements
|
|
for (i, (xa, xb)) in enumerate(zip(ra["result"], rb["result"])):
|
|
# Ignore round without ddp
|
|
if i == 0:
|
|
continue
|
|
# Sanity check: ignore if number of ranks is not equal
|
|
if len(xa["ranks"]) != len(xb["ranks"]):
|
|
continue
|
|
|
|
ngpus = len(xa["ranks"])
|
|
ma = sorted(xa["measurements"])
|
|
mb = sorted(xb["measurements"])
|
|
print("{:>4d} GPUs:".format(ngpus), end='') # noqa: E999
|
|
for p in [75, 95]:
|
|
va = np.percentile(ma, p)
|
|
vb = np.percentile(mb, p)
|
|
# We're measuring time, so lower is better (hence the negation)
|
|
delta = -100 * ((vb - va) / va)
|
|
print(" p{:02d}: {:8.3f}s {:7d}/s {:+8.1f}%".format(p, vb, int(batch_size / vb), delta), end='') # noqa: E999
|
|
print("")
|
|
print("")
|
|
|
|
|
|
if __name__ == '__main__':
|
|
main()
|