pytorch/benchmarks/dynamo/check_graph_breaks.py
Will Constable 218eeacacd Check dynamo graph-breaks in CI (#96346)
- add graph-breaks baselines
- add check_graph_breaks script (message users on regress or improvement)
- hook up test.sh for existing accuracy job

Refactor graph-break CI check

Take steps toward merging checker with existing check flow,
consider merging it all the way inside the bench runner.

csvs
Pull Request resolved: https://github.com/pytorch/pytorch/pull/96346
Approved by: https://github.com/ezyang
2023-03-14 03:39:36 +00:00

84 lines
2.3 KiB
Python

import argparse
import sys
import textwrap
import pandas as pd
def get_field(csv, model_name: str, field: str, typ=float):
return typ(csv.loc[csv["name"] == model_name][field])
def check_graph_breaks(actual_csv, expected_csv, expected_filename):
failed = []
improved = []
for model in actual_csv["name"]:
graph_breaks = get_field(actual_csv, model, "graph_breaks", typ=int)
expected_graph_breaks = get_field(expected_csv, model, "graph_breaks", typ=int)
if graph_breaks == expected_graph_breaks:
status = "PASS"
elif graph_breaks > expected_graph_breaks:
status = "FAIL"
failed.append(model)
elif graph_breaks < expected_graph_breaks:
status = "IMPROVED"
improved.append(model)
print(
f"""
{model:34}:
graph_breaks={graph_breaks},
expected_graph_breaks={expected_graph_breaks},
{status}
"""
)
msg = ""
if failed or improved:
if failed:
msg += textwrap.dedent(
f"""
Error: {len(failed)} models have new dynamo graph breaks:
{' '.join(failed)}
"""
)
if improved:
msg += textwrap.dedent(
f"""
Improvement: {len(improved)} models have fixed dynamo graph breaks:
{' '.join(improved)}
"""
)
msg += textwrap.dedent(
f"""
If this change is expected, you can update `{expected_filename}` to reflect the new baseline.
This can either be done manually, or by downloading artifacts from your PR CI job.
(Search artifacts files for test-reports-test-inductor_torchbench, _timm, _huggingface)
"""
)
return failed or improved, msg
def main():
parser = argparse.ArgumentParser()
parser.add_argument("--actual", type=str, required=True)
parser.add_argument("--expected", type=str, required=True)
args = parser.parse_args()
actual = pd.read_csv(args.actual)
expected = pd.read_csv(args.expected)
failed, msg = check_graph_breaks(actual, expected, args.expected)
if failed:
print(msg)
sys.exit(1)
if __name__ == "__main__":
main()