Files
pytorch/tools/stats/sccache_stats_to_benchmark_format.py
PyTorch MergeBot 99f2491af9 Revert "Use absolute path path.resolve() -> path.absolute() (#129409)"
This reverts commit 45411d1fc9a2b6d2f891b6ab0ae16409719e09fc.

Reverted https://github.com/pytorch/pytorch/pull/129409 on behalf of https://github.com/jeanschmidt due to Breaking internal CI, @albanD please help get this PR merged ([comment](https://github.com/pytorch/pytorch/pull/129409#issuecomment-2571316444))
2025-01-04 14:17:20 +00:00

64 lines
1.8 KiB
Python

import glob
import json
import os
from pathlib import Path
from typing import Any, Dict
REPO_ROOT = Path(__file__).resolve().parent.parent.parent
def flatten_data(d: Dict[str, Any]) -> Dict[str, Any]:
# Flatten the sccache stats data from a possibly nested dictionary to a flat
# dictionary. For example, the input:
# {
# "cache": {
# "hit": 1,
# "miss": 2,
# },
# }
# will be transformed to:
# {
# "cache_hit": 1,
# "cache_miss": 2,
# }
flat_data = {}
for key, value in d.items():
if isinstance(value, dict):
for k, v in flatten_data(value).items():
flat_data[f"{key}_{k}"] = v
else:
flat_data[key] = value
return flat_data
def main() -> None:
records = []
for file in glob.glob(str(REPO_ROOT / "sccache-stats-*.json")):
with open(file) as f:
data = json.load(f)
# I don't know what sccache info will be most useful yet, and the
# sccache json has a decent number of keys, so just flatten the data
# and store all of it
records.append(
{
"benchmark": {
"name": "sccache_stats",
},
"metric": {
"name": "sccache_stats",
"benchmark_values": [int(os.environ.get("BUILD_TIME") or 0)],
"extra_info": flatten_data(data),
},
}
)
output_file = REPO_ROOT / "test" / "test-reports" / "sccache-stats.json"
os.makedirs(output_file.parent, exist_ok=True)
with open(output_file, "w") as f:
json.dump(records, f)
if __name__ == "__main__":
main()