mirror of
https://github.com/pytorch/pytorch.git
synced 2025-10-20 12:54:11 +08:00
* Automatically applies ruff rule 401. Turns loops into equivalent list comprehensions which are faster and do not leak the scope of the loop variables. * list comprehensions not only often have better typing, but are 50+% faster than for loops on overhead. They also preserve length information etc and are better for the interpreter to optimize. * Manually went back and made mypy happy after the change. * Also fixed style lints in files covered by flake8 but not by pyfmt Pull Request resolved: https://github.com/pytorch/pytorch/pull/140980 Approved by: https://github.com/justinchuby, https://github.com/malfet
67 lines
1.9 KiB
Python
67 lines
1.9 KiB
Python
# mypy: allow-untyped-defs
|
|
import os.path
|
|
from glob import glob
|
|
from typing import cast
|
|
|
|
import torch
|
|
from torch.types import Storage
|
|
|
|
|
|
__serialization_id_record_name__ = ".data/serialization_id"
|
|
|
|
|
|
# because get_storage_from_record returns a tensor!?
|
|
class _HasStorage:
|
|
def __init__(self, storage):
|
|
self._storage = storage
|
|
|
|
def storage(self):
|
|
return self._storage
|
|
|
|
|
|
class DirectoryReader:
|
|
"""
|
|
Class to allow PackageImporter to operate on unzipped packages. Methods
|
|
copy the behavior of the internal PyTorchFileReader class (which is used for
|
|
accessing packages in all other cases).
|
|
|
|
N.B.: ScriptObjects are not depickleable or accessible via this DirectoryReader
|
|
class due to ScriptObjects requiring an actual PyTorchFileReader instance.
|
|
"""
|
|
|
|
def __init__(self, directory):
|
|
self.directory = directory
|
|
|
|
def get_record(self, name):
|
|
filename = f"{self.directory}/{name}"
|
|
with open(filename, "rb") as f:
|
|
return f.read()
|
|
|
|
def get_storage_from_record(self, name, numel, dtype):
|
|
filename = f"{self.directory}/{name}"
|
|
nbytes = torch._utils._element_size(dtype) * numel
|
|
storage = cast(Storage, torch.UntypedStorage)
|
|
return _HasStorage(storage.from_file(filename=filename, nbytes=nbytes))
|
|
|
|
def has_record(self, path):
|
|
full_path = os.path.join(self.directory, path)
|
|
return os.path.isfile(full_path)
|
|
|
|
def get_all_records(
|
|
self,
|
|
):
|
|
files = [
|
|
filename[len(self.directory) + 1 :]
|
|
for filename in glob(f"{self.directory}/**", recursive=True)
|
|
if not os.path.isdir(filename)
|
|
]
|
|
return files
|
|
|
|
def serialization_id(
|
|
self,
|
|
):
|
|
if self.has_record(__serialization_id_record_name__):
|
|
return self.get_record(__serialization_id_record_name__)
|
|
else:
|
|
return ""
|