[codemod][lint][fbcode/c*] Enable BLACK by default

Test Plan: manual inspection & sandcastle Reviewed By: zertosh Differential Revision: D30279364 fbshipit-source-id: c1ed77dfe43a3bde358f92737cd5535ae5d13c9a
2025-10-20 21:14:14 +08:00 · 2021-08-12 10:56:55 -07:00
parent aac3c7bd06
commit b004307252
188 changed files with 56875 additions and 28744 deletions
--- a/test/test_multiprocessing.py
+++ b/test/test_multiprocessing.py
@ -1,10 +1,10 @@
 import contextlib
+import copy
 import gc
 import os
 import sys
 import time
 import unittest
-import copy
 from sys import platform

 import torch
@ -12,18 +12,26 @@ import torch.cuda
 import torch.multiprocessing as mp
 import torch.utils.hooks
 from torch.nn import Parameter
-from torch.testing._internal.common_utils import (TestCase, run_tests, IS_WINDOWS, NO_MULTIPROCESSING_SPAWN, TEST_WITH_ASAN,
-                                                  load_tests, slowTest, TEST_WITH_TSAN)
+from torch.testing._internal.common_utils import (
+    TestCase,
+    run_tests,
+    IS_WINDOWS,
+    NO_MULTIPROCESSING_SPAWN,
+    TEST_WITH_ASAN,
+    load_tests,
+    slowTest,
+    TEST_WITH_TSAN,
+)

 # load_tests from common_utils is used to automatically filter tests for
 # sharding on sandcastle. This line silences flake warnings
 load_tests = load_tests

 TEST_REPEATS = 30
-HAS_SHM_FILES = os.path.isdir('/dev/shm')
-TEST_CUDA_IPC = torch.cuda.is_available() and \
-    sys.platform != 'darwin' and \
-    sys.platform != 'win32'
+HAS_SHM_FILES = os.path.isdir("/dev/shm")
+TEST_CUDA_IPC = (
+    torch.cuda.is_available() and sys.platform != "darwin" and sys.platform != "win32"
+)
 TEST_MULTIGPU = TEST_CUDA_IPC and torch.cuda.device_count() > 1


@ -41,7 +49,7 @@ def _test_cuda_ipc_deadlock_actor(queue, iterations):
    for i in range(iterations):
        if not queue.empty():
            queue.get()
-        time.sleep(.01)
+        time.sleep(0.01)


 def _test_cuda_ipc_deadlock_learner(queue, iterations):
@ -49,7 +57,7 @@ def _test_cuda_ipc_deadlock_learner(queue, iterations):
    for i in range(iterations):
        if not queue.full():
            queue.put(copy.deepcopy(net.state_dict()))
-        time.sleep(.01)
+        time.sleep(0.01)


 def simple_fill(queue, event):
@ -98,8 +106,14 @@ def sum_tensors(inq, outq):
    with torch.cuda.device(1):
        tensors = inq.get()
        for tensor in tensors:
-            outq.put((tensor.sum().item(), tensor.get_device(),
-                      tensor.numel(), tensor.storage().size()))
+            outq.put(
+                (
+                    tensor.sum().item(),
+                    tensor.get_device(),
+                    tensor.numel(),
+                    tensor.storage().size(),
+                )
+            )


 def queue_get_exception(inqueue, outqueue):
@ -109,7 +123,7 @@ def queue_get_exception(inqueue, outqueue):
    except Exception as e:
        outqueue.put(e)
    else:
-        outqueue.put('no exception')
+        outqueue.put("no exception")


 # Multiply by two in a separate stream
@ -139,7 +153,7 @@ def autograd_sharing(queue, ready, master_modified, device, is_parameter):
    ready.set()
    master_modified.wait()

-    expected_var = torch.arange(1., 26, device=device).view(5, 5)
+    expected_var = torch.arange(1.0, 26, device=device).view(5, 5)
    expected_var[0, 0] = 1000
    is_ok = var.data.equal(expected_var)
    var.data[:] = torch.ones(5, 5, device=device)
@ -165,14 +179,16 @@ def mixed_type_producer(queue, event):
        event.wait()
        event.clear()

+
 def simple_autograd_function(a=1):
    torch.rand(3).requires_grad_(True).mean().backward()
    return a ** 2

+
@contextlib.contextmanager
 def fs_sharing():
    prev_strategy = mp.get_sharing_strategy()
-    mp.set_sharing_strategy('file_system')
+    mp.set_sharing_strategy("file_system")
    try:
        yield
    finally:
@ -180,7 +196,6 @@ def fs_sharing():


 class leak_checker(object):
-
    def __init__(self, test_case):
        self.checked_pids = [os.getpid()]
        self.test_case = test_case
@ -218,30 +233,32 @@ class leak_checker(object):
        if not HAS_SHM_FILES:
            return False
        result = self._has_shm_files()
-        if result and mp.get_sharing_strategy() == 'file_system' and wait:
+        if result and mp.get_sharing_strategy() == "file_system" and wait:
            time.sleep(0.5)
            return self._has_shm_files()
        return result

    def _has_shm_files(self):
        gc.collect()
-        names = ['torch_' + str(pid) for pid in self.checked_pids]
-        for filename in os.listdir('/dev/shm'):
+        names = ["torch_" + str(pid) for pid in self.checked_pids]
+        for filename in os.listdir("/dev/shm"):
            for name in names:
                if filename.startswith(name):
                    return True
        return False


-@unittest.skipIf(TEST_WITH_TSAN, "TSAN is not fork-safe since we're forking in a multi-threaded environment")
+@unittest.skipIf(
+    TEST_WITH_TSAN,
+    "TSAN is not fork-safe since we're forking in a multi-threaded environment",
+)
 class TestMultiprocessing(TestCase):
-
    def tearDown(self):
        # This will keep tests isolated from each-other
        if torch.cuda.is_available():
            torch.cuda.ipc_collect()

-    def _test_sharing(self, ctx=mp, device='cpu', dtype=torch.float, repeat=1):
+    def _test_sharing(self, ctx=mp, device="cpu", dtype=torch.float, repeat=1):
        def test_fill():
            x = torch.zeros(5, 5).to(device, dtype)
            q = ctx.Queue()
@ -320,22 +337,32 @@ class TestMultiprocessing(TestCase):
            for _ in range(repeat):
                do_test()

-    @unittest.skipIf(platform == 'darwin', "file descriptor strategy is not supported on macOS")
-    @unittest.skipIf(TEST_WITH_ASAN,
-                     "seems to hang with ASAN, see https://github.com/pytorch/pytorch/issues/5326")
+    @unittest.skipIf(
+        platform == "darwin", "file descriptor strategy is not supported on macOS"
+    )
+    @unittest.skipIf(
+        TEST_WITH_ASAN,
+        "seems to hang with ASAN, see https://github.com/pytorch/pytorch/issues/5326",
+    )
    def test_fd_sharing(self):
        self._test_sharing(repeat=TEST_REPEATS)

-    @unittest.skipIf(platform == 'darwin', "file descriptor strategy is not supported on macOS")
+    @unittest.skipIf(
+        platform == "darwin", "file descriptor strategy is not supported on macOS"
+    )
    def test_fd_preserve_sharing(self):
        self._test_preserve_sharing(repeat=TEST_REPEATS)

-    @unittest.skipIf(platform == 'darwin', "file descriptor strategy is not supported on macOS")
+    @unittest.skipIf(
+        platform == "darwin", "file descriptor strategy is not supported on macOS"
+    )
    def test_fd_pool(self):
        self._test_pool(repeat=TEST_REPEATS)

-    @unittest.skipIf(TEST_WITH_ASAN,
-                     "seems to hang with ASAN, see https://github.com/pytorch/pytorch/issues/5326")
+    @unittest.skipIf(
+        TEST_WITH_ASAN,
+        "seems to hang with ASAN, see https://github.com/pytorch/pytorch/issues/5326",
+    )
    def test_fs_sharing(self):
        with fs_sharing():
            self._test_sharing(repeat=TEST_REPEATS)
@ -375,53 +402,67 @@ class TestMultiprocessing(TestCase):

    @unittest.skipIf(IS_WINDOWS, "Test needs to use fork multiprocessing")
    def test_autograd_errors(self):
-        ctx = mp.get_context('fork')
+        ctx = mp.get_context("fork")
        simple_autograd_function()
-        with self.assertRaisesRegex(RuntimeError, r'Unable to handle autograd'):
+        with self.assertRaisesRegex(RuntimeError, r"Unable to handle autograd"):
            with ctx.Pool(3) as pool:
                pool.map(simple_autograd_function, [1, 2, 3])

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Test needs to use spawn multiprocessing")
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN, "Test needs to use spawn multiprocessing"
+    )
    def test_autograd_fine_with_spawn(self):
-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        simple_autograd_function()
        with ctx.Pool(3) as pool:
            pool.map(simple_autograd_function, [1, 2, 3])

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_cuda_simple(self):
        torch.cuda.FloatTensor([1])  # initialize CUDA outside of leak checker
-        self._test_sharing(mp.get_context('spawn'), 'cuda', torch.float)
+        self._test_sharing(mp.get_context("spawn"), "cuda", torch.float)

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_cuda_memory_allocation(self):
-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        q = ctx.Queue()
        e = ctx.Event()
-        p = ctx.Process(target=send_and_delete_tensors, args=(q, e, 'cuda', torch.int, 5))
+        p = ctx.Process(
+            target=send_and_delete_tensors, args=(q, e, "cuda", torch.int, 5)
+        )
        p.start()
        t = []
        for _ in range(5):
            t.append(q.get())
        # TODO(#38095): Replace assertEqualIgnoreType. See issue #38095
-        self.assertEqualIgnoreType(t[0], torch.full([5], 0.))
+        self.assertEqualIgnoreType(t[0], torch.full([5], 0.0))
        del t
        e.set()
        p.join(1)

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_cuda_ipc_deadlock(self):
-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        queue = ctx.Queue(1)
        processes = dict(
            a=ctx.Process(target=_test_cuda_ipc_deadlock_actor, args=(queue, 100)),
-            l=ctx.Process(target=_test_cuda_ipc_deadlock_learner, args=(queue, 100)))
+            l=ctx.Process(target=_test_cuda_ipc_deadlock_learner, args=(queue, 100)),
+        )

        for p in processes.values():
            p.start()
@ -432,22 +473,30 @@ class TestMultiprocessing(TestCase):
        for p in processes.values():
            self.assertFalse(p.is_alive())

-
    @slowTest
-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_cuda_send_many(self, name=None, size=5, count=100000):
-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        q1 = ctx.Queue()
        q2 = ctx.Queue()
        q3 = ctx.Queue()
        e1 = ctx.Event()
        e2 = ctx.Event()
        e3 = ctx.Event()
-        p1 = ctx.Process(target=send_and_delete_tensors, args=(q1, e1, 'cuda', torch.long, count, size))
+        p1 = ctx.Process(
+            target=send_and_delete_tensors,
+            args=(q1, e1, "cuda", torch.long, count, size),
+        )
        p2 = ctx.Process(target=receive_and_send, args=(q1, q2, e2, count))
-        p3 = ctx.Process(target=receive_and_send_sum, args=(q2, q3, e3, 'cuda', torch.long, count, size))
+        p3 = ctx.Process(
+            target=receive_and_send_sum,
+            args=(q2, q3, e3, "cuda", torch.long, count, size),
+        )
        p1.start()
        p2.start()
        p3.start()
@ -461,18 +510,21 @@ class TestMultiprocessing(TestCase):
        p2.join(1)
        p3.join(1)

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
-    @unittest.skipIf(not TEST_MULTIGPU, 'found only 1 GPU')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
+    @unittest.skipIf(not TEST_MULTIGPU, "found only 1 GPU")
    def test_cuda_small_tensors(self):
        # Check multiple small tensors which will likely use the same
        # underlying cached allocation
-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        tensors = []
        for i in range(5):
            device = i % 2
-            tensors += [torch.arange(i * 5., (i + 1) * 5).cuda(device)]
+            tensors += [torch.arange(i * 5.0, (i + 1) * 5).cuda(device)]

        inq = ctx.Queue()
        outq = ctx.Queue()
@ -487,7 +539,7 @@ class TestMultiprocessing(TestCase):

        for i, _tensor in enumerate(tensors):
            v, device, tensor_size, storage_size = results[i]
-            self.assertEqual(v, torch.arange(i * 5., (i + 1) * 5).sum())
+            self.assertEqual(v, torch.arange(i * 5.0, (i + 1) * 5).sum())
            self.assertEqual(device, i % 2)
            self.assertEqual(tensor_size, 5)

@ -508,8 +560,8 @@ class TestMultiprocessing(TestCase):
        # memory 'file' for performance reason
        torch.cuda.ipc_collect()

-    @unittest.skipIf(IS_WINDOWS, 'not applicable to Windows (only fails with fork)')
-    @unittest.skipIf(not torch.cuda.is_available(), 'CUDA not available')
+    @unittest.skipIf(IS_WINDOWS, "not applicable to Windows (only fails with fork)")
+    @unittest.skipIf(not torch.cuda.is_available(), "CUDA not available")
    def test_cuda_bad_call(self):
        # Initialize CUDA
        t = torch.zeros(5, 5).cuda().cpu()
@ -521,10 +573,11 @@ class TestMultiprocessing(TestCase):
        p.join()
        self.assertIsInstance(outq.get(), RuntimeError)

-    @unittest.skipIf(IS_WINDOWS, 'not applicable to Windows (only fails with fork)')
-    @unittest.skipIf(not torch.cuda.is_available(), 'CUDA not available')
+    @unittest.skipIf(IS_WINDOWS, "not applicable to Windows (only fails with fork)")
+    @unittest.skipIf(not torch.cuda.is_available(), "CUDA not available")
    def test_wrong_cuda_fork(self):
-        stderr = TestCase.runWithPytorchAPIUsageStderr("""\
+        stderr = TestCase.runWithPytorchAPIUsageStderr(
+            """\
 import torch
 from torch.multiprocessing import Process
 def run(rank):
@ -540,14 +593,18 @@ if __name__ == "__main__":
        processes.append(p)
    for p in processes:
        p.join()
-""")
+"""
+        )
        self.assertRegex(stderr, "Cannot re-initialize CUDA in forked subprocess.")

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_event(self):
-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        queue = ctx.Queue()
        ready = ctx.Event()
        done = ctx.Event()
@ -576,19 +633,23 @@ if __name__ == "__main__":
        event.synchronize()
        c2p.put(1)  # notify parent synchronization is done

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_event_multiprocess(self):
        event = torch.cuda.Event(enable_timing=False, interprocess=True)
        self.assertTrue(event.query())

-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        p2c = ctx.SimpleQueue()
        c2p = ctx.SimpleQueue()
        p = ctx.Process(
            target=TestMultiprocessing._test_event_multiprocess_child,
-            args=(event, p2c, c2p))
+            args=(event, p2c, c2p),
+        )
        p.start()

        c2p.get()  # wait for until child process is ready
@ -601,13 +662,16 @@ if __name__ == "__main__":
        self.assertTrue(event.query())
        p.join()

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
-    @unittest.skipIf(not TEST_MULTIGPU, 'found only 1 GPU')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
+    @unittest.skipIf(not TEST_MULTIGPU, "found only 1 GPU")
    def test_event_handle_multi_gpu(self):
-        d0 = torch.device('cuda:0')
-        d1 = torch.device('cuda:1')
+        d0 = torch.device("cuda:0")
+        d1 = torch.device("cuda:1")
        with torch.cuda.device(d0):
            e0 = torch.cuda.Event(enable_timing=False, interprocess=True)

@ -634,19 +698,23 @@ if __name__ == "__main__":
        c2p.put(1)  # nofity synchronization is done in child
        p2c.get()  # wait for parent to finish before destructing child event

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_event_handle_importer(self):
        e0 = torch.cuda.Event(enable_timing=False, interprocess=True)
        self.assertTrue(e0.query())

-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        p2c = ctx.SimpleQueue()
        c2p = ctx.SimpleQueue()
        p = ctx.Process(
            target=TestMultiprocessing._test_event_handle_importer_consumer,
-            args=(e0.ipc_handle(), p2c, c2p))
+            args=(e0.ipc_handle(), p2c, c2p),
+        )
        p.start()

        c2p.get()  # wait for child to become ready
@ -664,8 +732,7 @@ if __name__ == "__main__":
    def _test_event_handle_exporter_consumer(handle, p2c, c2p):
        stream = torch.cuda.Stream()
        with torch.cuda.stream(stream):
-            e1 = torch.cuda.Event.from_ipc_handle(
-                torch.cuda.current_device(), handle)
+            e1 = torch.cuda.Event.from_ipc_handle(torch.cuda.current_device(), handle)
            torch.cuda._sleep(50000000)  # spin for about 50 ms
            e1.record()
            c2p.put(0)
@ -673,18 +740,22 @@ if __name__ == "__main__":
            # destructing e1
            p2c.get()

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_event_handle_exporter(self):
        e0 = torch.cuda.Event(enable_timing=False, interprocess=True)

-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        p2c = ctx.SimpleQueue()
        c2p = ctx.SimpleQueue()
        p = ctx.Process(
            target=TestMultiprocessing._test_event_handle_exporter_consumer,
-            args=(e0.ipc_handle(), p2c, c2p))
+            args=(e0.ipc_handle(), p2c, c2p),
+        )
        p.start()
        # wait for event in child process is recorded
        c2p.get()
@ -703,21 +774,24 @@ if __name__ == "__main__":
        self.assertEqual(out, empty)

    def test_empty_tensor_sharing(self):
-        self._test_empty_tensor_sharing(torch.float32, torch.device('cpu'))
-        self._test_empty_tensor_sharing(torch.int64, torch.device('cpu'))
+        self._test_empty_tensor_sharing(torch.float32, torch.device("cpu"))
+        self._test_empty_tensor_sharing(torch.int64, torch.device("cpu"))

-    @unittest.skipIf(not torch.cuda.is_available(), 'CUDA not available')
+    @unittest.skipIf(not torch.cuda.is_available(), "CUDA not available")
    def test_empty_tensor_sharing_cuda(self):
-        self._test_empty_tensor_sharing(torch.float32, torch.device('cuda'))
-        self._test_empty_tensor_sharing(torch.int64, torch.device('cuda'))
+        self._test_empty_tensor_sharing(torch.float32, torch.device("cuda"))
+        self._test_empty_tensor_sharing(torch.int64, torch.device("cuda"))

    def _test_autograd_sharing(self, var, ctx=mp, is_parameter=False):
-        device = 'cuda' if var.is_cuda else 'cpu'
+        device = "cuda" if var.is_cuda else "cpu"

        ready = ctx.Event()
        master_modified = ctx.Event()
        queue = ctx.Queue()
-        p = ctx.Process(target=autograd_sharing, args=(queue, ready, master_modified, device, is_parameter))
+        p = ctx.Process(
+            target=autograd_sharing,
+            args=(queue, ready, master_modified, device, is_parameter),
+        )
        p.daemon = True
        p.start()

@ -770,24 +844,29 @@ if __name__ == "__main__":

    def test_variable_sharing(self):
        for requires_grad in [True, False]:
-            var = torch.arange(1., 26).view(5, 5).requires_grad_(requires_grad)
+            var = torch.arange(1.0, 26).view(5, 5).requires_grad_(requires_grad)
            self._test_autograd_sharing(var)

    # See https://github.com/pytorch/pytorch/issues/14997
-    @unittest.skipIf(TEST_WITH_ASAN,
-                     "non-deterministically hangs with ASAN")
+    @unittest.skipIf(TEST_WITH_ASAN, "non-deterministically hangs with ASAN")
    def test_leaf_variable_sharing(self):
-        devices = ['cpu']
+        devices = ["cpu"]
        if torch.cuda.is_available() and not NO_MULTIPROCESSING_SPAWN and TEST_CUDA_IPC:
-            devices.append('cuda')
+            devices.append("cuda")
        for device in devices:
            for requires_grad in [True, False]:
-                var = torch.arange(1., 26, device=device).view(5, 5).requires_grad_(requires_grad)
+                var = (
+                    torch.arange(1.0, 26, device=device)
+                    .view(5, 5)
+                    .requires_grad_(requires_grad)
+                )
                self.assertTrue(var.is_leaf)
-                ctx = mp.get_context('spawn') if device == 'cuda' else mp
+                ctx = mp.get_context("spawn") if device == "cuda" else mp
                ready = ctx.Event()
                queue = ctx.Queue()
-                p = ctx.Process(target=requires_grad_variable_sharing, args=(queue, ready))
+                p = ctx.Process(
+                    target=requires_grad_variable_sharing, args=(queue, ready)
+                )
                p.daemon = True
                p.start()
                queue.put(var)
@ -796,65 +875,86 @@ if __name__ == "__main__":
                self.assertTrue(worker_requires_grad == requires_grad)

    def test_non_leaf_variable_sharing(self):
-        devices = ['cpu'] if not torch.cuda.is_available() else ['cpu', 'cuda']
+        devices = ["cpu"] if not torch.cuda.is_available() else ["cpu", "cuda"]
        for device in devices:
-            var0 = torch.arange(1., 26, device=device).view(5, 5).requires_grad_(True)
+            var0 = torch.arange(1.0, 26, device=device).view(5, 5).requires_grad_(True)
            var = var0 * 2
            # Don't use a regular Queue; it uses a background thread (which
            # means we can't catch the exceptions)
            queue = mp.SimpleQueue()
-            self.assertRaisesRegex(RuntimeError, r'requires_grad', lambda: queue.put(var))
+            self.assertRaisesRegex(
+                RuntimeError, r"requires_grad", lambda: queue.put(var)
+            )

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_cuda_variable_sharing(self):
        for requires_grad in [True, False]:
-            var = torch.arange(1., 26, device='cuda').view(5, 5).requires_grad_(requires_grad)
-            self._test_autograd_sharing(var, mp.get_context('spawn'))
+            var = (
+                torch.arange(1.0, 26, device="cuda")
+                .view(5, 5)
+                .requires_grad_(requires_grad)
+            )
+            self._test_autograd_sharing(var, mp.get_context("spawn"))

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_mixed_types_cuda_sharing(self):
-        self._test_mixed_types_cuda_sharing(mp.get_context('spawn'))
+        self._test_mixed_types_cuda_sharing(mp.get_context("spawn"))

    def test_parameter_sharing(self):
-        param = Parameter(torch.arange(1., 26).view(5, 5))
+        param = Parameter(torch.arange(1.0, 26).view(5, 5))
        self._test_autograd_sharing(param, is_parameter=True)

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_cuda_parameter_sharing(self):
-        param = Parameter(torch.arange(1., 26, device='cuda').view(5, 5))
-        self._test_autograd_sharing(param, mp.get_context('spawn'), is_parameter=True)
+        param = Parameter(torch.arange(1.0, 26, device="cuda").view(5, 5))
+        self._test_autograd_sharing(param, mp.get_context("spawn"), is_parameter=True)

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
    def test_integer_parameter_serialization_cpu(self):
-        self._test_integer_parameter_serialization(device='cpu')
+        self._test_integer_parameter_serialization(device="cpu")

-    @unittest.skipIf(NO_MULTIPROCESSING_SPAWN, "Disabled for environments that \
-                     don't support multiprocessing with spawn start method")
-    @unittest.skipIf(not TEST_CUDA_IPC, 'CUDA IPC not available')
+    @unittest.skipIf(
+        NO_MULTIPROCESSING_SPAWN,
+        "Disabled for environments that \
+                     don't support multiprocessing with spawn start method",
+    )
+    @unittest.skipIf(not TEST_CUDA_IPC, "CUDA IPC not available")
    def test_integer_parameter_serialization_cuda(self):
-        self._test_integer_parameter_serialization(device='cuda')
+        self._test_integer_parameter_serialization(device="cuda")

    def _test_integer_parameter_serialization(self, device):
        param = torch.nn.Parameter(
-            torch.tensor(0, dtype=torch.int64, device=device),
-            requires_grad=False
+            torch.tensor(0, dtype=torch.int64, device=device), requires_grad=False
        )

-        ctx = mp.get_context('spawn')
+        ctx = mp.get_context("spawn")
        p = ctx.Process(target=integer_parameter_serialization, args=(param,))
        p.start()
        p.join()

        self.assertEqual(
-            0, p.exitcode,
-            msg=f'Failed to serialize successfully for "{device}" device!'
+            0,
+            p.exitcode,
+            msg=f'Failed to serialize successfully for "{device}" device!',
        )

    def test_empty_shared(self):
@ -867,7 +967,9 @@ if __name__ == "__main__":
        t.share_memory_()
        self.assertTrue(t.is_shared())

-    @unittest.skipIf(platform == 'darwin', "file descriptor strategy is not supported on macOS")
+    @unittest.skipIf(
+        platform == "darwin", "file descriptor strategy is not supported on macOS"
+    )
    def test_is_shared(self):
        self._test_is_shared()

@ -875,11 +977,11 @@ if __name__ == "__main__":
        with fs_sharing():
            self._test_is_shared()

-    @unittest.skipIf(not torch.cuda.is_available(), 'CUDA not available')
+    @unittest.skipIf(not torch.cuda.is_available(), "CUDA not available")
    def test_is_shared_cuda(self):
        t = torch.randn(5, 5).cuda()
        self.assertTrue(t.is_shared())


-if __name__ == '__main__':
+if __name__ == "__main__":
    run_tests()