pytorch

mirror of https://github.com/pytorch/pytorch.git synced 2025-10-20 21:14:14 +08:00

Files

drisspg 3c6efd1380 Add cutedsl template support to compile (#160108 )

## Summary
Still figuring out what actually writing a template should look like, but lands alot of the base infra

<img width="1267" height="262" alt="Screenshot 2025-08-16 at 10 22 12 PM" src="https://github.com/user-attachments/assets/229f8bfa-0cb4-4fb1-8530-f535e569d350" />

Test code:

```Python
#!/usr/bin/env python3
"""
Fixed CuteDSL template test with proper def_kernel usage.
"""

import torch
import torch._inductor.config as config
from torch._inductor.lowering import lowerings
from torch._inductor.ir import TensorBox
from torch._inductor.select_algorithm import autotune_select_algorithm
from torch._inductor.codegen.cutedsl import CuteDSLTemplate

def create_fixed_cutedsl_template():
    """Create a properly structured CuteDSL template."""

    def cutedsl_grid(M, N, meta):
        return (1,)

    # Part 1: Imports and kernel definition
    template_part1 = r"""
import torch
import cutlass
import cutlass.cute as cute
from cutlass.cute.runtime import from_dlpack

@cute.kernel
def {{kernel_name}}_kernel(gA: cute.Tensor, gB: cute.Tensor, gC: cute.Tensor):
    # Get thread and block indices
    tidx, _, _ = cute.arch.thread_idx()
    bidx, _, _ = cute.arch.block_idx()
    bdim, _, _ = cute.arch.block_dim()

    thread_idx = bidx * bdim + tidx
    m, n = gA.shape

    if thread_idx < m * n:
        mi = thread_idx // n
        ni = thread_idx % n

        if mi < m and ni < n:
            a_val = gA[mi, ni]
            b_val = gB[mi, ni]
            result = a_val + b_val
            gC[mi, ni] = a_val + b_val
"""

    # Part 2: JIT wrapper function
    template_part2 = r"""
@cute.jit
def {{kernel_name}}_jit(mA: cute.Tensor, mB: cute.Tensor, mC: cute.Tensor):
    m, n = mA.shape
    total_threads = m * n
    threads_per_block = 256
    num_blocks = (total_threads + threads_per_block - 1) // threads_per_block

    kernel = {{kernel_name}}_kernel(mA, mB, mC)
    kernel.launch(
        grid=[num_blocks, 1, 1],
        block=[threads_per_block, 1, 1]
    )
"""

    # Part 3: Main kernel function
    template_part3 = r"""
{{def_kernel("input_a", "input_b", "output_c")}}
    cute_a = from_dlpack(input_a, assumed_align=16)
    cute_b = from_dlpack(input_b, assumed_align=16)
    cute_c = from_dlpack(output_c, assumed_align=16)

    # Launch kernel
    {{kernel_name}}_jit(cute_a, cute_b, cute_c)

    return output_c
"""

    # Combine all parts
    template = CuteDSLTemplate(
        name="fixed_add",
        grid=cutedsl_grid,
        source=template_part1 + template_part2 + template_part3
    )

    return template

def fixed_cutedsl_lowering(a: TensorBox, b: TensorBox) -> TensorBox:
    """Fixed CuteDSL lowering."""
    print(f"[FIXED] CuteDSL lowering: {a.get_size()} + {b.get_size()}")

    template = create_fixed_cutedsl_template()
    choices = []

    error = template.maybe_append_choice(
        choices,
        input_nodes=[a.data, b.data],
        layout=a.get_layout()
    )

    if error or not choices:
        print(f"[FIXED] Falling back: {error}")
        default_lowering = lowerings[torch.ops.aten.add.Tensor]
        return default_lowering(a, b)

    print(f"[FIXED] Using CuteDSL with {len(choices)} choices")

    result = autotune_select_algorithm(
        "fixed_cutedsl_add",
        choices,
        [a, b],
        a.get_layout(),
    )

    return result

def test_fixed_cutedsl():
    """Test the fixed CuteDSL template."""
    print("=" * 50)
    print("Fixed CuteDSL Template Test")
    print("=" * 50)

    original = lowerings.get(torch.ops.aten.add.Tensor, None)

    try:
        lowerings[torch.ops.aten.add.Tensor] = fixed_cutedsl_lowering

        def test_add(x, y):
            return x + y

        device = "cuda" if torch.cuda.is_available() else "cpu"
        x = torch.randn(128, 4, device=device, dtype=torch.float32)
        y = torch.randn(128, 4, device=device, dtype=torch.float32)

        print(f"[FIXED] Testing with {x.shape} tensors on {device}")

        compiled_fn = torch.compile(test_add, backend="inductor")
        result = compiled_fn(x, y)

        # Verify correctness
        expected = x + y
        if torch.allclose(result, expected, atol=1e-5):
            print("✅ [FIXED] Results match!")
            return True
        else:
            print("❌ [FIXED] Results don't match!")
            return False

    except Exception as e:
        print(f"❌ [FIXED] Failed: {e}")
        import traceback
        traceback.print_exc()
        return False

    finally:
        if original:
            lowerings[torch.ops.aten.add.Tensor] = original
        else:
            lowerings.pop(torch.ops.aten.add.Tensor, None)

if __name__ == "__main__":
    success = test_fixed_cutedsl()
    print("🎉 Fixed test completed!" if success else "💥 Fixed test failed!")

```

Pull Request resolved: https://github.com/pytorch/pytorch/pull/160108
Approved by: https://github.com/mlazos

2025-08-18 04:37:15 +00:00

ao/sparsity

[BE][3/6] fix typos in test/ (#157637 )

2025-07-17 12:08:33 +00:00

autograd

Fix unused Python variables in test/[a-d]* (#134665 )

2024-12-13 22:13:12 +00:00

backends/xeon

…

benchmark_utils

[BE][3/6] fix typos in test/ (#157637 )

2025-07-17 12:08:33 +00:00

bottleneck_test

Fix unused Python variables in test/[a-d]* (#134665 )

2024-12-13 22:13:12 +00:00

compiled_autograd_skips

[ca] skip on some PYTORCH_TEST_WITH_DYNAMO=1 autograd tests (#156374 )

2025-06-21 18:33:38 +00:00

cpp

[nativert] oss subgraph rewriter (#160780 )

2025-08-18 04:25:05 +00:00

cpp_api_parity

[BE][PYFMT] migrate PYFMT for test/[a-h]*/ to ruff format (#144555 )

2025-06-24 04:53:54 +00:00

cpp_extensions

Add getCurrentDeviceIndex to torch::stable::accelerator (#160453 )

2025-08-13 23:42:24 +00:00

custom_backend

[Cmake] Make PyTorch buildable by CMake-4.x (#150203 )

2025-03-29 01:39:13 +00:00

custom_operator

Using the latest torch.library.register_fake API instead of torch.library.impl_abstract (#158839 )

2025-07-25 02:37:30 +00:00

distributed

port 2 distributed pipeline test files for Intel GPU (#159140 )

2025-08-15 18:29:50 +00:00

distributions

[BE] fix remaining flake8 v7 warnings (#159044 )

2025-07-25 02:56:34 +00:00

dynamo

[PGO] add extra read/write keys (#160715 )

2025-08-18 01:41:08 +00:00

dynamo_expected_failures

[collections.abc] Ensure that binop calls works with UserDefinedObjects (#159865 )

2025-08-16 20:44:40 +00:00

dynamo_skips

[Test Fix] Delete dynamo skipfile for OpenMP test_one_thread (#160562 )

2025-08-14 20:55:59 +00:00

error_messages

…

expect

[cuDNN][SDPA] cuDNN SDPA refactor/cleanup, nested tensor backward, test priority bump for sm90, sm100 (#149282 )

2025-08-08 22:22:48 +00:00

export

Introduce OpInfo test for testing export on fake device (#160694 )

2025-08-15 07:26:28 +00:00

forward_backward_compatibility

Fused RMSNorm implementation (#153666 )

2025-07-22 22:25:44 +00:00

functorch

Remove guard_size_oblivious from default contiguity python check, and add aten.sym_is_contiguous. (#159197 )

2025-08-16 09:15:58 +00:00

Separate provenance tracking to different levels (#160383 )

2025-08-15 04:59:35 +00:00

higher_order_ops

[hop][exc] make UncapturedHigherOrderOpError print user code and avoid re-raise (#159296 )

2025-08-11 22:48:10 +00:00

inductor

Add cutedsl template support to compile (#160108 )

2025-08-18 04:37:15 +00:00

inductor_expected_failures

[dynamo] Support Tensor subclass that has dynamic attributes or calls Parameter.__torch_function__ (#149482 )

2025-04-02 20:56:43 +00:00

inductor_skips

[BE] Remove test_ops from FIXME_inductor_dont_reset_dynamo (#145307 )

2025-01-27 18:12:39 +00:00

jit

[TorchScript] thread-safe ErrorReport::CallStack (#160386 )

2025-08-12 21:59:04 +00:00

jit_hooks

[Cmake] Make PyTorch buildable by CMake-4.x (#150203 )

2025-03-29 01:39:13 +00:00

lazy

[BE][PYFMT] migrate PYFMT for test/[i-z]*/ to ruff format (#144556 )

2025-07-29 03:26:09 +00:00

mobile

[BE][PYFMT] migrate PYFMT for test/[i-z]*/ to ruff format (#144556 )

2025-07-29 03:26:09 +00:00

[cuDNN][64-bit indexing] update conv depthwise 64bit indexing dispatch condition to match native kernel (#156140 )

2025-08-12 18:07:41 +00:00

onnx

[ONNX] Default to dynamo export (#159646 )

2025-08-16 04:48:58 +00:00

optim

[BE][PYFMT] migrate PYFMT for {torch,test}/{nn,optim}/** to ruff format (#144548 )

2025-06-14 11:27:04 +00:00

package

[Torch Package] Make get names of OrderedImporters support fallback to importers (#155743 )

2025-08-06 02:26:10 +00:00

profiler

[Profiler] Fix unexpected C return events (#159574 )

2025-08-07 01:17:55 +00:00

quantization

Revert "unskipped mobilenet_v3 quantization and mobilenet_v2 quantization plus tests from https://github.com/pytorch/pytorch/issues/125438 (#157786 )"

2025-08-07 13:09:33 +00:00

scripts

[BE][PYFMT] migrate PYFMT for test/[i-z]*/ to ruff format (#144556 )

2025-07-29 03:26:09 +00:00

strobelight/examples

Enable strobelight profiling specific compile frame ids using COMPILE_STROBELIGHT_FRAME_FILTER (#147549 )

2025-02-22 03:44:53 +00:00

test_img

…

torch_np

[BE][PYFMT] migrate PYFMT for test/[i-z]*/ to ruff format (#144556 )

2025-07-29 03:26:09 +00:00

typing

More testing of Python arithmetic operators between tensors and scalars (see 157266) (#157632 )

2025-07-05 17:48:27 +00:00

xpu

Enable _int_mm on Intel GPU (#157769 )

2025-08-02 05:16:01 +00:00

_test_bazel.py

…

allowlist_for_publicAPI.json

remove guard_or_x from allowlist_for_publicAPI (#159181 )

2025-07-26 01:22:17 +00:00

bench_mps_ops.py

[BE] Remove macos-13 guard from bench_mps_ops (#159732 )

2025-08-03 20:53:58 +00:00

conftest.py

[CI][run_test] Fix rerun logic for failing at exit (#155853 )

2025-06-17 17:51:40 +00:00

create_dummy_torchscript_model.py

…

HowToWriteTestsUsingFileCheck.md

…

linear.py

…

load_torchscript_model.py

Flip default on weights_only (#137602 )

2024-11-04 18:30:29 +00:00

minioptest_failures_dict.json

…

mkl_verbose.py

…

mkldnn_verbose.py

…

pytest_shard_custom.py

…

run_doctests.sh

…

run_test.py

Actually run the einops tests in CI (#159776 )

2025-08-07 15:23:06 +00:00

simulate_nccl_errors.py

[BE]: Update ruff to 0.11.8 (#153249 )

2025-05-12 18:30:52 +00:00

slow_tests.json

Update slow tests (#158222 )

2025-08-11 12:00:13 +00:00

test_accelerator.py

Add UT for torch.accelerator memory-related API (#155200 )

2025-08-08 17:41:22 +00:00

test_ao_sparsity.py

Add __main__ guards to ao tests (#154612 )

2025-06-10 18:33:09 +00:00

test_appending_byte_serializer.py

Check integrity of bytes in AppendingByteSerializer (#152139 )

2025-04-26 18:10:58 +00:00

test_autocast.py

Enable TemporaryFileName tests on Windows (#146311 )

2025-02-07 06:06:18 +00:00

test_autograd_fallback.py

Fix TestAutogradFallback flaky tests under Dynamo: migrate to lib._destroy() (#159443 )

2025-07-30 19:30:55 +00:00

test_autograd.py

Add ownership token when needed on GradientEdge (#160098 )

2025-08-12 20:14:18 +00:00

test_autoload.py

…

test_binary_ufuncs.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_bundled_images.py

Add __main__ guards to tests (#154716 )

2025-06-04 14:38:13 +00:00

test_bundled_inputs.py

[4/N] Apply py39 ruff and pyupgrade fixes (#143257 )

2025-01-04 10:47:51 +00:00

test_ci_sanity_check_fail.py

…

test_comparison_utils.py

[export] Add device and dtype fields to assert_tensor_metadata (#141071 )

2024-11-22 20:54:55 +00:00

test_compile_benchmark_util.py

…

test_complex.py

…

test_content_store.py

torch.utils._content_store: fix error in hash_storage on XPU (#147785 )

2025-02-26 23:57:59 +00:00

test_cpp_api_parity.py

Revert "Stop parsing command line arguments every time common_utils is imported. (#156703 )"

2025-08-04 20:37:39 +00:00

test_cpp_extensions_aot.py

[build] modernize build-frontend: python setup.py develop/install -> [uv ]pip install --no-build-isolation [-e ]. (#156027 )

2025-07-09 11:24:27 +00:00

test_cpp_extensions_jit.py

[CI] Fixes CI for CUDA Version > 12.9 (#157385 )

2025-07-19 06:51:57 +00:00

test_cpp_extensions_mtia_backend.py

Revert "Generalize poison fork logic for each device backend (#144664 )"

2025-04-10 21:02:14 +00:00

test_cpp_extensions_stream_and_event.py

[Easy] Add more check for elapsedTime of torch.xxx.Event and torch.Event (#151404 )

2025-04-25 20:15:04 +00:00

test_cuda_expandable_segments.py

Revert "Use absolute path path.resolve() -> path.absolute() (#129409 )"

2025-01-04 14:17:20 +00:00

test_cuda_multigpu.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_cuda_nvml_based_avail.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_cuda_primary_ctx.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_cuda_sanitizer.py

[4/N] Apply py39 ruff and pyupgrade fixes (#143257 )

2025-01-04 10:47:51 +00:00

test_cuda_trace.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_cuda.py

Add UT for torch.accelerator memory-related API (#155200 )

2025-08-08 17:41:22 +00:00

test_custom_ops.py

Add utility to get computed kernel in torch.library (#158393 )

2025-08-13 21:00:59 +00:00

test_dataloader.py

skip XPU for dataloader CPU only unit test (#159811 )

2025-08-05 03:44:01 +00:00

test_datapipe.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_decomp.py

Fix full_like decomposition to preserve strides (#158898 )

2025-07-25 20:21:36 +00:00

test_determination.py

…

test_dispatch.py

Typo fixes for "overridden" in comments and function names (#155944 )

2025-06-14 03:37:38 +00:00

test_dlpack.py

[Testing] Add MPS to NATIVE_DEVICES (#153835 )

2025-08-05 18:57:35 +00:00

test_dynamic_shapes.py

Fix get_free_symbol_uses for several nodes (#160314 )

2025-08-13 12:28:29 +00:00

test_expanded_weights.py

Revert "Stop parsing command line arguments every time common_utils is imported. (#156703 )"

2025-08-04 20:37:39 +00:00

test_extension_utils.py

Move privateuse1 test out of test_utils and make them serial (#145380 )

2025-01-23 00:31:39 +00:00

test_fake_tensor.py

[MTIA] Allow users who know what they are doing to ignore all device mismatches in tracing and take a preferred device. (#159931 )

2025-08-07 22:37:15 +00:00

test_file_check.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_flop_counter.py

PYFMT lint grandfathered files 1 (#154261 )

2025-05-25 17:36:14 +00:00

test_foreach.py

Fix requires_cuda to requires_cuda_and_triton (#160222 )

2025-08-10 07:05:52 +00:00

test_function_schema.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_functional_autograd_benchmark.py

Enable Windows tests (#146666 )

2025-02-08 00:55:20 +00:00

test_functional_optim.py

[4/N] Apply py39 ruff and pyupgrade fixes (#143257 )

2025-01-04 10:47:51 +00:00

test_functionalization_of_rng_ops.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_functionalization.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_futures.py

…

test_fx_experimental.py

[fx] fix split_module with symint (#160093 )

2025-08-13 05:50:15 +00:00

test_fx_passes.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_fx_reinplace_pass.py

[dynamic shapes] avoid unnecessary slices (#157528 )

2025-07-10 06:34:46 +00:00

test_fx.py

Extend torch function support to ALL arguments, not just scalar type (but not insides of list) (#145089 )

2025-08-07 23:43:53 +00:00

test_hop_infra.py

Support torch.compile rng selective activation checkpointing with cudagraph (#146878 )

2025-02-28 00:47:03 +00:00

test_hub.py

Add __main__ guards to tests (#154716 )

2025-06-04 14:38:13 +00:00

test_import_stats.py

…

test_indexing.py

[Testing] Add MPS to NATIVE_DEVICES (#153835 )

2025-08-05 18:57:35 +00:00

test_itt.py

…

test_jit_autocast.py

Revert "Stop parsing command line arguments every time common_utils is imported. (#156703 )"

2025-08-04 20:37:39 +00:00

test_jit_disabled.py

…

test_jit_fuser_legacy.py

Revert "Stop parsing command line arguments every time common_utils is imported. (#156703 )"

2025-08-04 20:37:39 +00:00

test_jit_fuser_te.py

Remove tensorexpr tests (#158928 )

2025-08-09 02:21:22 +00:00

test_jit_fuser.py

Revert "Stop parsing command line arguments every time common_utils is imported. (#156703 )"

2025-08-04 20:37:39 +00:00

test_jit_legacy.py

Revert "Stop parsing command line arguments every time common_utils is imported. (#156703 )"

2025-08-04 20:37:39 +00:00

test_jit_llga_fuser.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_jit_profiling.py

…

test_jit_simple.py

…

test_jit_string.py

PEP585 update - test (#145176 )

2025-01-22 04:48:28 +00:00

test_jit.py

Revert "Stop parsing command line arguments every time common_utils is imported. (#156703 )"

2025-08-04 20:37:39 +00:00

test_jiterator.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_kernel_launch_checks.py

…

test_legacy_vmap.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_license.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_linalg.py

Revert "unskipped mobilenet_v3 quantization and mobilenet_v2 quantization plus tests from https://github.com/pytorch/pytorch/issues/125438 (#157786 )"

2025-08-07 13:09:33 +00:00

test_logging.py

…

test_masked.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_maskedtensor.py

Fix MaskedTensor to device ignored mask (#151205 )

2025-07-21 21:44:49 +00:00

test_matmul_cuda.py

Fix grouped MM load along K when TMA loads are not used (#159485 )

2025-07-31 17:58:02 +00:00

test_meta.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_metal.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_mkl_verbose.py

…

test_mkldnn_fusion.py

[4/N] Apply py39 ruff and pyupgrade fixes (#143257 )

2025-01-04 10:47:51 +00:00

test_mkldnn_verbose.py

…

test_mkldnn.py

Enable TF32 as fp32 internal precision for matmul/linear/conv (#157520 )

2025-07-17 08:57:34 +00:00

test_mobile_optimizer.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_model_exports_to_core_aten.py

[Codemod][AddExplicitStrictExportForTrainingInferenceArg] caffe2/ (#149595 )

2025-04-03 23:50:13 +00:00

test_module_tracker.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_modules.py

Disable slow gradcheck for nn.Transformer ModuleInfo (#145531 )

2025-01-25 00:58:03 +00:00

test_monitor.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_mps.py

[MPS] Add grid_sampler_3d for MPS (#160541 )

2025-08-15 16:19:25 +00:00

test_multiprocessing_spawn.py

Test multiprocessing spawn timing fix (#160672 )

2025-08-15 00:11:55 +00:00

test_multiprocessing.py

Revert "[CI] Use setup-python from for Mac tests (#155698 )"

2025-06-12 14:42:32 +00:00

test_namedtensor.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_namedtuple_return_api.py

…

test_native_functions.py

[4/N] Apply py39 ruff and pyupgrade fixes (#143257 )

2025-01-04 10:47:51 +00:00

test_native_mha.py

[ROCm] Update to AOTriton 0.8b (#140172 )

2024-12-06 21:45:18 +00:00

test_nestedtensor.py

[cuDNN][SDPA] cuDNN SDPA refactor/cleanup, nested tensor backward, test priority bump for sm90, sm100 (#149282 )

2025-08-08 22:22:48 +00:00

test_nn.py

[MPS] Add grid_sampler_3d for MPS (#160541 )

2025-08-15 16:19:25 +00:00

test_nnapi.py

[4/N] Apply py39 ruff and pyupgrade fixes (#143257 )

2025-01-04 10:47:51 +00:00

test_numa_binding.py

[ez] Make NUMA signpost parameters JSON serializable (#160710 )

2025-08-15 16:52:43 +00:00

test_numba_integration.py

Fix broken URLs (#152237 )

2025-04-27 09:56:42 +00:00

test_numpy_interop.py

Throw invalid_argument instead of RuntimeError when parameters exceed… (#158267 )

2025-07-25 23:49:46 +00:00

test_openmp.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_openreg.py

[OpenReg] move fallback tests into test_openreg.py (#158441 )

2025-07-25 02:39:41 +00:00

test_ops_fwd_gradients.py

…

test_ops_gradients.py

Enable more nightly tests on s390x (#148452 )

2025-03-18 16:09:39 +00:00

test_ops_jit.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_ops.py

Relax unclaimed successes in dtype op tests when running under TEST_WITH_DYNAMO/TEST_WITH_INDUCTOR (#159976 )

2025-08-07 02:38:45 +00:00

test_optim.py

Fix test/test_optim.py error message. (#153076 )

2025-05-07 22:46:05 +00:00

test_out_dtype_op.py

[Codemod][AddExplicitStrictExportArg] caffe2/test (#143688 )

2024-12-27 07:58:44 +00:00

test_overrides.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_package.py

…

test_per_overload_api.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_prims.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_proxy_tensor.py

[attempt 2] Compute contiguity symbolically to avoid dde, and introduce c++ sym_is_contiguous (#157472 )

2025-07-02 23:12:29 +00:00

test_pruning_op.py

…

test_public_bindings.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_python_dispatch.py

Remove guard_size_oblivious from default contiguity python check, and add aten.sym_is_contiguous. (#159197 )

2025-08-16 09:15:58 +00:00

test_pytree.py

Preserve Enum types during torch.export serialization and deserialization (#154821 )

2025-06-08 17:30:31 +00:00

test_quantization.py

Remove pytorch quant docs since we are moving to torchao (#157766 )

2025-07-11 03:21:47 +00:00

test_reductions.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_rename_privateuse1_to_existing_device.py

[Device] Add support for PrivateUse1 device type in parse_type function (#157609 )

2025-07-17 01:27:44 +00:00

test_scatter_gather_ops.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_schema_check.py

[inductor] slow test some Windows UTs. (#160267 )

2025-08-10 18:35:42 +00:00

test_segment_reductions.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_serialization.py

added class or module info for functions blocked by weight-only load (#159935 )

2025-08-12 20:52:25 +00:00

test_set_default_mobile_cpu_allocator.py

…

test_shape_ops.py

[Quant] flip: throw runtime error for QUInt4x2 and QUInt2x4 input (#147430 )

2025-02-25 03:47:40 +00:00

test_show_pickle.py

…

test_sort_and_select.py

Add dtype checks in meta dispatch for various ordering ops (#159556 )

2025-08-14 17:06:27 +00:00

test_sparse_csr.py

[BE] remove torch deploy - conditionals (#158288 )

2025-07-29 17:40:49 +00:00

test_sparse_semi_structured.py

[BE] fix remaining flake8 v7 warnings (#159044 )

2025-07-25 02:56:34 +00:00

test_sparse.py

[ROCm] Support large inputs for coalesceValuesKernel (#158281 )

2025-08-14 15:09:16 +00:00

test_spectral_ops.py

fix numpy compatibility for 2d small list indices (#154806 )

2025-06-04 01:58:52 +00:00

test_stateless.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_static_runtime.py

[4/N] Apply py39 ruff and pyupgrade fixes (#143257 )

2025-01-04 10:47:51 +00:00

test_subclass.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_sympy_utils.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_tensor_creation_ops.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_tensorboard.py

Fix test_tensorboard when started w/o tensorboard package (#154709 )

2025-05-30 19:18:43 +00:00

test_tensorexpr_pybind.py

…

test_tensorexpr.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_testing.py

Fix XPU CI UT test_circular_dependencies (#158189 )

2025-07-13 09:30:57 +00:00

test_throughput_benchmark.py

Fix Throughputbenchmark issue (#144669 )

2025-01-26 03:37:20 +00:00

test_torch.py

[inductor] slow test some Windows UTs. (#160267 )

2025-08-10 18:35:42 +00:00

test_transformers_privateuse1.py

Refactor and Improve the OpenReg Module (#158090 )

2025-07-15 08:10:05 +00:00

test_transformers.py

[Intel GPU] Support SDPA backend selection and priority setting on XPU (#159464 )

2025-08-14 08:55:31 +00:00

test_type_hints.py

Revert "Use absolute path path.resolve() -> path.absolute() (#129409 )"

2025-01-04 14:17:20 +00:00

test_type_info.py

…

test_type_promotion.py

[BE] Raise ValueError from torch.cat meta func (#158249 )

2025-07-20 23:49:18 +00:00

test_typing.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_unary_ufuncs.py

[inductor] slow test some Windows UTs. (#160267 )

2025-08-10 18:35:42 +00:00

test_utils_config_module.py

Add check that envvar configs are boolean (#145454 )

2025-02-05 19:40:10 +00:00

test_utils_filelock.py

filelock: Make waitcounter variant to use (#139816 )

2024-12-12 01:18:34 +00:00

test_utils.py

[docs] Decorator to create a deprecation warning (#155127 )

2025-06-25 18:09:04 +00:00

test_view_ops.py

unify broadcast_shapes functions and avoid duplicates (#160251 )

2025-08-16 00:54:32 +00:00

test_vulkan.py

Fix unused Python variables in test/[e-z]* (#136964 )

2024-12-18 23:02:30 +00:00

test_weak.py

[BE][2/6] fix typos in test/ (test/test_*.py) (#157636 )

2025-07-09 11:02:23 +00:00

test_xnnpack_integration.py

[BE][Ez]: ISC001 Auto concatenate implicit one line strings (#146408 )

2025-02-04 19:07:04 +00:00

test_xpu.py

Generalize support of background thread in pinned allocator (#160505 )

2025-08-14 02:22:39 +00:00