Change nvcc arch flags for sm100 (#148774)

### Summary
- Addressing this comment https://github.com/pytorch/pytorch/pull/148274#discussion_r1984944012

### Test plan
- Verified building from source w/ B200s is successful
- Verified B200 tensorcores are still being utilized properly via benchmarking script

Pull Request resolved: https://github.com/pytorch/pytorch/pull/148774
Approved by: https://github.com/Skylion007
This commit is contained in:
Daniel Vega-Myhre
2025-03-08 19:05:51 +00:00
committed by PyTorch MergeBot
parent 7ffadff286
commit 148eb735ee

View File

@ -92,7 +92,7 @@ if(INTERN_BUILD_ATEN_OPS)
if(EXISTING_ARCH_FLAGS MATCHES ".*compute_90.*")
list(APPEND ROWWISE_SCALED_MM_FILE_COMPILE_FLAGS "-gencode;arch=compute_90a,code=sm_90a")
endif()
if(EXISTING_ARCH_FLAGS MATCHES ".*compute_100a.*")
if(EXISTING_ARCH_FLAGS MATCHES ".*compute_100.*")
list(APPEND ROWWISE_SCALED_MM_FILE_COMPILE_FLAGS "-gencode;arch=compute_100a,code=sm_100a")
endif()
endif()