mirror of
https://github.com/pytorch/pytorch.git
synced 2025-10-20 21:14:14 +08:00
Change nvcc arch flags for sm100 (#148774)
### Summary - Addressing this comment https://github.com/pytorch/pytorch/pull/148274#discussion_r1984944012 ### Test plan - Verified building from source w/ B200s is successful - Verified B200 tensorcores are still being utilized properly via benchmarking script Pull Request resolved: https://github.com/pytorch/pytorch/pull/148774 Approved by: https://github.com/Skylion007
This commit is contained in:
committed by
PyTorch MergeBot
parent
7ffadff286
commit
148eb735ee
@ -92,7 +92,7 @@ if(INTERN_BUILD_ATEN_OPS)
|
||||
if(EXISTING_ARCH_FLAGS MATCHES ".*compute_90.*")
|
||||
list(APPEND ROWWISE_SCALED_MM_FILE_COMPILE_FLAGS "-gencode;arch=compute_90a,code=sm_90a")
|
||||
endif()
|
||||
if(EXISTING_ARCH_FLAGS MATCHES ".*compute_100a.*")
|
||||
if(EXISTING_ARCH_FLAGS MATCHES ".*compute_100.*")
|
||||
list(APPEND ROWWISE_SCALED_MM_FILE_COMPILE_FLAGS "-gencode;arch=compute_100a,code=sm_100a")
|
||||
endif()
|
||||
endif()
|
||||
|
Reference in New Issue
Block a user