[ROCm] Add cast to kFloat in amax calculation (#123872)

necessary cast to kFloat missed in previous amax PR Pull Request resolved: https://github.com/pytorch/pytorch/pull/123872 Approved by: https://github.com/drisspg
2025-10-20 21:14:14 +08:00 · 2024-04-12 15:38:41 +00:00
parent b024c0c2ef
commit 2cb3301f80
1 changed files with 1 additions and 1 deletions
--- a/aten/src/ATen/native/cuda/Blas.cpp
+++ b/aten/src/ATen/native/cuda/Blas.cpp
@ -912,7 +912,7 @@ _scaled_mm_out_cuda(const Tensor& mat1, const Tensor& mat2,

 #if defined(USE_ROCM) && ROCM_VERSION >= 60000
  // rocm's hipblaslt does not yet support amax, so calculate separately
-  amax = at::max(at::abs(out));
+  amax = at::max(at::abs(out.to(kFloat)));
 #endif

  return {out, amax};