This is an automated email from the ASF dual-hosted git repository.

masahi pushed a commit to branch unity
in repository https://gitbox.apache.org/repos/asf/tvm.git

commit 1fda9ad03ee19bc450454b05f8d25182394ec856
Author: Masahiro Masuda <masahi...@gmail.com>
AuthorDate: Wed Nov 29 10:20:38 2023 +0000

    fix fp32 accum not getting enabled
---
 src/runtime/contrib/cublas/cublas.cc | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/runtime/contrib/cublas/cublas.cc 
b/src/runtime/contrib/cublas/cublas.cc
index f4b28d29a8..b5aed23767 100644
--- a/src/runtime/contrib/cublas/cublas.cc
+++ b/src/runtime/contrib/cublas/cublas.cc
@@ -165,10 +165,10 @@ void CallCublasLt(cublasLtHandle_t hdl, cudaStream_t 
stream, const DLTensor* A,
   if (TypeMatch(C->dtype, kDLFloat, 16)) {
     // Disable fp16 accum to align with PT
     c_type = CUDA_R_16F;
-    compute_type = CUBLAS_COMPUTE_16F;
-    scale_type = CUDA_R_16F;
-    alpha = &one_fp16;
-    beta = &zero_fp16;
+    // compute_type = CUBLAS_COMPUTE_16F;
+    // scale_type = CUDA_R_16F;
+    // alpha = &one_fp16;
+    // beta = &zero_fp16;
   } else if (TypeMatch(C->dtype, kDLInt, 32)) {
     c_type = CUDA_R_32I;
     compute_type = CUBLAS_COMPUTE_32I;

Reply via email to