This is an automated email from the ASF dual-hosted git repository. masahi pushed a commit to branch unity in repository https://gitbox.apache.org/repos/asf/tvm.git
commit 1fda9ad03ee19bc450454b05f8d25182394ec856 Author: Masahiro Masuda <masahi...@gmail.com> AuthorDate: Wed Nov 29 10:20:38 2023 +0000 fix fp32 accum not getting enabled --- src/runtime/contrib/cublas/cublas.cc | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/src/runtime/contrib/cublas/cublas.cc b/src/runtime/contrib/cublas/cublas.cc index f4b28d29a8..b5aed23767 100644 --- a/src/runtime/contrib/cublas/cublas.cc +++ b/src/runtime/contrib/cublas/cublas.cc @@ -165,10 +165,10 @@ void CallCublasLt(cublasLtHandle_t hdl, cudaStream_t stream, const DLTensor* A, if (TypeMatch(C->dtype, kDLFloat, 16)) { // Disable fp16 accum to align with PT c_type = CUDA_R_16F; - compute_type = CUBLAS_COMPUTE_16F; - scale_type = CUDA_R_16F; - alpha = &one_fp16; - beta = &zero_fp16; + // compute_type = CUBLAS_COMPUTE_16F; + // scale_type = CUDA_R_16F; + // alpha = &one_fp16; + // beta = &zero_fp16; } else if (TypeMatch(C->dtype, kDLInt, 32)) { c_type = CUDA_R_32I; compute_type = CUBLAS_COMPUTE_32I;