This is an automated email from the ASF dual-hosted git repository.
tqchen pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/tvm.git
The following commit(s) were added to refs/heads/main by this push:
new 21c12fb124 [Bugfix][Cutlass] fix cutlass instantiate attention
template bugs (#17229)
21c12fb124 is described below
commit 21c12fb1243a79df2aea8b83956c6b0b914cf4a5
Author: senlyu163 <[email protected]>
AuthorDate: Sat Aug 3 20:45:36 2024 +0800
[Bugfix][Cutlass] fix cutlass instantiate attention template bugs (#17229)
[Bugfix][Cutlass] fix cutlass attention template
---
python/tvm/contrib/cutlass/attention_operation.py | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/python/tvm/contrib/cutlass/attention_operation.py
b/python/tvm/contrib/cutlass/attention_operation.py
index 518778ec52..69298453cb 100644
--- a/python/tvm/contrib/cutlass/attention_operation.py
+++ b/python/tvm/contrib/cutlass/attention_operation.py
@@ -111,7 +111,7 @@ def instantiate_attention_template(attrs):
if (accumulator_buf_size <= ${workspace}->shape[0]) {
p.output_accum_ptr = static_cast<float*>(${workspace}->data);
} else {
- accumulator_buf_size = true;
+ accumulator_buf_allocated = true;
cudaMalloc(
&p.output_accum_ptr,
accumulator_buf_size