FrozenGene commented on a change in pull request #7132:
URL: https://github.com/apache/tvm/pull/7132#discussion_r546625280
##########
File path: src/auto_scheduler/search_task.cc
##########
@@ -90,6 +90,22 @@ HardwareParams
HardwareParamsNode::GetDefaultHardwareParams(const Target& target
int max_vthread_extent = warp_size / 4;
return HardwareParams(-1, 16, 64, max_shared_memory_per_block,
max_local_memory_per_block,
max_threads_per_block, max_vthread_extent,
warp_size);
+ } else if (target->kind->device_type == kDLOpenCL) {
+ if (target->GetAttr<String>("device", "") == "mali") {
+ // We can not use device api to get attr like CUDA
+ // because like Mali target is normally on the remote machine
+ int max_shared_memory_per_block = 32768;
+ int max_local_memory_per_block = INT32_MAX; // skip the check on local
memory
+ int max_threads_per_block = 256;
+ int warp_size = 1;
+ int max_vthread_extent = 1;
+ return HardwareParams(-1, 16, 64, max_shared_memory_per_block,
max_local_memory_per_block,
+ max_threads_per_block, max_vthread_extent,
warp_size);
Review comment:
This is the default target parameter for mali. I will write how to get
these parameter and pass them to `SearchTask` in the tutorial of Mali.
----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
For queries about this service, please contact Infrastructure at:
[email protected]