Merge branch 'develop' into amoeba-gpu

This commit is contained in:
Trung Nguyen
2022-12-14 13:16:41 -06:00
4848 changed files with 102983 additions and 44974 deletions

View File

@ -473,8 +473,7 @@ void BaseThreeT::compile_kernels(UCL_Device &dev, const void *pair_str,
mx_subgroup_sz = std::min(mx_subgroup_sz, k_three_center_noev.max_subgroup_size(_block_size));
mx_subgroup_sz = std::min(mx_subgroup_sz, k_three_end_noev.max_subgroup_size(_block_size));
#endif
if (_threads_per_atom > mx_subgroup_sz)
_threads_per_atom = mx_subgroup_sz;
if (_threads_per_atom > (int)mx_subgroup_sz) _threads_per_atom = mx_subgroup_sz;
device->set_simd_size(mx_subgroup_sz);
}
#endif