diff --git a/opencl/init.go b/opencl/init.go index 4b8a945..59f05fd 100644 --- a/opencl/init.go +++ b/opencl/init.go @@ -226,6 +226,7 @@ func Init(gpu int) { ClMaxWGNum = ClCUnits ClTotalPE = ClWGSize[2] * ClCUnits if GPUVend == 1 { // Nvidia + ClTotalPE *= 2 if ClMaxWGSize > ClTotalPE { ClMaxWGNum = 1 ClMaxWGSize = ClTotalPE diff --git a/opencl64/init.go b/opencl64/init.go index a42d18a..2ba2e88 100644 --- a/opencl64/init.go +++ b/opencl64/init.go @@ -229,6 +229,7 @@ func Init(gpu int) { ClMaxWGNum = ClCUnits ClTotalPE = ClWGSize[2] * ClCUnits if GPUVend == 1 { // Nvidia + ClTotalPE *= 2 if ClMaxWGSize > ClTotalPE { ClMaxWGNum = 1 ClMaxWGSize = ClTotalPE