From 3852a35e388dfb12115a476a041000a9d0375521 Mon Sep 17 00:00:00 2001 From: William F Godoy Date: Mon, 1 Jul 2024 16:33:32 -0400 Subject: [PATCH] Reorder AMDGPU gridsize --- ext/JACCAMDGPU/JACCAMDGPU.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/ext/JACCAMDGPU/JACCAMDGPU.jl b/ext/JACCAMDGPU/JACCAMDGPU.jl index e65116b..66b0559 100644 --- a/ext/JACCAMDGPU/JACCAMDGPU.jl +++ b/ext/JACCAMDGPU/JACCAMDGPU.jl @@ -33,9 +33,9 @@ function JACC.parallel_for( (L, M, N)::Tuple{I, I, I}, f::F, x...) where { I <: Integer, F <: Function} numThreads = 32 - Lthreads = min(L, numThreads) + Lthreads = 1 Mthreads = min(M, numThreads) - Nthreads = 1 + Nthreads = min(N, numThreads) Lblocks = ceil(Int, L / Lthreads) Mblocks = ceil(Int, M / Mthreads) Nblocks = ceil(Int, N / Nthreads)