Skip to content

Commit

Permalink
#5 Consistent veclen across functions.
Browse files Browse the repository at this point in the history
Should be placed in a configuration somewhere, so that if it's updated, it's applied across.
  • Loading branch information
carljohnsen committed Sep 10, 2024
1 parent 656865a commit 8c90bdf
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions src/lib/cpp/gpu/diffusion.cc
Original file line number Diff line number Diff line change
Expand Up @@ -122,7 +122,7 @@ namespace gpu {
// Assumes that the x dimension is a multiple of veclen.
constexpr int32_t
worklen = 1,
veclen = 64,
veclen = 32,
max_k = 32,
sqvec = max_k*veclen;
const int32_t
Expand Down Expand Up @@ -175,7 +175,7 @@ namespace gpu {
// Assumes that the x dimension is a multiple of veclen.
constexpr int32_t
worklen = 1,
veclen = 64,
veclen = 32,
max_k = 32,
sqvec = max_k*veclen;
const int32_t
Expand Down Expand Up @@ -726,7 +726,7 @@ namespace gpu {
}

void diffusion_out_of_core(uint8_t *__restrict__ voxels, const shape_t &total_shape, const shape_t &global_shape, const float *__restrict__ kernel, const int64_t kernel_size, const int64_t repititions, uint16_t *__restrict__ output) {
constexpr int32_t veclen = 64; // TODO
constexpr int32_t veclen = 32; // TODO
const shape_t
total_shape_padded = {total_shape.z, total_shape.y, (total_shape.x + veclen - 1) / veclen * veclen},
global_shape_padded = {global_shape.z+kernel_size-1, global_shape.y, (global_shape.x + veclen - 1) / veclen * veclen};
Expand Down

0 comments on commit 8c90bdf

Please sign in to comment.