Skip to content

Commit

Permalink
Increase max local size of blas-3d batched kernels to 256
Browse files Browse the repository at this point in the history
  • Loading branch information
maddyscientist committed Nov 20, 2024
1 parent 6383489 commit d3f3482
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions include/kernels/blas_3d.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@
#include <fast_intdiv.h>
#include <quda_matrix.h>
#include <matrix_field.h>
#include <constant_kernel_arg.h>
#include <kernel.h>

namespace quda
Expand Down Expand Up @@ -118,7 +119,7 @@ namespace quda
// Create a typename F for the ColorSpinorFields
typedef typename colorspinor_mapper<Float, nSpin, nColor, spin_project, spinor_direct_load, disable_ghost>::type F;

static constexpr int MAX_ORTHO_DIM = 128;
static constexpr int MAX_ORTHO_DIM = 256;
real a[MAX_ORTHO_DIM];
const F x;
real b[MAX_ORTHO_DIM];
Expand Down Expand Up @@ -173,7 +174,7 @@ namespace quda
// Create a typename F for the ColorSpinorFields
typedef typename colorspinor_mapper<Float, nSpin, nColor, spin_project, spinor_direct_load, disable_ghost>::type F;

static constexpr int MAX_ORTHO_DIM = 64;
static constexpr int MAX_ORTHO_DIM = 256;
complex<real> a[MAX_ORTHO_DIM];
const F x;
complex<real> b[MAX_ORTHO_DIM];
Expand Down

0 comments on commit d3f3482

Please sign in to comment.