Skip to content

Commit

Permalink
Fix SHUF_BLOCKSIZE value
Browse files Browse the repository at this point in the history
  • Loading branch information
0cc4m committed Jun 13, 2023
1 parent 82fa31f commit a09cf75
Showing 1 changed file with 7 additions and 0 deletions.
7 changes: 7 additions & 0 deletions exllama_ext/cuda_func/column_remap.cu
Original file line number Diff line number Diff line change
@@ -1,7 +1,14 @@
#include "column_remap.cuh"
#include "../util.cuh"

// Using 1024 make me crash with "Memory access fault by GPU node-1 (Agent
// handle: 0x012345678912) on address 0x012345678912. Reason: Page not present
// or supervisor privilege."
#if defined(USE_ROCM)
const int SHUF_BLOCKSIZE_X = 256;
#else
const int SHUF_BLOCKSIZE_X = 1024;
#endif
const int SHUF_BLOCKSIZE_Y = 16;

__global__ void column_remap_kernel
Expand Down

0 comments on commit a09cf75

Please sign in to comment.