Skip to content

Commit

Permalink
Merge remote-tracking branch 'quarticcat/master' into master2
Browse files Browse the repository at this point in the history
# Conflicts:
#	exllama_ext/cuda_func/q4_matmul.cu
  • Loading branch information
turboderp committed Sep 8, 2023
2 parents 93dbb26 + 8e37f2d commit b12acc6
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions exllama_ext/cuda_func/q4_matmul.cu
Original file line number Diff line number Diff line change
Expand Up @@ -8,10 +8,10 @@
#include "../hip_compat.cuh"
#endif

const int THREADS_X = 128; // Block size and thread count along columns in w and out
const int THREADS_X = 32; // Block size and thread count along columns in w and out
const int THREADS_Y = 1; // Block size and thread count along rows in x and out

const int GROUP_STEP = 128; // Assumed group size when block_size_z % groupsize != 0
const int GROUP_STEP = 32; // Assumed group size when block_size_z % groupsize != 0

typedef void (*fp_q4_matmul_kernel)
(
Expand Down

0 comments on commit b12acc6

Please sign in to comment.