Skip to content

Commit ba10833

Browse files
Add comment for GGML_CUDA_DMMV_BLOCK_Y
1 parent 7ec5b63 commit ba10833

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

ggml-cuda.cu

+3-1
Original file line numberDiff line numberDiff line change
@@ -84,7 +84,9 @@ typedef struct {
8484
static_assert(sizeof(block_q8_0) == sizeof(float) + QK8_0, "wrong q8_0 block size/padding");
8585

8686
#define CUDA_DEQUANTIZE_BLOCK_SIZE 256
87-
#define GGML_CUDA_DMMV_BLOCK_X 32 // dmmv = dequantize_mul_mat_vec
87+
// dmmv = dequantize_mul_mat_vec
88+
#define GGML_CUDA_DMMV_BLOCK_X 32
89+
// #define GGML_CUDA_DMMV_BLOCK_Y 1 // This is defined by make/cmake
8890

8991
static __device__ void dequantize_q4_0(const void * vx, const int ib, const int iqs, float & v0, float & v1){
9092
const block_q4_0 * x = (const block_q4_0 *) vx;

0 commit comments

Comments
 (0)