Skip to content

Commit

Permalink
Add comment for GGML_CUDA_DMMV_BLOCK_Y
Browse files Browse the repository at this point in the history
  • Loading branch information
JohannesGaessler committed May 20, 2023
1 parent 7ec5b63 commit ba10833
Showing 1 changed file with 3 additions and 1 deletion.
4 changes: 3 additions & 1 deletion ggml-cuda.cu
Original file line number Diff line number Diff line change
Expand Up @@ -84,7 +84,9 @@ typedef struct {
static_assert(sizeof(block_q8_0) == sizeof(float) + QK8_0, "wrong q8_0 block size/padding");

#define CUDA_DEQUANTIZE_BLOCK_SIZE 256
#define GGML_CUDA_DMMV_BLOCK_X 32 // dmmv = dequantize_mul_mat_vec
// dmmv = dequantize_mul_mat_vec
#define GGML_CUDA_DMMV_BLOCK_X 32
// #define GGML_CUDA_DMMV_BLOCK_Y 1 // This is defined by make/cmake

static __device__ void dequantize_q4_0(const void * vx, const int ib, const int iqs, float & v0, float & v1){
const block_q4_0 * x = (const block_q4_0 *) vx;
Expand Down

0 comments on commit ba10833

Please sign in to comment.