mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-07 23:02:15 +08:00
Missing comment explaining VDR variable in GGUF kernels (#13290)
This commit is contained in:
parent
31aa045c11
commit
1cdc88614a
@ -37,6 +37,8 @@ static __device__ __forceinline__ int get_int_from_uint8_aligned(const uint8_t *
|
|||||||
return *((const int *) (x8 + sizeof(int) * i32)); // assume at least 4 byte alignment
|
return *((const int *) (x8 + sizeof(int) * i32)); // assume at least 4 byte alignment
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// VDR = vec dot ratio, how many contiguous integers each thread processes when the vec dot kernel is called
|
||||||
|
// MMVQ = mul_mat_vec_q, MMQ = mul_mat_q
|
||||||
|
|
||||||
#define VDR_Q4_0_Q8_1_MMVQ 2
|
#define VDR_Q4_0_Q8_1_MMVQ 2
|
||||||
#define VDR_Q4_0_Q8_1_MMQ 4
|
#define VDR_Q4_0_Q8_1_MMQ 4
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user