|
common.cuh
|
cuda : try to fix __hgt2_mask
|
2024-04-23 09:18:55 +03:00 |
|
convert.cuh
|
llama : add Command R Plus support (#6491)
|
2024-04-09 11:16:13 +03:00 |
|
dmmv.cu
|
llama : add Command R Plus support (#6491)
|
2024-04-09 11:16:13 +03:00 |
|
dmmv.cuh
|
sync : ggml (#6351)
|
2024-03-29 17:45:46 +02:00 |
|
fattn.cu
|
cuda : "constexpr dim3" -> "const dim3"
|
2024-04-22 20:31:23 +03:00 |
|
fattn.cuh
|
cuda : fix build
|
2024-03-27 10:31:52 +02:00 |
|
mmvq.cu
|
IQ1_M: 1.75 bpw quantization (#6302)
|
2024-03-26 15:21:27 +01:00 |
|
quantize.cu
|
llama : add Command R Plus support (#6491)
|
2024-04-09 11:16:13 +03:00 |
|
quantize.cuh
|
llama : add Command R Plus support (#6491)
|
2024-04-09 11:16:13 +03:00 |
|
softmax.cu
|
ggml : ggml_soft_max support F16/F32 mask/pos
|
2024-04-22 14:53:11 +03:00 |
|
vecdotq.cuh
|
IQ1_M: 1.75 bpw quantization (#6302)
|
2024-03-26 15:21:27 +01:00 |