mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-10-29 08:41:22 +00:00
CUDA: fix compilation on CC 6.0 (#16091)
This commit is contained in:
@@ -35,7 +35,6 @@ static int fattn_tile_get_kq_stride_host(const int D, const int ncols, const int
|
|||||||
switch (D) {
|
switch (D) {
|
||||||
case 64:
|
case 64:
|
||||||
case 128:
|
case 128:
|
||||||
return 128;
|
|
||||||
case 256:
|
case 256:
|
||||||
return ncols <= 16 ? 128 : 64;
|
return ncols <= 16 ? 128 : 64;
|
||||||
default:
|
default:
|
||||||
@@ -86,7 +85,6 @@ static constexpr __device__ int fattn_tile_get_kq_stride_device(int D, int ncols
|
|||||||
switch (D) {
|
switch (D) {
|
||||||
case 64:
|
case 64:
|
||||||
case 128:
|
case 128:
|
||||||
return 128;
|
|
||||||
case 256:
|
case 256:
|
||||||
return ncols <= 16 ? 128 : 64;
|
return ncols <= 16 ? 128 : 64;
|
||||||
default:
|
default:
|
||||||
|
|||||||
Reference in New Issue
Block a user