mirror of
https://github.com/ggml-org/llama.cpp.git
synced 2025-11-04 09:32:00 +00:00
remove compile flag
This commit is contained in:
@@ -504,10 +504,6 @@ static struct ggml_backend_metal_context * ggml_metal_init(ggml_backend_dev_t de
|
|||||||
// dictionary of preprocessor macros
|
// dictionary of preprocessor macros
|
||||||
NSMutableDictionary * prep = [NSMutableDictionary dictionary];
|
NSMutableDictionary * prep = [NSMutableDictionary dictionary];
|
||||||
|
|
||||||
#if defined(GGML_METAL_FORCE_FATTN_PREC_F16)
|
|
||||||
[prep setObject:@"1" forKey:@"GGML_METAL_FORCE_FATTN_PREC_F16"];
|
|
||||||
#endif
|
|
||||||
|
|
||||||
MTLCompileOptions * options = [MTLCompileOptions new];
|
MTLCompileOptions * options = [MTLCompileOptions new];
|
||||||
options.preprocessorMacros = prep;
|
options.preprocessorMacros = prep;
|
||||||
|
|
||||||
@@ -558,11 +554,6 @@ static struct ggml_backend_metal_context * ggml_metal_init(ggml_backend_dev_t de
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#if defined(GGML_METAL_FORCE_FATTN_PREC_F16)
|
|
||||||
GGML_LOG_INFO("%s: GGML_METAL_FORCE_FATTN_PREC_F16 = yes\n", __func__);
|
|
||||||
#else
|
|
||||||
GGML_LOG_INFO("%s: GGML_METAL_FORCE_FATTN_PREC_F16 = no\n", __func__);
|
|
||||||
#endif
|
|
||||||
GGML_LOG_INFO("%s: simdgroup reduction = %s\n", __func__, ctx_dev->has_simdgroup_reduction ? "true" : "false");
|
GGML_LOG_INFO("%s: simdgroup reduction = %s\n", __func__, ctx_dev->has_simdgroup_reduction ? "true" : "false");
|
||||||
GGML_LOG_INFO("%s: simdgroup matrix mul. = %s\n", __func__, ctx_dev->has_simdgroup_mm ? "true" : "false");
|
GGML_LOG_INFO("%s: simdgroup matrix mul. = %s\n", __func__, ctx_dev->has_simdgroup_mm ? "true" : "false");
|
||||||
GGML_LOG_INFO("%s: bfloat = %s\n", __func__, ctx_dev->has_bfloat ? "true" : "false");
|
GGML_LOG_INFO("%s: bfloat = %s\n", __func__, ctx_dev->has_bfloat ? "true" : "false");
|
||||||
|
|||||||
@@ -3021,9 +3021,11 @@ kernel void kernel_flash_attn_ext(
|
|||||||
}
|
}
|
||||||
|
|
||||||
// cast qk_t -> s_t
|
// cast qk_t -> s_t
|
||||||
s8x8_t mqks(1.0f);
|
//s8x8_t mqks(1.0f);
|
||||||
simdgroup_multiply(mqks, mqk, mqks);
|
//simdgroup_multiply(mqks, mqk, mqks);
|
||||||
simdgroup_store(mqks, ss + 8*cc, TS, 0, false);
|
//simdgroup_store(mqks, ss + 8*cc, TS, 0, false);
|
||||||
|
|
||||||
|
simdgroup_store(mqk, ss + 8*cc, TS, 0, false);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user