mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-11-04 09:32:00 +00:00 
			
		
		
		
	remove compile flag
This commit is contained in:
		@@ -504,10 +504,6 @@ static struct ggml_backend_metal_context * ggml_metal_init(ggml_backend_dev_t de
 | 
				
			|||||||
                // dictionary of preprocessor macros
 | 
					                // dictionary of preprocessor macros
 | 
				
			||||||
                NSMutableDictionary * prep = [NSMutableDictionary dictionary];
 | 
					                NSMutableDictionary * prep = [NSMutableDictionary dictionary];
 | 
				
			||||||
 | 
					
 | 
				
			||||||
#if defined(GGML_METAL_FORCE_FATTN_PREC_F16)
 | 
					 | 
				
			||||||
                [prep setObject:@"1" forKey:@"GGML_METAL_FORCE_FATTN_PREC_F16"];
 | 
					 | 
				
			||||||
#endif
 | 
					 | 
				
			||||||
 | 
					 | 
				
			||||||
                MTLCompileOptions * options = [MTLCompileOptions new];
 | 
					                MTLCompileOptions * options = [MTLCompileOptions new];
 | 
				
			||||||
                options.preprocessorMacros = prep;
 | 
					                options.preprocessorMacros = prep;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
@@ -558,11 +554,6 @@ static struct ggml_backend_metal_context * ggml_metal_init(ggml_backend_dev_t de
 | 
				
			|||||||
        }
 | 
					        }
 | 
				
			||||||
    }
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
#if defined(GGML_METAL_FORCE_FATTN_PREC_F16)
 | 
					 | 
				
			||||||
    GGML_LOG_INFO("%s: GGML_METAL_FORCE_FATTN_PREC_F16  = yes\n", __func__);
 | 
					 | 
				
			||||||
#else
 | 
					 | 
				
			||||||
    GGML_LOG_INFO("%s: GGML_METAL_FORCE_FATTN_PREC_F16  = no\n",  __func__);
 | 
					 | 
				
			||||||
#endif
 | 
					 | 
				
			||||||
    GGML_LOG_INFO("%s: simdgroup reduction   = %s\n", __func__, ctx_dev->has_simdgroup_reduction     ? "true" : "false");
 | 
					    GGML_LOG_INFO("%s: simdgroup reduction   = %s\n", __func__, ctx_dev->has_simdgroup_reduction     ? "true" : "false");
 | 
				
			||||||
    GGML_LOG_INFO("%s: simdgroup matrix mul. = %s\n", __func__, ctx_dev->has_simdgroup_mm            ? "true" : "false");
 | 
					    GGML_LOG_INFO("%s: simdgroup matrix mul. = %s\n", __func__, ctx_dev->has_simdgroup_mm            ? "true" : "false");
 | 
				
			||||||
    GGML_LOG_INFO("%s: bfloat                = %s\n", __func__, ctx_dev->has_bfloat                  ? "true" : "false");
 | 
					    GGML_LOG_INFO("%s: bfloat                = %s\n", __func__, ctx_dev->has_bfloat                  ? "true" : "false");
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -3021,9 +3021,11 @@ kernel void kernel_flash_attn_ext(
 | 
				
			|||||||
                    }
 | 
					                    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
                    // cast qk_t -> s_t
 | 
					                    // cast qk_t -> s_t
 | 
				
			||||||
                    s8x8_t mqks(1.0f);
 | 
					                    //s8x8_t mqks(1.0f);
 | 
				
			||||||
                    simdgroup_multiply(mqks, mqk, mqks);
 | 
					                    //simdgroup_multiply(mqks, mqk, mqks);
 | 
				
			||||||
                    simdgroup_store(mqks, ss + 8*cc, TS, 0, false);
 | 
					                    //simdgroup_store(mqks, ss + 8*cc, TS, 0, false);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					                    simdgroup_store(mqk, ss + 8*cc, TS, 0, false);
 | 
				
			||||||
                }
 | 
					                }
 | 
				
			||||||
            }
 | 
					            }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user