mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-11-03 09:22:01 +00:00 
			
		
		
		
	CUDA: fix CUDART_VERSION checks (#11821)
This commit is contained in:
		@@ -165,11 +165,11 @@ static const char * cu_get_error_str(CUresult err) {
 | 
			
		||||
#define CU_CHECK(err) CUDA_CHECK_GEN(err, CUDA_SUCCESS, cu_get_error_str)
 | 
			
		||||
#endif
 | 
			
		||||
 | 
			
		||||
#if CUDART_VERSION >= 11100 || defined(GGML_USE_MUSA)
 | 
			
		||||
#if CUDART_VERSION >= 11010 || defined(GGML_USE_MUSA)
 | 
			
		||||
#define GGML_CUDA_ASSUME(x) __builtin_assume(x)
 | 
			
		||||
#else
 | 
			
		||||
#define GGML_CUDA_ASSUME(x)
 | 
			
		||||
#endif // CUDART_VERSION >= 11100
 | 
			
		||||
#endif // CUDART_VERSION >= 11010
 | 
			
		||||
 | 
			
		||||
#ifdef GGML_CUDA_F16
 | 
			
		||||
typedef half dfloat; // dequantize float
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user