mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	fix NVCC version on Makefile, __halves2half2 -> make_half2
This commit is contained in:
		
							
								
								
									
										1
									
								
								Makefile
									
									
									
									
									
								
							
							
						
						
									
										1
									
								
								Makefile
									
									
									
									
									
								
							| @@ -176,6 +176,7 @@ ifdef LLAMA_CUDA | |||||||
| 	OBJS      += ggml-cuda.o | 	OBJS      += ggml-cuda.o | ||||||
| 	NVCC      = nvcc | 	NVCC      = nvcc | ||||||
| 	NVCCFLAGS = --forward-unknown-to-host-compiler | 	NVCCFLAGS = --forward-unknown-to-host-compiler | ||||||
|  | 	NVCCV 	  := $(shell $(NVCC) --version | tail -n 1) | ||||||
| ifdef LLAMA_DEBUG | ifdef LLAMA_DEBUG | ||||||
| 	NVCCFLAGS += -lineinfo | 	NVCCFLAGS += -lineinfo | ||||||
| endif # LLAMA_DEBUG | endif # LLAMA_DEBUG | ||||||
|   | |||||||
| @@ -14,7 +14,7 @@ template<> struct vec2_t_impl<float>  { typedef float2 type; }; | |||||||
| template<typename T> using vec2_t = typename vec2_t_impl<T>::type; | template<typename T> using vec2_t = typename vec2_t_impl<T>::type; | ||||||
|  |  | ||||||
| template<typename T> inline __host__ __device__ vec2_t<T> make_vec2_t(const T & x, const T & y); | template<typename T> inline __host__ __device__ vec2_t<T> make_vec2_t(const T & x, const T & y); | ||||||
| template<> inline __host__ __device__ vec2_t<half>  make_vec2_t(const  half & x, const  half & y) { return __halves2half2(x, y); } | template<> inline __host__ __device__ vec2_t<half>  make_vec2_t(const  half & x, const  half & y) { return make_half2 (x, y); } | ||||||
| template<> inline __host__ __device__ vec2_t<float> make_vec2_t(const float & x, const float & y) { return make_float2(x, y); } | template<> inline __host__ __device__ vec2_t<float> make_vec2_t(const float & x, const float & y) { return make_float2(x, y); } | ||||||
|  |  | ||||||
| // the cuda headers define operators for half2, but not for float2 | // the cuda headers define operators for half2, but not for float2 | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 slaren
					slaren