mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	added missing CUDA_CHECKs
This commit is contained in:
		| @@ -2440,12 +2440,11 @@ GGML_CALL static enum ggml_status ggml_backend_cuda_graph_compute(ggml_backend_t | |||||||
|     // kernel parameters which need updated in the graph for each token |     // kernel parameters which need updated in the graph for each token | ||||||
|     void* ggmlCudaCpyFn = nullptr; |     void* ggmlCudaCpyFn = nullptr; | ||||||
|  |  | ||||||
|  |  | ||||||
|     if(cudaGraph.count==0){         |     if(cudaGraph.count==0){         | ||||||
|         cudaDeviceProp prop; |         cudaDeviceProp prop; | ||||||
|         int device; |         int device; | ||||||
|         cudaGetDevice(&device); |         CUDA_CHECK(cudaGetDevice(&device)); | ||||||
|         cudaGetDeviceProperties(&prop, device); |         CUDA_CHECK(cudaGetDeviceProperties(&prop, device)); | ||||||
|         if (prop.major < 8){ |         if (prop.major < 8){ | ||||||
|             cudaGraph.disableDueToGpuArch=true; |             cudaGraph.disableDueToGpuArch=true; | ||||||
|         } |         } | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Alan Gray
					Alan Gray