mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	added missing CUDA_CHECKs
This commit is contained in:
		| @@ -2440,12 +2440,11 @@ GGML_CALL static enum ggml_status ggml_backend_cuda_graph_compute(ggml_backend_t | ||||
|     // kernel parameters which need updated in the graph for each token | ||||
|     void* ggmlCudaCpyFn = nullptr; | ||||
|  | ||||
|  | ||||
|     if(cudaGraph.count==0){         | ||||
|         cudaDeviceProp prop; | ||||
|         int device; | ||||
|         cudaGetDevice(&device); | ||||
|         cudaGetDeviceProperties(&prop, device); | ||||
|         CUDA_CHECK(cudaGetDevice(&device)); | ||||
|         CUDA_CHECK(cudaGetDeviceProperties(&prop, device)); | ||||
|         if (prop.major < 8){ | ||||
|             cudaGraph.disableDueToGpuArch=true; | ||||
|         } | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Alan Gray
					Alan Gray