mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	cuda : fix device sync on buffer clear (#14033)
This commit is contained in:
		| @@ -615,9 +615,8 @@ static void ggml_backend_cuda_buffer_clear(ggml_backend_buffer_t buffer, uint8_t | |||||||
|     ggml_backend_cuda_buffer_context * ctx = (ggml_backend_cuda_buffer_context *)buffer->context; |     ggml_backend_cuda_buffer_context * ctx = (ggml_backend_cuda_buffer_context *)buffer->context; | ||||||
|  |  | ||||||
|     ggml_cuda_set_device(ctx->device); |     ggml_cuda_set_device(ctx->device); | ||||||
|     CUDA_CHECK(cudaDeviceSynchronize()); |     CUDA_CHECK(cudaMemsetAsync(ctx->dev_ptr, value, buffer->size, cudaStreamPerThread)); | ||||||
|     CUDA_CHECK(cudaMemset(ctx->dev_ptr, value, buffer->size)); |     CUDA_CHECK(cudaStreamSynchronize(cudaStreamPerThread)); | ||||||
|     CUDA_CHECK(cudaDeviceSynchronize()); |  | ||||||
| } | } | ||||||
|  |  | ||||||
| static const ggml_backend_buffer_i ggml_backend_cuda_buffer_interface = { | static const ggml_backend_buffer_i ggml_backend_cuda_buffer_interface = { | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Diego Devesa
					Diego Devesa