mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	CUDA: fix DEBUG_CUDA_MALLOC (#5729)
This commit is contained in:
		| @@ -8079,8 +8079,8 @@ static void * ggml_cuda_pool_malloc_leg(int device, size_t size, size_t * actual | |||||||
|     *actual_size = look_ahead_size; |     *actual_size = look_ahead_size; | ||||||
|     g_cuda_pool_size[device] += look_ahead_size; |     g_cuda_pool_size[device] += look_ahead_size; | ||||||
| #ifdef DEBUG_CUDA_MALLOC | #ifdef DEBUG_CUDA_MALLOC | ||||||
|     fprintf(stderr, "%s[%d]: %d buffers, max_size = %u MB, pool_size = %u MB, requested %u MB\n", __func__, id, nnz, |     fprintf(stderr, "%s[%d]: %d buffers, max_size = %u MB, pool_size = %u MB, requested %u MB\n", __func__, device, nnz, | ||||||
|             (uint32_t)(max_size/1024/1024), (uint32_t)(g_cuda_pool_size[id]/1024/1024), (uint32_t)(size/1024/1024)); |             (uint32_t)(max_size/1024/1024), (uint32_t)(g_cuda_pool_size[device]/1024/1024), (uint32_t)(size/1024/1024)); | ||||||
| #endif | #endif | ||||||
|     return ptr; |     return ptr; | ||||||
| } | } | ||||||
| @@ -8166,7 +8166,7 @@ static void * ggml_cuda_pool_malloc_vmm(int device, size_t size, size_t * actual | |||||||
|     g_cuda_pool_used[device] += size; |     g_cuda_pool_used[device] += size; | ||||||
|  |  | ||||||
| #ifdef DEBUG_CUDA_MALLOC | #ifdef DEBUG_CUDA_MALLOC | ||||||
|     printf("cuda pool[%d]: allocated %llu bytes at %llx [%s]\n", id, (unsigned long long) size, ptr); |     printf("cuda pool[%d]: allocated %llu bytes at %llx\n", device, (unsigned long long) size, ptr); | ||||||
| #endif | #endif | ||||||
|  |  | ||||||
|     return ptr; |     return ptr; | ||||||
| @@ -8176,7 +8176,7 @@ static void ggml_cuda_pool_free_vmm(int device, void * ptr, size_t size) { | |||||||
|     scoped_spin_lock lock(g_cuda_pool_lock); |     scoped_spin_lock lock(g_cuda_pool_lock); | ||||||
|  |  | ||||||
| #ifdef DEBUG_CUDA_MALLOC | #ifdef DEBUG_CUDA_MALLOC | ||||||
|     printf("cuda pool[%d]: freed %llu bytes at %llx\n", id, (unsigned long long) size, ptr); |     printf("cuda pool[%d]: freed %llu bytes at %llx\n", device, (unsigned long long) size, ptr); | ||||||
| #endif | #endif | ||||||
|  |  | ||||||
|     g_cuda_pool_used[device] -= size; |     g_cuda_pool_used[device] -= size; | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Johannes Gäßler
					Johannes Gäßler