mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	Store layers in VRAM
This commit is contained in:
		| @@ -14,6 +14,8 @@ void   ggml_cuda_mul_mat(const struct ggml_tensor * src0, const struct ggml_tens | ||||
| void * ggml_cuda_host_malloc(size_t size); | ||||
| void   ggml_cuda_host_free(void * ptr); | ||||
|  | ||||
| void ggml_cuda_transform_tensor(struct ggml_tensor * tensor); | ||||
|  | ||||
| #ifdef  __cplusplus | ||||
| } | ||||
| #endif | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 JohannesGaessler
					JohannesGaessler