mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	Increase 3B scratch buffers. (#1698)
The 128 MB was too optimistic. Too bad it is not dynamically computed.
This commit is contained in:
		| @@ -63,7 +63,7 @@ static const size_t MB = 1024*1024; | |||||||
| static const std::map<e_model, size_t> & MEM_REQ_SCRATCH0() | static const std::map<e_model, size_t> & MEM_REQ_SCRATCH0() | ||||||
| { | { | ||||||
|     static std::map<e_model, size_t> k_sizes = { |     static std::map<e_model, size_t> k_sizes = { | ||||||
|         { MODEL_3B,    128ull * MB }, |         { MODEL_3B,    256ull * MB }, | ||||||
|         { MODEL_7B,    512ull * MB }, |         { MODEL_7B,    512ull * MB }, | ||||||
|         { MODEL_13B,   512ull * MB }, |         { MODEL_13B,   512ull * MB }, | ||||||
|         { MODEL_30B,   512ull * MB }, |         { MODEL_30B,   512ull * MB }, | ||||||
| @@ -75,7 +75,7 @@ static const std::map<e_model, size_t> & MEM_REQ_SCRATCH0() | |||||||
| static const std::map<e_model, size_t> & MEM_REQ_SCRATCH1() | static const std::map<e_model, size_t> & MEM_REQ_SCRATCH1() | ||||||
| { | { | ||||||
|     static std::map<e_model, size_t> k_sizes = { |     static std::map<e_model, size_t> k_sizes = { | ||||||
|         { MODEL_3B,    128ull * MB }, |         { MODEL_3B,    256ull * MB }, | ||||||
|         { MODEL_7B,    512ull * MB }, |         { MODEL_7B,    512ull * MB }, | ||||||
|         { MODEL_13B,   512ull * MB }, |         { MODEL_13B,   512ull * MB }, | ||||||
|         { MODEL_30B,   512ull * MB }, |         { MODEL_30B,   512ull * MB }, | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Henri Vasserman
					Henri Vasserman