mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	server : return error on too large embedding input (#7389)
This commit is contained in:
		| @@ -1981,8 +1981,7 @@ struct server_context { | ||||
|                                 slot.state = SLOT_STATE_PROCESSING; | ||||
|                                 slot.command = SLOT_COMMAND_NONE; | ||||
|                                 slot.release(); | ||||
|                                 slot.print_timings(); | ||||
|                                 send_final_response(slot); | ||||
|                                 send_error(slot, "input is too large to process. increase the physical batch size", ERROR_TYPE_SERVER); | ||||
|                                 continue; | ||||
|                             } | ||||
|                         } else { | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Georgi Gerganov
					Georgi Gerganov