mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	| @@ -2703,8 +2703,8 @@ int main(int argc, char ** argv) { | |||||||
|     }; |     }; | ||||||
|  |  | ||||||
|     const auto handle_completions_generic = [&ctx_server, &res_error, &res_ok](server_task_inf_type inf_type, json & data, httplib::Response & res) { |     const auto handle_completions_generic = [&ctx_server, &res_error, &res_ok](server_task_inf_type inf_type, json & data, httplib::Response & res) { | ||||||
|         if (ctx_server.params.embedding || ctx_server.params.reranking) { |         if (ctx_server.params.embedding) { | ||||||
|             res_error(res, format_error_response("This server does not support completions. Start it without `--embeddings` or `--reranking`", ERROR_TYPE_NOT_SUPPORTED)); |             res_error(res, format_error_response("This server does not support completions. Start it without `--embeddings`", ERROR_TYPE_NOT_SUPPORTED)); | ||||||
|             return; |             return; | ||||||
|         } |         } | ||||||
|  |  | ||||||
| @@ -2809,8 +2809,8 @@ int main(int argc, char ** argv) { | |||||||
|  |  | ||||||
|     // TODO: maybe merge this function with "handle_completions_generic" |     // TODO: maybe merge this function with "handle_completions_generic" | ||||||
|     const auto handle_chat_completions = [&ctx_server, ¶ms, &res_error, &res_ok, verbose](const httplib::Request & req, httplib::Response & res) { |     const auto handle_chat_completions = [&ctx_server, ¶ms, &res_error, &res_ok, verbose](const httplib::Request & req, httplib::Response & res) { | ||||||
|         if (ctx_server.params.embedding || ctx_server.params.reranking) { |         if (ctx_server.params.embedding) { | ||||||
|             res_error(res, format_error_response("This server does not support completions. Start it without `--embeddings` or `--reranking`", ERROR_TYPE_NOT_SUPPORTED)); |             res_error(res, format_error_response("This server does not support completions. Start it without `--embeddings`", ERROR_TYPE_NOT_SUPPORTED)); | ||||||
|             return; |             return; | ||||||
|         } |         } | ||||||
|  |  | ||||||
| @@ -2935,11 +2935,6 @@ int main(int argc, char ** argv) { | |||||||
|     }; |     }; | ||||||
|  |  | ||||||
|     const auto handle_embeddings = [&ctx_server, &res_error, &res_ok](const httplib::Request & req, httplib::Response & res) { |     const auto handle_embeddings = [&ctx_server, &res_error, &res_ok](const httplib::Request & req, httplib::Response & res) { | ||||||
|         // TODO: somehow clean up this checks in the future |  | ||||||
|         if (!ctx_server.params.embedding || ctx_server.params.reranking) { |  | ||||||
|             res_error(res, format_error_response("This server does not support embeddings. Start it with `--embeddings` and without `--reranking`", ERROR_TYPE_NOT_SUPPORTED)); |  | ||||||
|             return; |  | ||||||
|         } |  | ||||||
|         const json body = json::parse(req.body); |         const json body = json::parse(req.body); | ||||||
|         bool is_openai = false; |         bool is_openai = false; | ||||||
|  |  | ||||||
| @@ -2991,10 +2986,11 @@ int main(int argc, char ** argv) { | |||||||
|     }; |     }; | ||||||
|  |  | ||||||
|     const auto handle_rerank = [&ctx_server, &res_error, &res_ok](const httplib::Request & req, httplib::Response & res) { |     const auto handle_rerank = [&ctx_server, &res_error, &res_ok](const httplib::Request & req, httplib::Response & res) { | ||||||
|         if (!ctx_server.params.reranking) { |         if (!ctx_server.params.reranking || ctx_server.params.embedding) { | ||||||
|             res_error(res, format_error_response("This server does not support reranking. Start it with `--reranking`", ERROR_TYPE_NOT_SUPPORTED)); |             res_error(res, format_error_response("This server does not support reranking. Start it with `--reranking` and without `--embedding`", ERROR_TYPE_NOT_SUPPORTED)); | ||||||
|             return; |             return; | ||||||
|         } |         } | ||||||
|  |  | ||||||
|         const json body = json::parse(req.body); |         const json body = json::parse(req.body); | ||||||
|  |  | ||||||
|         // TODO: implement |         // TODO: implement | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Georgi Gerganov
					Georgi Gerganov