mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	cvector: better prompt handling, add "mean vector" method (#8069)
* remove completions file * fix inverted vector * add mean method * code style * remove inverted pca hotfix
This commit is contained in:
		| @@ -1263,11 +1263,6 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa | ||||
|         return true; | ||||
|     } | ||||
|     // cvector params | ||||
|     if (arg == "--completions-file") { | ||||
|         CHECK_ARG | ||||
|         params.cvector_completions_file = argv[i]; | ||||
|         return true; | ||||
|     } | ||||
|     if (arg == "--positive-file") { | ||||
|         CHECK_ARG | ||||
|         params.cvector_positive_file = argv[i]; | ||||
| @@ -1278,11 +1273,6 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa | ||||
|         params.cvector_negative_file = argv[i]; | ||||
|         return true; | ||||
|     } | ||||
|     if (arg == "--completions") { | ||||
|         CHECK_ARG | ||||
|         params.n_completions = std::stoi(argv[i]); | ||||
|         return true; | ||||
|     } | ||||
|     if (arg == "--pca-batch") { | ||||
|         CHECK_ARG | ||||
|         params.n_pca_batch = std::stoi(argv[i]); | ||||
| @@ -1293,6 +1283,14 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa | ||||
|         params.n_pca_iterations = std::stoi(argv[i]); | ||||
|         return true; | ||||
|     } | ||||
|     if (arg == "--method") { | ||||
|         CHECK_ARG | ||||
|         std::string value(argv[i]); | ||||
|         /**/ if (value == "pca") { params.cvector_dimre_method = DIMRE_METHOD_PCA; } | ||||
|         else if (value == "mean") { params.cvector_dimre_method = DIMRE_METHOD_MEAN; } | ||||
|         else { invalid_param = true; } | ||||
|         return true; | ||||
|     } | ||||
| #ifndef LOG_DISABLE_LOGS | ||||
|     // Parse args for logging parameters | ||||
|     if (log_param_single_parse(argv[i])) { | ||||
| @@ -1626,11 +1624,9 @@ void gpt_params_print_usage(int /*argc*/, char ** argv, const gpt_params & param | ||||
|     options.push_back({ "cvector",     "-o,    --output FNAME",         "output file (default: '%s')", params.cvector_outfile.c_str() }); | ||||
|     options.push_back({ "cvector",     "       --positive-file FNAME",  "positive prompts file, one prompt per line (default: '%s')", params.cvector_positive_file.c_str() }); | ||||
|     options.push_back({ "cvector",     "       --negative-file FNAME",  "negative prompts file, one prompt per line (default: '%s')", params.cvector_negative_file.c_str() }); | ||||
|     options.push_back({ "cvector",     "       --completions-file FNAME", | ||||
|                                                                         "completions file (default: '%s')", params.cvector_completions_file.c_str() }); | ||||
|     options.push_back({ "cvector",     "       --completions N",        "number of lines of completions file to use (default: %d)", params.n_completions }); | ||||
|     options.push_back({ "cvector",     "       --pca-batch N",          "batch size used for PCA. Larger batch runs faster, but uses more memory (default: %d)", params.n_pca_batch }); | ||||
|     options.push_back({ "cvector",     "       --pca-iter N",           "number of iterations used for PCA (default: %d)", params.n_pca_iterations }); | ||||
|     options.push_back({ "cvector",     "       --method {pca,mean}",    "dimensionality reduction method to be used (default: pca)" }); | ||||
|  | ||||
|     printf("usage: %s [options]\n", argv[0]); | ||||
|  | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Xuan Son Nguyen
					Xuan Son Nguyen