mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-27 08:21:30 +00:00 
			
		
		
		
	 64e7b47c69
			
		
	
	64e7b47c69
	
	
	
		
			
			* add `retrieval` example * add README * minor fixes * cast filepos on print * remove use of variable sized array * store similarities in separate vector * print error on insufficient batch size * fix error message printing * assign n_batch value to n_ubatch * fix param definitions * define retrieval-only parameters in retrieval.cpp * fix `--context-file` option to be provided multiple times for multiple files * use vector for `query_emb` * add usage description in README * fix merge conflict * fix usage printing * remove seed setting * fix lint * increase file read buffer size * retrieval : minor --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
		
			
				
	
	
		
			106 lines
		
	
	
		
			1.0 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
			
		
		
	
	
			106 lines
		
	
	
		
			1.0 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| *.o
 | |
| *.a
 | |
| *.so
 | |
| *.gguf
 | |
| *.bin
 | |
| *.exe
 | |
| *.dll
 | |
| *.log
 | |
| *.gcov
 | |
| *.gcno
 | |
| *.gcda
 | |
| *.dot
 | |
| *.bat
 | |
| *.tmp
 | |
| *.metallib
 | |
| *.etag
 | |
| *.lastModified
 | |
| .DS_Store
 | |
| .build/
 | |
| .cache/
 | |
| .ccls-cache/
 | |
| .direnv/
 | |
| .envrc
 | |
| .swiftpm
 | |
| .venv
 | |
| .clang-tidy
 | |
| .vs/
 | |
| .vscode/
 | |
| .idea/
 | |
| 
 | |
| ggml-metal-embed.metal
 | |
| 
 | |
| lcov-report/
 | |
| gcovr-report/
 | |
| 
 | |
| build*
 | |
| cmake-build-*
 | |
| out/
 | |
| tmp/
 | |
| 
 | |
| models/*
 | |
| models-mnt
 | |
| 
 | |
| /Pipfile
 | |
| /baby-llama
 | |
| /beam-search
 | |
| /benchmark-matmult
 | |
| /convert-llama2c-to-ggml
 | |
| /embd-input-test
 | |
| /embedding
 | |
| /gguf
 | |
| /gguf-llama-simple
 | |
| /gguf-split
 | |
| /gritlm
 | |
| /imatrix
 | |
| /infill
 | |
| /libllama.so
 | |
| /llama-bench
 | |
| /llava-cli
 | |
| /lookahead
 | |
| /lookup
 | |
| /lookup-create
 | |
| /lookup-merge
 | |
| /lookup-stats
 | |
| /main
 | |
| /metal
 | |
| /passkey
 | |
| /perplexity
 | |
| /q8dot
 | |
| /quantize
 | |
| /quantize-stats
 | |
| /result
 | |
| /save-load-state
 | |
| /server
 | |
| /simple
 | |
| /batched
 | |
| /batched-bench
 | |
| /export-lora
 | |
| /finetune
 | |
| /retrieval
 | |
| /speculative
 | |
| /parallel
 | |
| /train-text-from-scratch
 | |
| /tokenize
 | |
| /vdot
 | |
| /common/build-info.cpp
 | |
| arm_neon.h
 | |
| compile_commands.json
 | |
| CMakeSettings.json
 | |
| 
 | |
| __pycache__
 | |
| dist
 | |
| 
 | |
| zig-out/
 | |
| zig-cache/
 | |
| 
 | |
| ppl-*.txt
 | |
| qnt-*.txt
 | |
| perf-*.txt
 | |
| 
 | |
| examples/jeopardy/results.txt
 | |
| 
 | |
| poetry.lock
 | |
| poetry.toml
 | |
| nppBackup
 |