mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-27 08:21:30 +00:00 
			
		
		
		
	 7082d24cec
			
		
	
	7082d24cec
	
	
	
		
			
			* initial commit, going through initializations * main loop finished, starting to debug * BUG: generates gibberish/repeating tokens after a while * kv_cache management * Added colors to distinguish drafted tokens (--color). Updated README * lookup : fix token positions in the draft batch * lookup : use n_draft from CLI params * lookup : final touches --------- Co-authored-by: Leon Ericsson <leon.ericsson@icloud.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
		
			
				
	
	
		
			106 lines
		
	
	
		
			1.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
			
		
		
	
	
			106 lines
		
	
	
		
			1.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| *.o
 | |
| *.a
 | |
| *.so
 | |
| *.gguf
 | |
| *.bin
 | |
| *.exe
 | |
| *.dll
 | |
| *.log
 | |
| *.gcov
 | |
| *.gcno
 | |
| *.gcda
 | |
| *.dot
 | |
| *.bat
 | |
| *.metallib
 | |
| .DS_Store
 | |
| .build/
 | |
| .cache/
 | |
| .ccls-cache/
 | |
| .direnv/
 | |
| .envrc
 | |
| .swiftpm
 | |
| .venv
 | |
| .clang-tidy
 | |
| .vs/
 | |
| .vscode/
 | |
| 
 | |
| lcov-report/
 | |
| gcovr-report/
 | |
| 
 | |
| build*/
 | |
| out/
 | |
| tmp/
 | |
| 
 | |
| models/*
 | |
| models-mnt
 | |
| 
 | |
| /Pipfile
 | |
| /baby-llama
 | |
| /beam-search
 | |
| /benchmark-matmult
 | |
| /convert-llama2c-to-ggml
 | |
| /embd-input-test
 | |
| /embedding
 | |
| /gguf
 | |
| /gguf-llama-simple
 | |
| /infill
 | |
| /libllama.so
 | |
| /llama-bench
 | |
| /llava-cli
 | |
| /lookahead
 | |
| /lookup
 | |
| /main
 | |
| /metal
 | |
| /perplexity
 | |
| /q8dot
 | |
| /quantize
 | |
| /quantize-stats
 | |
| /result
 | |
| /save-load-state
 | |
| /server
 | |
| /simple
 | |
| /batched
 | |
| /batched-bench
 | |
| /export-lora
 | |
| /finetune
 | |
| /speculative
 | |
| /parallel
 | |
| /train-text-from-scratch
 | |
| /tokenize
 | |
| /vdot
 | |
| /common/build-info.cpp
 | |
| arm_neon.h
 | |
| compile_commands.json
 | |
| CMakeSettings.json
 | |
| 
 | |
| __pycache__
 | |
| dist
 | |
| 
 | |
| zig-out/
 | |
| zig-cache/
 | |
| 
 | |
| ppl-*.txt
 | |
| qnt-*.txt
 | |
| perf-*.txt
 | |
| 
 | |
| examples/jeopardy/results.txt
 | |
| 
 | |
| poetry.lock
 | |
| poetry.toml
 | |
| 
 | |
| # Test binaries
 | |
| /tests/test-grammar-parser
 | |
| /tests/test-llama-grammar
 | |
| /tests/test-double-float
 | |
| /tests/test-grad0
 | |
| /tests/test-opt
 | |
| /tests/test-quantize-fns
 | |
| /tests/test-quantize-perf
 | |
| /tests/test-sampling
 | |
| /tests/test-tokenizer-0-llama
 | |
| /tests/test-tokenizer-0-falcon
 | |
| /tests/test-tokenizer-1-llama
 | |
| /tests/test-tokenizer-1-bpe
 | |
| /tests/test-rope
 | |
| /tests/test-backend-ops
 |