mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-31 08:51:55 +00:00 
			
		
		
		
	mtmd-helper : bug fix to token batching in mtmd (#13650)
* Update mtmd-helper.cpp * Update tools/mtmd/mtmd-helper.cpp Co-authored-by: Xuan-Son Nguyen <thichthat@gmail.com> --------- Co-authored-by: Xuan-Son Nguyen <thichthat@gmail.com>
This commit is contained in:
		| @@ -231,12 +231,14 @@ int32_t mtmd_helper_eval_chunk_single(mtmd_context * ctx, | ||||
|         while (i < n_tokens) { // split into batches | ||||
|             text_batch.n_tokens = 0; // clear the batch | ||||
|             for (; i < n_tokens && text_batch.n_tokens < n_batch; i++) { | ||||
|                 int32_t j = text_batch.n_tokens; | ||||
|                 text_batch.token   [j]    = tokens[i]; | ||||
|                 text_batch.pos     [j]    = n_past++; | ||||
|                 text_batch.n_seq_id[j]    = 1; | ||||
|                 text_batch.seq_id  [j][0] = seq_id; | ||||
|                 text_batch.logits  [j]    = false; | ||||
|  | ||||
|                 text_batch.n_tokens++; | ||||
|                 text_batch.token   [i]    = tokens[i]; | ||||
|                 text_batch.pos     [i]    = n_past++; | ||||
|                 text_batch.n_seq_id[i]    = 1; | ||||
|                 text_batch.seq_id  [i][0] = seq_id; | ||||
|                 text_batch.logits  [i]    = false; | ||||
|             } | ||||
|             bool is_last_token = (i == n_tokens); | ||||
|             if (logits_last && is_last_token) { | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 l3utterfly
					l3utterfly