mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	vulkan: fix compile warnings (#10731)
This commit is contained in:
		| @@ -427,7 +427,7 @@ static_assert(sizeof(vk_op_unary_push_constants) <= 128, "sizeof(vk_op_unary_pus | |||||||
| // and a shift: | // and a shift: | ||||||
| // | // | ||||||
| // n/d = (mulhi(n, mp) + n) >> L; | // n/d = (mulhi(n, mp) + n) >> L; | ||||||
| void init_fastdiv_values(uint32_t d, uint32_t &mp, uint32_t &L) | static void init_fastdiv_values(uint32_t d, uint32_t &mp, uint32_t &L) | ||||||
| { | { | ||||||
|     // compute L = ceil(log2(d)); |     // compute L = ceil(log2(d)); | ||||||
|     L = 0; |     L = 0; | ||||||
| @@ -439,6 +439,7 @@ void init_fastdiv_values(uint32_t d, uint32_t &mp, uint32_t &L) | |||||||
| } | } | ||||||
|  |  | ||||||
| template <typename T> void init_pushconst_fastdiv(T &p) { | template <typename T> void init_pushconst_fastdiv(T &p) { | ||||||
|  |     GGML_UNUSED(p); | ||||||
|     static_assert(!std::is_const<T>::value, "unexpected type"); |     static_assert(!std::is_const<T>::value, "unexpected type"); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -3417,7 +3418,7 @@ static uint32_t ggml_vk_guess_split_k(ggml_backend_vk_context * ctx, int m, int | |||||||
|     return split_k; |     return split_k; | ||||||
| } | } | ||||||
|  |  | ||||||
| static vk_pipeline ggml_vk_guess_matmul_pipeline(ggml_backend_vk_context * ctx, vk_matmul_pipeline& mmp, int m, int n, bool aligned, ggml_type type_a) { | static vk_pipeline ggml_vk_guess_matmul_pipeline(ggml_backend_vk_context * ctx, vk_matmul_pipeline& mmp, int m, int n, bool aligned) { | ||||||
|     VK_LOG_DEBUG("ggml_vk_guess_matmul_pipeline(" << m << ", " << n << ", " << aligned << ")"); |     VK_LOG_DEBUG("ggml_vk_guess_matmul_pipeline(" << m << ", " << n << ", " << aligned << ")"); | ||||||
|  |  | ||||||
|     if (ctx->device->coopmat2) { |     if (ctx->device->coopmat2) { | ||||||
| @@ -3439,9 +3440,9 @@ static vk_pipeline ggml_vk_guess_matmul_pipeline(ggml_backend_vk_context * ctx, | |||||||
|     return aligned ? mmp->a_l : mmp->l; |     return aligned ? mmp->a_l : mmp->l; | ||||||
| } | } | ||||||
|  |  | ||||||
| static uint32_t ggml_vk_guess_matmul_pipeline_align(ggml_backend_vk_context * ctx, vk_matmul_pipeline& mmp, int m, int n, ggml_type type_a) { | static uint32_t ggml_vk_guess_matmul_pipeline_align(ggml_backend_vk_context * ctx, vk_matmul_pipeline& mmp, int m, int n) { | ||||||
|     VK_LOG_DEBUG("ggml_vk_guess_matmul_pipeline_align(" << m << ", " << n << ")"); |     VK_LOG_DEBUG("ggml_vk_guess_matmul_pipeline_align(" << m << ", " << n << ")"); | ||||||
|     return ggml_vk_guess_matmul_pipeline(ctx, mmp, m, n, true, type_a)->align; |     return ggml_vk_guess_matmul_pipeline(ctx, mmp, m, n, true)->align; | ||||||
| } | } | ||||||
|  |  | ||||||
| static void ggml_vk_matmul( | static void ggml_vk_matmul( | ||||||
| @@ -3571,6 +3572,7 @@ static void ggml_vk_cpy_to_contiguous(ggml_backend_vk_context * ctx, vk_context& | |||||||
|         (uint32_t)tensor->ne[0], (uint32_t)tensor->ne[1], (uint32_t)tensor->ne[2], (uint32_t)tensor->ne[3],                       1                   , (uint32_t)tensor->ne[0]                   , (uint32_t)(tensor->ne[0] * tensor->ne[1]) , (uint32_t)(tensor->ne[0] * tensor->ne[1] * tensor->ne[2]), |         (uint32_t)tensor->ne[0], (uint32_t)tensor->ne[1], (uint32_t)tensor->ne[2], (uint32_t)tensor->ne[3],                       1                   , (uint32_t)tensor->ne[0]                   , (uint32_t)(tensor->ne[0] * tensor->ne[1]) , (uint32_t)(tensor->ne[0] * tensor->ne[1] * tensor->ne[2]), | ||||||
|         0, |         0, | ||||||
|         0.0f, 0.0f, |         0.0f, 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }; |     }; | ||||||
|     init_pushconst_fastdiv(pc); |     init_pushconst_fastdiv(pc); | ||||||
|     ggml_vk_sync_buffers(subctx); |     ggml_vk_sync_buffers(subctx); | ||||||
| @@ -3644,10 +3646,10 @@ static void ggml_vk_mul_mat_q_f16(ggml_backend_vk_context * ctx, vk_context& sub | |||||||
|     const int y_ne = ne11 * ne10; |     const int y_ne = ne11 * ne10; | ||||||
|     const int d_ne = ne11 * ne01; |     const int d_ne = ne11 * ne01; | ||||||
|  |  | ||||||
|     const uint32_t kpad = ggml_vk_align_size(ne10, ggml_vk_guess_matmul_pipeline_align(ctx, mmp, ne01, ne11, src0->type)); |     const uint32_t kpad = ggml_vk_align_size(ne10, ggml_vk_guess_matmul_pipeline_align(ctx, mmp, ne01, ne11)); | ||||||
|     const bool aligned = ne10 == kpad && ne01 > 8 && ne11 > 8; |     const bool aligned = ne10 == kpad && ne01 > 8 && ne11 > 8; | ||||||
|  |  | ||||||
|     vk_pipeline pipeline = ggml_vk_guess_matmul_pipeline(ctx, mmp, ne01, ne11, aligned, src0->type); |     vk_pipeline pipeline = ggml_vk_guess_matmul_pipeline(ctx, mmp, ne01, ne11, aligned); | ||||||
|  |  | ||||||
|     const uint32_t split_k = ggml_vk_guess_split_k(ctx, ne01, ne11, ne10, pipeline); |     const uint32_t split_k = ggml_vk_guess_split_k(ctx, ne01, ne11, ne10, pipeline); | ||||||
|  |  | ||||||
| @@ -5351,7 +5353,8 @@ static void ggml_vk_scale(ggml_backend_vk_context * ctx, vk_context& subctx, con | |||||||
|         (uint32_t)src0->ne[0], (uint32_t)src0->ne[1], (uint32_t)src0->ne[2], (uint32_t)src0->ne[3], (uint32_t)src0->nb[0] / src0_type_size, (uint32_t)src0->nb[1] / src0_type_size, (uint32_t)src0->nb[2] / src0_type_size, (uint32_t)src0->nb[3] / src0_type_size, |         (uint32_t)src0->ne[0], (uint32_t)src0->ne[1], (uint32_t)src0->ne[2], (uint32_t)src0->ne[3], (uint32_t)src0->nb[0] / src0_type_size, (uint32_t)src0->nb[1] / src0_type_size, (uint32_t)src0->nb[2] / src0_type_size, (uint32_t)src0->nb[3] / src0_type_size, | ||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         0, |         0, | ||||||
|         op_params[0], 0.0f |         op_params[0], 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -5365,6 +5368,7 @@ static void ggml_vk_sqr(ggml_backend_vk_context * ctx, vk_context& subctx, const | |||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         0, |         0, | ||||||
|         0.0f, 0.0f, |         0.0f, 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -5378,6 +5382,7 @@ static void ggml_vk_sin(ggml_backend_vk_context * ctx, vk_context& subctx, const | |||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         0, |         0, | ||||||
|         0.0f, 0.0f, |         0.0f, 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -5391,6 +5396,7 @@ static void ggml_vk_cos(ggml_backend_vk_context * ctx, vk_context& subctx, const | |||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         0, |         0, | ||||||
|         0.0f, 0.0f, |         0.0f, 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -5405,6 +5411,7 @@ static void ggml_vk_clamp(ggml_backend_vk_context * ctx, vk_context& subctx, con | |||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         0, |         0, | ||||||
|         op_params[0], op_params[1], |         op_params[0], op_params[1], | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -5418,6 +5425,7 @@ static void ggml_vk_pad(ggml_backend_vk_context * ctx, vk_context& subctx, const | |||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         0, |         0, | ||||||
|         0.0f, 0.0f, |         0.0f, 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -5431,6 +5439,7 @@ static void ggml_vk_repeat(ggml_backend_vk_context * ctx, vk_context& subctx, co | |||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         0, |         0, | ||||||
|         0.0f, 0.0f, |         0.0f, 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -5445,6 +5454,7 @@ static void ggml_vk_cpy(ggml_backend_vk_context * ctx, vk_context& subctx, const | |||||||
|         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, |         (uint32_t) dst->ne[0], (uint32_t) dst->ne[1], (uint32_t) dst->ne[2], (uint32_t) dst->ne[3], (uint32_t) dst->nb[0] /  dst_type_size, (uint32_t) dst->nb[1] /  dst_type_size, (uint32_t) dst->nb[2] /  dst_type_size, (uint32_t) dst->nb[3] /  dst_type_size, | ||||||
|         d_offset, |         d_offset, | ||||||
|         0.0f, 0.0f, |         0.0f, 0.0f, | ||||||
|  |         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, | ||||||
|     }, dryrun); |     }, dryrun); | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user