mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-11-04 09:32:00 +00:00 
			
		
		
		
	SYCL: Reduce most of the compiler warnings (#10748)
* Try to reduce some unused and typecast warnings * Reduce compiler warnings step 2 * add a newline at the end of the file * Initialize nreduce as size_t * [SYCL] Remove pragma directives from mmq.cpp * SYCL: mmq add condition to prevent blocks_per_tile_x_row variable from becoming 0 * SYCL softmax: Initialize nreduce as size_t * ggml-sycl.cpp: fix some trailing whitespaces * SYCL: remove the unused variables instead of commenting it out * SYCL poo2d kernel: set NAN for invalid pooling op * SYCL gemm.hpp: remove pragma directives * SYCL gemm.hpp: use const cast to properly support dnnl::memory * SYCL: wkv6 remove a comment * SYCL: clean comments step 2 * SYCL: clean comments and variables step 3 * SYCL: Use GGML_UNUSED for unused variables * SYCL: remove extra empty lines and a comment * Remove TODO * cleanup spaces * add a stdout for unsupported op * use sycl printf over fprintf * remove prints for CI * SYCL ggml-sycl: pool2D use sycl::nan and remove if-else block --------- Co-authored-by: Abhilash Majumder <30946547+abhilash1910@users.noreply.github.com>
This commit is contained in:
		@@ -753,11 +753,7 @@ static void mul_mat_vec_iq2_xs_q8_1_sycl(const void *vx, const void *vy,
 | 
			
		||||
    const sycl::range<3> block_nums(1, 1, block_num_y);
 | 
			
		||||
    const sycl::range<3> block_dims(1, GGML_SYCL_MMV_Y, QK_WARP_SIZE);
 | 
			
		||||
    {
 | 
			
		||||
 | 
			
		||||
        stream->submit([&](sycl::handler &cgh) {
 | 
			
		||||
            auto iq2xs_grid_ptr_ct1 = &iq2xs_grid[0];
 | 
			
		||||
            auto ksigns64_ptr_ct1 = &ksigns64[0];
 | 
			
		||||
 | 
			
		||||
        stream->submit([&](sycl::handler & cgh) {
 | 
			
		||||
            cgh.parallel_for(
 | 
			
		||||
                sycl::nd_range<3>(block_nums * block_dims, block_dims),
 | 
			
		||||
                [=](sycl::nd_item<3> item_ct1)
 | 
			
		||||
@@ -780,9 +776,6 @@ static void mul_mat_vec_iq2_s_q8_1_sycl(const void *vx, const void *vy,
 | 
			
		||||
    {
 | 
			
		||||
 | 
			
		||||
        stream->submit([&](sycl::handler &cgh) {
 | 
			
		||||
            auto iq2xs_grid_ptr_ct1 = &iq2xs_grid[0];
 | 
			
		||||
            auto ksigns64_ptr_ct1 = &ksigns64[0];
 | 
			
		||||
 | 
			
		||||
            cgh.parallel_for(
 | 
			
		||||
                sycl::nd_range<3>(block_nums * block_dims, block_dims),
 | 
			
		||||
                [=](sycl::nd_item<3> item_ct1)
 | 
			
		||||
@@ -805,9 +798,6 @@ static void mul_mat_vec_iq3_xxs_q8_1_sycl(const void *vx, const void *vy,
 | 
			
		||||
    {
 | 
			
		||||
 | 
			
		||||
        stream->submit([&](sycl::handler &cgh) {
 | 
			
		||||
            auto iq3xxs_grid_ptr_ct1 = &iq3xxs_grid[0];
 | 
			
		||||
            auto ksigns64_ptr_ct1 = &ksigns64[0];
 | 
			
		||||
 | 
			
		||||
            cgh.parallel_for(
 | 
			
		||||
                sycl::nd_range<3>(block_nums * block_dims, block_dims),
 | 
			
		||||
                [=](sycl::nd_item<3> item_ct1)
 | 
			
		||||
@@ -830,8 +820,6 @@ static void mul_mat_vec_iq3_s_q8_1_sycl(const void *vx, const void *vy,
 | 
			
		||||
    {
 | 
			
		||||
 | 
			
		||||
        stream->submit([&](sycl::handler &cgh) {
 | 
			
		||||
            auto iq3s_grid_ptr_ct1 = &iq3s_grid[0];
 | 
			
		||||
 | 
			
		||||
            cgh.parallel_for(
 | 
			
		||||
                sycl::nd_range<3>(block_nums * block_dims, block_dims),
 | 
			
		||||
                [=](sycl::nd_item<3> item_ct1)
 | 
			
		||||
@@ -854,9 +842,6 @@ static void mul_mat_vec_iq1_s_q8_1_sycl(const void *vx, const void *vy,
 | 
			
		||||
    {
 | 
			
		||||
 | 
			
		||||
        stream->submit([&](sycl::handler &cgh) {
 | 
			
		||||
            auto iq1s_grid_ptr_ct1 = &iq1s_grid_gpu[0];
 | 
			
		||||
            auto ksigns64_ptr_ct1 = &ksigns64[0];
 | 
			
		||||
 | 
			
		||||
            cgh.parallel_for(
 | 
			
		||||
                sycl::nd_range<3>(block_nums * block_dims, block_dims),
 | 
			
		||||
                [=](sycl::nd_item<3> item_ct1)
 | 
			
		||||
@@ -954,7 +939,7 @@ void ggml_sycl_op_mul_mat_vec_q(
 | 
			
		||||
    const size_t q8_1_bs = QK8_1;
 | 
			
		||||
    // the main device has a larger memory buffer to hold the results from all GPUs
 | 
			
		||||
    // nrows_dst == nrows of the matrix that the kernel writes into
 | 
			
		||||
    const int64_t nrows_dst = id == ctx.device ? ne00 : row_diff;
 | 
			
		||||
 | 
			
		||||
    for (int i = 0; i < src1_ncols; i++)
 | 
			
		||||
    {
 | 
			
		||||
        const size_t src1_ddq_i_offset = i * src1_padded_col_size * q8_1_ts / q8_1_bs;
 | 
			
		||||
@@ -1023,7 +1008,8 @@ void ggml_sycl_op_mul_mat_vec_q(
 | 
			
		||||
            break;
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
    (void) src1;
 | 
			
		||||
    (void) dst;
 | 
			
		||||
    (void) src1_ddf_i;
 | 
			
		||||
    GGML_UNUSED(src1);
 | 
			
		||||
    GGML_UNUSED(dst);
 | 
			
		||||
    GGML_UNUSED(src1_ddf_i);
 | 
			
		||||
    GGML_UNUSED(ctx);
 | 
			
		||||
}
 | 
			
		||||
 
 | 
			
		||||
		Reference in New Issue
	
	Block a user