intel-gpu-llm-diagnosis/repos/patch/phase2-sycl-kernel/0003-tune-dmmv-xy-common-hpp.patch

diff --git a/ggml/src/ggml-sycl/common.hpp b/ggml/src/ggml-sycl/common.hpp
index fd84c91..dd5cf1a 100644
--- a/ggml/src/ggml-sycl/common.hpp
+++ b/ggml/src/ggml-sycl/common.hpp
@@ -103,10 +103,10 @@ extern int g_ggml_sycl_enable_flash_attention;

 // dmmv = dequantize_mul_mat_vec
 #ifndef GGML_SYCL_DMMV_X
-#define GGML_SYCL_DMMV_X 32
+#define GGML_SYCL_DMMV_X 64
 #endif
 #ifndef GGML_SYCL_MMV_Y
-#define GGML_SYCL_MMV_Y 1
+#define GGML_SYCL_MMV_Y 2
 #endif

 typedef sycl::queue *queue_ptr;