1 files changed, 76 insertions, 0 deletions
diff --git a/llama.cpp/ggml/src/ggml-sycl/presets.hpp b/llama.cpp/ggml/src/ggml-sycl/presets.hpp
new file mode 100644
index 0000000..b651737
--- /dev/null
+++ b/llama.cpp/ggml/src/ggml-sycl/presets.hpp
@@ -0,0 +1,76 @@
+//
+// MIT license
+// Copyright (C) 2024 Intel Corporation
+// SPDX-License-Identifier: MIT
+//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+#ifndef GGML_SYCL_PRESETS_HPP
+#define GGML_SYCL_PRESETS_HPP
+#define GGML_SYCL_MAX_STREAMS       8
+#define GGML_SYCL_MAX_BUFFERS       256
+#define WARP_SIZE GGML_SYCL_WARP_SIZE
+#define MATRIX_ROW_PADDING 512 // last row of quant. matrices is a multiple of this to avoid out-of-bounds memory accesses
+#define SYCL_GELU_BLOCK_SIZE 256
+#define SYCL_SILU_BLOCK_SIZE 256
+#define SYCL_TANH_BLOCK_SIZE 256
+#define SYCL_RELU_BLOCK_SIZE 256
+#define SYCL_HARDSIGMOID_BLOCK_SIZE 256
+#define SYCL_HARDSWISH_BLOCK_SIZE 256
+#define SYCL_EXP_BLOCK_SIZE 256
+#define SYCL_NEG_BLOCK_SIZE 256
+#define SYCL_SIGMOID_BLOCK_SIZE 256
+#define SYCL_SQRT_BLOCK_SIZE 256
+#define SYCL_SIN_BLOCK_SIZE 256
+#define SYCL_SQR_BLOCK_SIZE 256
+#define SYCL_SET_BLOCK_SIZE 256
+#define SYCL_CPY_BLOCK_SIZE 32
+#define SYCL_SCALE_BLOCK_SIZE 256
+#define SYCL_CLAMP_BLOCK_SIZE 256
+#define SYCL_ROPE_BLOCK_SIZE 256
+#define SYCL_ALIBI_BLOCK_SIZE 32
+#define SYCL_DIAG_MASK_INF_BLOCK_SIZE 32
+#define SYCL_QUANTIZE_BLOCK_SIZE 256
+#define SYCL_DEQUANTIZE_BLOCK_SIZE 256
+#define SYCL_GET_ROWS_BLOCK_SIZE 256
+#define SYCL_UPSCALE_BLOCK_SIZE 256
+#define SYCL_CONCAT_BLOCK_SIZE 256
+#define SYCL_PAD_BLOCK_SIZE 256
+#define SYCL_ACC_BLOCK_SIZE 256
+#define SYCL_IM2COL_BLOCK_SIZE 256
+#define SYCL_POOL2D_BLOCK_SIZE 256
+#define SYCL_ARGMAX_BLOCK_SIZE 256
+#define SYCL_CONV_TRANPOSE_1D_BLOCK_SIZE 256
+#define SYCL_TIMESTEP_EMBEDDING_BLOCK_SIZE 256
+#define SYCL_ARANGE_BLOCK_SIZE 256
+// dmmv = dequantize_mul_mat_vec
+#ifndef GGML_SYCL_DMMV_X
+#define GGML_SYCL_DMMV_X 32
+#endif
+#ifndef GGML_SYCL_MMV_Y
+#define GGML_SYCL_MMV_Y 1
+#endif
+#ifndef K_QUANTS_PER_ITERATION
+#define K_QUANTS_PER_ITERATION 2
+#else
+static_assert(K_QUANTS_PER_ITERATION == 1 || K_QUANTS_PER_ITERATION == 2, "K_QUANTS_PER_ITERATION must be 1 or 2");
+#endif
+#ifndef GGML_SYCL_PEER_MAX_BATCH_SIZE
+#define GGML_SYCL_PEER_MAX_BATCH_SIZE 128
+#endif // GGML_SYCL_PEER_MAX_BATCH_SIZE
+#define MUL_MAT_SRC1_COL_STRIDE 128
+#define QK_WARP_SIZE 32
+#endif // GGML_SYCL_PRESETS_HPP

diff --git a/llama.cpp/ggml/src/ggml-sycl/presets.hpp b/llama.cpp/ggml/src/ggml-sycl/presets.hpp new file mode 100644 index 0000000..b651737 --- /dev/null +++ b/llama.cpp/ggml/src/ggml-sycl/presets.hpp
@@ -0,0 +1,76 @@
	1	//
	2	// MIT license
	3	// Copyright (C) 2024 Intel Corporation
	4	// SPDX-License-Identifier: MIT
	5	//
	6
	7	//
	8	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	9	// See https://llvm.org/LICENSE.txt for license information.
	10	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	11	//
	12
	13	#ifndef GGML_SYCL_PRESETS_HPP
	14	#define GGML_SYCL_PRESETS_HPP
	15
	16	#define GGML_SYCL_MAX_STREAMS 8
	17	#define GGML_SYCL_MAX_BUFFERS 256
	18
	19	#define WARP_SIZE GGML_SYCL_WARP_SIZE
	20	#define MATRIX_ROW_PADDING 512 // last row of quant. matrices is a multiple of this to avoid out-of-bounds memory accesses
	21
	22	#define SYCL_GELU_BLOCK_SIZE 256
	23	#define SYCL_SILU_BLOCK_SIZE 256
	24	#define SYCL_TANH_BLOCK_SIZE 256
	25	#define SYCL_RELU_BLOCK_SIZE 256
	26	#define SYCL_HARDSIGMOID_BLOCK_SIZE 256
	27	#define SYCL_HARDSWISH_BLOCK_SIZE 256
	28	#define SYCL_EXP_BLOCK_SIZE 256
	29	#define SYCL_NEG_BLOCK_SIZE 256
	30	#define SYCL_SIGMOID_BLOCK_SIZE 256
	31	#define SYCL_SQRT_BLOCK_SIZE 256
	32	#define SYCL_SIN_BLOCK_SIZE 256
	33	#define SYCL_SQR_BLOCK_SIZE 256
	34	#define SYCL_SET_BLOCK_SIZE 256
	35	#define SYCL_CPY_BLOCK_SIZE 32
	36	#define SYCL_SCALE_BLOCK_SIZE 256
	37	#define SYCL_CLAMP_BLOCK_SIZE 256
	38	#define SYCL_ROPE_BLOCK_SIZE 256
	39	#define SYCL_ALIBI_BLOCK_SIZE 32
	40	#define SYCL_DIAG_MASK_INF_BLOCK_SIZE 32
	41	#define SYCL_QUANTIZE_BLOCK_SIZE 256
	42	#define SYCL_DEQUANTIZE_BLOCK_SIZE 256
	43	#define SYCL_GET_ROWS_BLOCK_SIZE 256
	44	#define SYCL_UPSCALE_BLOCK_SIZE 256
	45	#define SYCL_CONCAT_BLOCK_SIZE 256
	46	#define SYCL_PAD_BLOCK_SIZE 256
	47	#define SYCL_ACC_BLOCK_SIZE 256
	48	#define SYCL_IM2COL_BLOCK_SIZE 256
	49	#define SYCL_POOL2D_BLOCK_SIZE 256
	50	#define SYCL_ARGMAX_BLOCK_SIZE 256
	51	#define SYCL_CONV_TRANPOSE_1D_BLOCK_SIZE 256
	52	#define SYCL_TIMESTEP_EMBEDDING_BLOCK_SIZE 256
	53	#define SYCL_ARANGE_BLOCK_SIZE 256
	54
	55	// dmmv = dequantize_mul_mat_vec
	56	#ifndef GGML_SYCL_DMMV_X
	57	#define GGML_SYCL_DMMV_X 32
	58	#endif
	59	#ifndef GGML_SYCL_MMV_Y
	60	#define GGML_SYCL_MMV_Y 1
	61	#endif
	62
	63	#ifndef K_QUANTS_PER_ITERATION
	64	#define K_QUANTS_PER_ITERATION 2
	65	#else
	66	static_assert(K_QUANTS_PER_ITERATION == 1 \|\| K_QUANTS_PER_ITERATION == 2, "K_QUANTS_PER_ITERATION must be 1 or 2");
	67	#endif
	68
	69	#ifndef GGML_SYCL_PEER_MAX_BATCH_SIZE
	70	#define GGML_SYCL_PEER_MAX_BATCH_SIZE 128
	71	#endif // GGML_SYCL_PEER_MAX_BATCH_SIZE
	72
	73	#define MUL_MAT_SRC1_COL_STRIDE 128
	74
	75	#define QK_WARP_SIZE 32
	76	#endif // GGML_SYCL_PRESETS_HPP