From b333b06772c89d96aacb5490d6a219fba7c09cc6 Mon Sep 17 00:00:00 2001 From: Mitja Felicijan Date: Thu, 12 Feb 2026 20:57:17 +0100 Subject: Engage! --- llama.cpp/ggml/src/ggml-cpu/spacemit/ime_kernels.h | 26 ++++++++++++++++++++++ 1 file changed, 26 insertions(+) create mode 100644 llama.cpp/ggml/src/ggml-cpu/spacemit/ime_kernels.h (limited to 'llama.cpp/ggml/src/ggml-cpu/spacemit/ime_kernels.h') diff --git a/llama.cpp/ggml/src/ggml-cpu/spacemit/ime_kernels.h b/llama.cpp/ggml/src/ggml-cpu/spacemit/ime_kernels.h new file mode 100644 index 0000000..7570634 --- /dev/null +++ b/llama.cpp/ggml/src/ggml-cpu/spacemit/ime_kernels.h @@ -0,0 +1,26 @@ +#pragma once + +#include + +namespace sqnbitgemm_spacemit_ime { +namespace ime1 { +size_t gemm_kernel_i8i4(size_t blk_len, + const std::byte * quant_a_ptr, + const std::byte * quant_b_data, + const float * quant_b_scale, + const std::byte * quant_b_zp, + float * c_ptr, + size_t count_m, + size_t count_n, + size_t count_k, + size_t block_count_k, + size_t ldc, + const float * bias, + const size_t scale_stride); + +void quantize_a_row_i8(size_t blk_len, const float * a_ptr, size_t count_k, std::byte * quant_a_ptr); + +void quantize_a_4row_i8(size_t blk_len, const float * a_ptr, size_t count_k, std::byte * quant_a_ptr); + +} // namespace ime1 +} // namespace sqnbitgemm_spacemit_ime -- cgit v1.2.3