ggml : arm repack fix build (whisper/0)

author Georgi Gerganov <redacted>

Sat, 13 Dec 2025 06:04:09 +0000 (08:04 +0200)

committer Georgi Gerganov <redacted>

Sun, 14 Dec 2025 06:33:51 +0000 (08:33 +0200)
author Georgi Gerganov <redacted>
Sat, 13 Dec 2025 06:04:09 +0000 (08:04 +0200)
committer Georgi Gerganov <redacted>
Sun, 14 Dec 2025 06:33:51 +0000 (08:33 +0200)
diff --git a/ggml/src/ggml-cpu/arch/arm/repack.cpp b/ggml/src/ggml-cpu/arch/arm/repack.cpp

index 683ed8d2df1c397084381583feeabbcc2a79d882..fc62f1b86e331f099c4846bf54f9066d6d37b637 100644 (file)
--- a/ggml/src/ggml-cpu/arch/arm/repack.cpp
+++ b/ggml/src/ggml-cpu/arch/arm/repack.cpp
@@ -24,6 +24,7 @@
  
  #define UNUSED GGML_UNUSED
  
+#if defined(__aarch64__) && defined(__ARM_NEON) && defined(__ARM_FEATURE_MATMUL_INT8)
  static inline void decode_q4_Kx8_scales_mins(const uint8_t * scales_in,
                                               int16x8_t *     out_mins,
                                               int8_t *        out_scales) {
@@ -46,6 +47,7 @@ static inline void decode_q4_Kx8_scales_mins(const uint8_t * scales_in,
      scales_u32[1] = (sm[2] & kmask2) | (((sm[0] >> 6) & kmask3) << 4);
      memcpy(out_scales, scales_u32, 8);
  }
+#endif
  
  void ggml_quantize_mat_q8_0_4x4(const float * GGML_RESTRICT x, void * GGML_RESTRICT vy, int64_t k) {
      assert(QK8_0 == 32);
author	Georgi Gerganov <redacted>
	Sat, 13 Dec 2025 06:04:09 +0000 (08:04 +0200)
committer	Georgi Gerganov <redacted>
	Sun, 14 Dec 2025 06:33:51 +0000 (08:33 +0200)