cpu : add FLOOR, CEIL, ROUND and TRUNC unary operators (llama/16083)

author safranowith <redacted>

Wed, 15 Oct 2025 19:24:51 +0000 (22:24 +0300)

committer Georgi Gerganov <redacted>

Tue, 21 Oct 2025 15:14:33 +0000 (18:14 +0300)
author safranowith <redacted>
Wed, 15 Oct 2025 19:24:51 +0000 (22:24 +0300)
committer Georgi Gerganov <redacted>
Tue, 21 Oct 2025 15:14:33 +0000 (18:14 +0300)
diff --git a/include/ggml.h b/include/ggml.h

index 60c6b63d05978fa2a2c457d8db8e79371040c0f3..d948b00cc7f3048258b358ff32410d2e20204fb6 100644 (file)
--- a/include/ggml.h
+++ b/include/ggml.h
@@ -577,6 +577,10 @@ extern "C" {
          GGML_UNARY_OP_EXP,
          GGML_UNARY_OP_GELU_ERF,
          GGML_UNARY_OP_XIELU,
+        GGML_UNARY_OP_FLOOR,
+        GGML_UNARY_OP_CEIL,
+        GGML_UNARY_OP_ROUND,
+        GGML_UNARY_OP_TRUNC,
  
          GGML_UNARY_OP_COUNT,
      };
@@ -1151,6 +1155,46 @@ extern "C" {
              struct ggml_context * ctx,
              struct ggml_tensor  * a);
  
+    GGML_API struct ggml_tensor * ggml_floor(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+    GGML_API struct ggml_tensor * ggml_floor_inplace(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+    GGML_API struct ggml_tensor * ggml_ceil(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+    GGML_API struct ggml_tensor * ggml_ceil_inplace(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+    GGML_API struct ggml_tensor * ggml_round(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+    GGML_API struct ggml_tensor * ggml_round_inplace(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+     /**
+     * Truncates the fractional part of each element in the tensor (towards zero).
+     * For example: trunc(3.7) = 3.0, trunc(-2.9) = -2.0
+     * Similar to std::trunc in C/C++.
+     */
+
+    GGML_API struct ggml_tensor * ggml_trunc(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+    GGML_API struct ggml_tensor * ggml_trunc_inplace(
+            struct ggml_context * ctx,
+            struct ggml_tensor  * a);
+
+
+
      // xIELU activation function
      // x = x * (c_a(alpha_n) + c_b(alpha_p, beta) * sigmoid(beta * x)) + eps * (x > 0)
      // where c_a = softplus and c_b(a, b) = softplus(a) + b are constraining functions
diff --git a/src/ggml-cpu/ggml-cpu.c b/src/ggml-cpu/ggml-cpu.c

index ba2a36d99912871efe05f2a5ea22592c16fc9a67..29c870600ba93b022c860de4f5596fdedb4d0793 100644 (file)
--- a/src/ggml-cpu/ggml-cpu.c
+++ b/src/ggml-cpu/ggml-cpu.c
@@ -2184,6 +2184,10 @@ static int ggml_get_n_tasks(struct ggml_tensor * node, int n_threads) {
                  case GGML_UNARY_OP_HARDSWISH:
                  case GGML_UNARY_OP_HARDSIGMOID:
                  case GGML_UNARY_OP_EXP:
+                case GGML_UNARY_OP_FLOOR:
+                case GGML_UNARY_OP_CEIL:
+                case GGML_UNARY_OP_ROUND:
+                case GGML_UNARY_OP_TRUNC:
                      {
                          n_tasks = 1;
                      } break;
diff --git a/src/ggml-cpu/ops.cpp b/src/ggml-cpu/ops.cpp

index 1c43865ff65fcff2677c50b9981b24672f1ea396..b52f0f8472cfe1db2ee687caf599ab09fe0375c1 100644 (file)
--- a/src/ggml-cpu/ops.cpp
+++ b/src/ggml-cpu/ops.cpp
@@ -8993,6 +8993,22 @@ void ggml_compute_forward_unary(
              {
                  ggml_compute_forward_exp(params, dst);
              } break;
+        case GGML_UNARY_OP_FLOOR:
+            {
+                ggml_compute_forward_floor(params, dst);
+            } break;
+        case GGML_UNARY_OP_CEIL:
+            {
+                ggml_compute_forward_ceil(params, dst);
+            } break;
+        case GGML_UNARY_OP_ROUND:
+            {
+                ggml_compute_forward_round(params, dst);
+            } break;
+        case GGML_UNARY_OP_TRUNC:
+            {
+                ggml_compute_forward_trunc(params, dst);
+            } break;
          case GGML_UNARY_OP_XIELU:
              {
                  ggml_compute_forward_xielu(params, dst);
diff --git a/src/ggml-cpu/unary-ops.cpp b/src/ggml-cpu/unary-ops.cpp

index cf1a4615d042cd27001f3e3450cd3aa47c22ce53..a047537b34f78ffabb9cb62cb3bff1cc642f8036 100644 (file)
--- a/src/ggml-cpu/unary-ops.cpp
+++ b/src/ggml-cpu/unary-ops.cpp
@@ -73,6 +73,22 @@ static inline float op_log(float x) {
      return logf(x);
  }
  
+static inline float op_floor(float x) {
+    return floorf(x);
+}
+
+static inline float op_ceil(float x) {
+    return ceilf(x);
+}
+
+static inline float op_round(float x) {
+    return roundf(x);
+}
+
+static inline float op_trunc(float x) {
+    return truncf(x);
+}
+
  template <float (*op)(float), typename src0_t, typename dst_t>
  static inline void vec_unary_op(int64_t n, dst_t * y, const src0_t * x) {
      constexpr auto src0_to_f32 = type_conversion_table<src0_t>::to_f32;
@@ -274,6 +290,22 @@ void ggml_compute_forward_log(const ggml_compute_params * params, ggml_tensor *
      unary_op<op_log>(params, dst);
  }
  
+void ggml_compute_forward_floor(const ggml_compute_params * params, ggml_tensor * dst) {
+    unary_op<op_floor>(params, dst);
+}
+
+void ggml_compute_forward_ceil(const ggml_compute_params * params, ggml_tensor * dst) {
+    unary_op<op_ceil>(params, dst);
+}
+
+void ggml_compute_forward_round(const ggml_compute_params * params, ggml_tensor * dst) {
+    unary_op<op_round>(params, dst);
+}
+
+void ggml_compute_forward_trunc(const ggml_compute_params * params, ggml_tensor * dst) {
+    unary_op<op_trunc>(params, dst);
+}
+
  void ggml_compute_forward_xielu(const ggml_compute_params * params, ggml_tensor * dst) {
      const float alpha_n = ggml_get_op_params_f32(dst, 1);
      const float alpha_p = ggml_get_op_params_f32(dst, 2);
diff --git a/src/ggml-cpu/unary-ops.h b/src/ggml-cpu/unary-ops.h

index 697c1e0da0ace50739973cd1bc91e430273bff7d..fa45d9f0e636fc5890432bc73d27ed563c434186 100644 (file)
--- a/src/ggml-cpu/unary-ops.h
+++ b/src/ggml-cpu/unary-ops.h
@@ -22,6 +22,10 @@ void ggml_compute_forward_sqrt(const struct ggml_compute_params * params, struct
  void ggml_compute_forward_sin(const struct ggml_compute_params * params, struct ggml_tensor * dst);
  void ggml_compute_forward_cos(const struct ggml_compute_params * params, struct ggml_tensor * dst);
  void ggml_compute_forward_log(const struct ggml_compute_params * params, struct ggml_tensor * dst);
+void ggml_compute_forward_floor(const struct ggml_compute_params * params, struct ggml_tensor * dst);
+void ggml_compute_forward_ceil(const struct ggml_compute_params * params, struct ggml_tensor * dst);
+void ggml_compute_forward_round(const struct ggml_compute_params * params, struct ggml_tensor * dst);
+void ggml_compute_forward_trunc(const struct ggml_compute_params * params, struct ggml_tensor * dst);
  void ggml_compute_forward_xielu(const struct ggml_compute_params * params, struct ggml_tensor * dst);
  
  #ifdef __cplusplus
diff --git a/src/ggml.c b/src/ggml.c

index 2bce1375ba3c089a458090e62e6df3cb9d7f69be..86f1c31afd7a6254e4b9013ca80cd6010ac0e267 100644 (file)
--- a/src/ggml.c
+++ b/src/ggml.c
@@ -1144,9 +1144,13 @@ static const char * GGML_UNARY_OP_NAME[GGML_UNARY_OP_COUNT] = {
      "EXP",
      "GELU_ERF",
      "XIELU",
+    "FLOOR",
+    "CEIL",
+    "ROUND",
+    "TRUNC",
  };
  
-static_assert(GGML_UNARY_OP_COUNT == 16, "GGML_UNARY_OP_COUNT != 16");
+static_assert(GGML_UNARY_OP_COUNT == 20, "GGML_UNARY_OP_COUNT != 20");
  
  static const char * GGML_GLU_OP_NAME[GGML_GLU_OP_COUNT] = {
      "REGLU",
@@ -2749,6 +2753,62 @@ static struct ggml_tensor * ggml_glu_impl(
      return result;
  }
  
+// ggml_floor
+
+struct ggml_tensor * ggml_floor(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary(ctx, a, GGML_UNARY_OP_FLOOR);
+}
+
+struct ggml_tensor * ggml_floor_inplace(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary_inplace(ctx, a, GGML_UNARY_OP_FLOOR);
+}
+
+// ggml_ceil
+
+struct ggml_tensor * ggml_ceil(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary(ctx, a, GGML_UNARY_OP_CEIL);
+}
+
+struct ggml_tensor * ggml_ceil_inplace(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary_inplace(ctx, a, GGML_UNARY_OP_CEIL);
+}
+
+//ggml_round
+
+struct ggml_tensor * ggml_round(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary(ctx, a, GGML_UNARY_OP_ROUND);
+}
+
+struct ggml_tensor * ggml_round_inplace(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary_inplace(ctx, a, GGML_UNARY_OP_ROUND);
+}
+
+//ggml_trunc
+
+struct ggml_tensor * ggml_trunc(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary(ctx, a, GGML_UNARY_OP_TRUNC);
+}
+
+struct ggml_tensor * ggml_trunc_inplace(
+        struct ggml_context * ctx,
+        struct ggml_tensor  * a) {
+    return ggml_unary_inplace(ctx, a, GGML_UNARY_OP_TRUNC);
+}
+
  struct ggml_tensor * ggml_glu(
          struct ggml_context * ctx,
          struct ggml_tensor  * a,
author	safranowith <redacted>
	Wed, 15 Oct 2025 19:24:51 +0000 (22:24 +0300)
committer	Georgi Gerganov <redacted>
	Tue, 21 Oct 2025 15:14:33 +0000 (18:14 +0300)
include/ggml.h		patch \| blob \| history
src/ggml-cpu/ggml-cpu.c		patch \| blob \| history
src/ggml-cpu/ops.cpp		patch \| blob \| history
src/ggml-cpu/unary-ops.cpp		patch \| blob \| history
src/ggml-cpu/unary-ops.h		patch \| blob \| history
src/ggml.c		patch \| blob \| history