common : remove json.hpp from common.cpp (#12697)

author Xuan-Son Nguyen <redacted>

Wed, 2 Apr 2025 07:58:34 +0000 (09:58 +0200)

committer GitHub <redacted>

Wed, 2 Apr 2025 07:58:34 +0000 (09:58 +0200)
author Xuan-Son Nguyen <redacted>
Wed, 2 Apr 2025 07:58:34 +0000 (09:58 +0200)
committer GitHub <redacted>
Wed, 2 Apr 2025 07:58:34 +0000 (09:58 +0200)
diff --git a/common/common.cpp b/common/common.cpp

index 22642c84afa40cbcce769cea748738ab07d1ee2f..e7269ead4f94e7355a15e544f2fb70103f3ece8d 100644 (file)
--- a/common/common.cpp
+++ b/common/common.cpp
@@ -7,9 +7,6 @@
  
  #include "common.h"
  #include "log.h"
-// Change JSON_ASSERT from assert() to GGML_ASSERT:
-#define JSON_ASSERT GGML_ASSERT
-#include "json.hpp"
  #include "llama.h"
  
  #include <algorithm>
@@ -56,8 +53,6 @@
  #pragma warning(disable: 4244 4267) // possible loss of data
  #endif
  
-using json = nlohmann::ordered_json;
-
  //
  // CPU utils
  //
@@ -1545,26 +1540,3 @@ common_control_vector_data common_control_vector_load(const std::vector<common_c
  
      return result;
  }
-
-template <>
-json common_grammar_trigger::to_json() const {
-    json out {
-        {"type", (int) type},
-        {"value", value},
-    };
-    if (type == COMMON_GRAMMAR_TRIGGER_TYPE_TOKEN) {
-        out["token"] = (int) token;
-    }
-    return out;
-}
-
-template <>
-common_grammar_trigger common_grammar_trigger::from_json(const json & in) {
-    common_grammar_trigger out;
-    out.type = (common_grammar_trigger_type) in.at("type").get<int>();
-    out.value = in.at("value").get<std::string>();
-    if (out.type == COMMON_GRAMMAR_TRIGGER_TYPE_TOKEN) {
-        out.token = (llama_token) in.at("token").get<int>();
-    }
-    return out;
-}
diff --git a/common/common.h b/common/common.h

index 41ff9905e441654f1090410216cb90ec5cf179e5..ea7aef99d918acec20e145f6867918aef622882f 100644 (file)
--- a/common/common.h
+++ b/common/common.h
@@ -121,10 +121,6 @@ struct common_grammar_trigger {
      common_grammar_trigger_type type;
      std::string value;
      llama_token token = LLAMA_TOKEN_NULL;
-
-    // T can only be nlohmann::ordered_json
-    template <class T> T to_json() const;
-    template <class T> static common_grammar_trigger from_json(const T & in);
  };
  
  // sampling parameters
diff --git a/examples/server/server.cpp b/examples/server/server.cpp

index d140f8c4469c9df01fc18501c7460bcc79f4873b..760c3646433ad1070a34e8913c35ac795149a1a1 100644 (file)
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@@ -133,7 +133,8 @@ struct slot_params {
  
          auto grammar_triggers = json::array();
          for (const auto & trigger : sampling.grammar_triggers) {
-            grammar_triggers.push_back(trigger.to_json<json>());
+            server_grammar_trigger ct(std::move(trigger));
+            grammar_triggers.push_back(ct.to_json());
          }
  
          return json {
@@ -372,9 +373,9 @@ struct server_task {
              const auto grammar_triggers = data.find("grammar_triggers");
              if (grammar_triggers != data.end()) {
                  for (const auto & t : *grammar_triggers) {
-                    auto ct = common_grammar_trigger::from_json(t);
-                    if (ct.type == COMMON_GRAMMAR_TRIGGER_TYPE_WORD) {
-                        const auto & word = ct.value;
+                    server_grammar_trigger ct(t);
+                    if (ct.value.type == COMMON_GRAMMAR_TRIGGER_TYPE_WORD) {
+                        const auto & word = ct.value.value;
                          auto ids = common_tokenize(vocab, word, /* add_special= */ false, /* parse_special= */ true);
                          if (ids.size() == 1) {
                              auto token = ids[0];
@@ -392,7 +393,7 @@ struct server_task {
                              params.sampling.grammar_triggers.push_back({COMMON_GRAMMAR_TRIGGER_TYPE_WORD, word});
                          }
                      } else {
-                        params.sampling.grammar_triggers.push_back(ct);
+                        params.sampling.grammar_triggers.push_back(std::move(ct.value));
                      }
                  }
              }
diff --git a/examples/server/utils.hpp b/examples/server/utils.hpp

index 58cdd6af92974597fbd48afc57a7ba01838d9dc0..55cf3230d90ce985320893cd8a2bd220f12afc8b 100644 (file)
--- a/examples/server/utils.hpp
+++ b/examples/server/utils.hpp
@@ -58,6 +58,32 @@ static T json_value(const json & body, const std::string & key, const T & defaul
  
  const static std::string build_info("b" + std::to_string(LLAMA_BUILD_NUMBER) + "-" + LLAMA_COMMIT);
  
+// thin wrapper around common_grammar_trigger with (de)serialization functions
+struct server_grammar_trigger {
+    common_grammar_trigger value;
+
+    server_grammar_trigger() = default;
+    server_grammar_trigger(const common_grammar_trigger & value) : value(value) {}
+    server_grammar_trigger(const json & in) {
+        value.type = (common_grammar_trigger_type) in.at("type").get<int>();
+        value.value = in.at("value").get<std::string>();
+        if (value.type == COMMON_GRAMMAR_TRIGGER_TYPE_TOKEN) {
+            value.token = (llama_token) in.at("token").get<int>();
+        }
+    }
+
+    json to_json() const {
+        json out {
+            {"type", (int) value.type},
+            {"value", value.value},
+        };
+        if (value.type == COMMON_GRAMMAR_TRIGGER_TYPE_TOKEN) {
+            out["token"] = (int) value.token;
+        }
+        return out;
+    }
+};
+
  //
  // tokenizer and input processing utils
  //
@@ -627,7 +653,8 @@ static json oaicompat_completion_params_parse(
      llama_params["grammar_lazy"]     = chat_params.grammar_lazy;
      auto grammar_triggers = json::array();
      for (const auto & trigger : chat_params.grammar_triggers) {
-        grammar_triggers.push_back(trigger.to_json<json>());
+        server_grammar_trigger ct(trigger);
+        grammar_triggers.push_back(ct.to_json());
      }
      llama_params["grammar_triggers"] = grammar_triggers;
      llama_params["preserved_tokens"] = chat_params.preserved_tokens;
author	Xuan-Son Nguyen <redacted>
	Wed, 2 Apr 2025 07:58:34 +0000 (09:58 +0200)
committer	GitHub <redacted>
	Wed, 2 Apr 2025 07:58:34 +0000 (09:58 +0200)
common/common.cpp		patch \| blob \| history
common/common.h		patch \| blob \| history
examples/server/server.cpp		patch \| blob \| history
examples/server/utils.hpp		patch \| blob \| history