llama-bench : fix RPC indication (#7936)

author Radoslav Gerganov <redacted>

Fri, 14 Jun 2024 13:47:41 +0000 (16:47 +0300)

committer GitHub <redacted>

Fri, 14 Jun 2024 13:47:41 +0000 (16:47 +0300)
author Radoslav Gerganov <redacted>
Fri, 14 Jun 2024 13:47:41 +0000 (16:47 +0300)
committer GitHub <redacted>
Fri, 14 Jun 2024 13:47:41 +0000 (16:47 +0300)
diff --git a/examples/llama-bench/llama-bench.cpp b/examples/llama-bench/llama-bench.cpp

index 61dd1d71ab5e9fe300221729874e4f60754c4d94..d641a9f12b3887b180b00afa762f9f9b7511de3e 100644 (file)
--- a/examples/llama-bench/llama-bench.cpp
+++ b/examples/llama-bench/llama-bench.cpp
@@ -714,7 +714,6 @@ struct test {
      static const bool kompute;
      static const bool metal;
      static const bool sycl;
-    static const bool rpc;
      static const bool gpu_blas;
      static const bool blas;
      static const std::string cpu_info;
@@ -726,6 +725,7 @@ struct test {
      int n_batch;
      int n_ubatch;
      int n_threads;
+    bool has_rpc;
      ggml_type type_k;
      ggml_type type_v;
      int n_gpu_layers;
@@ -751,6 +751,7 @@ struct test {
          n_batch = inst.n_batch;
          n_ubatch = inst.n_ubatch;
          n_threads = inst.n_threads;
+        has_rpc = !inst.rpc_servers.empty();
          type_k = inst.type_k;
          type_v = inst.type_v;
          n_gpu_layers = inst.n_gpu_layers;
@@ -810,9 +811,6 @@ struct test {
          if (sycl) {
              return GGML_SYCL_NAME;
          }
-        if (rpc) {
-            return "RPC";
-        }
          if (gpu_blas) {
              return "GPU BLAS";
          }
@@ -882,7 +880,7 @@ struct test {
          std::vector<std::string> values = {
              build_commit, std::to_string(build_number),
              std::to_string(cuda), std::to_string(vulkan), std::to_string(vulkan),
-            std::to_string(metal), std::to_string(sycl), std::to_string(rpc), std::to_string(gpu_blas), std::to_string(blas),
+            std::to_string(metal), std::to_string(sycl), std::to_string(has_rpc), std::to_string(gpu_blas), std::to_string(blas),
              cpu_info, gpu_info,
              model_filename, model_type, std::to_string(model_size), std::to_string(model_n_params),
              std::to_string(n_batch), std::to_string(n_ubatch),
@@ -916,7 +914,6 @@ const bool        test::metal        = !!ggml_cpu_has_metal();
  const bool        test::gpu_blas     = !!ggml_cpu_has_gpublas();
  const bool        test::blas         = !!ggml_cpu_has_blas();
  const bool        test::sycl         = !!ggml_cpu_has_sycl();
-const bool        test::rpc          = !!ggml_cpu_has_rpc();
  const std::string test::cpu_info     = get_cpu_info();
  const std::string test::gpu_info     = get_gpu_info();
  
@@ -1182,6 +1179,9 @@ struct markdown_printer : public printer {
                  value = buf;
              } else if (field == "backend") {
                  value = test::get_backend();
+                if (t.has_rpc) {
+                    value += "+RPC";
+                }
              } else if (field == "test") {
                  if (t.n_prompt > 0 && t.n_gen == 0) {
                      snprintf(buf, sizeof(buf), "pp%d", t.n_prompt);
author	Radoslav Gerganov <redacted>
	Fri, 14 Jun 2024 13:47:41 +0000 (16:47 +0300)
committer	GitHub <redacted>
	Fri, 14 Jun 2024 13:47:41 +0000 (16:47 +0300)