common : add support for cpu_get_num_physical_cores() on Windows (#8771)

author Liu Jia <redacted>

Fri, 16 Aug 2024 06:23:12 +0000 (14:23 +0800)

committer GitHub <redacted>

Fri, 16 Aug 2024 06:23:12 +0000 (09:23 +0300)
author Liu Jia <redacted>
Fri, 16 Aug 2024 06:23:12 +0000 (14:23 +0800)
committer GitHub <redacted>
Fri, 16 Aug 2024 06:23:12 +0000 (09:23 +0300)
diff --git a/common/common.cpp b/common/common.cpp

index ce46e65ae2834df99d22a64bfebe5e3703026350..382d585a5e6f900a1eb72fbd3abab2809b73d19f 100644 (file)
--- a/common/common.cpp
+++ b/common/common.cpp
@@ -110,8 +110,34 @@ int32_t cpu_get_num_physical_cores() {
      if (result == 0) {
          return num_physical_cores;
      }
-#elif defined(_WIN32)
-    //TODO: Implement
+#elif defined(_WIN32) && (_WIN32_WINNT >= 0x0601) && !defined(__MINGW64__) // windows 7 and later
+    // TODO: windows + arm64 + mingw64
+    unsigned int n_threads_win = std::thread::hardware_concurrency();
+    unsigned int default_threads = n_threads_win > 0 ? (n_threads_win <= 4 ? n_threads_win : n_threads_win / 2) : 4;
+
+    DWORD buffer_size = 0;
+    if (!GetLogicalProcessorInformationEx(RelationProcessorCore, nullptr, &buffer_size)) {
+        if (GetLastError() != ERROR_INSUFFICIENT_BUFFER) {
+            return default_threads;
+        }
+    }
+
+    std::vector<char> buffer(buffer_size);
+    if (!GetLogicalProcessorInformationEx(RelationProcessorCore, reinterpret_cast<PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX>(buffer.data()), &buffer_size)) {
+        return default_threads;
+    }
+
+    int32_t num_physical_cores = 0;
+    PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX info = reinterpret_cast<PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX>(buffer.data());
+    while (buffer_size > 0) {
+        if (info->Relationship == RelationProcessorCore) {
+            num_physical_cores += info->Processor.GroupCount;
+        }
+        buffer_size -= info->Size;
+        info = reinterpret_cast<PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX>(reinterpret_cast<char*>(info) + info->Size);
+    }
+
+    return num_physical_cores > 0 ? num_physical_cores : default_threads;
  #endif
      unsigned int n_threads = std::thread::hardware_concurrency();
      return n_threads > 0 ? (n_threads <= 4 ? n_threads : n_threads / 2) : 4;
@@ -1727,7 +1753,13 @@ std::string gpt_params_get_system_info(const gpt_params & params) {
      if (params.n_threads_batch != -1) {
          os << " (n_threads_batch = " << params.n_threads_batch << ")";
      }
+#if defined(_WIN32) && (_WIN32_WINNT >= 0x0601) && !defined(__MINGW64__) // windows 7 and later
+    // TODO: windows + arm64 + mingw64
+    DWORD logicalProcessorCount = GetActiveProcessorCount(ALL_PROCESSOR_GROUPS);
+    os << " / " << logicalProcessorCount << " | " << llama_print_system_info();
+#else
      os << " / " << std::thread::hardware_concurrency() << " | " << llama_print_system_info();
+#endif
  
      return os.str();
  }
author	Liu Jia <redacted>
	Fri, 16 Aug 2024 06:23:12 +0000 (14:23 +0800)
committer	GitHub <redacted>
	Fri, 16 Aug 2024 06:23:12 +0000 (09:23 +0300)