server : correct signal handler (#11795)

author Xuan-Son Nguyen <redacted>

Mon, 10 Feb 2025 17:03:28 +0000 (18:03 +0100)

committer GitHub <redacted>

Mon, 10 Feb 2025 17:03:28 +0000 (18:03 +0100)
author Xuan-Son Nguyen <redacted>
Mon, 10 Feb 2025 17:03:28 +0000 (18:03 +0100)
committer GitHub <redacted>
Mon, 10 Feb 2025 17:03:28 +0000 (18:03 +0100)
diff --git a/examples/server/server.cpp b/examples/server/server.cpp

index 0718806c89407ab97116f602a74f26e7e9b57d6a..5da3e187f740aac54cc4d7c93fef15d4a7194f94 100644 (file)
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@@ -1600,6 +1600,10 @@ struct server_queue {
  
              while (true) {
                  std::unique_lock<std::mutex> lock(mutex_tasks);
+                if (!running) {
+                    QUE_DBG("%s", "terminate\n");
+                    return;
+                }
                  if (queue_tasks.empty()) {
                      lock.unlock();
                      break;
@@ -1620,11 +1624,11 @@ struct server_queue {
              QUE_DBG("%s", "waiting for new tasks\n");
              {
                  std::unique_lock<std::mutex> lock(mutex_tasks);
+                if (!running) {
+                    QUE_DBG("%s", "terminate\n");
+                    return;
+                }
                  if (queue_tasks.empty()) {
-                    if (!running) {
-                        QUE_DBG("%s", "terminate\n");
-                        return;
-                    }
                      condition_tasks.wait(lock, [&]{
                          return (!queue_tasks.empty() || !running);
                      });
@@ -4430,6 +4434,7 @@ int main(int argc, char ** argv) {
  
      // clean up function, to be called before exit
      auto clean_up = [&svr]() {
+        SRV_INF("%s: cleaning up before exit...\n", __func__);
          svr->stop();
          llama_backend_free();
      };
@@ -4446,10 +4451,6 @@ int main(int argc, char ** argv) {
      }
  
      if (!was_bound) {
-        //LOG_ERROR("couldn't bind HTTP server socket", {
-        //    {"hostname", params.hostname},
-        //    {"port", params.port},
-        //});
          LOG_ERR("%s: couldn't bind HTTP server socket, hostname: %s, port: %d\n", __func__, params.hostname.c_str(), params.port);
          clean_up();
          return 1;
@@ -4466,7 +4467,7 @@ int main(int argc, char ** argv) {
  
      if (!ctx_server.load_model(params)) {
          clean_up();
-        t.join();
+        // t.join(); // FIXME: see below
          LOG_ERR("%s: exiting due to model loading error\n", __func__);
          return 1;
      }
@@ -4490,13 +4491,10 @@ int main(int argc, char ** argv) {
      });
  
      shutdown_handler = [&](int) {
+        // this will unblock start_loop()
          ctx_server.queue_tasks.terminate();
      };
  
-    LOG_INF("%s: server is listening on http://%s:%d - starting the main loop\n", __func__, params.hostname.c_str(), params.port);
-
-    ctx_server.queue_tasks.start_loop();
-
  #if defined (__unix__) || (defined (__APPLE__) && defined (__MACH__))
      struct sigaction sigint_action;
      sigint_action.sa_handler = signal_handler;
@@ -4511,8 +4509,13 @@ int main(int argc, char ** argv) {
      SetConsoleCtrlHandler(reinterpret_cast<PHANDLER_ROUTINE>(console_ctrl_handler), true);
  #endif
  
+    LOG_INF("%s: server is listening on http://%s:%d - starting the main loop\n", __func__, params.hostname.c_str(), params.port);
+
+    // this call blocks the main thread until queue_tasks.terminate() is called
+    ctx_server.queue_tasks.start_loop();
+
      clean_up();
-    t.join();
+    // t.join(); // FIXME: http thread may stuck if there is an on-going request. we don't need to care about this for now as the HTTP connection will already be closed at this point, but it's better to fix this
  
      return 0;
  }
author	Xuan-Son Nguyen <redacted>
	Mon, 10 Feb 2025 17:03:28 +0000 (18:03 +0100)
committer	GitHub <redacted>
	Mon, 10 Feb 2025 17:03:28 +0000 (18:03 +0100)