]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
server bench: fix bench not waiting for model load (#7284)
authorJohannes Gäßler <redacted>
Wed, 15 May 2024 06:44:16 +0000 (08:44 +0200)
committerGitHub <redacted>
Wed, 15 May 2024 06:44:16 +0000 (08:44 +0200)
examples/server/bench/bench.py

index 86c5de101445c162c6150b25c73fbde1255afe0a..25ac29c4c7145d8609c95b8515191330cadb1bcf 100644 (file)
@@ -293,13 +293,14 @@ def start_server_background(args):
 
 
 def is_server_listening(server_fqdn, server_port):
-    with closing(socket.socket(socket.AF_INET, socket.SOCK_STREAM)) as sock:
-        result = sock.connect_ex((server_fqdn, server_port))
-        _is_server_listening = result == 0
-        if _is_server_listening:
-            print(f"server is listening on {server_fqdn}:{server_port}...")
-        return _is_server_listening
-
+    try:
+        url = f"{server_fqdn}:{server_port}/health"
+        if not url.startswith("http://"):
+            url = f"http://{url}"
+        result = requests.get(url)
+        return result.status_code == 200
+    except Exception:
+        return False
 
 def escape_metric_name(metric_name):
     return re.sub('[^A-Z0-9]', '_', metric_name.upper())