server: tests - slow inference causes timeout on the CI (#5715)

author Pierrick Hymbert <redacted>

Sun, 25 Feb 2024 21:48:33 +0000 (22:48 +0100)

committer GitHub <redacted>

Sun, 25 Feb 2024 21:48:33 +0000 (22:48 +0100)
author Pierrick Hymbert <redacted>
Sun, 25 Feb 2024 21:48:33 +0000 (22:48 +0100)
committer GitHub <redacted>
Sun, 25 Feb 2024 21:48:33 +0000 (22:48 +0100)
diff --git a/common/sampling.cpp b/common/sampling.cpp

index de4331a1182d6aaf39e5873f46b5d8ace97eea9f..e67096bea693262d0b4a5d244c37d52d48ae5453 100644 (file)
--- a/common/sampling.cpp
+++ b/common/sampling.cpp
@@ -266,7 +266,7 @@ static llama_token llama_sampling_sample_impl(
              //    }
              //}
  
-            LOG("sampled token: %5d: '%s'\n", id, llama_token_to_piece(ctx_main, id).c_str());
+            //LOG("sampled token: %5d: '%s'\n", id, llama_token_to_piece(ctx_main, id).c_str());
          }
      }
  
diff --git a/examples/server/tests/features/steps/steps.py b/examples/server/tests/features/steps/steps.py

index 8e4babf204f8ac7654406be3b755f8a5559971c3..ad87fcb820aa8f856d8ad9467b3599de32745970 100644 (file)
--- a/examples/server/tests/features/steps/steps.py
+++ b/examples/server/tests/features/steps/steps.py
@@ -699,6 +699,8 @@ async def wait_for_health_status(context,
      if context.debug:
          print(f"Starting checking for health for expected_health_status={expected_health_status}")
      timeout = 3  # seconds
+    if expected_health_status == 'ok':
+        timeout = 10 # CI slow inference
      interval = 0.5
      counter = 0
      async with aiohttp.ClientSession() as session:
@@ -736,7 +738,7 @@ async def wait_for_health_status(context,
                          if n_completions > 0:
                              return
  
-                assert False, 'timeout exceeded'
+                assert False, f'{expected_health_status} timeout exceeded {counter}s>={timeout}'
  
  
  def assert_embeddings(embeddings):
author	Pierrick Hymbert <redacted>
	Sun, 25 Feb 2024 21:48:33 +0000 (22:48 +0100)
committer	GitHub <redacted>
	Sun, 25 Feb 2024 21:48:33 +0000 (22:48 +0100)
common/sampling.cpp		patch \| blob \| history
examples/server/tests/features/steps/steps.py		patch \| blob \| history