if (is_processing()) {
SLT_INF(*this, "stop processing: n_past = %d, truncated = %d\n", n_past, truncated);
+ t_last_used = ggml_time_us();
t_token_generation = (ggml_time_us() - t_start_generation) / 1e3;
state = SLOT_STATE_IDLE;
callback_on_release(id);
// find the slot that has at least n% prompt similarity
if (ret == nullptr && slot_prompt_similarity != 0.0f) {
- int max_lcs_len = 0;
+ int lcs_len = 0;
float similarity = 0;
for (server_slot & slot : slots) {
}
// length of the Longest Common Subsequence between the current slot's prompt and the input prompt
- int lcs_len = longest_common_subsequence(slot.cache_tokens, task.prompt_tokens);
+ int cur_lcs_len = longest_common_subsequence(slot.cache_tokens, task.prompt_tokens);
// fraction of the common subsequence length compared to the current slot's prompt length
- similarity = static_cast<float>(lcs_len) / static_cast<int>(slot.cache_tokens.size());
+ float cur_similarity = static_cast<float>(cur_lcs_len) / static_cast<int>(slot.cache_tokens.size());
// select the current slot if the criteria match
- if (lcs_len > max_lcs_len && similarity > slot_prompt_similarity) {
- max_lcs_len = lcs_len;
+ if (cur_lcs_len > lcs_len && cur_similarity > slot_prompt_similarity) {
+ lcs_len = cur_lcs_len;
+ similarity = cur_similarity;
ret = &slot;
}
}
if (ret != nullptr) {
- SLT_DBG(*ret, "selected slot by lcs similarity, max_lcs_len = %d, similarity = %f\n", max_lcs_len, similarity);
+ SLT_DBG(*ret, "selected slot by lcs similarity, lcs_len = %d, similarity = %f\n", lcs_len, similarity);
}
}
}
// get the lengths of the input sequences
- int a_len = a.size();
- int b_len = b.size();
+ size_t a_len = a.size();
+ size_t b_len = b.size();
// initialize the maximum length of the longest common subsequence (LCS)
- int max_length = 0;
+ size_t max_length = 0;
// use two rows instead of a 2D matrix to optimize space
- std::vector<int> prev_row(b_len + 1, 0);
- std::vector<int> curr_row(b_len + 1, 0);
+ std::vector<size_t> prev_row(b_len + 1, 0);
+ std::vector<size_t> curr_row(b_len + 1, 0);
// iterate through the elements of a
- for (int i = 1; i <= a_len; i++) {
+ for (size_t i = 1; i <= a_len; i++) {
// iterate through the elements of b
- for (int j = 1; j <= b_len; j++) {
+ for (size_t j = 1; j <= b_len; j++) {
// if elements at the current positions match
if (a[i - 1] == b[j - 1]) {
// if it's the first element of either sequences, set LCS length to 1