Skip to content

Commit f088b6a

Browse files
authored
server : adjust prompt similarity thold + add logs (#15913)
ggml-ci
1 parent 304ac56 commit f088b6a

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

common/common.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -452,7 +452,7 @@ struct common_params {
452452

453453
std::string slot_save_path;
454454

455-
float slot_prompt_similarity = 0.5f;
455+
float slot_prompt_similarity = 0.1f;
456456

457457
// batched-bench params
458458
bool is_pp_shared = false;

tools/server/server.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2372,7 +2372,7 @@ struct server_context {
23722372
}
23732373

23742374
if (ret != nullptr) {
2375-
SLT_DBG(*ret, "selected slot by lcs similarity, lcs_len = %d, similarity = %f\n", lcs_len, similarity);
2375+
SLT_INF(*ret, "selected slot by lcs similarity, lcs_len = %d, similarity = %.3f (> %.3f thold)\n", lcs_len, similarity, slot_prompt_similarity);
23762376
}
23772377
}
23782378

@@ -2394,7 +2394,7 @@ struct server_context {
23942394
}
23952395

23962396
if (ret != nullptr) {
2397-
SLT_DBG(*ret, "selected slot by lru, t_last = %" PRId64 "\n", t_last);
2397+
SLT_INF(*ret, "selected slot by LRU, t_last = %" PRId64 "\n", t_last);
23982398
}
23992399
}
24002400

0 commit comments

Comments
 (0)