server : fix LRU check (#14079)

ggml-ci
This commit is contained in:
Georgi Gerganov 2025-06-09 12:57:58 +03:00 committed by GitHub
parent b460d16ae8
commit 87d34b381d
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -2142,7 +2142,8 @@ struct server_context {
// find the slot that has been least recently used // find the slot that has been least recently used
if (ret == nullptr) { if (ret == nullptr) {
int64_t t_last = ggml_time_us(); int64_t t_last = -1;
for (server_slot & slot : slots) { for (server_slot & slot : slots) {
// skip the slot if it is not available // skip the slot if it is not available
if (slot.is_processing()) { if (slot.is_processing()) {
@ -2150,7 +2151,7 @@ struct server_context {
} }
// select the current slot if the criteria match // select the current slot if the criteria match
if (slot.t_last_used < t_last) { if (!ret || slot.t_last_used <= t_last) {
t_last = slot.t_last_used; t_last = slot.t_last_used;
ret = &slot; ret = &slot;
} }