Skip to content

Commit 105e2f3

Browse files
committed
fix use-after-free
1 parent 937b064 commit 105e2f3

1 file changed

Lines changed: 3 additions & 6 deletions

File tree

tools/server/server-context.cpp

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -809,14 +809,11 @@ struct server_context_impl {
809809
batch = llama_batch_init(std::max(n_batch, params_base.n_parallel), 0, 1);
810810
}
811811

812-
if (is_resume) {
813-
return true;
812+
// preserve metric state across resumes
813+
if (!is_resume) {
814+
metrics.init();
814815
}
815816

816-
// everything below this line is only for fresh model load
817-
818-
metrics.init();
819-
820817
if (params_base.cache_ram_mib != 0) {
821818
if (params_base.cache_ram_mib < 0) {
822819
SRV_WRN("prompt cache is enabled, size limit: %s\n", "no limit");

0 commit comments

Comments
 (0)