Skip to content

Commit f8d561e

Browse files
llama-fit-params: fix step size for last device (ggml-org#18415)
1 parent e59efe6 commit f8d561e

1 file changed

Lines changed: 3 additions & 0 deletions

File tree

src/llama.cpp

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -512,6 +512,9 @@ static void llama_params_fit_impl(
512512
if (mem_high[id] > targets[id]) {
513513
assert(ngl_per_device_high[id].n_layer > ngl_per_device[id].n_layer);
514514
uint32_t delta = ngl_per_device_high[id].n_layer - ngl_per_device[id].n_layer;
515+
if (hp_nex > 0 && size_t(id) == nd - 1) {
516+
delta--;
517+
}
515518
LLAMA_LOG_DEBUG("%s: start filling device %" PRIu32 ", delta=%" PRIu32 "\n", __func__, id, delta);
516519
while (delta > 1) {
517520
uint32_t step_size = int64_t(delta) * (targets[id] - mem[id]) / (mem_high[id] - mem[id]);

0 commit comments

Comments
 (0)