Skip to content

Commit 79a37ec

Browse files
committed
Avoid mlock of offloaded tensors.
1 parent 05c2f76 commit 79a37ec

File tree

1 file changed

+6
-5
lines changed

1 file changed

+6
-5
lines changed

llama.cpp

+6-5
Original file line numberDiff line numberDiff line change
@@ -715,8 +715,12 @@ struct llama_model_loader {
715715
load_data_for(lt);
716716
switch(lt.ggml_tensor->backend) {
717717
case GGML_BACKEND_CPU:
718-
lt.ggml_tensor->data = lt.data;
719-
break;
718+
lt.ggml_tensor->data = lt.data;
719+
if (use_mmap && lmlock)
720+
{
721+
lmlock->grow_to(done_size);
722+
}
723+
break;
720724
#ifdef GGML_USE_CUBLAS
721725
case GGML_BACKEND_CUDA:
722726
ggml_cuda_load_data(lt.data, lt.ggml_tensor);
@@ -731,9 +735,6 @@ struct llama_model_loader {
731735
continue;
732736
}
733737
done_size += lt.size;
734-
if (use_mmap && lmlock) {
735-
lmlock->grow_to(done_size);
736-
}
737738
}
738739
}
739740

0 commit comments

Comments
 (0)