Add --threads flag for llama.cpp

2023-03-31 21:18:05 -03:00 · 2023-03-31 21:18:05 -03:00 · 2c52310642
commit 2c52310642
parent eeafd60713
3 changed files with 57 additions and 35 deletions
--- a/modules/llamacpp_model.py
+++ b/modules/llamacpp_model.py
@ -1,5 +1,8 @@
+import multiprocessing
+
 import llamacpp

+from modules import shared
 from modules.callbacks import Iteratorize


@ -29,6 +32,7 @@ class LlamaCppModel:
    def from_pretrained(self, path):
        params = llamacpp.InferenceParams()
        params.path_model = str(path)
+        params.n_threads = shared.args.threads or multiprocessing.cpu_count() // 2

        _model = llamacpp.LlamaInference(params)