Add CUDA wheels for llama-cpp-python by jllllll

2023-07-19 19:31:19 -07:00 · 2023-07-19 19:31:19 -07:00 · 4b19b74e6c
commit 4b19b74e6c
parent 05f4cc63c8
3 changed files with 19 additions and 7 deletions
--- a/modules/llamacpp_model.py
+++ b/modules/llamacpp_model.py
@ -9,12 +9,17 @@ https://abetlen.github.io/llama-cpp-python/
 import re
 from functools import partial

-from llama_cpp import Llama, LlamaCache, LogitsProcessorList
+import torch

 from modules import shared
 from modules.callbacks import Iteratorize
 from modules.logging_colors import logger

+if torch.cuda.is_available():
+    from llama_cpp_cuda import Llama, LlamaCache, LogitsProcessorList
+else:
+    from llama_cpp import Llama, LlamaCache, LogitsProcessorList
+

 def ban_eos_logits_processor(eos_token, input_ids, logits):
    logits[eos_token] = -float('inf')