Make colab functional for llama.cpp

- Download only Q4_K_M for GGUF repositories by default - Use maximum n-gpu-layers by default
2023-10-22 09:06:20 -07:00 · 2023-10-22 09:06:20 -07:00 · 613feca23b
commit 613feca23b
parent 994502d41b
2 changed files with 6 additions and 1 deletions
--- a/download-model.py
+++ b/download-model.py
@ -128,6 +128,11 @@ class ModelDownloader:
                if classifications[i] in ['pytorch', 'pt']:
                    links.pop(i)

+        if has_gguf and specific_file is None:
+            for i in range(len(classifications) - 1, -1, -1):
+                if 'q4_k_m' not in links[i].lower():
+                    links.pop(i)
+
        is_llamacpp = has_gguf and specific_file is not None
        return links, sha256, is_lora, is_llamacpp