AutoGPTQ: Add --disable_exllamav2 flag (Mixtral CPU offloading needs this)

2023-12-15 06:46:13 -08:00 · 2023-12-15 06:46:13 -08:00 · 3bbf6c601d
commit 3bbf6c601d
parent 7de10f4c8e
7 changed files with 16 additions and 4 deletions
--- a/modules/loaders.py
+++ b/modules/loaders.py
@ -25,6 +25,7 @@ loaders_and_params = OrderedDict({
        'rope_freq_base',
        'compress_pos_emb',
        'disable_exllama',
+        'disable_exllamav2',
        'transformers_info'
    ],
    'llama.cpp': [
@ -94,6 +95,7 @@ loaders_and_params = OrderedDict({
        'groupsize',
        'desc_act',
        'disable_exllama',
+        'disable_exllamav2',
        'gpu_memory',
        'cpu_memory',
        'cpu',