AutoAWQ: initial support (#3999)

2023-10-05 16:19:18 +00:00 · 2023-10-05 16:19:18 +00:00 · cc632c3f33
commit cc632c3f33
parent 3f56151f03
8 changed files with 75 additions and 3 deletions
--- a/modules/models_settings.py
+++ b/modules/models_settings.py
@ -107,10 +107,14 @@ def infer_loader(model_name, model_settings):
        loader = None
    elif (path_to_model / 'quantize_config.json').exists() or ('wbits' in model_settings and type(model_settings['wbits']) is int and model_settings['wbits'] > 0):
        loader = 'AutoGPTQ'
+    elif (path_to_model / 'quant_config.json').exists():
+        loader = 'AutoAWQ'
    elif len(list(path_to_model.glob('*.gguf'))) > 0:
        loader = 'llama.cpp'
    elif re.match(r'.*\.gguf', model_name.lower()):
        loader = 'llama.cpp'
+    elif re.match(r'.*-awq', model_name.lower()):
+        loader = 'AutoAWQ'
    elif re.match(r'.*rwkv.*\.pth', model_name.lower()):
        loader = 'RWKV'
    elif re.match(r'.*exl2', model_name.lower()):