Implement CFG for ExLlama_HF (#3666)

2023-08-24 16:27:36 -03:00 · 2023-08-24 16:27:36 -03:00 · d6934bc7bc
commit d6934bc7bc
parent 2b675533f7
8 changed files with 122 additions and 26 deletions
--- a/modules/models_settings.py
+++ b/modules/models_settings.py
@ -91,8 +91,8 @@ def apply_model_settings_to_state(model, state):
        if 'wbits' in model_settings and type(model_settings['wbits']) is int and model_settings['wbits'] > 0:
            loader = 'AutoGPTQ'

-        # If the user is using an alternative GPTQ loader, let them keep using it
-        if not (loader == 'AutoGPTQ' and state['loader'] in ['GPTQ-for-LLaMa', 'ExLlama', 'ExLlama_HF']):
+        # If the user is using an alternative loader for the same model type, let them keep using it
+        if not (loader == 'AutoGPTQ' and state['loader'] in ['GPTQ-for-LLaMa', 'ExLlama', 'ExLlama_HF']) and not (loader == 'llama.cpp' and state['loader'] in ['llamacpp_HF', 'ctransformers']):
            state['loader'] = loader

    for k in model_settings: