Clear cache while switching LoRAs

2023-03-23 21:56:26 -03:00 · 2023-03-23 21:56:26 -03:00 · bf22d16ebc
commit bf22d16ebc
parent 4578e88ffd
3 changed files with 13 additions and 24 deletions
--- a/modules/LoRA.py
+++ b/modules/LoRA.py
@ -2,19 +2,22 @@ from pathlib import Path

 import modules.shared as shared
 from modules.models import load_model
+from modules.text_generation import clear_torch_cache


+def reload_model():
+    shared.model = shared.tokenizer = None
+    clear_torch_cache()
+    shared.model, shared.tokenizer = load_model(shared.model_name)
+
 def add_lora_to_model(lora_name):

    from peft import PeftModel

-    # Is there a more efficient way of returning to the base model?
-    if lora_name == "None":
-        print("Reloading the model to remove the LoRA...")
-        shared.model, shared.tokenizer = load_model(shared.model_name)
-    else:
+    reload_model()
+
+    if lora_name != "None":
        print(f"Adding the LoRA {lora_name} to the model...")
-        
        params = {}
        if not shared.args.cpu:
            params['dtype'] = shared.model.dtype
--- a/modules/callbacks.py
+++ b/modules/callbacks.py
@ -1,11 +1,10 @@
-import gc
 from queue import Queue
 from threading import Thread

 import torch
 import transformers

-import modules.shared as shared
+from modules.text_generation import clear_torch_cache


 # Copied from https://github.com/PygmalionAI/gradio-ui/
@ -90,8 +89,3 @@ class Iteratorize:
    def __exit__(self, exc_type, exc_val, exc_tb):
        self.stop_now = True
        clear_torch_cache()
-
-def clear_torch_cache():
-    gc.collect()
-    if not shared.args.cpu:
-        torch.cuda.empty_cache()