add checkpoint cache option to UI for faster model switching

switching time reduced from ~1500ms to ~280ms
2022-10-13 23:00:38 -06:00 · 2022-10-13 23:00:38 -06:00 · e21f01f645
commit e21f01f645
parent 494afccbc1
2 changed files with 33 additions and 22 deletions
--- a/modules/sd_models.py
+++ b/modules/sd_models.py
@ -1,4 +1,4 @@
-import glob
+import collections
 import os.path
 import sys
 from collections import namedtuple
@ -15,6 +15,7 @@ model_path = os.path.abspath(os.path.join(models_path, model_dir))

 CheckpointInfo = namedtuple("CheckpointInfo", ['filename', 'title', 'hash', 'model_name', 'config'])
 checkpoints_list = {}
+checkpoints_loaded = collections.OrderedDict()

 try:
    # this silences the annoying "Some weights of the model checkpoint were not used when initializing..." message at start.
@ -132,6 +133,7 @@ def load_model_weights(model, checkpoint_info):
    checkpoint_file = checkpoint_info.filename
    sd_model_hash = checkpoint_info.hash

+    if checkpoint_info not in checkpoints_loaded:
        print(f"Loading weights [{sd_model_hash}] from {checkpoint_file}")

        pl_sd = torch.load(checkpoint_file, map_location="cpu")
@ -139,7 +141,6 @@ def load_model_weights(model, checkpoint_info):
            print(f"Global Step: {pl_sd['global_step']}")

        sd = get_state_dict_from_checkpoint(pl_sd)
-
        model.load_state_dict(sd, strict=False)

        if shared.cmd_opts.opt_channelslast:
@ -165,6 +166,14 @@ def load_model_weights(model, checkpoint_info):

        model.first_stage_model.to(devices.dtype_vae)

+        checkpoints_loaded[checkpoint_info] = model.state_dict().copy()
+        while len(checkpoints_loaded) > shared.opts.sd_checkpoint_cache:
+            checkpoints_loaded.popitem(last=False)  # LRU
+    else:
+        print(f"Loading weights [{sd_model_hash}] from cache")
+        checkpoints_loaded.move_to_end(checkpoint_info)
+        model.load_state_dict(checkpoints_loaded[checkpoint_info])
+
    model.sd_model_hash = sd_model_hash
    model.sd_model_checkpoint = checkpoint_file
    model.sd_checkpoint_info = checkpoint_info
@ -202,6 +211,7 @@ def reload_model_weights(sd_model, info=None):
        return

    if sd_model.sd_checkpoint_info.config != checkpoint_info.config:
+        checkpoints_loaded.clear()
        shared.sd_model = load_model()
        return shared.sd_model

--- a/modules/shared.py
+++ b/modules/shared.py
@ -238,6 +238,7 @@ options_templates.update(options_section(('training', "Training"), {

 options_templates.update(options_section(('sd', "Stable Diffusion"), {
    "sd_model_checkpoint": OptionInfo(None, "Stable Diffusion checkpoint", gr.Dropdown, lambda: {"choices": modules.sd_models.checkpoint_tiles()}, refresh=sd_models.list_models),
+    "sd_checkpoint_cache": OptionInfo(0, "Checkpoints to cache in RAM", gr.Slider, {"minimum": 0, "maximum": 10, "step": 1}),
    "sd_hypernetwork": OptionInfo("None", "Hypernetwork", gr.Dropdown, lambda: {"choices": ["None"] + [x for x in hypernetworks.keys()]}, refresh=reload_hypernetworks),
    "sd_hypernetwork_strength": OptionInfo(1.0, "Hypernetwork strength", gr.Slider, {"minimum": 0.0, "maximum": 1.0, "step": 0.001}),
    "img2img_color_correction": OptionInfo(False, "Apply color correction to img2img results to match original colors."),