2
0

sd_vae.py 6.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216
  1. import torch
  2. import safetensors.torch
  3. import os
  4. import collections
  5. from collections import namedtuple
  6. from modules import paths, shared, devices, script_callbacks, sd_models
  7. import glob
  8. from copy import deepcopy
  9. vae_path = os.path.abspath(os.path.join(paths.models_path, "VAE"))
  10. vae_ignore_keys = {"model_ema.decay", "model_ema.num_updates"}
  11. vae_dict = {}
  12. base_vae = None
  13. loaded_vae_file = None
  14. checkpoint_info = None
  15. checkpoints_loaded = collections.OrderedDict()
  16. def get_base_vae(model):
  17. if base_vae is not None and checkpoint_info == model.sd_checkpoint_info and model:
  18. return base_vae
  19. return None
  20. def store_base_vae(model):
  21. global base_vae, checkpoint_info
  22. if checkpoint_info != model.sd_checkpoint_info:
  23. assert not loaded_vae_file, "Trying to store non-base VAE!"
  24. base_vae = deepcopy(model.first_stage_model.state_dict())
  25. checkpoint_info = model.sd_checkpoint_info
  26. def delete_base_vae():
  27. global base_vae, checkpoint_info
  28. base_vae = None
  29. checkpoint_info = None
  30. def restore_base_vae(model):
  31. global loaded_vae_file
  32. if base_vae is not None and checkpoint_info == model.sd_checkpoint_info:
  33. print("Restoring base VAE")
  34. _load_vae_dict(model, base_vae)
  35. loaded_vae_file = None
  36. delete_base_vae()
  37. def get_filename(filepath):
  38. return os.path.basename(filepath)
  39. def refresh_vae_list():
  40. vae_dict.clear()
  41. paths = [
  42. os.path.join(sd_models.model_path, '**/*.vae.ckpt'),
  43. os.path.join(sd_models.model_path, '**/*.vae.pt'),
  44. os.path.join(sd_models.model_path, '**/*.vae.safetensors'),
  45. os.path.join(vae_path, '**/*.ckpt'),
  46. os.path.join(vae_path, '**/*.pt'),
  47. os.path.join(vae_path, '**/*.safetensors'),
  48. ]
  49. if shared.cmd_opts.ckpt_dir is not None and os.path.isdir(shared.cmd_opts.ckpt_dir):
  50. paths += [
  51. os.path.join(shared.cmd_opts.ckpt_dir, '**/*.vae.ckpt'),
  52. os.path.join(shared.cmd_opts.ckpt_dir, '**/*.vae.pt'),
  53. os.path.join(shared.cmd_opts.ckpt_dir, '**/*.vae.safetensors'),
  54. ]
  55. if shared.cmd_opts.vae_dir is not None and os.path.isdir(shared.cmd_opts.vae_dir):
  56. paths += [
  57. os.path.join(shared.cmd_opts.vae_dir, '**/*.ckpt'),
  58. os.path.join(shared.cmd_opts.vae_dir, '**/*.pt'),
  59. os.path.join(shared.cmd_opts.vae_dir, '**/*.safetensors'),
  60. ]
  61. candidates = []
  62. for path in paths:
  63. candidates += glob.iglob(path, recursive=True)
  64. for filepath in candidates:
  65. name = get_filename(filepath)
  66. vae_dict[name] = filepath
  67. def find_vae_near_checkpoint(checkpoint_file):
  68. checkpoint_path = os.path.splitext(checkpoint_file)[0]
  69. for vae_location in [checkpoint_path + ".vae.pt", checkpoint_path + ".vae.ckpt", checkpoint_path + ".vae.safetensors"]:
  70. if os.path.isfile(vae_location):
  71. return vae_location
  72. return None
  73. def resolve_vae(checkpoint_file):
  74. if shared.cmd_opts.vae_path is not None:
  75. return shared.cmd_opts.vae_path, 'from commandline argument'
  76. is_automatic = shared.opts.sd_vae in {"Automatic", "auto"} # "auto" for people with old config
  77. vae_near_checkpoint = find_vae_near_checkpoint(checkpoint_file)
  78. if vae_near_checkpoint is not None and (shared.opts.sd_vae_as_default or is_automatic):
  79. return vae_near_checkpoint, 'found near the checkpoint'
  80. if shared.opts.sd_vae == "None":
  81. return None, None
  82. vae_from_options = vae_dict.get(shared.opts.sd_vae, None)
  83. if vae_from_options is not None:
  84. return vae_from_options, 'specified in settings'
  85. if not is_automatic:
  86. print(f"Couldn't find VAE named {shared.opts.sd_vae}; using None instead")
  87. return None, None
  88. def load_vae_dict(filename, map_location):
  89. vae_ckpt = sd_models.read_state_dict(filename, map_location=map_location)
  90. vae_dict_1 = {k: v for k, v in vae_ckpt.items() if k[0:4] != "loss" and k not in vae_ignore_keys}
  91. return vae_dict_1
  92. def load_vae(model, vae_file=None, vae_source="from unknown source"):
  93. global vae_dict, loaded_vae_file
  94. # save_settings = False
  95. cache_enabled = shared.opts.sd_vae_checkpoint_cache > 0
  96. if vae_file:
  97. if cache_enabled and vae_file in checkpoints_loaded:
  98. # use vae checkpoint cache
  99. print(f"Loading VAE weights {vae_source}: cached {get_filename(vae_file)}")
  100. store_base_vae(model)
  101. _load_vae_dict(model, checkpoints_loaded[vae_file])
  102. else:
  103. assert os.path.isfile(vae_file), f"VAE {vae_source} doesn't exist: {vae_file}"
  104. print(f"Loading VAE weights {vae_source}: {vae_file}")
  105. store_base_vae(model)
  106. vae_dict_1 = load_vae_dict(vae_file, map_location=shared.weight_load_location)
  107. _load_vae_dict(model, vae_dict_1)
  108. if cache_enabled:
  109. # cache newly loaded vae
  110. checkpoints_loaded[vae_file] = vae_dict_1.copy()
  111. # clean up cache if limit is reached
  112. if cache_enabled:
  113. while len(checkpoints_loaded) > shared.opts.sd_vae_checkpoint_cache + 1: # we need to count the current model
  114. checkpoints_loaded.popitem(last=False) # LRU
  115. # If vae used is not in dict, update it
  116. # It will be removed on refresh though
  117. vae_opt = get_filename(vae_file)
  118. if vae_opt not in vae_dict:
  119. vae_dict[vae_opt] = vae_file
  120. elif loaded_vae_file:
  121. restore_base_vae(model)
  122. loaded_vae_file = vae_file
  123. # don't call this from outside
  124. def _load_vae_dict(model, vae_dict_1):
  125. model.first_stage_model.load_state_dict(vae_dict_1)
  126. model.first_stage_model.to(devices.dtype_vae)
  127. def clear_loaded_vae():
  128. global loaded_vae_file
  129. loaded_vae_file = None
  130. unspecified = object()
  131. def reload_vae_weights(sd_model=None, vae_file=unspecified):
  132. from modules import lowvram, devices, sd_hijack
  133. if not sd_model:
  134. sd_model = shared.sd_model
  135. checkpoint_info = sd_model.sd_checkpoint_info
  136. checkpoint_file = checkpoint_info.filename
  137. if vae_file == unspecified:
  138. vae_file, vae_source = resolve_vae(checkpoint_file)
  139. else:
  140. vae_source = "from function argument"
  141. if loaded_vae_file == vae_file:
  142. return
  143. if shared.cmd_opts.lowvram or shared.cmd_opts.medvram:
  144. lowvram.send_everything_to_cpu()
  145. else:
  146. sd_model.to(devices.cpu)
  147. sd_hijack.model_hijack.undo_hijack(sd_model)
  148. load_vae(sd_model, vae_file, vae_source)
  149. sd_hijack.model_hijack.hijack(sd_model)
  150. script_callbacks.model_loaded_callback(sd_model)
  151. if not shared.cmd_opts.lowvram and not shared.cmd_opts.medvram:
  152. sd_model.to(devices.device)
  153. print("VAE weights loaded.")
  154. return sd_model