import os import glob from copy import deepcopy import torch from modules import shared, paths, devices, script_callbacks, sd_models vae_ignore_keys = {"model_ema.decay", "model_ema.num_updates"} vae_dict = {} base_vae = None loaded_vae_file = None checkpoint_info = None vae_path = os.path.abspath(os.path.join(paths.models_path, 'VAE')) def get_base_vae(model): if base_vae is not None and checkpoint_info == model.sd_checkpoint_info and model: return base_vae return None def store_base_vae(model): global base_vae, checkpoint_info # pylint: disable=global-statement if checkpoint_info != model.sd_checkpoint_info: assert not loaded_vae_file, "Trying to store non-base VAE!" base_vae = deepcopy(model.first_stage_model.state_dict()) checkpoint_info = model.sd_checkpoint_info def delete_base_vae(): global base_vae, checkpoint_info # pylint: disable=global-statement base_vae = None checkpoint_info = None def restore_base_vae(model): global loaded_vae_file # pylint: disable=global-statement if base_vae is not None and checkpoint_info == model.sd_checkpoint_info: shared.log.info("Restoring base VAE") _load_vae_dict(model, base_vae) loaded_vae_file = None delete_base_vae() def get_filename(filepath): if filepath.endswith(".json"): return os.path.basename(os.path.dirname(filepath)) else: return os.path.basename(filepath) def refresh_vae_list(): global vae_path # pylint: disable=global-statement vae_path = shared.opts.vae_dir vae_dict.clear() vae_paths = [] if not shared.native: if sd_models.model_path is not None and os.path.isdir(sd_models.model_path): vae_paths += [ os.path.join(sd_models.model_path, 'VAE', '**/*.vae.ckpt'), os.path.join(sd_models.model_path, 'VAE', '**/*.vae.pt'), os.path.join(sd_models.model_path, 'VAE', '**/*.vae.safetensors'), ] if shared.opts.ckpt_dir is not None and os.path.isdir(shared.opts.ckpt_dir): vae_paths += [ os.path.join(shared.opts.ckpt_dir, '**/*.vae.ckpt'), os.path.join(shared.opts.ckpt_dir, '**/*.vae.pt'), os.path.join(shared.opts.ckpt_dir, '**/*.vae.safetensors'), ] if shared.opts.vae_dir is not None and os.path.isdir(shared.opts.vae_dir): vae_paths += [ os.path.join(shared.opts.vae_dir, '**/*.ckpt'), os.path.join(shared.opts.vae_dir, '**/*.pt'), os.path.join(shared.opts.vae_dir, '**/*.safetensors'), ] elif shared.native: if sd_models.model_path is not None and os.path.isdir(sd_models.model_path): vae_paths += [os.path.join(sd_models.model_path, 'VAE', '**/*.vae.safetensors')] if shared.opts.ckpt_dir is not None and os.path.isdir(shared.opts.ckpt_dir): vae_paths += [os.path.join(shared.opts.ckpt_dir, '**/*.vae.safetensors')] if shared.opts.vae_dir is not None and os.path.isdir(shared.opts.vae_dir): vae_paths += [os.path.join(shared.opts.vae_dir, '**/*.safetensors')] vae_paths += [ os.path.join(sd_models.model_path, 'VAE', '**/*.json'), os.path.join(shared.opts.vae_dir, '**/*.json'), ] candidates = [] for path in vae_paths: candidates += glob.iglob(path, recursive=True) candidates = [os.path.abspath(path) for path in candidates] for filepath in candidates: name = get_filename(filepath) if name == 'VAE': continue if not shared.native: vae_dict[name] = filepath else: if filepath.endswith(".json"): vae_dict[name] = os.path.dirname(filepath) else: vae_dict[name] = filepath shared.log.info(f'Available VAEs: path="{vae_path}" items={len(vae_dict)}') return vae_dict def find_vae_near_checkpoint(checkpoint_file): checkpoint_path = os.path.splitext(checkpoint_file)[0] for vae_location in [f"{checkpoint_path}.vae.pt", f"{checkpoint_path}.vae.ckpt", f"{checkpoint_path}.vae.safetensors"]: if os.path.isfile(vae_location): return vae_location return None def resolve_vae(checkpoint_file): if shared.opts.sd_vae == 'TAESD': return None, None if shared.cmd_opts.vae is not None: # 1st return shared.cmd_opts.vae, 'forced' if shared.opts.sd_vae == "None": # 2nd return None, None vae_near_checkpoint = find_vae_near_checkpoint(checkpoint_file) if vae_near_checkpoint is not None: # 3rd return vae_near_checkpoint, 'near-checkpoint' if shared.opts.sd_vae == "Automatic": # 4th basename = os.path.splitext(os.path.basename(checkpoint_file))[0] if vae_dict.get(basename, None) is not None: return vae_dict[basename], 'automatic' else: vae_from_options = vae_dict.get(shared.opts.sd_vae, None) # 5th if vae_from_options is not None: return vae_from_options, 'settings' vae_from_options = vae_dict.get(shared.opts.sd_vae + '.safetensors', None) # 6th if vae_from_options is not None: return vae_from_options, 'settings' shared.log.warning(f"VAE not found: {shared.opts.sd_vae}") return None, None def load_vae_dict(filename): vae_ckpt = sd_models.read_state_dict(filename) vae_dict_1 = {k: v for k, v in vae_ckpt.items() if k[0:4] != "loss" and k not in vae_ignore_keys} return vae_dict_1 def load_vae(model, vae_file=None, vae_source="unknown-source"): global loaded_vae_file # pylint: disable=global-statement if vae_file: try: if not os.path.isfile(vae_file): shared.log.error(f"VAE not found: model={vae_file} source={vae_source}") return store_base_vae(model) vae_dict_1 = load_vae_dict(vae_file) _load_vae_dict(model, vae_dict_1) except Exception as e: shared.log.error(f"Loading VAE failed: model={vae_file} source={vae_source} {e}") restore_base_vae(model) vae_opt = get_filename(vae_file) if vae_opt not in vae_dict: vae_dict[vae_opt] = vae_file elif loaded_vae_file: restore_base_vae(model) loaded_vae_file = vae_file def apply_vae_config(model_file, vae_file, sd_model): def get_vae_config(): config_file = os.path.join(paths.sd_configs_path, os.path.splitext(os.path.basename(model_file))[0] + '_vae.json') if config_file is not None and os.path.exists(config_file): return shared.readfile(config_file) config_file = os.path.join(paths.sd_configs_path, os.path.splitext(os.path.basename(vae_file))[0] + '.json') if vae_file else None if config_file is not None and os.path.exists(config_file): return shared.readfile(config_file) config_file = os.path.join(paths.sd_configs_path, shared.sd_model_type, 'vae', 'config.json') if config_file is not None and os.path.exists(config_file): return shared.readfile(config_file) return {} if hasattr(sd_model, 'vae') and hasattr(sd_model.vae, 'config'): config = get_vae_config() for k, v in config.items(): if k in sd_model.vae.config and not k.startswith('_'): sd_model.vae.config[k] = v def load_vae_diffusers(model_file, vae_file=None, vae_source="unknown-source"): if vae_file is None: return None if not os.path.exists(vae_file): shared.log.error(f'VAE not found: model{vae_file}') return None shared.log.info(f"Loading VAE: model={vae_file} source={vae_source}") diffusers_load_config = { "low_cpu_mem_usage": False, "torch_dtype": devices.dtype_vae, "use_safetensors": True, } if shared.opts.diffusers_vae_load_variant == 'default': if devices.dtype_vae == torch.float16: diffusers_load_config['variant'] = 'fp16' elif shared.opts.diffusers_vae_load_variant == 'fp32': pass else: diffusers_load_config['variant'] = shared.opts.diffusers_vae_load_variant if shared.opts.diffusers_vae_upcast != 'default': diffusers_load_config['force_upcast'] = True if shared.opts.diffusers_vae_upcast == 'true' else False shared.log.debug(f'Diffusers VAE load config: {diffusers_load_config}') try: import diffusers if os.path.isfile(vae_file): _pipeline, model_type = sd_models.detect_pipeline(model_file, 'vae') diffusers_load_config = { "config_file": paths.sd_default_config if model_type != 'Stable Diffusion XL' else os.path.join(paths.sd_configs_path, 'sd_xl_base.yaml')} if os.path.getsize(vae_file) > 1310944880: vae = diffusers.ConsistencyDecoderVAE.from_pretrained('openai/consistency-decoder', **diffusers_load_config) # consistency decoder does not have from single file, so we'll just download it once more else: vae = diffusers.AutoencoderKL.from_single_file(vae_file, **diffusers_load_config) if getattr(vae.config, 'scaling_factor', 0) == 0.18125 and shared.sd_model_type == 'sdxl': vae.config.scaling_factor = 0.13025 shared.log.debug('Diffusers VAE: fix scaling factor') vae = vae.to(devices.dtype_vae) else: if 'consistency-decoder' in vae_file: vae = diffusers.ConsistencyDecoderVAE.from_pretrained(vae_file, **diffusers_load_config) else: vae = diffusers.AutoencoderKL.from_pretrained(vae_file, **diffusers_load_config) global loaded_vae_file # pylint: disable=global-statement loaded_vae_file = os.path.basename(vae_file) # shared.log.debug(f'Diffusers VAE config: {vae.config}') return vae except Exception as e: shared.log.error(f"Loading VAE failed: model={vae_file} {e}") return None # don't call this from outside def _load_vae_dict(model, vae_dict_1): model.first_stage_model.load_state_dict(vae_dict_1) model.first_stage_model.to(devices.dtype_vae) def clear_loaded_vae(): global loaded_vae_file # pylint: disable=global-statement loaded_vae_file = None unspecified = object() def reload_vae_weights(sd_model=None, vae_file=unspecified): from modules import lowvram, sd_hijack if not sd_model: sd_model = shared.sd_model if sd_model is None: return None global checkpoint_info # pylint: disable=global-statement checkpoint_info = sd_model.sd_checkpoint_info checkpoint_file = checkpoint_info.filename if vae_file == unspecified: vae_file, vae_source = resolve_vae(checkpoint_file) else: vae_source = "function-argument" if vae_file is None or vae_file == 'None': if hasattr(sd_model, 'original_vae'): sd_models.set_diffuser_options(sd_model, vae=sd_model.original_vae, op='vae') shared.log.info("VAE restored") return None if loaded_vae_file == vae_file: return None if not shared.native and (shared.cmd_opts.lowvram or shared.cmd_opts.medvram): lowvram.send_everything_to_cpu() # else: # sd_models.move_model(sd_model, devices.cpu) if not shared.native: sd_hijack.model_hijack.undo_hijack(sd_model) if shared.cmd_opts.rollback_vae and devices.dtype_vae == torch.bfloat16: devices.dtype_vae = torch.float16 load_vae(sd_model, vae_file, vae_source) sd_hijack.model_hijack.hijack(sd_model) script_callbacks.model_loaded_callback(sd_model) if vae_file is not None: shared.log.info(f"VAE weights loaded: {vae_file}") else: if hasattr(sd_model, "vae") and hasattr(sd_model, "sd_checkpoint_info"): vae = load_vae_diffusers(sd_model.sd_checkpoint_info.filename, vae_file, vae_source) if vae is not None: if not hasattr(sd_model, 'original_vae'): sd_model.original_vae = sd_model.vae sd_models.move_model(sd_model.original_vae, devices.cpu) sd_models.set_diffuser_options(sd_model, vae=vae, op='vae') apply_vae_config(sd_model.sd_checkpoint_info.filename, vae_file, sd_model) if not shared.cmd_opts.lowvram and not shared.cmd_opts.medvram: sd_models.move_model(sd_model, devices.device) return sd_model