load models to VRAM when using --lowram param

load models to VRM instead of RAM (for machines which have bigger VRM than RAM such as free Google Colab server)
2022-10-13 02:07:49 +08:00 · 2022-10-13 02:07:49 +08:00 · 4a216ded43
commit 4a216ded43
parent a8eeb2b7ad
1 changed files with 13 additions and 2 deletions
--- a/modules/sd_models.py
+++ b/modules/sd_models.py
@ -134,7 +134,12 @@ def load_model_weights(model, checkpoint_info):
    print(f"Loading weights [{sd_model_hash}] from {checkpoint_file}")
-    pl_sd = torch.load(checkpoint_file, map_location="cpu")
+    if shared.cmd_opts.lowram:
        print("Load to VRAM if GPU is available (low RAM)")
        pl_sd = torch.load(checkpoint_file)
    else:
        pl_sd = torch.load(checkpoint_file, map_location="cpu")
    if "global_step" in pl_sd:
        print(f"Global Step: {pl_sd['global_step']}")
@ -158,7 +163,13 @@ def load_model_weights(model, checkpoint_info):
    if os.path.exists(vae_file):
        print(f"Loading VAE weights from: {vae_file}")
-        vae_ckpt = torch.load(vae_file, map_location="cpu")
+
        if shared.cmd_opts.lowram:
            print("Load to VRAM if GPU is available (low RAM)")
            vae_ckpt = torch.load(vae_file)
        else:
            vae_ckpt = torch.load(vae_file, map_location="cpu")
        vae_dict = {k: v for k, v in vae_ckpt["state_dict"].items() if k[0:4] != "loss"}
        model.first_stage_model.load_state_dict(vae_dict)