diff options
Diffstat (limited to 'modules')
-rw-r--r-- | modules/cmd_args.py | 4 | ||||
-rw-r--r-- | modules/sd_models.py | 8 |
2 files changed, 12 insertions, 0 deletions
diff --git a/modules/cmd_args.py b/modules/cmd_args.py index 81c0b82a..4314f97b 100644 --- a/modules/cmd_args.py +++ b/modules/cmd_args.py @@ -101,3 +101,7 @@ parser.add_argument("--no-gradio-queue", action='store_true', help="Disables gra parser.add_argument("--skip-version-check", action='store_true', help="Do not check versions of torch and xformers")
parser.add_argument("--no-hashing", action='store_true', help="disable sha256 hashing of checkpoints to help loading performance", default=False)
parser.add_argument("--no-download-sd-model", action='store_true', help="don't download SD1.5 model even if no model is found in --ckpt-dir", default=False)
+
+# token merging / tomesd
+parser.add_argument("--token-merging", action='store_true', help="Provides generation speedup by merging redundant tokens. (compatible with --xformers)", default=False)
+parser.add_argument("--token-merging-ratio", type=float, help="Adjusts ratio of merged to untouched tokens. Range: (0.0-1.0], Defaults to 0.5", default=0.5)
diff --git a/modules/sd_models.py b/modules/sd_models.py index 6ea874df..0b74aa0f 100644 --- a/modules/sd_models.py +++ b/modules/sd_models.py @@ -9,6 +9,7 @@ from omegaconf import OmegaConf from os import mkdir
from urllib import request
import ldm.modules.midas as midas
+import tomesd
from ldm.util import instantiate_from_config
@@ -430,6 +431,13 @@ def load_model(checkpoint_info=None, already_loaded_state_dict=None, time_taken_ try:
with sd_disable_initialization.DisableInitialization(disable_clip=clip_is_included_into_sd):
sd_model = instantiate_from_config(sd_config.model)
+
+ if shared.cmd_opts.token_merging:
+ ratio = shared.cmd_opts.token_merging_ratio
+
+ tomesd.apply_patch(sd_model, ratio=ratio)
+ print(f"Model accelerated using {(ratio * 100)}% token merging via tomesd.")
+ timer.record("token merging")
except Exception as e:
pass
|