Added shuffeling to prompts

2026-01-26 16:39:47 +00:00 · 2023-08-19 07:57:30 -06:00
parent 90eedb78bf
commit c6675e2801
4 changed files with 59 additions and 6 deletions
--- a/config/examples/train_slider.example.yml
+++ b/config/examples/train_slider.example.yml
@@ -184,6 +184,10 @@ config:
            # if you are doing more than one target it may be good to set less important ones
            # to a lower number like 0.1 so they don't outweigh the primary target
            weight: 1.0
            # shuffle the prompts split by the comma. We will run every combination randomly
            # this will make the LoRA more robust. You probably want this on unless prompt order
            # is important for some reason
            shuffle: true
        # anchors are prompts that we will try to hold on to while training the slider
--- a/jobs/process/TrainSliderProcess.py
+++ b/jobs/process/TrainSliderProcess.py
@@ -86,6 +86,9 @@ class TrainSliderProcess(BaseSDTrainProcess):
            # remove duplicates
            prompts_to_cache = list(dict.fromkeys(prompts_to_cache))
            # trim to max steps if max steps is lower than prompt count
            prompts_to_cache = prompts_to_cache[:self.train_config.steps]
            # encode them
            cache = encode_prompts_to_cache(
                prompt_list=prompts_to_cache,
--- a/toolkit/config_modules.py
+++ b/toolkit/config_modules.py
@@ -4,6 +4,7 @@ from typing import List, Optional
 import random
 class SaveConfig:
    def __init__(self, **kwargs):
        self.save_every: int = kwargs.get('save_every', 1000)
@@ -93,6 +94,7 @@ class SliderTargetConfig:
        self.negative: str = kwargs.get('negative', '')
        self.multiplier: float = kwargs.get('multiplier', 1.0)
        self.weight: float = kwargs.get('weight', 1.0)
        self.shuffle: bool = kwargs.get('shuffle', False)
 class SliderConfigAnchors:
@@ -105,8 +107,6 @@ class SliderConfigAnchors:
 class SliderConfig:
    def __init__(self, **kwargs):
        targets = kwargs.get('targets', [])
        targets = [SliderTargetConfig(**target) for target in targets]
        self.targets: List[SliderTargetConfig] = targets
        anchors = kwargs.get('anchors', [])
        anchors = [SliderConfigAnchors(**anchor) for anchor in anchors]
        self.anchors: List[SliderConfigAnchors] = anchors
@@ -115,6 +115,18 @@ class SliderConfig:
        self.prompt_tensors: str = kwargs.get('prompt_tensors', None)
        self.batch_full_slide: bool = kwargs.get('batch_full_slide', True)
        # expand targets if shuffling
        from toolkit.prompt_utils import get_slider_target_permutations
        self.targets: List[SliderTargetConfig] = []
        targets = [SliderTargetConfig(**target) for target in targets]
        # do permutations if shuffle is true
        for target in targets:
            if target.shuffle:
                target_permutations = get_slider_target_permutations(target)
                self.targets = self.targets + target_permutations
            else:
                self.targets.append(target)
 class GenerateImageConfig:
    def __init__(
--- a/toolkit/prompt_utils.py
+++ b/toolkit/prompt_utils.py
@@ -7,6 +7,10 @@ from tqdm import tqdm
 from toolkit.stable_diffusion_model import PromptEmbeds
 from toolkit.train_tools import get_torch_dtype
 import itertools
 if TYPE_CHECKING:
    from toolkit.config_modules import SliderTargetConfig
 class ACTION_TYPES_SLIDER:
@@ -226,6 +230,40 @@ def split_anchors(concatenated: EncodedAnchor, num_anchors: int = 4) -> List[Enc
    return anchors
 def get_permutations(s):
    # Split the string by comma
    phrases = [phrase.strip() for phrase in s.split(',')]
    # remove empty strings
    phrases = [phrase for phrase in phrases if len(phrase) > 0]
    # Get all permutations
    permutations = list(itertools.permutations(phrases))
    # Convert the tuples back to comma separated strings
    return [', '.join(permutation) for permutation in permutations]
 def get_slider_target_permutations(target: 'SliderTargetConfig') -> List['SliderTargetConfig']:
    from toolkit.config_modules import SliderTargetConfig
    pos_permutations = get_permutations(target.positive)
    neg_permutations = get_permutations(target.negative)
    permutations = []
    for pos, neg in itertools.product(pos_permutations, neg_permutations):
        permutations.append(
            SliderTargetConfig(
                target_class=target.target_class,
                positive=pos,
                negative=neg,
                multiplier=target.multiplier,
                weight=target.weight
            )
        )
    return permutations
 if TYPE_CHECKING:
    from toolkit.stable_diffusion_model import StableDiffusion
@@ -291,10 +329,6 @@ def encode_prompts_to_cache(
    return cache
 if TYPE_CHECKING:
    from toolkit.config_modules import SliderTargetConfig
@torch.no_grad()
 def build_prompt_pair_batch_from_cache(
        cache: PromptEmbedsCache,