add multiple enhancements

- ability to cycle through models and dimensions - process automatically through invokeai - create an .md file to display the grid results
2024-08-30 20:32:17 +00:00 · 2023-02-28 15:10:20 -05:00
parent 2a179799d8
commit 4c61f3a514
2 changed files with 311 additions and 99 deletions
--- a/scripts/dynamic_prompts.py
+++ b/scripts/dynamic_prompts.py
@ -0,0 +1,311 @@
+#!/usr/bin/env python
+
+"""
+Simple script to generate a file of InvokeAI prompts and settings
+that scan across steps and other parameters.
+"""
+
+import re
+import pydoc
+import shutil
+import sys
+import argparse
+from dataclasses import dataclass
+from subprocess import Popen, PIPE
+from itertools import product
+from io import TextIOBase
+from pathlib import Path
+from typing import Iterable, List, Union
+
+from omegaconf import OmegaConf, dictconfig, listconfig
+
+def expand_prompts(template_file: Path,
+                   run_invoke: bool=False,
+                   invoke_model: str=None,
+                   invoke_outdir: Path=None,
+                   ):
+    '''
+    :param template_file: A YAML file containing templated prompts and args
+    :param run_invoke: A boolean which if True will pass expanded prompts to invokeai CLI
+    :param invoke_model: Name of the model to load when run_invoke is true; otherwise uses default
+    :param invoke_outdir: Directory for outputs when run_invoke is true; otherwise uses default
+    '''
+    conf = OmegaConf.load(template_file)
+    try:
+        if run_invoke:
+            invokeai_args = [shutil.which('invokeai')]
+            if invoke_model:
+                invokeai_args.extend(('--model',invoke_model))
+            if invoke_outdir:
+                invokeai_args.extend(('--outdir',invoke_outdir))
+            print(f'Calling invokeai with arguments {invokeai_args}',file=sys.stderr)
+            process = Popen(invokeai_args, stdin=PIPE, text=True)
+            with process.stdin as fh:
+                _do_expand(conf,file=fh)
+            process.wait()
+        else:
+            _do_expand(conf)
+    except KeyboardInterrupt:
+        process.kill()
+
+def main():
+    parser = argparse.ArgumentParser(
+        description=HELP,
+    )
+    parser.add_argument(
+        'template_file',
+        type=Path,
+        nargs='?',
+        help='path to a template file, use --example to generate an example file'
+    )
+    parser.add_argument(
+        '--example',
+        action='store_true',
+        default=False,
+        help=f'Print an example template file. Use "{sys.argv[0]} --example > example.yaml" to save output to a file'
+    )
+    parser.add_argument(
+        '--instructions',
+        '-i',
+        dest='instructions',
+        action='store_true',
+        default=False,
+        help=f'Print verbose instructions.'
+    )
+    parser.add_argument(
+        '--invoke',
+        action='store_true',
+        help='Execute invokeai using specified optional --model and --outdir'
+    )
+    parser.add_argument(
+        '--model',
+        help='Feed the generated prompts to the invokeai CLI using the indicated model. Will be overriden by a model: section in template file.'
+    )
+    parser.add_argument(
+        '--outdir',
+        type=Path,
+        help='Write images and log into indicated directory'
+    )
+    opt = parser.parse_args()
+
+    if opt.example:
+        print(EXAMPLE_TEMPLATE_FILE)
+        sys.exit(0)
+
+    if opt.instructions:
+        pydoc.pager(INSTRUCTIONS)
+        sys.exit(0)
+
+    if not opt.template_file:
+        parser.print_help()
+        sys.exit(-1)
+        
+    expand_prompts(
+        template_file = opt.template_file,
+        run_invoke = opt.invoke,
+        invoke_model = opt.model,
+        invoke_outdir = opt.outdir
+    )
+    
+def _do_expand(conf: OmegaConf, file: TextIOBase=sys.stdout):
+    models = expand_values(conf.get("model"))
+    steps = expand_values(conf.get("steps")) or [30]
+    cfgs = expand_values(conf.get("cfg")) or [7.5]
+    samplers = expand_values(conf.get("sampler")) or ["ddim"]
+    seeds = expand_values(conf.get("seed")) or [0]
+    prompts = expand_prompt(conf.get("prompt")) or ["banana sushi"]
+    dimensions = expand_prompt(conf.get("dimensions")) or ['512x512']
+    
+    cross_product = product(*[models, seeds, prompts, samplers, cfgs, steps, dimensions])
+    previous_model = None
+    for p in cross_product:
+        (model, seed, prompt, sampler, cfg, step, dimensions) = tuple(p)
+        (width, height) = dimensions.split('x')
+        if previous_model != model:
+            previous_model = model
+            print(f'!switch {model}', file=file)
+        print(f'"{prompt}" -S{seed} -A{sampler} -C{cfg} -s{step} -W{width} -H{height}',file=file)
+
+def expand_prompt(
+    stanza: str | dict | listconfig.ListConfig | dictconfig.DictConfig,
+) -> list | range:
+    if not stanza:
+        return None
+    if isinstance(stanza, listconfig.ListConfig):
+        return stanza
+    if isinstance(stanza, str):
+        return [stanza]
+    if not isinstance(stanza, dictconfig.DictConfig):
+        raise ValueError(f"Unrecognized template: {stanza}")
+
+    if not (template := stanza.get("template")):
+        raise KeyError('"prompt" section must contain a "template" definition')
+
+    fragment_labels = re.findall("{([^{}]+?)}", template)
+    if len(fragment_labels) == 0:
+        return [template]
+    fragments = [[{x: y} for y in stanza.get(x)] for x in fragment_labels]
+    dicts = merge(product(*fragments))
+    return [template.format(**x) for x in dicts]
+
+def merge(dicts: Iterable) -> List[dict]:
+    result = list()
+    for x in dicts:
+        to_merge = dict()
+        for item in x:
+            to_merge = to_merge | item
+        result.append(to_merge)
+    return result
+
+
+def expand_values(stanza: str | dict | listconfig.ListConfig) -> list | range:
+    if not stanza:
+        return None
+    if isinstance(stanza, listconfig.ListConfig):
+        return stanza
+    elif match := re.match("^(\d+);(\d+)(;(\d+))?", str(stanza)):
+        return range(int(match.group(1)), 1+int(match.group(2)), int(match.group(4)) or 1)
+    else:
+        return [stanza]
+
+HELP = f"""
+This script takes a prompt template file that contains multiple
+alternative values for the prompt and its generation arguments (such
+as steps). It then expands out the prompts using all combinations of
+arguments and either prints them to the terminal's standard output, or
+feeds the prompts directly to the invokeai command-line interface.
+
+Call this script again with --instructions (-i) for verbose instructions.
+"""
+
+INSTRUCTIONS = f"""
+== INTRODUCTION ==
+This script takes a prompt template file that contains multiple
+alternative values for the prompt and its generation arguments (such
+as steps). It then expands out the prompts using all combinations of
+arguments and either prints them to the terminal's standard output, or
+feeds the prompts directly to the invokeai command-line interface.
+
+If the optional --invoke argument is provided, then the generated
+prompts will be fed directly to invokeai for image generation. You
+will likely want to add the --outdir option in order to save the image
+files to their own folder.
+
+   {sys.argv[0]} --invoke --outdir=/tmp/outputs my_template.yaml
+
+If --invoke isn't specified, the expanded prompts will be printed to
+output. You can capture them to a file for inspection and editing this
+way:
+
+   {sys.argv[0]} my_template.yaml > prompts.txt
+
+And then feed them to invokeai this way:
+
+  invokeai --outdir=/tmp/outputs < prompts.txt
+
+Note that after invokeai finishes processing the list of prompts, the
+output directory will contain a markdown file named `log.md`
+containing annotated images. You can open this file using an e-book
+reader such as the cross-platform Calibre eBook reader
+(https://calibre-ebook.com/).
+
+
+== FORMAT OF THE TEMPLATES FILE ==
+
+This will generate an example template file that you can get
+started with:
+
+  {sys.argv[0]} --example > example.yaml
+
+An excerpt from the top of this file looks like this:
+
+ model:
+   - stable-diffusion-1.5
+   - stable-diffusion-2.1-base
+ steps: 30:50:1  # start steps at 30 and go up to 50, incrementing by 1 each time
+ seed: 50        # fixed constant, seed=50
+ cfg:            # list of CFG values to try
+   - 7
+   - 8
+   - 12
+ prompt: a walk in the park   # constant value
+
+In more detail, the template file can have any of the
+following sections:
+ - model:
+ - steps:
+ - seed:
+ - cfg:
+ - sampler:
+ - prompt:
+
+- Each section can have a constant value such as this:
+     steps: 50
+- Or a range of numeric values in the format:
+     steps: <start>;<stop>;<step>      (note semicolon, not colon!)
+- Or a list of values in the format:
+     - value1
+     - value2
+     - value3
+
+The "prompt:" section is special. It can accept a constant value:
+
+   prompt: a walk in the woods in the style of donatello
+
+Or it can accept a list of prompts:
+
+   prompt:
+      - a walk in the woods
+      - a walk on the beach
+
+Or it can accept a templated list of prompts. These allow you to
+define a series of phrases, each of which is a list. You then combine
+them together into a prompt template in this way:
+
+  prompt:
+    style:
+         - greg rutkowski
+         - gustav klimt
+         - renoir
+         - donetello
+    subject:
+         - sunny meadow in the mountains
+         - gathering storm in the mountains
+    template: a {{subject}} in the style of {{style}}
+
+In the example above, the phrase names "style" and "subject" are
+examples only. You can use whatever you like. However, the "template:"
+field is required. The output will be:
+
+  "a sunny meadow in the mountains in the style of greg rutkowski"
+  "a sunny meadow in the mountains in the style of gustav klimt"
+  ...
+  "a gathering storm in the mountains in the style of donetello"
+"""
+
+EXAMPLE_TEMPLATE_FILE="""
+model: stable-diffusion-1.5
+steps: 30;50;10
+seed: 50
+dimensions: 512x512
+cfg:
+  - 7
+  - 12
+sampler:
+  - k_euler_a
+  - k_lms
+prompt:
+  style:
+       - greg rutkowski
+       - gustav klimt
+  location:
+       - the mountains
+       - a desert
+  object:
+       - luxurious dwelling
+       - crude tent
+  template: a {object} in {location}, in the style of {style}
+"""
+
+if __name__ == "__main__":
+    main()
--- a/scripts/generate_param_scan.py
+++ b/scripts/generate_param_scan.py
@ -1,99 +0,0 @@
-#!/usr/bin/env python
-
-'''
-Simple script to generate a file of InvokeAI prompts and settings
-that scan across steps and other parameters.
-'''
-
-from omegaconf import OmegaConf, listconfig
-import re
-import sys
-
-INSTRUCTIONS='''
-To use, create a file named "template.yaml" (or similar) formatted like this
->>> cut here <<<
-steps: "30:50:1"
-seed: 50
-cfg:
-  - 7
-  - 8
-  - 12
-sampler:
-  - ddim
-  - k_lms
-prompt:
-  - a sunny meadow in the mountains
-  - a gathering storm in the mountains
->>> cut here <<<
-
-Create sections named "steps", "seed", "cfg", "sampler" and "prompt".
- Each section can have a constant value such as this:
-     steps: 50
- Or a range of numeric values in the format:
-     steps: "<start>:<stop>:<step>"
- Or a list of values in the format:
-     - value1
-     - value2
-     - value3
-
-Be careful to: 1) put quotation marks around numeric ranges; 2) put a 
-space between the "-" and the value in a list of values; and 3) use spaces,
-not tabs, at the beginnings of indented lines.
-
-When you run this script, capture the output into a text file like this:
-
-    python generate_param_scan.py template.yaml > output_prompts.txt
-
-"output_prompts.txt" will now contain an expansion of all the list
-values you provided. You can examine it in a text editor such as
-Notepad.
-
-Now start the CLI, and feed the expanded prompt file to it using the
-"!replay" command:
-
-   !replay output_prompts.txt
-
-Alternatively, you can directly feed the output of this script
-by issuing a command like this from the developer's console:
-
-   python generate_param_scan.py template.yaml | invokeai
-
-You can use the web interface to view the resulting images and their
-metadata.
-'''
-
-def main():
-    if len(sys.argv)<2:
-        print(f'Usage: {__file__} template_file.yaml')
-        print('Outputs a series of prompts expanded from the provided template.')
-        print(INSTRUCTIONS)
-        sys.exit(-1)
-        
-    conf_file = sys.argv[1]
-    conf = OmegaConf.load(conf_file)
-
-    steps = expand_values(conf.get('steps')) or [30]
-    cfg = expand_values(conf.get('cfg')) or [7.5]
-    sampler = expand_values(conf.get('sampler')) or ['ddim']
-    prompt = expand_values(conf.get('prompt')) or ['banana sushi']
-    seed = expand_values(conf.get('seed'))
-
-    for seed in seed:
-        for p in prompt:
-            for s in sampler:
-                for c in cfg:
-                    for step in steps:
-                        print(f'"{p}" -s{step} {f"-S{seed}" if seed else ""} -A{s} -C{c}')
-
-def expand_values(stanza: str|dict|listconfig.ListConfig)->list|range:
-    if not stanza:
-        return None
-    if isinstance(stanza,listconfig.ListConfig):
-        return stanza
-    elif match := re.match('^(\d+):(\d+)(:(\d+))?',str(stanza)):
-        return range(int(match.group(1)), int(match.group(2)), int(match.group(4)) or 1)
-    else:
-        return [stanza]
-    
-if __name__ == '__main__':
-    main()