InvokeAI/ldm/invoke/pngwriter.py

"""
Two helper classes for dealing with PNG images and their path names.
PngWriter -- Converts Images generated by T2I into PNGs, finds
             appropriate names for them, and writes prompt metadata
             into the PNG.

Exports function retrieve_metadata(path)
"""
import os
import re
import json
from PIL import PngImagePlugin, Image

# -------------------image generation utils-----


class PngWriter:
    def __init__(self, outdir):
        self.outdir = outdir
        os.makedirs(outdir, exist_ok=True)

    # gives the next unique prefix in outdir
    def unique_prefix(self):
        # sort reverse alphabetically until we find max+1
        dirlist = sorted(os.listdir(self.outdir), reverse=True)
        # find the first filename that matches our pattern or return 000000.0.png
        existing_name = next(
            (f for f in dirlist if re.match('^(\d+)\..*\.png', f)),
            '0000000.0.png',
        )
        basecount = int(existing_name.split('.', 1)[0]) + 1
        return f'{basecount:06}'

    # saves image named _image_ to outdir/name, writing metadata from prompt
    # returns full path of output
    def save_image_and_prompt_to_png(self, image, dream_prompt, name, metadata=None, compress_level=6):
        path = os.path.join(self.outdir, name)
        info = PngImagePlugin.PngInfo()
        info.add_text('Dream', dream_prompt)
        if metadata:
            info.add_text('sd-metadata', json.dumps(metadata))
        image.save(path, 'PNG', pnginfo=info, compress_level=compress_level)
        return path

    def retrieve_metadata(self,img_basename):
        '''
        Given a PNG filename stored in outdir, returns the "sd-metadata"
        metadata stored there, as a dict
        '''
        path = os.path.join(self.outdir,img_basename)
        all_metadata = retrieve_metadata(path)
        return all_metadata['sd-metadata']

def retrieve_metadata(img_path):
    '''
    Given a path to a PNG image, returns the "sd-metadata"
    metadata stored there, as a dict
    '''
    im = Image.open(img_path)
    if hasattr(im, 'text'):
        md = im.text.get('sd-metadata', '{}')
        dream_prompt = im.text.get('Dream', '')
    else:
        # When trying to retrieve metadata from images without a 'text' payload, such as JPG images.
        md = '{}'
        dream_prompt = ''
    return {'sd-metadata': json.loads(md), 'Dream': dream_prompt}

def write_metadata(img_path:str, meta:dict):
    im = Image.open(img_path)
    info = PngImagePlugin.PngInfo()
    info.add_text('sd-metadata', json.dumps(meta))
    im.save(img_path,'PNG',pnginfo=info)

class PromptFormatter:
    def __init__(self, t2i, opt):
        self.t2i = t2i
        self.opt = opt

    # note: the t2i object should provide all these values.
    # there should be no need to or against opt values
    def normalize_prompt(self):
        """Normalize the prompt and switches"""
        t2i = self.t2i
        opt = self.opt

        switches = list()
        switches.append(f'"{opt.prompt}"')
        switches.append(f'-s{opt.steps        or t2i.steps}')
        switches.append(f'-W{opt.width        or t2i.width}')
        switches.append(f'-H{opt.height       or t2i.height}')
        switches.append(f'-C{opt.cfg_scale    or t2i.cfg_scale}')
        switches.append(f'-A{opt.sampler_name or t2i.sampler_name}')
# to do: put model name into the t2i object
#        switches.append(f'--model{t2i.model_name}')
        if opt.seamless or t2i.seamless:
            switches.append(f'--seamless')
        if opt.init_img:
            switches.append(f'-I{opt.init_img}')
        if opt.fit:
            switches.append(f'--fit')
        if opt.strength and opt.init_img is not None:
            switches.append(f'-f{opt.strength or t2i.strength}')
        if opt.gfpgan_strength:
            switches.append(f'-G{opt.gfpgan_strength}')
        if opt.upscale:
            switches.append(f'-U {" ".join([str(u) for u in opt.upscale])}')
        if opt.variation_amount > 0:
            switches.append(f'-v{opt.variation_amount}')
        if opt.with_variations:
            formatted_variations = ','.join(f'{seed}:{weight}' for seed, weight in opt.with_variations)
            switches.append(f'-V{formatted_variations}')
        return ' '.join(switches)
prettified all the code using "blue" at the urging of @tildebyte 2022-08-26 07:15:42 +00:00			`"""`
moved dream utilities into their own subfolder 2022-08-26 02:49:15 +00:00			`Two helper classes for dealing with PNG images and their path names.`
			`PngWriter -- Converts Images generated by T2I into PNGs, finds`
			`appropriate names for them, and writes prompt metadata`
move make_grid into image_utils 2022-08-31 04:36:38 +00:00			`into the PNG.`
implementation of RFC #266 (#587) * Feature complete for #266 with exception of several small deviations: 1. initial image and model weight hashes use full sha256 hash rather than first 8 digits 2. Initialization parameters for post-processing steps not provided 3. Uses top-level "images" tags for both a single image and a grid of images. This change was suggested in a comment. * Added scripts/sd_metadata.py to retrieve and print metadata from PNG files * New ldm.dream.args.Args class is a namespace like object which holds all defaults and can be modified during exection to hold current settings. * Modified dream.py and server.py to accommodate Args class. 2022-09-16 17:09:04 +00:00
			`Exports function retrieve_metadata(path)`
prettified all the code using "blue" at the urging of @tildebyte 2022-08-26 07:15:42 +00:00			`"""`
first draft at big refactoring; will be broken 2022-08-24 21:52:34 +00:00			`import os`
code is reorganized and mostly functional. Grid needs to be brought back online, as well as naming of img2img variants (currently the variants get written but not logged) 2022-08-24 23:47:59 +00:00			`import re`
implementation of RFC #266 (#587) * Feature complete for #266 with exception of several small deviations: 1. initial image and model weight hashes use full sha256 hash rather than first 8 digits 2. Initialization parameters for post-processing steps not provided 3. Uses top-level "images" tags for both a single image and a grid of images. This change was suggested in a comment. * Added scripts/sd_metadata.py to retrieve and print metadata from PNG files * New ldm.dream.args.Args class is a namespace like object which holds all defaults and can be modified during exection to hold current settings. * Modified dream.py and server.py to accommodate Args class. 2022-09-16 17:09:04 +00:00			`import json`
			`from PIL import PngImagePlugin, Image`
first draft at big refactoring; will be broken 2022-08-24 21:52:34 +00:00
mostly back to full functionality; just missing grid generation code 2022-08-25 04:42:37 +00:00			`# -------------------image generation utils-----`
Optimize and Improve GFPGAN and Real-ESRGAN Pipeline 2022-08-28 20:14:29 +00:00

mostly back to full functionality; just missing grid generation code 2022-08-25 04:42:37 +00:00			`class PngWriter:`
refactor pngwriter 2022-08-31 04:21:04 +00:00			`def __init__(self, outdir):`
prettified all the code using "blue" at the urging of @tildebyte 2022-08-26 07:15:42 +00:00			`self.outdir = outdir`
mostly back to full functionality; just missing grid generation code 2022-08-25 04:42:37 +00:00			`os.makedirs(outdir, exist_ok=True)`

refactor pngwriter 2022-08-31 04:21:04 +00:00			`# gives the next unique prefix in outdir`
			`def unique_prefix(self):`
			`# sort reverse alphabetically until we find max+1`
			`dirlist = sorted(os.listdir(self.outdir), reverse=True)`
			`# find the first filename that matches our pattern or return 000000.0.png`
			`existing_name = next(`
			`(f for f in dirlist if re.match('^(\d+)\..*\.png', f)),`
			`'0000000.0.png',`
			`)`
			`basecount = int(existing_name.split('.', 1)[0]) + 1`
			`return f'{basecount:06}'`
mostly back to full functionality; just missing grid generation code 2022-08-25 04:42:37 +00:00
refactor pngwriter 2022-08-31 04:21:04 +00:00			`# saves image named _image_ to outdir/name, writing metadata from prompt`
			`# returns full path of output`
add option to CLI and pngwriter that allows user to set PNG compression level - In CLI: the argument is --png_compression <0..9> (-z<0..9>) - In API, pass `compress_level` to PngWriter.save_image_and_prompt_to_png() Compression ranges from 0 (no compression) to 9 (maximum compression). Default value is 6 (as specified by Pillow package). This addresses an issue first raised in #652. 2022-10-16 15:50:59 +00:00			`def save_image_and_prompt_to_png(self, image, dream_prompt, name, metadata=None, compress_level=6):`
refactor pngwriter 2022-08-31 04:21:04 +00:00			`path = os.path.join(self.outdir, name)`
mostly back to full functionality; just missing grid generation code 2022-08-25 04:42:37 +00:00			`info = PngImagePlugin.PngInfo()`
implementation of RFC #266 (#587) * Feature complete for #266 with exception of several small deviations: 1. initial image and model weight hashes use full sha256 hash rather than first 8 digits 2. Initialization parameters for post-processing steps not provided 3. Uses top-level "images" tags for both a single image and a grid of images. This change was suggested in a comment. * Added scripts/sd_metadata.py to retrieve and print metadata from PNG files * New ldm.dream.args.Args class is a namespace like object which holds all defaults and can be modified during exection to hold current settings. * Modified dream.py and server.py to accommodate Args class. 2022-09-16 17:09:04 +00:00			`info.add_text('Dream', dream_prompt)`
add outcrop postprocessor 2022-10-03 18:39:58 +00:00			`if metadata:`
fix a few more metadata bugs - facetool and upscale arguments now written into metadata - cleaned up handling of !fetch command 2022-10-21 21:45:15 +00:00			`info.add_text('sd-metadata', json.dumps(metadata))`
add option to CLI and pngwriter that allows user to set PNG compression level - In CLI: the argument is --png_compression <0..9> (-z<0..9>) - In API, pass `compress_level` to PngWriter.save_image_and_prompt_to_png() Compression ranges from 0 (no compression) to 9 (maximum compression). Default value is 6 (as specified by Pillow package). This addresses an issue first raised in #652. 2022-10-16 15:50:59 +00:00			`image.save(path, 'PNG', pnginfo=info, compress_level=compress_level)`
refactor pngwriter 2022-08-31 04:21:04 +00:00			`return path`
feature complete; looks like ready for merge 2022-08-25 21:26:48 +00:00
implementation of RFC #266 (#587) * Feature complete for #266 with exception of several small deviations: 1. initial image and model weight hashes use full sha256 hash rather than first 8 digits 2. Initialization parameters for post-processing steps not provided 3. Uses top-level "images" tags for both a single image and a grid of images. This change was suggested in a comment. * Added scripts/sd_metadata.py to retrieve and print metadata from PNG files * New ldm.dream.args.Args class is a namespace like object which holds all defaults and can be modified during exection to hold current settings. * Modified dream.py and server.py to accommodate Args class. 2022-09-16 17:09:04 +00:00			`def retrieve_metadata(self,img_basename):`
			`'''`
			`Given a PNG filename stored in outdir, returns the "sd-metadata"`
			`metadata stored there, as a dict`
			`'''`
			`path = os.path.join(self.outdir,img_basename)`
Fixes metadata related to new args 2022-09-16 20:16:16 +00:00			`all_metadata = retrieve_metadata(path)`
			`return all_metadata['sd-metadata']`
implementation of RFC #266 (#587) * Feature complete for #266 with exception of several small deviations: 1. initial image and model weight hashes use full sha256 hash rather than first 8 digits 2. Initialization parameters for post-processing steps not provided 3. Uses top-level "images" tags for both a single image and a grid of images. This change was suggested in a comment. * Added scripts/sd_metadata.py to retrieve and print metadata from PNG files * New ldm.dream.args.Args class is a namespace like object which holds all defaults and can be modified during exection to hold current settings. * Modified dream.py and server.py to accommodate Args class. 2022-09-16 17:09:04 +00:00
			`def retrieve_metadata(img_path):`
			`'''`
			`Given a path to a PNG image, returns the "sd-metadata"`
			`metadata stored there, as a dict`
			`'''`
			`im = Image.open(img_path)`
correct bug when trying to enhance JPG images (#1928) This fix was authored by @mebelz and is reissued here to base it on `main`. 2022-12-11 18:48:47 +00:00			`if hasattr(im, 'text'):`
			`md = im.text.get('sd-metadata', '{}')`
			`dream_prompt = im.text.get('Dream', '')`
			`else:`
			`# When trying to retrieve metadata from images without a 'text' payload, such as JPG images.`
			`md = '{}'`
			`dream_prompt = ''`
Fixes metadata related to new args 2022-09-16 20:16:16 +00:00			`return {'sd-metadata': json.loads(md), 'Dream': dream_prompt}`
prettified all the code using "blue" at the urging of @tildebyte 2022-08-26 07:15:42 +00:00
add outcrop postprocessor 2022-10-03 18:39:58 +00:00			`def write_metadata(img_path:str, meta:dict):`
			`im = Image.open(img_path)`
			`info = PngImagePlugin.PngInfo()`
			`info.add_text('sd-metadata', json.dumps(meta))`
			`im.save(img_path,'PNG',pnginfo=info)`
Add back old `dream.py` as `legacy_api.py` This commit "reverts" the new API changes by extracting the old functionality into new files. The work is based on the commit `803a51d5adca7e6e28491fc414fd3937bee7cb79` PngWriter regained PromptFormatter as old server used that. `server_legacy.py` is the old server that `dream.py` used. Finally `legacy_api.py` is what `dream.py` used to be at the mentioned commit. One manually run test has been added in order to be able to test compatibility with the old API, currently just testing that the API endpoint works the same way + the image hash is the same as it used to be before. 2022-10-12 18:05:55 +00:00
			`class PromptFormatter:`
			`def __init__(self, t2i, opt):`
			`self.t2i = t2i`
			`self.opt = opt`

			`# note: the t2i object should provide all these values.`
			`# there should be no need to or against opt values`
			`def normalize_prompt(self):`
			`"""Normalize the prompt and switches"""`
			`t2i = self.t2i`
			`opt = self.opt`

			`switches = list()`
			`switches.append(f'"{opt.prompt}"')`
			`switches.append(f'-s{opt.steps or t2i.steps}')`
			`switches.append(f'-W{opt.width or t2i.width}')`
			`switches.append(f'-H{opt.height or t2i.height}')`
			`switches.append(f'-C{opt.cfg_scale or t2i.cfg_scale}')`
			`switches.append(f'-A{opt.sampler_name or t2i.sampler_name}')`
			`# to do: put model name into the t2i object`
			`# switches.append(f'--model{t2i.model_name}')`
			`if opt.seamless or t2i.seamless:`
			`switches.append(f'--seamless')`
			`if opt.init_img:`
			`switches.append(f'-I{opt.init_img}')`
			`if opt.fit:`
			`switches.append(f'--fit')`
			`if opt.strength and opt.init_img is not None:`
			`switches.append(f'-f{opt.strength or t2i.strength}')`
			`if opt.gfpgan_strength:`
			`switches.append(f'-G{opt.gfpgan_strength}')`
			`if opt.upscale:`
			`switches.append(f'-U {" ".join([str(u) for u in opt.upscale])}')`
			`if opt.variation_amount > 0:`
			`switches.append(f'-v{opt.variation_amount}')`
			`if opt.with_variations:`
			`formatted_variations = ','.join(f'{seed}:{weight}' for seed, weight in opt.with_variations)`
			`switches.append(f'-V{formatted_variations}')`
			`return ' '.join(switches)`