onnx-web/api/onnx_web/convert/diffusion/diffusion_xl.py

from logging import getLogger
from os import path
from typing import Dict, Optional, Tuple

import onnx
import torch
from diffusers import AutoencoderKL, StableDiffusionXLPipeline
from onnx.shape_inference import infer_shapes_path
from onnxruntime.transformers.float16 import convert_float_to_float16
from optimum.exporters.onnx import main_export

from ...constants import ONNX_MODEL
from ..client import fetch_model
from ..utils import RESOLVE_FORMATS, ConversionContext, check_ext

logger = getLogger(__name__)


@torch.no_grad()
def convert_diffusion_diffusers_xl(
    conversion: ConversionContext,
    model: Dict,
    format: Optional[str],
) -> Tuple[bool, str]:
    """
    From https://github.com/huggingface/diffusers/blob/main/scripts/convert_stable_diffusion_checkpoint_to_onnx.py
    """
    name = str(model.get("name")).strip()
    source = model.get("source")
    replace_vae = model.get("vae", None)

    device = conversion.training_device
    dtype = conversion.torch_dtype()
    logger.debug("using Torch dtype %s for pipeline", dtype)

    dest_path = path.join(conversion.model_path, name)
    model_index = path.join(dest_path, "model_index.json")
    model_hash = path.join(dest_path, "hash.txt")

    # diffusers go into a directory rather than .onnx file
    logger.info(
        "converting Stable Diffusion XL model %s: %s -> %s/", name, source, dest_path
    )

    if path.exists(dest_path) and path.exists(model_index):
        logger.info("ONNX model already exists, skipping conversion")

        if "hash" in model and not path.exists(model_hash):
            logger.info("ONNX model does not have hash file, adding one")
            with open(model_hash, "w") as f:
                f.write(model["hash"])

        return (False, dest_path)

    cache_path = fetch_model(conversion, name, model["source"], format=format)
    # safetensors -> diffusers directory with torch models
    temp_path = path.join(conversion.cache_path, f"{name}-torch")

    if format == "safetensors":
        pipeline = StableDiffusionXLPipeline.from_single_file(
            cache_path, use_safetensors=True
        )
    else:
        pipeline = StableDiffusionXLPipeline.from_pretrained(cache_path)

    if replace_vae is not None:
        vae_path = path.join(conversion.model_path, replace_vae)
        vae_file = check_ext(vae_path, RESOLVE_FORMATS)
        if vae_file[0]:
            logger.debug("loading VAE from single tensor file: %s", vae_path)
            pipeline.vae = AutoencoderKL.from_single_file(vae_path)
        else:
            logger.debug("loading pretrained VAE from path: %s", replace_vae)
            pipeline.vae = AutoencoderKL.from_pretrained(replace_vae)

    if path.exists(temp_path):
        logger.debug("torch model already exists for %s: %s", source, temp_path)
    else:
        logger.debug("exporting torch model for %s: %s", source, temp_path)
        pipeline.save_pretrained(temp_path)

    # directory -> onnx using optimum exporters
    main_export(
        temp_path,
        output=dest_path,
        task="stable-diffusion-xl",
        device=device,
        fp16=conversion.has_optimization(
            "torch-fp16"
        ),  # optimum's fp16 mode only works on CUDA or ROCm
        framework="pt",
    )

    if "hash" in model:
        logger.debug("adding hash file to ONNX model")
        with open(model_hash, "w") as f:
            f.write(model["hash"])

    if conversion.half:
        unet_path = path.join(dest_path, "unet", ONNX_MODEL)
        infer_shapes_path(unet_path)
        unet = onnx.load(unet_path)
        opt_model = convert_float_to_float16(
            unet,
            disable_shape_infer=True,
            force_fp16_initializers=True,
            keep_io_types=True,
            op_block_list=["Attention", "MultiHeadAttention"],
        )
        onnx.save_model(
            opt_model,
            unet_path,
            save_as_external_data=True,
            all_tensors_to_one_file=True,
            location="weights.pb",
        )

    return False, dest_path
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00			`from logging import getLogger`
			`from os import path`
			`from typing import Dict, Optional, Tuple`

add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00			`import onnx`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00			`import torch`
add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00			`from diffusers import AutoencoderKL, StableDiffusionXLPipeline`
			`from onnx.shape_inference import infer_shapes_path`
			`from onnxruntime.transformers.float16 import convert_float_to_float16`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00			`from optimum.exporters.onnx import main_export`

add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00			`from ...constants import ONNX_MODEL`
fix(api): only fetch diffusion models if they have not already been converted (#398) 2023-12-10 19:52:52 +00:00			`from ..client import fetch_model`
fix(api): allow SDXL VAE in any supported tensor format, ensure new SDXL models get hash file 2023-10-07 00:01:00 +00:00			`from ..utils import RESOLVE_FORMATS, ConversionContext, check_ext`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00
			`logger = getLogger(__name__)`


			`@torch.no_grad()`
			`def convert_diffusion_diffusers_xl(`
			`conversion: ConversionContext,`
			`model: Dict,`
			`format: Optional[str],`
			`) -> Tuple[bool, str]:`
			`"""`
			`From https://github.com/huggingface/diffusers/blob/main/scripts/convert_stable_diffusion_checkpoint_to_onnx.py`
			`"""`
fix(api): trim whitespace from model names because it breaks things (#376) 2023-12-10 19:59:47 +00:00			`name = str(model.get("name")).strip()`
fix(api): only fetch diffusion models if they have not already been converted (#398) 2023-12-10 19:52:52 +00:00			`source = model.get("source")`
add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00			`replace_vae = model.get("vae", None)`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00
			`device = conversion.training_device`
			`dtype = conversion.torch_dtype()`
			`logger.debug("using Torch dtype %s for pipeline", dtype)`

			`dest_path = path.join(conversion.model_path, name)`
			`model_index = path.join(dest_path, "model_index.json")`
			`model_hash = path.join(dest_path, "hash.txt")`

			`# diffusers go into a directory rather than .onnx file`
			`logger.info(`
			`"converting Stable Diffusion XL model %s: %s -> %s/", name, source, dest_path`
			`)`

			`if path.exists(dest_path) and path.exists(model_index):`
			`logger.info("ONNX model already exists, skipping conversion")`
fix(api): allow SDXL VAE in any supported tensor format, ensure new SDXL models get hash file 2023-10-07 00:01:00 +00:00
			`if "hash" in model and not path.exists(model_hash):`
			`logger.info("ONNX model does not have hash file, adding one")`
			`with open(model_hash, "w") as f:`
			`f.write(model["hash"])`

feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00			`return (False, dest_path)`

fix(api): only fetch diffusion models if they have not already been converted (#398) 2023-12-10 19:52:52 +00:00			`cache_path = fetch_model(conversion, name, model["source"], format=format)`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00			`# safetensors -> diffusers directory with torch models`
			`temp_path = path.join(conversion.cache_path, f"{name}-torch")`

			`if format == "safetensors":`
apply lint 2023-09-10 16:53:36 +00:00			`pipeline = StableDiffusionXLPipeline.from_single_file(`
fix(api): only fetch diffusion models if they have not already been converted (#398) 2023-12-10 19:52:52 +00:00			`cache_path, use_safetensors=True`
apply lint 2023-09-10 16:53:36 +00:00			`)`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00			`else:`
fix(api): only fetch diffusion models if they have not already been converted (#398) 2023-12-10 19:52:52 +00:00			`pipeline = StableDiffusionXLPipeline.from_pretrained(cache_path)`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00
add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00			`if replace_vae is not None:`
fix(api): resolve XL VAE within model folder 2023-09-12 01:21:43 +00:00			`vae_path = path.join(conversion.model_path, replace_vae)`
fix(api): correct VAE extension check during conversion 2023-12-09 04:55:51 +00:00			`vae_file = check_ext(vae_path, RESOLVE_FORMATS)`
			`if vae_file[0]:`
fix(api): add logging along SDXL custom VAE codepath 2023-11-24 05:21:45 +00:00			`logger.debug("loading VAE from single tensor file: %s", vae_path)`
fix(api): resolve XL VAE within model folder 2023-09-12 01:21:43 +00:00			`pipeline.vae = AutoencoderKL.from_single_file(vae_path)`
add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00			`else:`
fix(api): load pretrained VAE from original path 2023-12-09 05:19:52 +00:00			`logger.debug("loading pretrained VAE from path: %s", replace_vae)`
			`pipeline.vae = AutoencoderKL.from_pretrained(replace_vae)`
add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00
add more misc logging 2023-11-06 14:48:35 +00:00			`if path.exists(temp_path):`
			`logger.debug("torch model already exists for %s: %s", source, temp_path)`
			`else:`
			`logger.debug("exporting torch model for %s: %s", source, temp_path)`
			`pipeline.save_pretrained(temp_path)`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00
			`# directory -> onnx using optimum exporters`
			`main_export(`
			`temp_path,`
			`output=dest_path,`
			`task="stable-diffusion-xl",`
			`device=device,`
apply lint, add missing file 2023-11-19 00:13:13 +00:00			`fp16=conversion.has_optimization(`
			`"torch-fp16"`
			`), # optimum's fp16 mode only works on CUDA or ROCm`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00			`framework="pt",`
			`)`

fix(api): allow SDXL VAE in any supported tensor format, ensure new SDXL models get hash file 2023-10-07 00:01:00 +00:00			`if "hash" in model:`
			`logger.debug("adding hash file to ONNX model")`
			`with open(model_hash, "w") as f:`
			`f.write(model["hash"])`

add custom VAE and fp16 support to SDXL conversion 2023-09-11 23:18:38 +00:00			`if conversion.half:`
			`unet_path = path.join(dest_path, "unet", ONNX_MODEL)`
			`infer_shapes_path(unet_path)`
			`unet = onnx.load(unet_path)`
			`opt_model = convert_float_to_float16(`
			`unet,`
			`disable_shape_infer=True,`
			`force_fp16_initializers=True,`
			`keep_io_types=True,`
			`op_block_list=["Attention", "MultiHeadAttention"],`
			`)`
			`onnx.save_model(`
			`opt_model,`
			`unet_path,`
			`save_as_external_data=True,`
			`all_tensors_to_one_file=True,`
			`location="weights.pb",`
			`)`
feat(api): add conversion for SDXL models 2023-09-10 16:52:46 +00:00
apply lint 2023-09-10 16:53:36 +00:00			`return False, dest_path`