fix(api): avoid loading encoder twice when using LoRAs and inversions together

2023-03-18 13:39:35 -05:00 · 2023-03-18 13:39:35 -05:00 · af326a784f
parent 9f9b73b780
commit af326a784f
1 changed files with 9 additions and 7 deletions
--- a/api/onnx_web/diffusers/load.py
+++ b/api/onnx_web/diffusers/load.py
@ -236,15 +236,17 @@ def load_pipeline(
                list(zip(inversion_models, inversion_weights, inversion_names)),
            )
            # should be pretty small and should not need external data
            components["text_encoder"] = OnnxRuntimeModel(
                OnnxRuntimeModel.load_model(
                    text_encoder.SerializeToString(),
                    provider=device.ort_provider(),
                )
            )
            components["tokenizer"] = tokenizer
            # should be pretty small and should not need external data
            if loras is None or len(loras) == 0:
                components["text_encoder"] = OnnxRuntimeModel(
                    OnnxRuntimeModel.load_model(
                        text_encoder.SerializeToString(),
                        provider=device.ort_provider(),
                    )
                )
        # test LoRA blending
        if loras is not None and len(loras) > 0:
            lora_names, lora_weights = zip(*loras)