feat(api): add prompt filter stage using GPT2 models

2024-02-11 16:23:10 -06:00 · 2024-02-11 16:23:10 -06:00 · bc2eeb8503
parent acd9168b32
commit bc2eeb8503
2 changed files with 49 additions and 0 deletions
--- a/api/onnx_web/chain/stages.py
+++ b/api/onnx_web/chain/stages.py
@ -20,6 +20,7 @@ from .source_noise import SourceNoiseStage
 from .source_s3 import SourceS3Stage
 from .source_txt2img import SourceTxt2ImgStage
 from .source_url import SourceURLStage
+from .text_prompt import TextPromptStage
 from .upscale_bsrgan import UpscaleBSRGANStage
 from .upscale_highres import UpscaleHighresStage
 from .upscale_outpaint import UpscaleOutpaintStage
@ -52,6 +53,7 @@ CHAIN_STAGES = {
    "source-s3": SourceS3Stage,
    "source-txt2img": SourceTxt2ImgStage,
    "source-url": SourceURLStage,
+    "text-prompt": TextPromptStage,
    "upscale-bsrgan": UpscaleBSRGANStage,
    "upscale-highres": UpscaleHighresStage,
    "upscale-outpaint": UpscaleOutpaintStage,
--- a/api/onnx_web/chain/text_prompt.py
+++ b/api/onnx_web/chain/text_prompt.py
@ -0,0 +1,47 @@
+from logging import getLogger
+from random import randint
+from typing import Optional
+
+from transformers import pipeline
+
+from ..params import ImageParams, SizeChart, StageParams
+from ..server import ServerContext
+from ..worker import ProgressCallback, WorkerContext
+from .base import BaseStage
+from .result import StageResult
+
+logger = getLogger(__name__)
+
+
+class TextPromptStage(BaseStage):
+    max_tile = SizeChart.max
+
+    def run(
+        self,
+        worker: WorkerContext,
+        server: ServerContext,
+        stage: StageParams,
+        params: ImageParams,
+        sources: StageResult,
+        *,
+        callback: Optional[ProgressCallback] = None,
+        prompt_model: str = "Gustavosta/MagicPrompt-Stable-Diffusion",
+        **kwargs,
+    ) -> StageResult:
+        gpt2_pipe = pipeline("text-generation", model=prompt_model, tokenizer="gpt2")
+        gpt2_pipe = gpt2_pipe.to("cuda")
+
+        input = params.prompt
+        max_length = len(input) + randint(60, 90)
+        logger.debug(
+            "generating new prompt with max length of %d from input prompt: %s",
+            max_length,
+            input,
+        )
+
+        result = gpt2_pipe(input, max_length=max_length, num_return_sequences=1)
+        prompt = result[0]["generated_text"].strip()
+        logger.debug("replacing prompt with: %s", prompt)
+
+        params.prompt = prompt
+        return sources