from io import BytesIO from logging import getLogger from typing import List, Optional from boto3 import Session from PIL import Image from ..params import ImageParams, StageParams from ..server import ServerContext from ..worker import WorkerContext from .stage import BaseStage logger = getLogger(__name__) class SourceS3Stage(BaseStage): def run( self, _job: WorkerContext, _server: ServerContext, _stage: StageParams, _params: ImageParams, _sources: List[Image.Image], *, source_keys: List[str], bucket: str, endpoint_url: Optional[str] = None, profile_name: Optional[str] = None, **kwargs, ) -> List[Image.Image]: session = Session(profile_name=profile_name) s3 = session.client("s3", endpoint_url=endpoint_url) outputs = [] for key in source_keys: try: logger.info("loading image from s3://%s/%s", bucket, key) data = BytesIO() s3.download_fileobj(bucket, key, data) data.seek(0) outputs.append(Image.open(data)) except Exception: logger.exception("error loading image from S3") return outputs