From 8193d18c7c64affb27221f0ffeadab44867a8030 Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Wed, 20 Aug 2025 10:18:55 +0200 Subject: [PATCH] feat(img2img): Add support to Qwen Image Edit (#6113) Signed-off-by: Ettore Di Giacinto --- backend/python/diffusers/backend.py | 5 ++++- gallery/index.yaml | 20 ++++++++++++++++++++ 2 files changed, 24 insertions(+), 1 deletion(-) diff --git a/backend/python/diffusers/backend.py b/backend/python/diffusers/backend.py index 17a71694a..185838209 100755 --- a/backend/python/diffusers/backend.py +++ b/backend/python/diffusers/backend.py @@ -18,7 +18,7 @@ import backend_pb2_grpc import grpc from diffusers import SanaPipeline, StableDiffusion3Pipeline, StableDiffusionXLPipeline, StableDiffusionDepth2ImgPipeline, DPMSolverMultistepScheduler, StableDiffusionPipeline, DiffusionPipeline, \ - EulerAncestralDiscreteScheduler, FluxPipeline, FluxTransformer2DModel + EulerAncestralDiscreteScheduler, FluxPipeline, FluxTransformer2DModel, QwenImageEditPipeline from diffusers import StableDiffusionImg2ImgPipeline, AutoPipelineForText2Image, ControlNetModel, StableVideoDiffusionPipeline, Lumina2Text2ImgPipeline from diffusers.pipelines.stable_diffusion import safety_checker from diffusers.utils import load_image, export_to_video @@ -263,6 +263,9 @@ class BackendServicer(backend_pb2_grpc.BackendServicer): elif request.PipelineType == "DiffusionPipeline": self.pipe = DiffusionPipeline.from_pretrained(request.Model, torch_dtype=torchType) + elif request.PipelineType == "QwenImageEditPipeline": + self.pipe = QwenImageEditPipeline.from_pretrained(request.Model, + torch_dtype=torchType) elif request.PipelineType == "VideoDiffusionPipeline": self.txt2vid = True self.pipe = DiffusionPipeline.from_pretrained(request.Model, diff --git a/gallery/index.yaml b/gallery/index.yaml index 7f64f0f02..2da4ca063 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -127,6 +127,26 @@ - text-to-image description: | We are thrilled to release Qwen-Image, an image generation foundation model in the Qwen series that achieves significant advances in complex text rendering and precise image editing. Experiments show strong general capabilities in both image generation and editing, with exceptional performance in text rendering, especially for Chinese. +- !!merge <<: *qwenimage + name: "qwen-image-edit" + url: "github:mudler/LocalAI/gallery/qwen-image.yaml@master" + urls: + - https://huggingface.co/Qwen/Qwen-Image-Edit + icon: https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-Image/qwen_image_logo.png + license: apache-2.0 + tags: + - qwen-image + - gpu + - image-to-image + description: | + Qwen-Image-Edit is a model for image editing, which is based on Qwen-Image. + overrides: + parameters: + model: Qwen/Qwen-Image-Edit + diffusers: + cuda: true + pipeline_type: QwenImageEditPipeline + enable_parameters: num_inference_steps,image - &gptoss name: "gpt-oss-20b" url: "github:mudler/LocalAI/gallery/harmony.yaml@master"