QwenImageEdit support

saddam213 · saddam213 · commit 75ad3923d366 · 2025-12-21T13:22:39.000+13:00
diff --git a/TensorStack.Python/Common/PipelineOptions.cs b/TensorStack.Python/Common/PipelineOptions.cs
@@ -1,4 +1,5 @@
 ﻿using System.Collections.Generic;
+using TensorStack.Common.Tensor;
 
 namespace TensorStack.Python.Common
 {
@@ -21,6 +22,6 @@ public record PipelineOptions
         public SchedulerType Scheduler { get; set; }
         public SchedulerType[] Schedulers { get; set; }
         public List<LoraOptions> LoraOptions { get; set; }
-       
+        public ImageTensor ImageInput { get; set; }
     }
 }
diff --git a/TensorStack.Python/Common/ProcessType.cs b/TensorStack.Python/Common/ProcessType.cs
@@ -3,6 +3,7 @@
     public enum ProcessType
     {
         TextToImage = 0,
-        ImageToImage = 1
+        ImageToImage = 1,
+        ImageEdit = 2
     }
 }
diff --git a/TensorStack.Python/Config/EnvironmentConfig.cs b/TensorStack.Python/Config/EnvironmentConfig.cs
@@ -6,5 +6,86 @@ public record EnvironmentConfig
         public string Environment { get; set; }
         public string[] Requirements { get; set; }
         public string Directory { get; set; }
+
+
+        public readonly static EnvironmentConfig DefaultCPU = new()
+        {
+            Environment = "default-cpu",
+            Directory = "PythonRuntime",
+            Requirements =
+            [
+                "torchvision==0.22.0",
+
+                 // Default Packages
+                "typing",
+                "wheel",
+                "transformers",
+                "accelerate",
+                "diffusers",
+                "protobuf",
+                "sentencepiece",
+                "pillow",
+                "ftfy",
+                "scipy",
+                "peft",
+                "pillow"
+            ]
+        };
+
+
+        public readonly static EnvironmentConfig DefaultCUDA = new()
+        {
+            Environment = "default-cuda",
+            Directory = "PythonRuntime",
+            Requirements =
+            [
+                "--extra-index-url https://download.pytorch.org/whl/cu118",
+                "torchvision==0.22.0+cu118",
+
+                 // Default Packages
+                "typing",
+                "wheel",
+                "transformers",
+                "accelerate",
+                "diffusers",
+                "protobuf",
+                "sentencepiece",
+                "pillow",
+                "ftfy",
+                "scipy",
+                "peft",
+                "pillow"
+            ]
+        };
+
+
+        public readonly static EnvironmentConfig DefaultROCM = new()
+        {
+            Environment = "default-rocm",
+            Directory = "PythonRuntime",
+            Requirements =
+            [
+                "https://repo.radeon.com/rocm/windows/rocm-rel-7.1.1/rocm_sdk_core-0.1.dev0-py3-none-win_amd64.whl",
+                "https://repo.radeon.com/rocm/windows/rocm-rel-7.1.1/rocm_sdk_devel-0.1.dev0-py3-none-win_amd64.whl",
+                "https://repo.radeon.com/rocm/windows/rocm-rel-7.1.1/rocm_sdk_libraries_custom-0.1.dev0-py3-none-win_amd64.whl",
+                "https://repo.radeon.com/rocm/windows/rocm-rel-7.1.1/rocm-0.1.dev0.tar.gz",
+                "https://repo.radeon.com/rocm/windows/rocm-rel-7.1.1/torch-2.9.0+rocmsdk20251116-cp312-cp312-win_amd64.whl",
+                "https://repo.radeon.com/rocm/windows/rocm-rel-7.1.1/torchvision-0.24.0+rocmsdk20251116-cp312-cp312-win_amd64.whl",
+
+                // Default Packages
+                "typing",
+                "wheel",
+                "transformers",
+                "accelerate",
+                "diffusers",
+                "protobuf",
+                "sentencepiece",
+                "pillow",
+                "ftfy",
+                "scipy",
+                "peft",
+                "pillow"
+            ]
+        };
     }
 }
diff --git a/TensorStack.Python/Pipelines/ChromaPipeline.py b/TensorStack.Python/Pipelines/ChromaPipeline.py
@@ -7,7 +7,7 @@
 from collections.abc import Buffer
 from typing import Coroutine, Dict, Sequence, List, Tuple, Optional
 from diffusers import ChromaPipeline, ChromaImg2ImgPipeline
-from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, createTensor
+from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, imageFromInput
 sys.stderr = MemoryStdout()
 
 # Globals
@@ -150,7 +150,7 @@ def generate(
         )[0]
     elif _processType == "ImageToImage":
         output = _pipeline(
-            image = createTensor(inputData, inputShape, device=_pipeline.device, dtype=_pipeline.dtype),
+            image = imageFromInput(inputData, inputShape),
             strength = strength,
             prompt = prompt,
             negative_prompt = negativePrompt,
diff --git a/TensorStack.Python/Pipelines/QwenImagePipeline.py b/TensorStack.Python/Pipelines/QwenImagePipeline.py
@@ -6,8 +6,8 @@
 from threading import Event
 from collections.abc import Buffer
 from typing import Coroutine, Dict, Sequence, List, Tuple, Optional
-from diffusers import QwenImagePipeline, QwenImageImg2ImgPipeline
-from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, createTensor
+from diffusers import QwenImagePipeline, QwenImageImg2ImgPipeline, QwenImageEditPipeline
+from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, imageFromInput
 sys.stderr = MemoryStdout()
 
 # Globals
@@ -56,6 +56,14 @@ def load(
             token = secureToken,
             variant=variant
         )
+    elif _processType == "ImageEdit":
+        _pipeline = QwenImageEditPipeline.from_pretrained(
+            modelName, 
+            torch_dtype=torch_dtype,
+            cache_dir = cacheDir,
+            token = secureToken,
+            variant=variant
+        )
 
     #Lora Adapters
     if loraAdapters is not None:
@@ -151,7 +159,7 @@ def generate(
         )[0]
     elif _processType == "ImageToImage":
         output = _pipeline(
-            image = createTensor(inputData, inputShape, device=_pipeline.device, dtype=_pipeline.dtype),
+            image = imageFromInput(inputData, inputShape),
             strength = strength,
             prompt = prompt,
             negative_prompt = negativePrompt,
@@ -165,6 +173,21 @@ def generate(
             callback_on_step_end = _progress_callback,
             callback_on_step_end_tensor_inputs = ["latents"]
         )[0]
+    elif _processType == "ImageEdit":
+        output = _pipeline(
+            image = imageFromInput(inputData, inputShape),
+            prompt = prompt,
+            negative_prompt = negativePrompt,
+            height = height,
+            width = width,
+            generator = _generator.manual_seed(seed),
+            true_cfg_scale = guidanceScale,
+            guidance_scale = guidanceScale2,
+            num_inference_steps = steps,
+            output_type = "np",
+            callback_on_step_end = _progress_callback,
+            callback_on_step_end_tensor_inputs = ["latents"]
+        )[0]
 
     # (Batch, Channel, Height, Width)
     output = output.transpose(0, 3, 1, 2)
diff --git a/TensorStack.Python/Pipelines/WanPipeline.py b/TensorStack.Python/Pipelines/WanPipeline.py
@@ -7,7 +7,7 @@
 from collections.abc import Buffer
 from typing import Coroutine, Dict, Sequence, List, Tuple, Optional
 from diffusers import WanPipeline, WanImageToVideoPipeline, UniPCMultistepScheduler
-from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, createTensor
+from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, tensorFromInput
 sys.stderr = MemoryStdout()
 
 # Globals
@@ -152,7 +152,7 @@ def generate(
         )[0]
     elif _processType == "ImageToImage":
         max_area = height * width
-        image = createTensor(inputData, inputShape, device=_pipeline.device, dtype=_pipeline.dtype)
+        image = tensorFromInput(inputData, inputShape, device=_pipeline.device, dtype=_pipeline.dtype)
         image = resize_tensor(image, max_area, _pipeline)
         output = _pipeline(
             image = image,
diff --git a/TensorStack.Python/Pipelines/ZImagePipeline.py b/TensorStack.Python/Pipelines/ZImagePipeline.py
@@ -7,7 +7,7 @@
 from collections.abc import Buffer
 from typing import Coroutine, Dict, Sequence, List, Tuple, Optional
 from diffusers import ZImagePipeline, ZImageImg2ImgPipeline
-from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, createTensor
+from tensorstack.utils import MemoryStdout, create_scheduler, getDataType, imageFromInput
 sys.stderr = MemoryStdout()
 
 # Globals
@@ -150,7 +150,7 @@ def generate(
         )[0]
     elif _processType == "ImageToImage":
         output = _pipeline(
-            image = createTensor(inputData, inputShape, device=_pipeline.device, dtype=_pipeline.dtype),
+            image = imageFromInput(inputData, inputShape),
             strength = strength,
             prompt = prompt, 
             negative_prompt = negativePrompt,
diff --git a/TensorStack.Python/Python/lib/tensorstack/utils.py b/TensorStack.Python/Python/lib/tensorstack/utils.py
@@ -1,4 +1,5 @@
 import torch
+from PIL import Image
 from typing import Sequence, Optional
 import numpy as np
 import threading
@@ -80,7 +81,7 @@ def getDataType(dtype: str):
     return torch.float
 
 
-def createTensor(
+def tensorFromInput(
     inputData: Optional[Sequence[float]],
     inputShape: Optional[Sequence[int]],
     *,
@@ -112,6 +113,23 @@ def createTensor(
     return torch.from_numpy(np_array).to(device=device, dtype=dtype)
 
 
+def imageFromInput(
+    inputData: Optional[Sequence[float]],
+    inputShape: Optional[Sequence[int]],
+) -> Optional[Image.Image]:
+
+    if not inputData or not inputShape:
+        return None
+
+    t = torch.tensor(inputData, dtype=torch.float32)
+    t = t.view(*inputShape)
+    t = t[0]
+    t = (t + 1) / 2
+    t = t.permute(1, 2, 0)
+    t = (t.clamp(0, 1) * 255).to(torch.uint8)
+    return Image.fromarray(t.numpy())
+
+
 class MemoryStdout:
     def __init__(self, callback=None):
         self.callback = callback
diff --git a/TensorStack.Python/PythonPipeline.cs b/TensorStack.Python/PythonPipeline.cs
diff --git a/TensorStack.Python/README.md b/TensorStack.Python/README.md

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`using System.Collections.Generic;`
	`2`	`+using TensorStack.Common.Tensor;`
`2`	`3`
`3`	`4`	`namespace TensorStack.Python.Common`
`4`	`5`	`{`
`@@ -21,6 +22,6 @@ public record PipelineOptions`
`21`	`22`	`public SchedulerType Scheduler { get; set; }`
`22`	`23`	`public SchedulerType[] Schedulers { get; set; }`
`23`	`24`	`public List<LoraOptions> LoraOptions { get; set; }`
`24`		`-`
	`25`	`+ public ImageTensor ImageInput { get; set; }`
`25`	`26`	`}`
`26`	`27`	`}`
Original file line number	Diff line number	Diff line change
`@@ -3,6 +3,7 @@`
`3`	`3`	`public enum ProcessType`
`4`	`4`	`{`
`5`	`5`	`TextToImage = 0,`
`6`		`- ImageToImage = 1`
	`6`	`+ ImageToImage = 1,`
	`7`	`+ ImageEdit = 2`
`7`	`8`	`}`
`8`	`9`	`}`