Inpaint Legacy process started

saddam213 · saddam213 · commit e31a85dabdbc · 2023-10-17T23:40:05.000+13:00
diff --git a/OnnxStack.StableDiffusion/Diffusers/InpaintLegacyDiffuser.cs b/OnnxStack.StableDiffusion/Diffusers/InpaintLegacyDiffuser.cs
@@ -0,0 +1,216 @@
+﻿using Microsoft.ML.OnnxRuntime;
+using Microsoft.ML.OnnxRuntime.Tensors;
+using OnnxStack.Core.Config;
+using OnnxStack.Core.Services;
+using OnnxStack.StableDiffusion.Common;
+using OnnxStack.StableDiffusion.Config;
+using OnnxStack.StableDiffusion.Diffusers;
+using OnnxStack.StableDiffusion.Helpers;
+using SixLabors.ImageSharp;
+using SixLabors.ImageSharp.Processing;
+using SixLabors.ImageSharp.Processing.Processors.Transforms;
+using System;
+using System.Collections.Generic;
+using System.Linq;
+using System.Threading;
+using System.Threading.Tasks;
+
+namespace OnnxStack.StableDiffusion.Services
+{
+    public sealed class InpaintLegacyDiffuser : DiffuserBase
+    {
+        /// <summary>
+        /// Initializes a new instance of the <see cref="InpaintLegacyDiffuser"/> class.
+        /// </summary>
+        /// <param name="configuration">The configuration.</param>
+        /// <param name="onnxModelService">The onnx model service.</param>
+        public InpaintLegacyDiffuser(IOnnxModelService onnxModelService, IPromptService promptService)
+            : base(onnxModelService, promptService)
+        {
+        }
+
+        public override async Task<DenseTensor<float>> DiffuseAsync(PromptOptions promptOptions, SchedulerOptions schedulerOptions, Action<int, int> progress = null, CancellationToken cancellationToken = default)
+        {
+            // Create random seed if none was set
+            schedulerOptions.Seed = schedulerOptions.Seed > 0 ? schedulerOptions.Seed : Random.Shared.Next();
+
+            // Get Scheduler
+            using (var scheduler = GetScheduler(promptOptions, schedulerOptions))
+            {
+                // Process prompts
+                var promptEmbeddings = await _promptService.CreatePromptAsync(promptOptions.Prompt, promptOptions.NegativePrompt);
+
+                // Get timesteps
+                var timesteps = GetTimesteps(promptOptions, schedulerOptions, scheduler);
+
+                // Create latent sample
+                var latentsOriginal = PrepareLatents(promptOptions, schedulerOptions, scheduler, timesteps);
+
+                // Create masks sample
+                var maskImage = PrepareMask(promptOptions, schedulerOptions);
+
+                // Generate some noise
+                var noise = scheduler.CreateRandomSample(latentsOriginal.Dimensions);
+
+                // Add noise to original latent
+                var latents = scheduler.AddNoise(latentsOriginal, noise, timesteps);
+
+                // Loop though the timesteps
+                var step = 0;
+                foreach (var timestep in timesteps)
+                {
+                    cancellationToken.ThrowIfCancellationRequested();
+
+                    // Create input tensor.
+                    var inputTensor = scheduler.ScaleInput(latents.Duplicate(schedulerOptions.GetScaledDimension(2)), timestep);
+
+                    // Create Input Parameters
+                    var inputNames = _onnxModelService.GetInputNames(OnnxModelType.Unet);
+                    var inputParameters = CreateInputParameters(
+                         NamedOnnxValue.CreateFromTensor(inputNames[0], inputTensor),
+                         NamedOnnxValue.CreateFromTensor(inputNames[1], new DenseTensor<long>(new long[] { timestep }, new int[] { 1 })),
+                         NamedOnnxValue.CreateFromTensor(inputNames[2], promptEmbeddings));
+
+                    // Run Inference
+                    using (var inferResult = await _onnxModelService.RunInferenceAsync(OnnxModelType.Unet, inputParameters))
+                    {
+                        var noisePred = inferResult.FirstElementAs<DenseTensor<float>>();
+
+                        // Perform guidance
+                        if (schedulerOptions.GuidanceScale > 1.0f)
+                        {
+                            var (noisePredUncond, noisePredText) = noisePred.SplitTensor(schedulerOptions.GetScaledDimension());
+                            noisePred = noisePredUncond.PerformGuidance(noisePredText, schedulerOptions.GuidanceScale);
+                        }
+
+                        // Scheduler Step
+                        var steplatents = scheduler.Step(noisePred, timestep, latents);
+
+                        // Add noise to original latent
+                        var initLatentsProper = scheduler.AddNoise(latentsOriginal, noise, new[] { timestep });
+
+                        // Apply mask and combine 
+                        latents = ApplyMaskedLatents(steplatents, initLatentsProper, maskImage);
+
+                        ImageHelpers.TensorToImageDebug(latents, $@"D:\Debug\Latent{step}.png");
+                    }
+
+                    progress?.Invoke(++step, timesteps.Count);
+                }
+
+                // Decode Latents
+                return await DecodeLatents(schedulerOptions, latents);
+            }
+        }
+
+
+        /// <summary>
+        /// Gets the timesteps.
+        /// </summary>
+        /// <param name="prompt">The prompt.</param>
+        /// <param name="options">The options.</param>
+        /// <param name="scheduler">The scheduler.</param>
+        /// <returns></returns>
+        protected override IReadOnlyList<int> GetTimesteps(PromptOptions prompt, SchedulerOptions options, IScheduler scheduler)
+        {
+            var inittimestep = Math.Min((int)(options.InferenceSteps * options.Strength), options.InferenceSteps);
+            var start = Math.Max(options.InferenceSteps - inittimestep, 0);
+            return scheduler.Timesteps.Skip(start).ToList();
+        }
+
+
+        /// <summary>
+        /// Prepares the latents for inference.
+        /// </summary>
+        /// <param name="prompt">The prompt.</param>
+        /// <param name="options">The options.</param>
+        /// <param name="scheduler">The scheduler.</param>
+        /// <returns></returns>
+        protected override DenseTensor<float> PrepareLatents(PromptOptions prompt, SchedulerOptions options, IScheduler scheduler, IReadOnlyList<int> timesteps)
+        {
+            // Image input, decode, add noise, return as latent 0
+            var imageTensor = prompt.InputImage.ToDenseTensor(new[] { 1, 3, options.Width, options.Height });
+            var inputNames = _onnxModelService.GetInputNames(OnnxModelType.VaeEncoder);
+            var inputParameters = CreateInputParameters(NamedOnnxValue.CreateFromTensor(inputNames[0], imageTensor));
+            using (var inferResult = _onnxModelService.RunInference(OnnxModelType.VaeEncoder, inputParameters))
+            {
+                var sample = inferResult.FirstElementAs<DenseTensor<float>>();
+                var noisySample = sample
+                    .AddTensors(scheduler.CreateRandomSample(sample.Dimensions, options.InitialNoiseLevel))
+                    .MultipleTensorByFloat(_configuration.ScaleFactor);
+                return noisySample;
+            }
+        }
+
+
+        /// <summary>
+        /// Prepares the mask.
+        /// </summary>
+        /// <param name="promptOptions">The prompt options.</param>
+        /// <param name="schedulerOptions">The scheduler options.</param>
+        /// <returns></returns>
+        private DenseTensor<float> PrepareMask(PromptOptions promptOptions, SchedulerOptions schedulerOptions)
+        {
+            using (var mask = promptOptions.InputImageMask.ToImage())
+            {
+                // Prepare the mask
+                int width = schedulerOptions.GetScaledWidth();
+                int height = schedulerOptions.GetScaledHeight();
+                mask.Mutate(x => x.Grayscale());
+                mask.Mutate(x => x.Resize(new Size(width, height), KnownResamplers.NearestNeighbor, true));
+                var maskTensor = new DenseTensor<float>(new[] { 1, 4, width, height });
+                mask.ProcessPixelRows(img =>
+                {
+                    for (int x = 0; x < width; x++)
+                    {
+                        for (int y = 0; y < height; y++)
+                        {
+                            var pixelSpan = img.GetRowSpan(y);
+                            var value = (float)pixelSpan[x].A / 255.0f;
+
+                            //TODO: mask = 1 - mask  # repaint white, keep black
+                            maskTensor[0, 0, y, x] = 0f;
+                            maskTensor[0, 1, y, x] = 0f; // Needed for shape only
+                            maskTensor[0, 2, y, x] = 0f; // Needed for shape only
+                            maskTensor[0, 3, y, x] = 0f; // Needed for shape only
+                        }
+                    }
+                });
+                return maskTensor;
+            }
+        }
+
+
+        /// <summary>
+        /// Applies the masked latents.
+        /// </summary>
+        /// <param name="latents">The latents.</param>
+        /// <param name="initLatentsProper">The initialize latents proper.</param>
+        /// <param name="mask">The mask.</param>
+        /// <returns></returns>
+        private DenseTensor<float> ApplyMaskedLatents(DenseTensor<float> latents, DenseTensor<float> initLatentsProper, DenseTensor<float> mask)
+        {
+            var result = new DenseTensor<float>(latents.Dimensions);
+            for (int batch = 0; batch < latents.Dimensions[0]; batch++)
+            {
+                for (int channel = 0; channel < latents.Dimensions[1]; channel++)
+                {
+                    for (int height = 0; height < latents.Dimensions[2]; height++)
+                    {
+                        for (int width = 0; width < latents.Dimensions[3]; width++)
+                        {
+                            float maskValue = mask[batch, 0, height, width];
+                            float latentsValue = latents[batch, channel, height, width];
+                            float initLatentsProperValue = initLatentsProper[batch, channel, height, width];
+
+                            //TODO: Apply the logic to compute the result based on the mask
+                            float newValue = (initLatentsProperValue * maskValue) + (latentsValue * (1f - maskValue));
+                            result[batch, channel, height, width] = newValue;
+                        }
+                    }
+                }
+            }
+            return result;
+        }
+    }
+}
diff --git a/OnnxStack.StableDiffusion/Helpers/TensorHelper.cs b/OnnxStack.StableDiffusion/Helpers/TensorHelper.cs
@@ -280,6 +280,62 @@ public static DenseTensor<float> Abs(this DenseTensor<float> tensor)
         }
 
 
+        /// <summary>
+        /// Multiplies the specified tensor.
+        /// </summary>
+        /// <param name="tensor1">The tensor1.</param>
+        /// <param name="tensor2">The tensor2.</param>
+        /// <returns></returns>
+        public static DenseTensor<float> Multiply(this DenseTensor<float> tensor1, DenseTensor<float> tensor2)
+        {
+            var result = new DenseTensor<float>(tensor1.Dimensions);
+            for (int batch = 0; batch < tensor1.Dimensions[0]; batch++)
+            {
+                for (int channel = 0; channel < tensor1.Dimensions[1]; channel++)
+                {
+                    for (int height = 0; height < tensor1.Dimensions[2]; height++)
+                    {
+                        for (int width = 0; width < tensor1.Dimensions[3]; width++)
+                        {
+                            var value1 = tensor1[batch, channel, height, width];
+                            var value2 = tensor2[batch, channel, height, width];
+                            result[batch, channel, height, width] = value1 * value2;
+                        }
+                    }
+                }
+            }
+            return result;
+        }
+
+
+        /// <summary>
+        /// Divides the specified tensor.
+        /// </summary>
+        /// <param name="tensor1">The tensor1.</param>
+        /// <param name="tensor2">The tensor2.</param>
+        /// <returns></returns>
+        public static DenseTensor<float> Divide(this DenseTensor<float> tensor1, DenseTensor<float> tensor2)
+        {
+            var result = new DenseTensor<float>(tensor1.Dimensions);
+            for (int batch = 0; batch < tensor1.Dimensions[0]; batch++)
+            {
+                for (int channel = 0; channel < tensor1.Dimensions[1]; channel++)
+                {
+                    for (int height = 0; height < tensor1.Dimensions[2]; height++)
+                    {
+                        for (int width = 0; width < tensor1.Dimensions[3]; width++)
+                        {
+                            var value1 = tensor1[batch, channel, height, width];
+                            var value2 = tensor2[batch, channel, height, width];
+                            result[batch, channel, height, width] = value1 / value2;
+                        }
+                    }
+                }
+            }
+            return result;
+        }
+
+
         /// <summary>
         /// Generate a random Tensor from a normal distribution with mean 0 and variance 1
         /// </summary>
diff --git a/OnnxStack.StableDiffusion/Services/DiffuserService.cs b/OnnxStack.StableDiffusion/Services/DiffuserService.cs
@@ -15,6 +15,7 @@ public sealed class DiffuserService : IDiffuserService
         private readonly IDiffuser _textDiffuser;
         private readonly IDiffuser _imageDiffuser;
         private readonly IDiffuser _inpaintDiffuser;
+        private readonly IDiffuser _inpaintLegacyDiffuser;
 
         /// <summary>
         /// Initializes a new instance of the <see cref="DiffuserService"/> class.
@@ -26,6 +27,7 @@ public DiffuserService(IOnnxModelService onnxModelService, IPromptService prompt
             _textDiffuser = new TextDiffuser(onnxModelService, promptService);
             _imageDiffuser = new ImageDiffuser(onnxModelService, promptService);
             _inpaintDiffuser = new InpaintDiffuser(onnxModelService, promptService);
+            _inpaintLegacyDiffuser = new InpaintLegacyDiffuser(onnxModelService, promptService);
         }
 
 
@@ -41,7 +43,7 @@ public async Task<DenseTensor<float>> RunAsync(PromptOptions promptOptions, Sche
             {
                 ProcessType.TextToImage => await _textDiffuser.DiffuseAsync(promptOptions, schedulerOptions, progress, cancellationToken),
                 ProcessType.ImageToImage => await _imageDiffuser.DiffuseAsync(promptOptions, schedulerOptions, progress, cancellationToken),
-                ProcessType.ImageInpaint => await _inpaintDiffuser.DiffuseAsync(promptOptions, schedulerOptions, progress, cancellationToken),
+                ProcessType.ImageInpaint => await _inpaintLegacyDiffuser.DiffuseAsync(promptOptions, schedulerOptions, progress, cancellationToken),
                 _ => throw new NotImplementedException()
             };
         }
diff --git a/OnnxStack.WebUI/wwwroot/js/stableDiffusionImageInpaint.js b/OnnxStack.WebUI/wwwroot/js/stableDiffusionImageInpaint.js
@@ -320,7 +320,7 @@ const stableDiffusionImageInpaint = () => {
 
 
     // Map UI Events/Functions
-    $(".image2image-control").hide();
+    //$(".image2image-control").hide();
     buttonCancel.on("click", cancelDiffusion);
     buttonClear.on("click", clearHistory);
     buttonExecute.on("click", async () => { await executeDiffusion(); });