LCM ImageToImage support

saddam213 · saddam213 · commit 86d719556833 · 2023-11-03T08:23:36.000+13:00
diff --git a/OnnxStack.StableDiffusion/Diffusers/LatentConsistency/ImageDiffuser.cs b/OnnxStack.StableDiffusion/Diffusers/LatentConsistency/ImageDiffuser.cs
@@ -0,0 +1,74 @@
+﻿using Microsoft.ML.OnnxRuntime;
+using Microsoft.ML.OnnxRuntime.Tensors;
+using OnnxStack.Core.Config;
+using OnnxStack.Core.Services;
+using OnnxStack.StableDiffusion.Common;
+using OnnxStack.StableDiffusion.Config;
+using OnnxStack.StableDiffusion.Helpers;
+using SixLabors.ImageSharp;
+using System;
+using System.Collections.Generic;
+using System.Linq;
+
+
+namespace OnnxStack.StableDiffusion.Diffusers.LatentConsistency
+{
+    public sealed class ImageDiffuser : TextDiffuser
+    {
+        /// <summary>
+        /// Initializes a new instance of the <see cref="ImageDiffuser"/> class.
+        /// </summary>
+        /// <param name="configuration">The configuration.</param>
+        /// <param name="onnxModelService">The onnx model service.</param>
+        public ImageDiffuser(IOnnxModelService onnxModelService, IPromptService promptService)
+            : base(onnxModelService, promptService)
+        {
+        }
+
+
+        /// <summary>
+        /// Gets the timesteps.
+        /// </summary>
+        /// <param name="prompt">The prompt.</param>
+        /// <param name="options">The options.</param>
+        /// <param name="scheduler">The scheduler.</param>
+        /// <returns></returns>
+        protected override IReadOnlyList<int> GetTimesteps(PromptOptions prompt, SchedulerOptions options, IScheduler scheduler)
+        {
+            // Image2Image we narrow step the range by the Strength
+            var inittimestep = Math.Min((int)(options.InferenceSteps * options.Strength), options.InferenceSteps);
+            var start = Math.Max(options.InferenceSteps - inittimestep, 0);
+            return scheduler.Timesteps.Skip(start).ToList();
+        }
+
+
+        /// <summary>
+        /// Prepares the latents for inference.
+        /// </summary>
+        /// <param name="prompt">The prompt.</param>
+        /// <param name="options">The options.</param>
+        /// <param name="scheduler">The scheduler.</param>
+        /// <returns></returns>
+        protected override DenseTensor<float> PrepareLatents(IModelOptions model, PromptOptions prompt, SchedulerOptions options, IScheduler scheduler, IReadOnlyList<int> timesteps)
+        {
+            // Image input, decode, add noise, return as latent 0
+            var imageTensor = prompt.InputImage.ToDenseTensor(new[] { 1, 3, options.Width, options.Height });
+            var inputNames = _onnxModelService.GetInputNames(model, OnnxModelType.VaeEncoder);
+            var inputParameters = CreateInputParameters(NamedOnnxValue.CreateFromTensor(inputNames[0], imageTensor));
+            using (var inferResult = _onnxModelService.RunInference(model, OnnxModelType.VaeEncoder, inputParameters))
+            {
+                var sample = inferResult.FirstElementAs<DenseTensor<float>>();
+                var scaledSample = sample
+                    .Add(scheduler.CreateRandomSample(sample.Dimensions, options.InitialNoiseLevel))
+                    .MultiplyBy(model.ScaleFactor);
+
+                var noisySample = scheduler.AddNoise(scaledSample, scheduler.CreateRandomSample(scaledSample.Dimensions), timesteps);
+                if (prompt.BatchCount > 1)
+                    return noisySample.Repeat(prompt.BatchCount);
+
+                return noisySample;
+            }
+        }
+
+    }
+}
diff --git a/OnnxStack.StableDiffusion/Diffusers/LatentConsistency/TextDiffuser.cs b/OnnxStack.StableDiffusion/Diffusers/LatentConsistency/TextDiffuser.cs
@@ -5,8 +5,6 @@
 using OnnxStack.StableDiffusion.Common;
 using OnnxStack.StableDiffusion.Config;
 using OnnxStack.StableDiffusion.Enums;
-using OnnxStack.StableDiffusion.Helpers;
-using OnnxStack.StableDiffusion.Schedulers;
 using OnnxStack.StableDiffusion.Schedulers.LatentConsistency;
 using System;
 using System.Collections.Generic;
@@ -16,7 +14,7 @@
 
 namespace OnnxStack.StableDiffusion.Diffusers.LatentConsistency
 {
-    public sealed class TextDiffuser : DiffuserBase
+    public class TextDiffuser : DiffuserBase
     {
         /// <summary>
         /// Initializes a new instance of the <see cref="TextDiffuser"/> class.
diff --git a/OnnxStack.StableDiffusion/Pipelines/LatentConsistency.cs b/OnnxStack.StableDiffusion/Pipelines/LatentConsistency.cs
@@ -17,7 +17,8 @@ public LatentConsistencyPipeline(IOnnxModelService onnxModelService, IPromptServ
         {
             var diffusers = new Dictionary<DiffuserType, IDiffuser>
             {
-               { DiffuserType.TextToImage, new TextDiffuser(onnxModelService, promptService) }
+               { DiffuserType.TextToImage, new TextDiffuser(onnxModelService, promptService) },
+               { DiffuserType.ImageToImage, new ImageDiffuser(onnxModelService, promptService) }
             };
             _pipelineType = DiffuserPipelineType.LatentConsistency;
             _diffusers = new ConcurrentDictionary<DiffuserType, IDiffuser>(diffusers);
diff --git a/OnnxStack.StableDiffusion/Schedulers/LatentConsistency/LCMScheduler.cs b/OnnxStack.StableDiffusion/Schedulers/LatentConsistency/LCMScheduler.cs
@@ -197,7 +197,7 @@ public override DenseTensor<float> AddNoise(DenseTensor<float> originalSamples,
         public (float cSkip, float cOut) GetBoundaryConditionScalings(float timestep)
         {
             //self.sigma_data = 0.5  # Default: 0.5
-            var sigmaData = 0.1f;
+            var sigmaData = 0.5f;
 
             float c = MathF.Pow(timestep / 0.1f, 2f) + MathF.Pow(sigmaData, 2f);
             float cSkip = MathF.Pow(sigmaData, 2f) / c;

Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,8 @@ public LatentConsistencyPipeline(IOnnxModelService onnxModelService, IPromptServ`
`17`	`17`	`{`
`18`	`18`	`var diffusers = new Dictionary<DiffuserType, IDiffuser>`
`19`	`19`	`{`
`20`		`- { DiffuserType.TextToImage, new TextDiffuser(onnxModelService, promptService) }`
	`20`	`+ { DiffuserType.TextToImage, new TextDiffuser(onnxModelService, promptService) },`
	`21`	`+ { DiffuserType.ImageToImage, new ImageDiffuser(onnxModelService, promptService) }`
`21`	`22`	`};`
`22`	`23`	`_pipelineType = DiffuserPipelineType.LatentConsistency;`
`23`	`24`	`_diffusers = new ConcurrentDictionary<DiffuserType, IDiffuser>(diffusers);`
Original file line number	Diff line number	Diff line change
`@@ -197,7 +197,7 @@ public override DenseTensor<float> AddNoise(DenseTensor<float> originalSamples,`
`197`	`197`	`public (float cSkip, float cOut) GetBoundaryConditionScalings(float timestep)`
`198`	`198`	`{`
`199`	`199`	`//self.sigma_data = 0.5 # Default: 0.5`
`200`		`- var sigmaData = 0.1f;`
	`200`	`+ var sigmaData = 0.5f;`
`201`	`201`
`202`	`202`	`float c = MathF.Pow(timestep / 0.1f, 2f) + MathF.Pow(sigmaData, 2f);`
`203`	`203`	`float cSkip = MathF.Pow(sigmaData, 2f) / c;`