KDPM2 Scheduler

saddam213 · saddam213 · commit ca2b6bd6160d · 2023-10-29T18:56:43.000+13:00
diff --git a/OnnxStack.StableDiffusion/Diffusers/DiffuserBase.cs b/OnnxStack.StableDiffusion/Diffusers/DiffuserBase.cs
@@ -283,6 +283,7 @@ protected static IScheduler GetScheduler(PromptOptions prompt, SchedulerOptions
                 SchedulerType.EulerAncestral => new EulerAncestralScheduler(options),
                 SchedulerType.DDPM => new DDPMScheduler(options),
                 SchedulerType.DDIM => new DDIMScheduler(options),
+                SchedulerType.KDPM2 => new KDPM2Scheduler(options),
                 _ => default
             };
         }
diff --git a/OnnxStack.StableDiffusion/Enums/SchedulerType.cs b/OnnxStack.StableDiffusion/Enums/SchedulerType.cs
@@ -17,6 +17,9 @@ public enum SchedulerType
         DDPM = 3,
 
         [Display(Name = "DDIM")]
-        DDIM = 4
+        DDIM = 4,
+
+        [Display(Name = "KDPM2")]
+        KDPM2 = 5
     }
 }
diff --git a/OnnxStack.StableDiffusion/Schedulers/DDPMScheduler.cs b/OnnxStack.StableDiffusion/Schedulers/DDPMScheduler.cs
@@ -1,9 +1,5 @@
 ﻿using Microsoft.ML.OnnxRuntime.Tensors;
 using NumSharp;
-using OnnxStack.Core;
-using OnnxStack.StableDiffusion.Config;
-using OnnxStack.StableDiffusion.Enums;
-using OnnxStack.StableDiffusion.Helpers;
 using OnnxStack.StableDiffusion.Config;
 using OnnxStack.StableDiffusion.Enums;
 using OnnxStack.StableDiffusion.Helpers;
diff --git a/OnnxStack.StableDiffusion/Schedulers/KDPM2Scheduler.cs b/OnnxStack.StableDiffusion/Schedulers/KDPM2Scheduler.cs
@@ -0,0 +1,248 @@
+﻿using Microsoft.ML.OnnxRuntime.Tensors;
+using NumSharp;
+using OnnxStack.StableDiffusion.Config;
+using OnnxStack.StableDiffusion.Enums;
+using OnnxStack.StableDiffusion.Helpers;
+using System;
+using System.Collections.Generic;
+using System.Linq;
+
+namespace OnnxStack.StableDiffusion.Schedulers
+{
+    internal class KDPM2Scheduler : SchedulerBase
+    {
+        private int _stepIndex;
+        private float[] _sigmas;
+        private float[] _sigmasInterpol;
+        private float[] _alphasCumProd;
+        private DenseTensor<float> _sample;
+
+        /// <summary>
+        /// Initializes a new instance of the <see cref="KDPM2Scheduler"/> class.
+        /// </summary>
+        /// <param name="stableDiffusionOptions">The stable diffusion options.</param>
+        public KDPM2Scheduler() : this(new SchedulerOptions()) { }
+
+        /// <summary>
+        /// Initializes a new instance of the <see cref="KDPM2Scheduler"/> class.
+        /// </summary>
+        /// <param name="stableDiffusionOptions">The stable diffusion options.</param>
+        /// <param name="schedulerOptions">The scheduler options.</param>
+        public KDPM2Scheduler(SchedulerOptions options) : base(options) { }
+
+
+        /// <summary>
+        /// Initializes this instance.
+        /// </summary>
+        protected override void Initialize()
+        {
+            _stepIndex = 0;
+            _sample = null;
+            _alphasCumProd = null;
+
+            var betas = GetBetaSchedule();
+            var alphas = betas.Select(beta => 1.0f - beta);
+            _alphasCumProd = alphas
+                .Select((alpha, i) => alphas.Take(i + 1).Aggregate((a, b) => a * b))
+                .ToArray();
+            _sigmas = _alphasCumProd
+               .Select(alpha_prod => (float)Math.Sqrt((1 - alpha_prod) / alpha_prod))
+               .ToArray();
+
+            var initNoiseSigma = GetInitNoiseSigma(_sigmas);
+            SetInitNoiseSigma(initNoiseSigma);
+        }
+
+
+        /// <summary>
+        /// Sets the timesteps.
+        /// </summary>
+        /// <returns></returns>
+        protected override int[] SetTimesteps()
+        {
+            // Create timesteps based on the specified strategy
+            var sigmas = _sigmas.ToArray();
+            var timesteps = GetTimesteps();
+            var logSigmas = np.log(sigmas).ToArray<float>();
+            var range = np.arange(0, (float)_sigmas.Length).ToArray<float>();
+            sigmas = Interpolate(timesteps, range, _sigmas);
+
+            if (Options.UseKarrasSigmas)
+            {
+                sigmas = ConvertToKarras(sigmas);
+                timesteps = SigmaToTimestep(sigmas, logSigmas);
+            }
+
+            //# interpolate sigmas
+            var sigmasInterpol = InterpolateSigmas(sigmas);
+
+            _sigmas = Interleave(sigmas);
+            _sigmasInterpol = Interleave(sigmasInterpol);
+
+            var timestepsInterpol = SigmaToTimestep(sigmasInterpol, logSigmas);
+            var interleavedTimesteps = timestepsInterpol
+                .Concat(timesteps)
+                .Select(x => (int)x)
+                .OrderByDescending(x => x)
+                .ToArray();
+            return interleavedTimesteps;
+        }
+
+
+        /// <summary>
+        /// Scales the input.
+        /// </summary>
+        /// <param name="sample">The sample.</param>
+        /// <param name="timestep">The timestep.</param>
+        /// <returns></returns>
+        public override DenseTensor<float> ScaleInput(DenseTensor<float> sample, int timestep)
+        {
+            var sigma = _sample is null
+                ? _sigmas[_stepIndex]
+                : _sigmasInterpol[_stepIndex];
+
+            sigma = (float)Math.Sqrt(Math.Pow(sigma, 2) + 1);
+            return sample.DivideTensorByFloat(sigma);
+        }
+
+
+        /// <summary>
+        /// Processes a inference step for the specified model output.
+        /// </summary>
+        /// <param name="modelOutput">The model output.</param>
+        /// <param name="timestep">The timestep.</param>
+        /// <param name="sample">The sample.</param>
+        /// <param name="order">The order.</param>
+        /// <returns></returns>
+        /// <exception cref="System.ArgumentException">Invalid prediction_type: {SchedulerOptions.PredictionType}</exception>
+        /// <exception cref="System.NotImplementedException">KDPM2Scheduler Thresholding currently not implemented</exception>
+        public override DenseTensor<float> Step(DenseTensor<float> modelOutput, int timestep, DenseTensor<float> sample, int order = 4)
+        {
+            float sigma;
+            float sigmaInterpol;
+            float sigmaNext;
+            bool isFirstPass = _sample is null;
+            if (isFirstPass)
+            {
+                sigma = _sigmas[_stepIndex];
+                sigmaInterpol = _sigmasInterpol[_stepIndex + 1];
+                sigmaNext = _sigmas[_stepIndex + 1];
+            }
+            else
+            {
+                sigma = _sigmas[_stepIndex - 1];
+                sigmaInterpol = _sigmasInterpol[_stepIndex];
+                sigmaNext = _sigmas[_stepIndex];
+            }
+
+            //# currently only gamma=0 is supported. This usually works best anyways.
+            float gamma = 0f;
+            float sigmaHat = sigma * (gamma + 1f);
+            var sigmaInput = isFirstPass ? sigmaHat : sigmaInterpol;
+            DenseTensor<float> predOriginalSample;
+            if (Options.PredictionType == PredictionType.Epsilon)
+            {
+                predOriginalSample = sample.SubtractTensors(modelOutput.MultipleTensorByFloat(sigmaInput));
+            }
+            else if (Options.PredictionType == PredictionType.VariablePrediction)
+            {
+                var sigmaSqrt = (float)Math.Sqrt(sigmaInput * sigmaInput + 1f);
+                predOriginalSample = sample.DivideTensorByFloat(sigmaSqrt)
+                    .AddTensors(modelOutput.MultipleTensorByFloat(-sigmaInput / sigmaSqrt));
+            }
+            else
+            {
+                predOriginalSample = modelOutput.ToDenseTensor();
+            }
+
+
+            float dt;
+            DenseTensor<float> derivative;
+            if (isFirstPass)
+            {
+                dt = sigmaInterpol - sigmaHat;
+                derivative = sample
+                    .SubtractTensors(predOriginalSample)
+                    .DivideTensorByFloat(sigmaHat);
+                _sample = sample.ToDenseTensor();
+            }
+            else
+            {
+                dt = sigmaNext - sigmaHat;
+                derivative = sample
+                    .SubtractTensors(predOriginalSample)
+                    .DivideTensorByFloat(sigmaInterpol);
+                sample = _sample;
+                _sample = null;
+            }
+
+            _stepIndex += 1;
+            return sample.AddTensors(derivative.MultipleTensorByFloat(dt));
+        }
+
+
+        /// <summary>
+        /// Adds noise to the sample.
+        /// </summary>
+        /// <param name="originalSamples">The original samples.</param>
+        /// <param name="noise">The noise.</param>
+        /// <param name="timesteps">The timesteps.</param>
+        /// <returns></returns>
+        public override DenseTensor<float> AddNoise(DenseTensor<float> originalSamples, DenseTensor<float> noise, IReadOnlyList<int> timesteps)
+        {
+            var sigma = _sigmas[_stepIndex];
+            return noise
+                .MultipleTensorByFloat(sigma)
+                .AddTensors(originalSamples);
+        }
+
+
+        /// <summary>
+        /// Interpolates the sigmas.
+        /// </summary>
+        /// <param name="sigmas">The sigmas.</param>
+        /// <returns></returns>
+        public float[] InterpolateSigmas(float[] sigmas)
+        {
+            var rolledLogSigmas = sigmas
+                .Append(0f)
+                .Select((value, index) => (float)Math.Log(sigmas[(index + sigmas.Length - 1) % sigmas.Length]))
+                .ToArray();
+
+            var lerpSigmas = new float[rolledLogSigmas.Length - 1];
+            for (int i = 0; i < rolledLogSigmas.Length - 1; i++)
+            {
+                lerpSigmas[i] = (float)Math.Exp(rolledLogSigmas[i] + 0.5f * (rolledLogSigmas[i + 1] - rolledLogSigmas[i]));
+            }
+            return lerpSigmas;
+        }
+
+
+        /// <summary>
+        /// Interleaves the specified sigmas.
+        /// </summary>
+        /// <param name="sigmas">The sigmas.</param>
+        /// <returns></returns>
+        private float[] Interleave(float[] sigmas)
+        {
+            var first = sigmas.First();
+            var last = sigmas.Last();
+            return sigmas.Skip(1)
+                .SelectMany(value => new[] { value, value })
+                .Prepend(first)
+                .Append(last)
+                .ToArray();
+        }
+
+
+        /// <summary>
+        /// Releases unmanaged and - optionally - managed resources.
+        /// </summary>
+        /// <param name="disposing"><c>true</c> to release both managed and unmanaged resources; <c>false</c> to release only unmanaged resources.</param>
+        protected override void Dispose(bool disposing)
+        {
+            _alphasCumProd = null;
+            base.Dispose(disposing);
+        }
+    }
+}
diff --git a/OnnxStack.StableDiffusion/Schedulers/SchedulerBase.cs b/OnnxStack.StableDiffusion/Schedulers/SchedulerBase.cs
@@ -276,7 +276,7 @@ protected float[] GetBetasForAlphaBar()
         protected float[] Interpolate(float[] timesteps, float[] range, float[] sigmas)
         {
             // Create an output array with the same shape as timesteps
-            var result = new float[timesteps.Length + 1];
+            var result = new float[timesteps.Length];
 
             // Loop over each element of timesteps
             for (int i = 0; i < timesteps.Length; i++)

Original file line number	Diff line number	Diff line change
`@@ -283,6 +283,7 @@ protected static IScheduler GetScheduler(PromptOptions prompt, SchedulerOptions`
`283`	`283`	`SchedulerType.EulerAncestral => new EulerAncestralScheduler(options),`
`284`	`284`	`SchedulerType.DDPM => new DDPMScheduler(options),`
`285`	`285`	`SchedulerType.DDIM => new DDIMScheduler(options),`
	`286`	`+ SchedulerType.KDPM2 => new KDPM2Scheduler(options),`
`286`	`287`	`_ => default`
`287`	`288`	`};`
`288`	`289`	`}`
Original file line number	Diff line number	Diff line change
`@@ -17,6 +17,9 @@ public enum SchedulerType`
`17`	`17`	`DDPM = 3,`
`18`	`18`
`19`	`19`	`[Display(Name = "DDIM")]`
`20`		`- DDIM = 4`
	`20`	`+ DDIM = 4,`
	`21`	`+`
	`22`	`+ [Display(Name = "KDPM2")]`
	`23`	`+ KDPM2 = 5`
`21`	`24`	`}`
`22`	`25`	`}`
Original file line number	Diff line number	Diff line change
`@@ -276,7 +276,7 @@ protected float[] GetBetasForAlphaBar()`
`276`	`276`	`protected float[] Interpolate(float[] timesteps, float[] range, float[] sigmas)`
`277`	`277`	`{`
`278`	`278`	`// Create an output array with the same shape as timesteps`
`279`		`- var result = new float[timesteps.Length + 1];`
	`279`	`+ var result = new float[timesteps.Length];`
`280`	`280`
`281`	`281`	`// Loop over each element of timesteps`
`282`	`282`	`for (int i = 0; i < timesteps.Length; i++)`