LCM Scheduler prototype

saddam213 · saddam213 · commit 87bcdb8adba2 · 2023-11-02T14:28:22.000+13:00
diff --git a/OnnxStack.StableDiffusion/Schedulers/LCMScheduler.cs b/OnnxStack.StableDiffusion/Schedulers/LCMScheduler.cs
@@ -0,0 +1,216 @@
+﻿using Microsoft.ML.OnnxRuntime.Tensors;
+using OnnxStack.StableDiffusion.Config;
+using OnnxStack.StableDiffusion.Enums;
+using OnnxStack.StableDiffusion.Helpers;
+using System;
+using System.Collections.Generic;
+using System.Linq;
+
+namespace OnnxStack.StableDiffusion.Schedulers
+{
+    internal class LCMScheduler : SchedulerBase
+    {
+        private float[] _alphasCumProd;
+        private float _finalAlphaCumprod;
+        private int _originalInferenceSteps;
+
+        /// <summary>
+        /// Initializes a new instance of the <see cref="LCMScheduler"/> class.
+        /// </summary>
+        /// <param name="stableDiffusionOptions">The stable diffusion options.</param>
+        public LCMScheduler() : this(new SchedulerOptions()) { }
+
+        /// <summary>
+        /// Initializes a new instance of the <see cref="LCMScheduler"/> class.
+        /// </summary>
+        /// <param name="stableDiffusionOptions">The stable diffusion options.</param>
+        /// <param name="schedulerOptions">The scheduler options.</param>
+        public LCMScheduler(SchedulerOptions options) : base(options) { }
+
+
+        /// <summary>
+        /// Initializes this instance.
+        /// </summary>
+        protected override void Initialize()
+        {
+            _alphasCumProd = null;
+
+            var betas = GetBetaSchedule();
+            var alphas = betas.Select(beta => 1.0f - beta);
+            _alphasCumProd = alphas
+                .Select((alpha, i) => alphas.Take(i + 1).Aggregate((a, b) => a * b))
+                .ToArray();
+
+            bool setAlphaToOne = true;
+            _finalAlphaCumprod = setAlphaToOne
+                ? 1.0f
+            : _alphasCumProd.First();
+
+            //The default number of inference steps used to generate a linearly - spaced timestep schedule, from which we
+            //will ultimately take `num_inference_steps` evenly spaced timesteps to form the final timestep schedule.
+            _originalInferenceSteps = Options.InferenceSteps;
+
+            SetInitNoiseSigma(1.0f);
+        }
+
+
+        /// <summary>
+        /// Sets the timesteps.
+        /// </summary>
+        /// <returns></returns>
+        protected override int[] SetTimesteps()
+        {
+            // LCM Timesteps Setting
+            // Currently, only linear spacing is supported.
+            var timeIncrement = (float)Options.TrainTimesteps / _originalInferenceSteps;
+
+            //# LCM Training Steps Schedule
+            var lcmOriginTimesteps = Enumerable.Range(1, _originalInferenceSteps)
+                .Select(x => x * timeIncrement - 1f)
+                .ToArray();
+
+            var skippingStep = (float)lcmOriginTimesteps.Length / Options.InferenceSteps;
+
+            // LCM Inference Steps Schedule
+            return lcmOriginTimesteps
+                .Where((t, index) => index % skippingStep == 0)
+                .Take(Options.InferenceSteps)
+                .Select(x => (int)x)
+                .OrderByDescending(x => x)
+                .ToArray();
+        }
+
+
+        /// <summary>
+        /// Scales the input.
+        /// </summary>
+        /// <param name="sample">The sample.</param>
+        /// <param name="timestep">The timestep.</param>
+        /// <returns></returns>
+        public override DenseTensor<float> ScaleInput(DenseTensor<float> sample, int timestep)
+        {
+            return sample;
+        }
+
+
+        /// <summary>
+        /// Processes a inference step for the specified model output.
+        /// </summary>
+        /// <param name="modelOutput">The model output.</param>
+        /// <param name="timestep">The timestep.</param>
+        /// <param name="sample">The sample.</param>
+        /// <param name="order">The order.</param>
+        /// <returns></returns>
+        public override DenseTensor<float> Step(DenseTensor<float> modelOutput, int timestep, DenseTensor<float> sample, int order = 4)
+        {
+            //# Latent Consistency Models paper https://arxiv.org/abs/2310.04378
+
+            int currentTimestep = timestep;
+
+            // 1. get previous step value
+            int previousTimestep = GetPreviousTimestep(currentTimestep);
+
+            //# 2. compute alphas, betas
+            float alphaProdT = _alphasCumProd[currentTimestep];
+            float alphaProdTPrev = previousTimestep >= 0 ? _alphasCumProd[previousTimestep] : _finalAlphaCumprod;
+            float betaProdT = 1f - alphaProdT;
+            float betaProdTPrev = 1f - alphaProdTPrev;
+
+            // 3.Get scalings for boundary conditions
+            (float cSkip, float cOut) = GetBoundaryConditionScalings(currentTimestep);
+
+
+            //# 4. compute predicted original sample from predicted noise also called "predicted x_0" of formula (15) from https://arxiv.org/pdf/2006.11239.pdf
+            DenseTensor<float> predOriginalSample = null;
+            if (Options.PredictionType == PredictionType.Epsilon)
+            {
+                var sampleBeta = sample.SubtractTensors(modelOutput.MultipleTensorByFloat((float)Math.Sqrt(betaProdT)));
+                predOriginalSample = sampleBeta.DivideTensorByFloat((float)Math.Sqrt(alphaProdT));
+            }
+            else if (Options.PredictionType == PredictionType.Sample)
+            {
+                predOriginalSample = modelOutput;
+            }
+            else if (Options.PredictionType == PredictionType.VariablePrediction)
+            {
+                var alphaSqrt = (float)Math.Sqrt(alphaProdT);
+                var betaSqrt = (float)Math.Sqrt(betaProdT);
+                predOriginalSample = sample
+                    .MultipleTensorByFloat(alphaSqrt)
+                    .SubtractTensors(modelOutput.MultipleTensorByFloat(betaSqrt));
+            }
+
+
+            //# 5. Clip or threshold "predicted x_0"
+            // TODO: OnnxStack does not yet support Threshold and Clipping
+
+
+            //# 6. Denoise model output using boundary conditions
+            var denoised = sample
+                .MultipleTensorByFloat(cSkip)
+                .AddTensors(predOriginalSample.MultipleTensorByFloat(cOut));
+
+
+            //# 7. Sample and inject noise z ~ N(0, I) for MultiStep Inference
+            var prevSample = Timesteps.Count > 1
+                ? CreateRandomSample(modelOutput.Dimensions)
+                    .MultipleTensorByFloat(MathF.Sqrt(betaProdTPrev))
+                    .AddTensors(denoised.MultipleTensorByFloat(MathF.Sqrt(alphaProdTPrev)))
+                : denoised;
+
+            return prevSample;
+        }
+
+
+        /// <summary>
+        /// Adds noise to the sample.
+        /// </summary>
+        /// <param name="originalSamples">The original samples.</param>
+        /// <param name="noise">The noise.</param>
+        /// <param name="timesteps">The timesteps.</param>
+        /// <returns></returns>
+        public override DenseTensor<float> AddNoise(DenseTensor<float> originalSamples, DenseTensor<float> noise, IReadOnlyList<int> timesteps)
+        {
+            // Ref: https://github.com/huggingface/diffusers/blob/main/src/diffusers/schedulers/scheduling_ddpm.py#L456
+            int timestep = timesteps[0];
+            float alphaProd = _alphasCumProd[timestep];
+            float sqrtAlpha = (float)Math.Sqrt(alphaProd);
+            float sqrtOneMinusAlpha = (float)Math.Sqrt(1.0f - alphaProd);
+
+            return noise
+                .MultipleTensorByFloat(sqrtOneMinusAlpha)
+                .AddTensors(originalSamples.MultipleTensorByFloat(sqrtAlpha));
+        }
+
+
+        /// <summary>
+        /// Gets the boundary condition scalings.
+        /// </summary>
+        /// <param name="timestep">The timestep.</param>
+        /// <returns></returns>
+        public (float cSkip, float cOut) GetBoundaryConditionScalings(float timestep)
+        {
+            //self.sigma_data = 0.5  # Default: 0.5
+            var sigmaData = 0.5f;
+
+            //c_skip = self.sigma_data * *2 / ((t / 0.1) * *2 + self.sigma_data * *2)
+            float cSkip = MathF.Pow(sigmaData, 2f) / (MathF.Pow(timestep / 0.1f, 2f) + MathF.Pow(sigmaData, 2f));
+
+            //c_out = (t / 0.1) / ((t / 0.1) * *2 + self.sigma_data * *2) * *0.5
+            float cOut = (timestep / 0.1f) / (MathF.Pow(timestep / 0.1f, 2f) + MathF.Pow(sigmaData, 2f)) * 0.5f;
+
+            return (cSkip, cOut);
+        }
+
+
+        /// <summary>
+        /// Releases unmanaged and - optionally - managed resources.
+        /// </summary>
+        /// <param name="disposing"><c>true</c> to release both managed and unmanaged resources; <c>false</c> to release only unmanaged resources.</param>
+        protected override void Dispose(bool disposing)
+        {
+            _alphasCumProd = null;
+            base.Dispose(disposing);
+        }
+    }
+}