tetherto
diff --git a/‎examples/llama.swiftui/llama.cpp.swift/LibLlama.swift‎
Lines changed: 79 additions & 11 deletions b/‎examples/llama.swiftui/llama.cpp.swift/LibLlama.swift‎
Lines changed: 79 additions & 11 deletions
diff --git a/‎examples/llama.swiftui/llama.swiftui.xcodeproj/project.pbxproj‎
Lines changed: 31 additions & 9 deletions b/‎examples/llama.swiftui/llama.swiftui.xcodeproj/project.pbxproj‎
Lines changed: 31 additions & 9 deletions
diff --git a/‎examples/llama.swiftui/llama.swiftui/Bridging/FinetuneBridge.h‎
Lines changed: 50 additions & 0 deletions b/‎examples/llama.swiftui/llama.swiftui/Bridging/FinetuneBridge.h‎
Lines changed: 50 additions & 0 deletions
@@ -5,6 +5,16 @@ enum LlamaError: Error {
     case couldNotInitializeContext
 }
 
+struct LlamaRuntimeOptions {
+    var contextLength: Int32
+    var nGpuLayers: Int32
+    var seed: UInt32
+    var temperature: Float
+    var topP: Float
+    var topK: Int32
+    var flashAttention: Bool
+}
+
 func llama_batch_clear(_ batch: inout llama_batch) {
     batch.n_tokens = 0
 }
@@ -25,9 +35,10 @@ actor LlamaContext {
     private var model: OpaquePointer
     private var context: OpaquePointer
     private var vocab: OpaquePointer
-    private var sampling: UnsafeMutablePointer<llama_sampler>
+    private var sampling: UnsafeMutablePointer<llama_sampler>?
     private var batch: llama_batch
     private var tokens_list: [llama_token]
+    private var runtimeOptions: LlamaRuntimeOptions
     var is_done: Bool = false
 
     /// This variable is used to store temporarily invalid cchars
@@ -38,34 +49,80 @@ actor LlamaContext {
 
     var n_decode: Int32 = 0
 
-    init(model: OpaquePointer, context: OpaquePointer) {
+    init(model: OpaquePointer, context: OpaquePointer, options: LlamaRuntimeOptions) {
         self.model = model
         self.context = context
         self.tokens_list = []
-        self.batch = llama_batch_init(512, 0, 1)
+    self.batch = llama_batch_init(max(Int32(512), options.contextLength), 0, 1)
         self.temporary_invalid_cchars = []
-        let sparams = llama_sampler_chain_default_params()
-        self.sampling = llama_sampler_chain_init(sparams)
-        llama_sampler_chain_add(self.sampling, llama_sampler_init_temp(0.4))
-        llama_sampler_chain_add(self.sampling, llama_sampler_init_dist(1234))
+        self.runtimeOptions = options
+        self.n_len = options.contextLength
         vocab = llama_model_get_vocab(model)
+
+        let chainParams = llama_sampler_chain_default_params()
+        let initialChain = llama_sampler_chain_init(chainParams)
+
+        if options.topK > 0 {
+            llama_sampler_chain_add(initialChain, llama_sampler_init_top_k(options.topK))
+        }
+
+        let clampedTopP = max(0.0, min(Double(options.topP), 1.0))
+        llama_sampler_chain_add(initialChain, llama_sampler_init_top_p(Float(clampedTopP), 1))
+
+    let clampedTemp = max(0.0, Double(options.temperature))
+        llama_sampler_chain_add(initialChain, llama_sampler_init_temp(Float(clampedTemp)))
+
+        let seed = options.seed == 0 ? UInt32.max : options.seed
+        llama_sampler_chain_add(initialChain, llama_sampler_init_dist(seed))
+
+        sampling = initialChain
     }
 
     deinit {
-        llama_sampler_free(sampling)
+        if let sampling {
+            llama_sampler_free(sampling)
+        }
         llama_batch_free(batch)
         llama_model_free(model)
         llama_free(context)
         llama_backend_free()
     }
 
-    static func create_context(path: String) throws -> LlamaContext {
+    private func rebuildSamplerChain() {
+        let chainParams = llama_sampler_chain_default_params()
+        let newChain = llama_sampler_chain_init(chainParams)
+
+        if runtimeOptions.topK > 0 {
+            llama_sampler_chain_add(newChain, llama_sampler_init_top_k(runtimeOptions.topK))
+        }
+
+        let clampedTopP = max(0.0, min(runtimeOptions.topP, 1.0))
+        llama_sampler_chain_add(newChain, llama_sampler_init_top_p(clampedTopP, 1))
+
+    let clampedTemp = max(0.0, Double(runtimeOptions.temperature))
+        llama_sampler_chain_add(newChain, llama_sampler_init_temp(Float(clampedTemp)))
+
+        let seed = runtimeOptions.seed == 0 ? UInt32.max : runtimeOptions.seed
+        llama_sampler_chain_add(newChain, llama_sampler_init_dist(seed))
+
+        if let sampling {
+            llama_sampler_free(sampling)
+        }
+
+        sampling = newChain
+    }
+
+    static func create_context(path: String, options: LlamaRuntimeOptions) throws -> LlamaContext {
         llama_backend_init()
         var model_params = llama_model_default_params()
 
 #if targetEnvironment(simulator)
         model_params.n_gpu_layers = 0
         print("Running on simulator, force use n_gpu_layers = 0")
+#else
+        if options.nGpuLayers >= 0 {
+            model_params.n_gpu_layers = options.nGpuLayers
+        }
 #endif
         let model = llama_model_load_from_file(path, model_params)
         guard let model else {
@@ -77,17 +134,24 @@ actor LlamaContext {
         print("Using \(n_threads) threads")
 
         var ctx_params = llama_context_default_params()
-        ctx_params.n_ctx = 2048
+        ctx_params.n_ctx = UInt32(options.contextLength)
         ctx_params.n_threads       = Int32(n_threads)
         ctx_params.n_threads_batch = Int32(n_threads)
+        ctx_params.flash_attn_type = options.flashAttention ? LLAMA_FLASH_ATTN_TYPE_ENABLED : LLAMA_FLASH_ATTN_TYPE_DISABLED
 
         let context = llama_init_from_model(model, ctx_params)
         guard let context else {
             print("Could not load context!")
             throw LlamaError.couldNotInitializeContext
         }
 
-        return LlamaContext(model: model, context: context)
+        return LlamaContext(model: model, context: context, options: options)
+    }
+
+    func updateSampler(options: LlamaRuntimeOptions) {
+        runtimeOptions = options
+        n_len = options.contextLength
+        rebuildSamplerChain()
     }
 
     func model_info() -> String {
@@ -151,6 +215,10 @@ actor LlamaContext {
     func completion_loop() -> String {
         var new_token_id: llama_token = 0
 
+        guard let sampling else {
+            return ""
+        }
+
         new_token_id = llama_sampler_sample(sampling, context, batch.n_tokens - 1)
 
         if llama_vocab_is_eog(vocab, new_token_id) || n_cur == n_len {
 
@@ -20,6 +20,7 @@
 		DD84C9FD2D747FED007778EC /* llama.xcframework in Frameworks */ = {isa = PBXBuildFile; fileRef = DD84C9FC2D747FED007778EC /* llama.xcframework */; };
 		DD84C9FE2D747FED007778EC /* llama.xcframework in Embed Frameworks */ = {isa = PBXBuildFile; fileRef = DD84C9FC2D747FED007778EC /* llama.xcframework */; settings = {ATTRIBUTES = (CodeSignOnCopy, RemoveHeadersOnCopy, ); }; };
 		F1FE20E22B465ECA00B45541 /* LoadCustomButton.swift in Sources */ = {isa = PBXBuildFile; fileRef = F1FE20E12B465EC900B45541 /* LoadCustomButton.swift */; };
+		D1A2F0012E0C8E8B00A1B1C0 /* FinetuneBridge.mm in Sources */ = {isa = PBXBuildFile; fileRef = D1A2F0002E0C8E8B00A1B1C0 /* FinetuneBridge.mm */; };
 /* End PBXBuildFile section */
 
 /* Begin PBXCopyFilesBuildPhase section */
@@ -51,6 +52,9 @@
 		DD84C9FC2D747FED007778EC /* llama.xcframework */ = {isa = PBXFileReference; lastKnownFileType = wrapper.xcframework; name = llama.xcframework; path = "../../build-apple/llama.xcframework"; sourceTree = "<group>"; };
 		DF2D2FE72B4A59BE00FCB72D /* llama.cpp */ = {isa = PBXFileReference; lastKnownFileType = wrapper; name = llama.cpp; path = ../..; sourceTree = "<group>"; };
 		F1FE20E12B465EC900B45541 /* LoadCustomButton.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = LoadCustomButton.swift; sourceTree = "<group>"; };
+		D1A2F0002E0C8E8B00A1B1C0 /* FinetuneBridge.mm */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.cpp.objcpp; path = FinetuneBridge.mm; sourceTree = "<group>"; };
+		D1A2F0022E0C8E8B00A1B1C0 /* FinetuneBridge.h */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.h; path = FinetuneBridge.h; sourceTree = "<group>"; };
+		D1A2F0032E0C8E8B00A1B1C0 /* llama_swiftui-Bridging-Header.h */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.c.h; path = "llama_swiftui-Bridging-Header.h"; sourceTree = "<group>"; };
 /* End PBXFileReference section */
 
 /* Begin PBXFrameworksBuildPhase section */
@@ -93,6 +97,7 @@
 				8A3F84102AC4BD85005E2EE8 /* Resources */,
 				8A9F7C4B2AC332DC008AE1EA /* Models */,
 				8A9F7C4A2AC332BF008AE1EA /* UI */,
+				D1A2F0062E0C8E8B00A1B1C0 /* Bridging */,
 				8A1C83762AC328BD0096AF73 /* llama_swiftuiApp.swift */,
 				8A1C837A2AC328BE0096AF73 /* Assets.xcassets */,
 			);
@@ -109,19 +114,19 @@
 			name = Frameworks;
 			sourceTree = "<group>";
 		};
-		8A3F84102AC4BD85005E2EE8 /* Resources */ = {
+		8A3F84112AC4BD8C005E2EE8 /* models */ = {
 			isa = PBXGroup;
 			children = (
-				8A3F84112AC4BD8C005E2EE8 /* models */,
 			);
-			path = Resources;
+			path = models;
 			sourceTree = "<group>";
 		};
-		8A3F84112AC4BD8C005E2EE8 /* models */ = {
+		8A3F84102AC4BD85005E2EE8 /* Resources */ = {
 			isa = PBXGroup;
 			children = (
+				8A3F84112AC4BD8C005E2EE8 /* models */,
 			);
-			path = models;
+			path = Resources;
 			sourceTree = "<group>";
 		};
 		8A907F312AC7134E006146EA /* llama.cpp.swift */ = {
@@ -132,6 +137,16 @@
 			path = llama.cpp.swift;
 			sourceTree = "<group>";
 		};
+		D1A2F0062E0C8E8B00A1B1C0 /* Bridging */ = {
+			isa = PBXGroup;
+			children = (
+				D1A2F0022E0C8E8B00A1B1C0 /* FinetuneBridge.h */,
+				D1A2F0032E0C8E8B00A1B1C0 /* llama_swiftui-Bridging-Header.h */,
+				D1A2F0002E0C8E8B00A1B1C0 /* FinetuneBridge.mm */,
+			);
+			path = Bridging;
+			sourceTree = "<group>";
+		};
 		8A9F7C4A2AC332BF008AE1EA /* UI */ = {
 			isa = PBXGroup;
 			children = (
@@ -230,6 +245,7 @@
 				F1FE20E22B465ECA00B45541 /* LoadCustomButton.swift in Sources */,
 				8A907F332AC7138A006146EA /* LibLlama.swift in Sources */,
 				8A9F7C4D2AC332EE008AE1EA /* LlamaState.swift in Sources */,
+				D1A2F0012E0C8E8B00A1B1C0 /* FinetuneBridge.mm in Sources */,
 				8A1C83792AC328BD0096AF73 /* ContentView.swift in Sources */,
 				8A1C83772AC328BD0096AF73 /* llama_swiftuiApp.swift in Sources */,
 				7FA3D2B32B2EA2F600543F92 /* DownloadButton.swift in Sources */,
@@ -364,9 +380,10 @@
 			buildSettings = {
 				ASSETCATALOG_COMPILER_APPICON_NAME = AppIcon;
 				CLANG_ENABLE_MODULES = YES;
+				CODE_SIGN_IDENTITY = "Apple Development";
 				CODE_SIGN_STYLE = Automatic;
 				CURRENT_PROJECT_VERSION = 1;
-				DEVELOPMENT_TEAM = K5UQJPP73A;
+				DEVELOPMENT_TEAM = 3LT8Z8ZRCG;
 				ENABLE_PREVIEWS = YES;
 				GENERATE_INFOPLIST_FILE = YES;
 				INFOPLIST_KEY_UIApplicationSceneManifest_Generation = YES;
@@ -380,14 +397,16 @@
 					"@executable_path/Frameworks",
 				);
 				MARKETING_VERSION = 1.0;
-				PRODUCT_BUNDLE_IDENTIFIER = "com.bachittle.llama-swift";
+				PRODUCT_BUNDLE_IDENTIFIER = "llama-collabora";
 				PRODUCT_NAME = "$(TARGET_NAME)";
+				PROVISIONING_PROFILE_SPECIFIER = "";
 				SUPPORTED_PLATFORMS = "iphoneos iphonesimulator xros xrsimulator";
 				SUPPORTS_XR_DESIGNED_FOR_IPHONE_IPAD = NO;
 				SWIFT_EMIT_LOC_STRINGS = YES;
 				SWIFT_OPTIMIZATION_LEVEL = "-Onone";
 				SWIFT_VERSION = 5.0;
 				TARGETED_DEVICE_FAMILY = "1,2,7";
+				SWIFT_OBJC_BRIDGING_HEADER = "llama.swiftui/Bridging/llama_swiftui-Bridging-Header.h";
 			};
 			name = Debug;
 		};
@@ -396,9 +415,10 @@
 			buildSettings = {
 				ASSETCATALOG_COMPILER_APPICON_NAME = AppIcon;
 				CLANG_ENABLE_MODULES = YES;
+				CODE_SIGN_IDENTITY = "Apple Development";
 				CODE_SIGN_STYLE = Automatic;
 				CURRENT_PROJECT_VERSION = 1;
-				DEVELOPMENT_TEAM = K5UQJPP73A;
+				DEVELOPMENT_TEAM = 3LT8Z8ZRCG;
 				ENABLE_PREVIEWS = YES;
 				GENERATE_INFOPLIST_FILE = YES;
 				INFOPLIST_KEY_UIApplicationSceneManifest_Generation = YES;
@@ -412,13 +432,15 @@
 					"@executable_path/Frameworks",
 				);
 				MARKETING_VERSION = 1.0;
-				PRODUCT_BUNDLE_IDENTIFIER = "com.bachittle.llama-swift";
+				PRODUCT_BUNDLE_IDENTIFIER = "llama-collabora";
 				PRODUCT_NAME = "$(TARGET_NAME)";
+				PROVISIONING_PROFILE_SPECIFIER = "";
 				SUPPORTED_PLATFORMS = "iphoneos iphonesimulator xros xrsimulator";
 				SUPPORTS_XR_DESIGNED_FOR_IPHONE_IPAD = NO;
 				SWIFT_EMIT_LOC_STRINGS = YES;
 				SWIFT_VERSION = 5.0;
 				TARGETED_DEVICE_FAMILY = "1,2,7";
+				SWIFT_OBJC_BRIDGING_HEADER = "llama.swiftui/Bridging/llama_swiftui-Bridging-Header.h";
 			};
 			name = Release;
 		};
 
@@ -0,0 +1,50 @@
+#pragma once
+
+#include <stdbool.h>
+#include <stddef.h>
+#include <stdint.h>
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+// Error codes returned by llama_swift_run_lora_finetune
+enum llama_swift_finetune_error {
+    LLAMA_SWIFT_FINETUNE_OK = 0,
+    LLAMA_SWIFT_FINETUNE_ERROR_INVALID_ARGUMENT = 1,
+    LLAMA_SWIFT_FINETUNE_ERROR_MODEL_LOAD = 2,
+    LLAMA_SWIFT_FINETUNE_ERROR_CONTEXT_CREATE = 3,
+    LLAMA_SWIFT_FINETUNE_ERROR_DATASET = 4,
+    LLAMA_SWIFT_FINETUNE_ERROR_TRAINING_INIT = 5,
+    LLAMA_SWIFT_FINETUNE_ERROR_SAVE = 6,
+};
+
+struct llama_swift_finetune_options {
+    int32_t  n_ctx;
+    int32_t  n_threads;
+    int32_t  n_batch;
+    int32_t  n_ubatch;
+    int32_t  epochs;
+    int32_t  lora_rank;
+    float    lora_alpha;
+    float    learning_rate;
+    float    val_split;
+    uint32_t target_modules;
+    int32_t  seed;
+    bool     flash_attn;
+    int32_t  n_gpu_layers;
+};
+
+typedef void (*llama_swift_finetune_log_callback)(const char * message, void * user_data);
+
+enum llama_swift_finetune_error llama_swift_run_lora_finetune(
+    const char * model_path,
+    const char * dataset_path,
+    const char * output_adapter_path,
+    const struct llama_swift_finetune_options * options,
+    llama_swift_finetune_log_callback logger,
+    void * user_data);
+
+#ifdef __cplusplus
+}
+#endif