pytorch
diff --git a/‎ImageSegmentation/ImageSegmentation.xcodeproj/project.pbxproj‎
Lines changed: 4 additions & 4 deletions b/‎ImageSegmentation/ImageSegmentation.xcodeproj/project.pbxproj‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎ImageSegmentation/ImageSegmentation/TorchModule.mm‎
Lines changed: 4 additions & 3 deletions b/‎ImageSegmentation/ImageSegmentation/TorchModule.mm‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎ImageSegmentation/ImageSegmentation/ViewController.swift‎
Lines changed: 1 addition & 1 deletion b/‎ImageSegmentation/ImageSegmentation/ViewController.swift‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎ImageSegmentation/Podfile‎
Lines changed: 1 addition & 1 deletion b/‎ImageSegmentation/Podfile‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎ImageSegmentation/README.md‎
Lines changed: 38 additions & 8 deletions b/‎ImageSegmentation/README.md‎
Lines changed: 38 additions & 8 deletions
diff --git a/‎ImageSegmentation/deeplabv3.py‎
Lines changed: 1 addition & 0 deletions b/‎ImageSegmentation/deeplabv3.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎ObjectDetection/ObjectDetection.xcodeproj/project.pbxproj‎
Lines changed: 16 additions & 0 deletions b/‎ObjectDetection/ObjectDetection.xcodeproj/project.pbxproj‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎ObjectDetection/ObjectDetection/Inference/InferenceModule.mm‎
Lines changed: 1 addition & 1 deletion b/‎ObjectDetection/ObjectDetection/Inference/InferenceModule.mm‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎ObjectDetection/ObjectDetection/Utils/PrePostProcessor.swift‎
Lines changed: 2 additions & 2 deletions b/‎ObjectDetection/ObjectDetection/Utils/PrePostProcessor.swift‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎ObjectDetection/ObjectDetection/aicook.txt‎
Lines changed: 30 additions & 0 deletions b/‎ObjectDetection/ObjectDetection/aicook.txt‎
Lines changed: 30 additions & 0 deletions
@@ -8,6 +8,7 @@
 
 /* Begin PBXBuildFile section */
 		2655CA6425454E6E006AD893 /* UIImageHelper.mm in Sources */ = {isa = PBXBuildFile; fileRef = 2655CA6225454E6E006AD893 /* UIImageHelper.mm */; };
+		2658DBFB26EC059F00AA0F61 /* deeplabv3_scripted.pt in Resources */ = {isa = PBXBuildFile; fileRef = 2658DBFA26EC059F00AA0F61 /* deeplabv3_scripted.pt */; };
 		265BAFE8253A6A6800467AC4 /* AppDelegate.swift in Sources */ = {isa = PBXBuildFile; fileRef = 265BAFE7253A6A6800467AC4 /* AppDelegate.swift */; };
 		265BAFEA253A6A6800467AC4 /* SceneDelegate.swift in Sources */ = {isa = PBXBuildFile; fileRef = 265BAFE9253A6A6800467AC4 /* SceneDelegate.swift */; };
 		265BAFEC253A6A6800467AC4 /* ViewController.swift in Sources */ = {isa = PBXBuildFile; fileRef = 265BAFEB253A6A6800467AC4 /* ViewController.swift */; };
@@ -18,12 +19,12 @@
 		265BB00E253A6E0E00467AC4 /* UIImage+Helper.swift in Sources */ = {isa = PBXBuildFile; fileRef = 265BB00D253A6E0E00467AC4 /* UIImage+Helper.swift */; };
 		265BB017253A7F0500467AC4 /* TorchModule.mm in Sources */ = {isa = PBXBuildFile; fileRef = 265BB015253A7F0500467AC4 /* TorchModule.mm */; };
 		265F9A6F2551CB3700B8F2EC /* dog.jpg in Resources */ = {isa = PBXBuildFile; fileRef = 265F9A6E2551CB3700B8F2EC /* dog.jpg */; };
-		266A451D267974C300548578 /* deeplabv3_scripted.ptl in Resources */ = {isa = PBXBuildFile; fileRef = 266A451C267974C300548578 /* deeplabv3_scripted.ptl */; };
 /* End PBXBuildFile section */
 
 /* Begin PBXFileReference section */
 		2655CA6225454E6E006AD893 /* UIImageHelper.mm */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.objcpp; path = UIImageHelper.mm; sourceTree = "<group>"; };
 		2655CA6325454E6E006AD893 /* UIImageHelper.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; path = UIImageHelper.h; sourceTree = "<group>"; };
+		2658DBFA26EC059F00AA0F61 /* deeplabv3_scripted.pt */ = {isa = PBXFileReference; lastKnownFileType = file; path = deeplabv3_scripted.pt; sourceTree = "<group>"; };
 		265BAFE4253A6A6800467AC4 /* ImageSegmentation.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = ImageSegmentation.app; sourceTree = BUILT_PRODUCTS_DIR; };
 		265BAFE7253A6A6800467AC4 /* AppDelegate.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = AppDelegate.swift; sourceTree = "<group>"; };
 		265BAFE9253A6A6800467AC4 /* SceneDelegate.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = SceneDelegate.swift; sourceTree = "<group>"; };
@@ -38,7 +39,6 @@
 		265BB015253A7F0500467AC4 /* TorchModule.mm */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.objcpp; path = TorchModule.mm; sourceTree = "<group>"; };
 		265BB016253A7F0500467AC4 /* TorchModule.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; path = TorchModule.h; sourceTree = "<group>"; };
 		265F9A6E2551CB3700B8F2EC /* dog.jpg */ = {isa = PBXFileReference; lastKnownFileType = image.jpeg; path = dog.jpg; sourceTree = "<group>"; };
-		266A451C267974C300548578 /* deeplabv3_scripted.ptl */ = {isa = PBXFileReference; lastKnownFileType = file; path = deeplabv3_scripted.ptl; sourceTree = "<group>"; };
 /* End PBXFileReference section */
 
 /* Begin PBXFrameworksBuildPhase section */
@@ -92,7 +92,7 @@
 				265BB015253A7F0500467AC4 /* TorchModule.mm */,
 				265BB00D253A6E0E00467AC4 /* UIImage+Helper.swift */,
 				265BAFFF253A6B1200467AC4 /* ImageSegmentation-Bridging-Header.h */,
-				266A451C267974C300548578 /* deeplabv3_scripted.ptl */,
+				2658DBFA26EC059F00AA0F61 /* deeplabv3_scripted.pt */,
 				265BB007253A6B9600467AC4 /* deeplab.jpg */,
 				265F9A6E2551CB3700B8F2EC /* dog.jpg */,
 			);
@@ -161,8 +161,8 @@
 				265BAFF4253A6A6900467AC4 /* LaunchScreen.storyboard in Resources */,
 				265BB008253A6B9600467AC4 /* deeplab.jpg in Resources */,
 				265BAFF1253A6A6900467AC4 /* Assets.xcassets in Resources */,
+				2658DBFB26EC059F00AA0F61 /* deeplabv3_scripted.pt in Resources */,
 				265BAFEF253A6A6800467AC4 /* Main.storyboard in Resources */,
-				266A451D267974C300548578 /* deeplabv3_scripted.ptl in Resources */,
 			);
 			runOnlyForDeploymentPostprocessing = 0;
 		};
 
@@ -8,18 +8,19 @@
 #import "UIImageHelper.h"
 #import <CoreImage/CoreImage.h>
 #import <ImageIO/ImageIO.h>
-#import <Libtorch-Lite/Libtorch-Lite.h>
+#import <Libtorch/Libtorch.h>
 
 @implementation TorchModule {
 @protected
-    torch::jit::mobile::Module _impl;
+    torch::jit::script::Module _impl;
 }
 
 - (nullable instancetype)initWithFileAtPath:(NSString*)filePath {
     self = [super init];
     if (self) {
         try {
-            _impl = torch::jit::_load_for_mobile(filePath.UTF8String);
+            _impl = torch::jit::load(filePath.UTF8String);
+            _impl.eval();
         } catch (const std::exception& exception) {
             NSLog(@"%s", exception.what());
             return nil;
 
@@ -10,7 +10,7 @@ class ViewController: UIViewController {
 
     private lazy var module: TorchModule = {
         if let filePath = Bundle.main.path(forResource:
-            "deeplabv3_scripted", ofType: "ptl"),
+            "deeplabv3_scripted", ofType: "pt"),
             let module = TorchModule(fileAtPath: filePath) {
             return module
         } else {
 
@@ -6,5 +6,5 @@ target 'ImageSegmentation' do
   use_frameworks!
 
   # Pods for ImageSegmentation
-  pod 'LibTorch-Lite', '~>1.9.0'
+  pod 'LibTorch', '~>1.9.0'
 end
@@ -2,13 +2,13 @@
 
 ## Introduction
 
-This repo offers a Python script that converts the [PyTorch DeepLabV3 model](https://pytorch.org/hub/pytorch_vision_deeplabv3_resnet101) to the Mobile Interpreter version and an iOS app that uses the model to segment images.
+This repo offers a Python script that converts the [PyTorch DeepLabV3 model](https://pytorch.org/hub/pytorch_vision_deeplabv3_resnet101) to both the Full JIT and the Lite/Mobile Interpreter versions and an iOS app that uses the Full JIT model to segment images. Steps of how to prepare the Lite model and make the code changes in the Xcode project to use the Lite model are also provided.
 
 ## Prerequisites
 
 * PyTorch 1.9 and torchvision 0.10 (Optional)
 * Python 3.8 or above (Optional)
-* iOS Cocoapods LibTorch-Lite 1.9.0 and LibTorchvision 0.10.0
+* iOS Cocoapods LibTorch 1.9.0 or LibTorch-Lite 1.9.0
 * Xcode 12.4 or later
 
 ## Quick Start
@@ -17,25 +17,25 @@ To Test Run the Image Segmentation iOS App, follow the steps below:
 
 ### 1. Prepare the Model
 
-If you don't have the PyTorch environment set up to run the script below to generate the model file, you can download it to the `ios-demo-app/ImageSegmentation` folder using the link [here](https://pytorch-mobile-demo-apps.s3.us-east-2.amazonaws.com/deeplabv3_scripted.ptl).
+If you don't have the PyTorch environment set up to run the script below to generate the full JIT model file, you can download it to the `ios-demo-app/ImageSegmentation` folder using the link [here](https://pytorch-mobile-demo-apps.s3.us-east-2.amazonaws.com/deeplabv3_scripted.pt).
 
-Open a Mac Terminal, first install PyTorch 1.9 and torchvision 0.10 using command like `pip install torch torchvision`, then run the following commands:
+Open a Terminal, first install PyTorch 1.9 and torchvision 0.10 using command like `pip install torch torchvision`, then run the following commands:
 
 ```
 git clone https://github.com/pytorch/ios-demo-app
 cd ios-demo-app/ImageSegmentation
 python deeplabv3.py
 ```
 
-The Python script `deeplabv3.py` is used to generate the Lite Interpreter model file `deeplabv3_scripted.ptl` to be used in iOS.
+The Python script `deeplabv3.py` is used to generate both the full JIT and the Lite Interpreter model files `deeplabv3_scripted.pt` and `deeplabv3_scripted.ptl` to be used in iOS.
 
-### 2. Use LibTorch-Lite
+### 2. Use LibTorch
 
-Run the commands below (note the `Podfile` uses `pod 'LibTorch-Lite', '~>1.9.0'`):
+Run the commands below (note the `Podfile` uses `pod 'LibTorch', '~>1.9.0'`):
 
 ```
 pod install
-open ImageSegmentation.xcworkspace/
+open ImageSegmentation.xcworkspace
 ```
 
 ### 3. Run the app
@@ -46,6 +46,36 @@ Select an iOS simulator or device on Xcode to run the app. The example image and
 
 Note that the `resized` method in `UIImage+Helper.swift` is used to speed up the model inference, but a smaller size may cause the result to be less accurate.
 
+## Using the Lite/Mobile Interpreter Model
+
+All the other iOS demo apps have been converted to use the new Mobile Interpreter model, except this Image Segmentation demo app, which is used to illustrate how to convert a demo using a full JIT model to one using the mobile interpreter model, by following 3 simple steps.
+
+### 1. Prepare the Lite model
+
+If you don't have the PyTorch environment set up to run the script `deeplabv3.py` to generate the mobile interpreter model file, you can download it to the `ios-demo-app/ImageSegmentation` folder using the link [here](https://pytorch-mobile-demo-apps.s3.us-east-2.amazonaws.com/deeplabv3_scripted.ptl). Otherwise, or if you prefer to run the script to generate the model yourself, just run `python deeplabv3.py`.
+
+Note that to save a model in the mobile interpreter format, simply call `_save_for_lite_interpreter`, as shown at the end of the `deeplabv3.py`:
+```
+optimized_model.save("ImageSegmentation/deeplabv3_scripted.pt")
+optimized_model._save_for_lite_interpreter("ImageSegmentation/deeplabv3_scripted.ptl")
+```
+
+### 2. Modify the Podfile
+
+If you already went through the previous section and have the demo using the full JIT model up and running, close Xcode, go to the `ios-demo-app/ImageSegmentation` directory and run `pod deintegrate` first.
+
+In `Podfile`, change `pod 'LibTorch', '~>1.9.0'` to `pod 'LibTorch-Lite', '~>1.9.0'`
+
+Then run `pod install` and `open ImageSegmentation.xcworkspace`. Don't forget to drag and drop the `deeplabv3_scripted.ptl` file from step 1 to the project.
+
+### 3. Change the iOS code
+
+In `InferenceModule.mm`, first change `#import <LibTorch/LibTorch.h>` to `#import <Libtorch-Lite/Libtorch-Lite.h>`, then change `@protected torch::jit::script::Module _impl;` to `@protected torch::jit::mobile::Module _impl;` and `_impl = torch::jit::load(filePath.UTF8String);` to `_impl = torch::jit::_load_for_mobile(filePath.UTF8String);`.
+
+Finally, modify `pt` in ViewController.swift's `Bundle.main.path(forResource: "deeplabv3_scripted", ofType: "pt")` to `ptl`.
+
+Now you can build and run the app using the Lite/Mobile interpreter model.
+
 ## Tutorial
 
 Read the tutorial [here](https://pytorch.org/tutorials/beginner/deeplabv3_on_ios.html) for detailed step-by-step instructions of how to prepare and run the [PyTorch DeepLabV3 model](https://pytorch.org/hub/pytorch_vision_deeplabv3_resnet101) on iOS, as well as practical tips on how to successfully use a pre-trained PyTorch model on iOS and avoid common pitfalls.
 
@@ -6,4 +6,5 @@
 
 scripted_module = torch.jit.script(model)
 optimized_model = optimize_for_mobile(scripted_module)
+optimized_model.save("ImageSegmentation/deeplabv3_scripted.pt")
 optimized_model._save_for_lite_interpreter("ImageSegmentation/deeplabv3_scripted.ptl")
@@ -7,6 +7,10 @@
 	objects = {
 
 /* Begin PBXBuildFile section */
+		2669BE16270FA65200806A63 /* aicook2.jpg in Resources */ = {isa = PBXBuildFile; fileRef = 2669BE11270FA61000806A63 /* aicook2.jpg */; };
+		2669BE18270FA65200806A63 /* aicook.txt in Resources */ = {isa = PBXBuildFile; fileRef = 2669BE13270FA62F00806A63 /* aicook.txt */; };
+		2669BE19270FA65200806A63 /* aicook1.jpg in Resources */ = {isa = PBXBuildFile; fileRef = 2669BE14270FA63D00806A63 /* aicook1.jpg */; };
+		2669BE1A270FA65200806A63 /* aicook3.jpg in Resources */ = {isa = PBXBuildFile; fileRef = 2669BE15270FA65200806A63 /* aicook3.jpg */; };
 		266E87232563120D00CF5151 /* classes.txt in Resources */ = {isa = PBXBuildFile; fileRef = 266E87222563120D00CF5151 /* classes.txt */; };
 		266E8746256350C000CF5151 /* CameraController.swift in Sources */ = {isa = PBXBuildFile; fileRef = 266E8742256350C000CF5151 /* CameraController.swift */; };
 		266E8747256350C000CF5151 /* CVPixelBuffer+Helper.swift in Sources */ = {isa = PBXBuildFile; fileRef = 266E8743256350C000CF5151 /* CVPixelBuffer+Helper.swift */; };
@@ -29,6 +33,10 @@
 /* End PBXBuildFile section */
 
 /* Begin PBXFileReference section */
+		2669BE11270FA61000806A63 /* aicook2.jpg */ = {isa = PBXFileReference; lastKnownFileType = image.jpeg; path = aicook2.jpg; sourceTree = "<group>"; };
+		2669BE13270FA62F00806A63 /* aicook.txt */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = text; path = aicook.txt; sourceTree = "<group>"; };
+		2669BE14270FA63D00806A63 /* aicook1.jpg */ = {isa = PBXFileReference; lastKnownFileType = image.jpeg; path = aicook1.jpg; sourceTree = "<group>"; };
+		2669BE15270FA65200806A63 /* aicook3.jpg */ = {isa = PBXFileReference; lastKnownFileType = image.jpeg; path = aicook3.jpg; sourceTree = "<group>"; };
 		266E87222563120D00CF5151 /* classes.txt */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = text; path = classes.txt; sourceTree = "<group>"; };
 		266E8742256350C000CF5151 /* CameraController.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = CameraController.swift; sourceTree = "<group>"; };
 		266E8743256350C000CF5151 /* CVPixelBuffer+Helper.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = "CVPixelBuffer+Helper.swift"; sourceTree = "<group>"; };
@@ -109,6 +117,10 @@
 				269E7487255CC69400B1D6CA /* test1.png */,
 				269E748B255CC6D100B1D6CA /* test2.jpg */,
 				269E748A255CC6D100B1D6CA /* test3.png */,
+				2669BE13270FA62F00806A63 /* aicook.txt */,
+				2669BE14270FA63D00806A63 /* aicook1.jpg */,
+				2669BE11270FA61000806A63 /* aicook2.jpg */,
+				2669BE15270FA65200806A63 /* aicook3.jpg */,
 				266E87222563120D00CF5151 /* classes.txt */,
 				26A8C11326E17F8100F4A58D /* yolov5s.torchscript.ptl */,
 			);
@@ -201,12 +213,16 @@
 			buildActionMask = 2147483647;
 			files = (
 				269E747E255CC56400B1D6CA /* LaunchScreen.storyboard in Resources */,
+				2669BE18270FA65200806A63 /* aicook.txt in Resources */,
 				26A8C11426E17F8100F4A58D /* yolov5s.torchscript.ptl in Resources */,
 				266E87232563120D00CF5151 /* classes.txt in Resources */,
 				269E747B255CC56400B1D6CA /* Assets.xcassets in Resources */,
+				2669BE19270FA65200806A63 /* aicook1.jpg in Resources */,
 				269E748D255CC6D100B1D6CA /* test2.jpg in Resources */,
+				2669BE16270FA65200806A63 /* aicook2.jpg in Resources */,
 				269E7488255CC69400B1D6CA /* test1.png in Resources */,
 				269E7479255CC56200B1D6CA /* Main.storyboard in Resources */,
+				2669BE1A270FA65200806A63 /* aicook3.jpg in Resources */,
 				269E748C255CC6D100B1D6CA /* test3.png in Resources */,
 			);
 			runOnlyForDeploymentPostprocessing = 0;
 
@@ -32,7 +32,7 @@ - (nullable instancetype)initWithFileAtPath:(NSString*)filePath {
 
 - (NSArray<NSNumber*>*)detectImage:(void*)imageBuffer {
     try {
-        at::Tensor tensor = torch::from_blob(imageBuffer, { 1, 3, input_width, input_height }, at::kFloat);
+        at::Tensor tensor = torch::from_blob(imageBuffer, { 1, 3, input_height, input_width }, at::kFloat);
 
         c10::InferenceMode guard;
         CFTimeInterval startTime = CACurrentMediaTime();
 
@@ -17,7 +17,7 @@ class PrePostProcessor : NSObject {
     static let inputWidth = 640
     static let inputHeight = 640
 
-    // model output is of size 25200*85
+    // model output is of size 25200*(num_of_class+5)
     static let outputRow = 25200 // as decided by the YOLOv5 model for input image of size 640*640
     static let outputColumn = 85 // left, top, right, bottom, score and 80 class probability
     static let threshold : Float = 0.35 // score above which a detection is generated
@@ -111,7 +111,7 @@ class PrePostProcessor : NSObject {
 
                 let rect = CGRect(x: startX+ivScaleX*left, y: startY+top*ivScaleY, width: ivScaleX*(right-left), height: ivScaleY*(bottom-top))
 
-                let prediction = Prediction(classIndex: cls, score: Float(truncating: outputs[i*85+4]), rect: rect)
+                let prediction = Prediction(classIndex: cls, score: Float(truncating: outputs[i*outputColumn+4]), rect: rect)
                 predictions.append(prediction)
             }
         }
 
@@ -0,0 +1,30 @@
+apple
+banana
+beef
+blueberries
+bread
+butter
+carrot
+cheese
+chicken
+chicken_breast
+chocolate
+corn
+eggs
+flour
+goat_cheese
+green_beans
+ground_beef
+ham
+heavy_cream
+lime
+milk
+mushrooms
+onion
+potato
+shrimp
+spinach
+strawberries
+sugar
+sweet_potato
+tomato
Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,7 @@ class PrePostProcessor : NSObject {`
`17`	`17`	`static let inputWidth = 640`
`18`	`18`	`static let inputHeight = 640`
`19`	`19`
`20`		`- // model output is of size 25200*85`
	`20`	`+ // model output is of size 25200*(num_of_class+5)`
`21`	`21`	`static let outputRow = 25200 // as decided by the YOLOv5 model for input image of size 640*640`
`22`	`22`	`static let outputColumn = 85 // left, top, right, bottom, score and 80 class probability`
`23`	`23`	`static let threshold : Float = 0.35 // score above which a detection is generated`
`@@ -111,7 +111,7 @@ class PrePostProcessor : NSObject {`
`111`	`111`
`112`	`112`	`let rect = CGRect(x: startX+ivScaleXleft, y: startY+topivScaleY, width: ivScaleX(right-left), height: ivScaleY(bottom-top))`
`113`	`113`
`114`		`- let prediction = Prediction(classIndex: cls, score: Float(truncating: outputs[i*85+4]), rect: rect)`
	`114`	`+ let prediction = Prediction(classIndex: cls, score: Float(truncating: outputs[i*outputColumn+4]), rect: rect)`
`115`	`115`	`predictions.append(prediction)`
`116`	`116`	`}`
`117`	`117`	`}`