huggingface · Jun 14, 2023
diff --git a/‎Diffusion-macOS/Capabilities.swift
+10 b/‎Diffusion-macOS/Capabilities.swift
+10
diff --git a/‎Diffusion.xcodeproj/project.pbxproj
+30-12 b/‎Diffusion.xcodeproj/project.pbxproj
+30-12
diff --git a/‎Diffusion.xcodeproj/project.xcworkspace/xcshareddata/swiftpm/Package.resolved
+1-1 b/‎Diffusion.xcodeproj/project.xcworkspace/xcshareddata/swiftpm/Package.resolved
+1-1
diff --git a/‎Diffusion/DiffusionApp.swift
+9 b/‎Diffusion/DiffusionApp.swift
+9
diff --git a/‎Diffusion/Downloader.swift
+13-3 b/‎Diffusion/Downloader.swift
+13-3
diff --git a/‎Diffusion/ModelInfo.swift
+92-18 b/‎Diffusion/ModelInfo.swift
+92-18
@@ -9,6 +9,16 @@
 import Foundation
 
 let runningOnMac = true
+let deviceHas6GBOrMore = true
+
+let deviceSupportsQuantization = {
+    if #available(macOS 14, *) {
+        true
+    } else {
+        false
+    }
+}()
+
 
 #if canImport(MLCompute)
 import MLCompute
 
@@ -8,7 +8,8 @@
 
 /* Begin PBXBuildFile section */
 		EB067F872992E561004D1AD9 /* HelpContent.swift in Sources */ = {isa = PBXBuildFile; fileRef = EB067F862992E561004D1AD9 /* HelpContent.swift */; };
-		EB33A51D2954D89F00B16357 /* StableDiffusion in Frameworks */ = {isa = PBXBuildFile; productRef = EB33A51C2954D89F00B16357 /* StableDiffusion */; };
+		EB25B3D62A3A2DC4000E25A1 /* StableDiffusion in Frameworks */ = {isa = PBXBuildFile; productRef = EB25B3D52A3A2DC4000E25A1 /* StableDiffusion */; };
+		EB25B3D82A3A2DD5000E25A1 /* StableDiffusion in Frameworks */ = {isa = PBXBuildFile; productRef = EB25B3D72A3A2DD5000E25A1 /* StableDiffusion */; };
 		EB560F0429A3C20800C0F8B8 /* Capabilities.swift in Sources */ = {isa = PBXBuildFile; fileRef = EB560F0329A3C20800C0F8B8 /* Capabilities.swift */; };
 		EBB5BA5329425BEE003A2A5B /* PipelineLoader.swift in Sources */ = {isa = PBXBuildFile; fileRef = EBB5BA5229425BEE003A2A5B /* PipelineLoader.swift */; };
 		EBB5BA5829425E17003A2A5B /* Path in Frameworks */ = {isa = PBXBuildFile; productRef = EBB5BA5729425E17003A2A5B /* Path */; };
@@ -18,7 +19,6 @@
 		EBDD7DAB29731F7500C1C4B2 /* PipelineLoader.swift in Sources */ = {isa = PBXBuildFile; fileRef = EBB5BA5229425BEE003A2A5B /* PipelineLoader.swift */; };
 		EBDD7DAD29731FB300C1C4B2 /* Path in Frameworks */ = {isa = PBXBuildFile; productRef = EBDD7DAC29731FB300C1C4B2 /* Path */; };
 		EBDD7DAF29731FB300C1C4B2 /* ZIPFoundation in Frameworks */ = {isa = PBXBuildFile; productRef = EBDD7DAE29731FB300C1C4B2 /* ZIPFoundation */; };
-		EBDD7DB129731FB300C1C4B2 /* StableDiffusion in Frameworks */ = {isa = PBXBuildFile; productRef = EBDD7DB029731FB300C1C4B2 /* StableDiffusion */; };
 		EBDD7DB32973200200C1C4B2 /* Utils.swift in Sources */ = {isa = PBXBuildFile; fileRef = EBDD7DB22973200200C1C4B2 /* Utils.swift */; };
 		EBDD7DB42973200200C1C4B2 /* Utils.swift in Sources */ = {isa = PBXBuildFile; fileRef = EBDD7DB22973200200C1C4B2 /* Utils.swift */; };
 		EBDD7DB52973201800C1C4B2 /* ModelInfo.swift in Sources */ = {isa = PBXBuildFile; fileRef = EBE3FF4B295E1EFE00E921AA /* ModelInfo.swift */; };
@@ -105,7 +105,7 @@
 			buildActionMask = 2147483647;
 			files = (
 				EBB5BA5829425E17003A2A5B /* Path in Frameworks */,
-				EB33A51D2954D89F00B16357 /* StableDiffusion in Frameworks */,
+				EB25B3D62A3A2DC4000E25A1 /* StableDiffusion in Frameworks */,
 				EBB5BA5D294504DE003A2A5B /* ZIPFoundation in Frameworks */,
 			);
 			runOnlyForDeploymentPostprocessing = 0;
@@ -129,7 +129,7 @@
 			buildActionMask = 2147483647;
 			files = (
 				F155203C297118E700DC009B /* CompactSlider in Frameworks */,
-				EBDD7DB129731FB300C1C4B2 /* StableDiffusion in Frameworks */,
+				EB25B3D82A3A2DD5000E25A1 /* StableDiffusion in Frameworks */,
 				EBDD7DAD29731FB300C1C4B2 /* Path in Frameworks */,
 				EBDD7DAF29731FB300C1C4B2 /* ZIPFoundation in Frameworks */,
 			);
@@ -280,12 +280,13 @@
 			buildRules = (
 			);
 			dependencies = (
+				EBF61AB32A2F976600482CF3 /* PBXTargetDependency */,
 			);
 			name = Diffusion;
 			packageProductDependencies = (
 				EBB5BA5729425E17003A2A5B /* Path */,
 				EBB5BA5C294504DE003A2A5B /* ZIPFoundation */,
-				EB33A51C2954D89F00B16357 /* StableDiffusion */,
+				EB25B3D52A3A2DC4000E25A1 /* StableDiffusion */,
 			);
 			productName = Diffusion;
 			productReference = EBE755C5293E37DD00806B32 /* Diffusion.app */;
@@ -339,13 +340,14 @@
 			buildRules = (
 			);
 			dependencies = (
+				EB0199492A31FEAF00B133E2 /* PBXTargetDependency */,
 			);
 			name = "Diffusion-macOS";
 			packageProductDependencies = (
 				F155203B297118E700DC009B /* CompactSlider */,
 				EBDD7DAC29731FB300C1C4B2 /* Path */,
 				EBDD7DAE29731FB300C1C4B2 /* ZIPFoundation */,
-				EBDD7DB029731FB300C1C4B2 /* StableDiffusion */,
+				EB25B3D72A3A2DD5000E25A1 /* StableDiffusion */,
 			);
 			productName = "Diffusion-macOS";
 			productReference = F15520212971093300DC009B /* Diffusers.app */;
@@ -389,8 +391,8 @@
 			packageReferences = (
 				EBB5BA5629425E17003A2A5B /* XCRemoteSwiftPackageReference "Path.swift" */,
 				EBB5BA5B294504DE003A2A5B /* XCRemoteSwiftPackageReference "ZIPFoundation" */,
-				EB33A51B2954D89F00B16357 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */,
 				F155203A297118E600DC009B /* XCRemoteSwiftPackageReference "CompactSlider" */,
+				EB25B3D42A3A2DC4000E25A1 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */,
 			);
 			productRefGroup = EBE755C6293E37DD00806B32 /* Products */;
 			projectDirPath = "";
@@ -517,6 +519,10 @@
 /* End PBXSourcesBuildPhase section */
 
 /* Begin PBXTargetDependency section */
+		EB0199492A31FEAF00B133E2 /* PBXTargetDependency */ = {
+			isa = PBXTargetDependency;
+			productRef = EB0199482A31FEAF00B133E2 /* StableDiffusion */;
+		};
 		EBE755D8293E37DE00806B32 /* PBXTargetDependency */ = {
 			isa = PBXTargetDependency;
 			target = EBE755C4293E37DD00806B32 /* Diffusion */;
@@ -527,6 +533,10 @@
 			target = EBE755C4293E37DD00806B32 /* Diffusion */;
 			targetProxy = EBE755E1293E37DE00806B32 /* PBXContainerItemProxy */;
 		};
+		EBF61AB32A2F976600482CF3 /* PBXTargetDependency */ = {
+			isa = PBXTargetDependency;
+			productRef = EBF61AB22A2F976600482CF3 /* StableDiffusion */;
+		};
 /* End PBXTargetDependency section */
 
 /* Begin XCBuildConfiguration section */
@@ -915,7 +925,7 @@
 /* End XCConfigurationList section */
 
 /* Begin XCRemoteSwiftPackageReference section */
-		EB33A51B2954D89F00B16357 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */ = {
+		EB25B3D42A3A2DC4000E25A1 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */ = {
 			isa = XCRemoteSwiftPackageReference;
 			repositoryURL = "https://github.com/apple/ml-stable-diffusion";
 			requirement = {
@@ -950,9 +960,18 @@
 /* End XCRemoteSwiftPackageReference section */
 
 /* Begin XCSwiftPackageProductDependency section */
-		EB33A51C2954D89F00B16357 /* StableDiffusion */ = {
+		EB0199482A31FEAF00B133E2 /* StableDiffusion */ = {
+			isa = XCSwiftPackageProductDependency;
+			productName = StableDiffusion;
+		};
+		EB25B3D52A3A2DC4000E25A1 /* StableDiffusion */ = {
+			isa = XCSwiftPackageProductDependency;
+			package = EB25B3D42A3A2DC4000E25A1 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */;
+			productName = StableDiffusion;
+		};
+		EB25B3D72A3A2DD5000E25A1 /* StableDiffusion */ = {
 			isa = XCSwiftPackageProductDependency;
-			package = EB33A51B2954D89F00B16357 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */;
+			package = EB25B3D42A3A2DC4000E25A1 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */;
 			productName = StableDiffusion;
 		};
 		EBB5BA5729425E17003A2A5B /* Path */ = {
@@ -975,9 +994,8 @@
 			package = EBB5BA5B294504DE003A2A5B /* XCRemoteSwiftPackageReference "ZIPFoundation" */;
 			productName = ZIPFoundation;
 		};
-		EBDD7DB029731FB300C1C4B2 /* StableDiffusion */ = {
+		EBF61AB22A2F976600482CF3 /* StableDiffusion */ = {
 			isa = XCSwiftPackageProductDependency;
-			package = EB33A51B2954D89F00B16357 /* XCRemoteSwiftPackageReference "ml-stable-diffusion" */;
 			productName = StableDiffusion;
 		};
 		F155203B297118E700DC009B /* CompactSlider */ = {
 
@@ -15,7 +15,7 @@
       "location" : "https://github.com/apple/ml-stable-diffusion",
       "state" : {
         "branch" : "main",
-        "revision" : "fb1fa01c9d30e9b2e02a8b7ed35d905e272a0262"
+        "revision" : "48f07f24891155a14c51dd835bba7371bdf32d0e"
       }
     },
     {
 
@@ -18,3 +18,12 @@ struct DiffusionApp: App {
 }
 
 let runningOnMac = ProcessInfo.processInfo.isMacCatalystApp
+let deviceHas6GBOrMore = ProcessInfo.processInfo.physicalMemory > 5924000000   // Different devices report different amounts, so approximate
+
+let deviceSupportsQuantization = {
+    if #available(iOS 17, *) {
+        true
+    } else {
+        false
+    }
+}()
@@ -25,7 +25,7 @@ class Downloader: NSObject, ObservableObject {
 
     private var urlSession: URLSession? = nil
 
-    init(from url: URL, to destination: URL) {
+    init(from url: URL, to destination: URL, using authToken: String? = nil) {
         self.destination = destination
         super.init()
 
@@ -40,7 +40,13 @@ class Downloader: NSObject, ObservableObject {
                 return
             }
             print("Starting download of \(url)")
-            self.urlSession?.downloadTask(with: url).resume()
+            
+            var request = URLRequest(url: url)
+            if let authToken = authToken {
+                request.setValue("Bearer \(authToken)", forHTTPHeaderField: "Authorization")
+            }
+
+            self.urlSession?.downloadTask(with: request).resume()
         }
     }
 
@@ -91,9 +97,13 @@ extension Downloader: URLSessionDelegate, URLSessionDownloadDelegate {
         }
     }
 
-    func urlSession(_: URLSession, task: URLSessionTask, didCompleteWithError error: Error?) {
+    func urlSession(_ session: URLSession, task: URLSessionTask, didCompleteWithError error: Error?) {
         if let error = error {
             downloadState.value = .failed(error)
+        } else if let response = task.response as? HTTPURLResponse {
+            print("HTTP response status code: \(response.statusCode)")
+//            let headers = response.allHeaderFields
+//            print("HTTP response headers: \(headers)")
         }
     }
 }
@@ -11,6 +11,7 @@ import CoreML
 enum AttentionVariant: String {
     case original
     case splitEinsum
+    case splitEinsumV2
 }
 
 extension AttentionVariant {
@@ -30,15 +31,34 @@ struct ModelInfo {
     /// Suffix of the archive containing the SPLIT_EINSUM attention variant. Usually something like "split_einsum_compiled"
     let splitAttentionSuffix: String
 
+    /// Suffix of the archive containing the SPLIT_EINSUM_V2 attention variant. Usually something like "split_einsum_v2_compiled"
+    let splitAttentionV2Suffix: String
+    
     /// Whether the archive contains the VAE Encoder (for image to image tasks). Not yet in use.
     let supportsEncoder: Bool
-        
-    init(modelId: String, modelVersion: String, originalAttentionSuffix: String = "original_compiled", splitAttentionSuffix: String = "split_einsum_compiled", supportsEncoder: Bool = false) {
+    
+    /// Is attention v2 supported? (Ideally, we should know by looking at the repo contents)
+    let supportsAttentionV2: Bool
+    
+    /// Are weights quantized? This is only used to decide whether to use `reduceMemory`
+    let quantized: Bool
+    
+    //TODO: refactor all these properties
+    init(modelId: String, modelVersion: String,
+         originalAttentionSuffix: String = "original_compiled",
+         splitAttentionSuffix: String = "split_einsum_compiled",
+         splitAttentionV2Suffix: String = "split_einsum_v2_compiled",
+         supportsEncoder: Bool = false,
+         supportsAttentionV2: Bool = false,
+         quantized: Bool = false) {
         self.modelId = modelId
         self.modelVersion = modelVersion
         self.originalAttentionSuffix = originalAttentionSuffix
         self.splitAttentionSuffix = splitAttentionSuffix
+        self.splitAttentionV2Suffix = splitAttentionV2Suffix
         self.supportsEncoder = supportsEncoder
+        self.supportsAttentionV2 = supportsAttentionV2
+        self.quantized = quantized
     }
 }
 
@@ -56,7 +76,10 @@ extension ModelInfo {
 
     static var defaultComputeUnits: MLComputeUnits { defaultAttention.defaultComputeUnits }
 
-    var bestAttention: AttentionVariant { ModelInfo.defaultAttention }
+    var bestAttention: AttentionVariant {
+        if !runningOnMac && supportsAttentionV2 { return .splitEinsumV2 }
+        return ModelInfo.defaultAttention
+    }
     var defaultComputeUnits: MLComputeUnits { bestAttention.defaultComputeUnits }
 
     func modelURL(for variant: AttentionVariant) -> URL {
@@ -65,6 +88,7 @@ extension ModelInfo {
         switch variant {
         case .original: suffix = originalAttentionSuffix
         case .splitEinsum: suffix = splitAttentionSuffix
+        case .splitEinsumV2: suffix = splitAttentionV2Suffix
         }
         let repo = modelId.split(separator: "/").last!
         return URL(string: "https://huggingface.co/\(modelId)/resolve/main/\(repo)_\(suffix).zip")!
@@ -73,47 +97,97 @@ extension ModelInfo {
     /// Best variant for the current platform.
     /// Currently using `split_einsum` for iOS and simple performance heuristics for macOS.
     var bestURL: URL { modelURL(for: bestAttention) }
-        
+    
     var reduceMemory: Bool {
-        return !runningOnMac
+        // Enable on iOS devices, except when using quantization
+        if runningOnMac { return false }
+        return !(quantized && deviceHas6GBOrMore)
     }
 }
 
 extension ModelInfo {
-    // TODO: repo does not exist yet
     static let v14Base = ModelInfo(
         modelId: "pcuenq/coreml-stable-diffusion-1-4",
-        modelVersion: "CompVis/stable-diffusion-v1-4"
+        modelVersion: "CompVis SD 1.4"
+    )
+
+    static let v14Palettized = ModelInfo(
+        modelId: "apple/coreml-stable-diffusion-1-4-palettized",
+        modelVersion: "CompVis SD 1.4 [6 bit]",
+        supportsEncoder: true,
+        supportsAttentionV2: true,
+        quantized: true
     )
 
     static let v15Base = ModelInfo(
         modelId: "pcuenq/coreml-stable-diffusion-v1-5",
-        modelVersion: "runwayml/stable-diffusion-v1-5"
+        modelVersion: "RunwayML SD 1.5"
+    )
+    
+    static let v15Palettized = ModelInfo(
+        modelId: "apple/coreml-stable-diffusion-v1-5-palettized",
+        modelVersion: "RunwayML SD 1.5 [6 bit]",
+        supportsEncoder: true,
+        supportsAttentionV2: true,
+        quantized: true
     )
 
     static let v2Base = ModelInfo(
         modelId: "pcuenq/coreml-stable-diffusion-2-base",
-        modelVersion: "stabilityai/stable-diffusion-2-base"
+        modelVersion: "StabilityAI SD 2.0",
+        supportsEncoder: true
+    )
+    
+    static let v2Palettized = ModelInfo(
+        modelId: "apple/coreml-stable-diffusion-2-base-palettized",
+        modelVersion: "StabilityAI SD 2.0 [6 bit]",
+        supportsEncoder: true,
+        supportsAttentionV2: true,
+        quantized: true
     )
 
     static let v21Base = ModelInfo(
         modelId: "pcuenq/coreml-stable-diffusion-2-1-base",
-        modelVersion: "stabilityai/stable-diffusion-2-1-base",
+        modelVersion: "StabilityAI SD 2.1",
         supportsEncoder: true
     )
 
+    static let v21Palettized = ModelInfo(
+        modelId: "apple/coreml-stable-diffusion-2-1-base-palettized",
+        modelVersion: "StabilityAI SD 2.1 [6 bit]",
+        supportsEncoder: true,
+        supportsAttentionV2: true,
+        quantized: true
+    )
+        
     static let ofaSmall = ModelInfo(
         modelId: "pcuenq/coreml-small-stable-diffusion-v0",
         modelVersion: "OFA-Sys/small-stable-diffusion-v0"
     )
-
-    static let MODELS = [
-        ModelInfo.v14Base,
-        ModelInfo.v15Base,
-        ModelInfo.v2Base,
-        ModelInfo.v21Base,
-        ModelInfo.ofaSmall
-    ]
+    
+    static let MODELS: [ModelInfo] = {
+        if deviceSupportsQuantization {
+            return [
+                ModelInfo.v14Base,
+                ModelInfo.v14Palettized,
+                ModelInfo.v15Base,
+                ModelInfo.v15Palettized,
+                ModelInfo.v2Base,
+                ModelInfo.v2Palettized,
+                ModelInfo.v21Base,
+                ModelInfo.v21Palettized,
+                ModelInfo.ofaSmall
+            ]
+        } else {
+            return [
+                ModelInfo.v14Base,
+                ModelInfo.v15Base,
+                ModelInfo.v2Base,
+                ModelInfo.v21Base,
+                ModelInfo.ofaSmall
+            ]
+        }
+    }()
 
     static func from(modelVersion: String) -> ModelInfo? {
         ModelInfo.MODELS.first(where: {$0.modelVersion == modelVersion})
Original file line number	Diff line number	Diff line change
`@@ -15,7 +15,7 @@`
`15`	`15`	`"location" : "https://github.com/apple/ml-stable-diffusion",`
`16`	`16`	`"state" : {`
`17`	`17`	`"branch" : "main",`
`18`		`- "revision" : "fb1fa01c9d30e9b2e02a8b7ed35d905e272a0262"`
	`18`	`+ "revision" : "48f07f24891155a14c51dd835bba7371bdf32d0e"`
`19`	`19`	`}`
`20`	`20`	`},`
`21`	`21`	`{`
Original file line number	Diff line number	Diff line change
`@@ -25,7 +25,7 @@ class Downloader: NSObject, ObservableObject {`
`25`	`25`
`26`	`26`	`private var urlSession: URLSession? = nil`
`27`	`27`
`28`		`- init(from url: URL, to destination: URL) {`
	`28`	`+ init(from url: URL, to destination: URL, using authToken: String? = nil) {`
`29`	`29`	`self.destination = destination`
`30`	`30`	`super.init()`
`31`	`31`
`@@ -40,7 +40,13 @@ class Downloader: NSObject, ObservableObject {`
`40`	`40`	`return`
`41`	`41`	`}`
`42`	`42`	`print("Starting download of \(url)")`
`43`		`- self.urlSession?.downloadTask(with: url).resume()`
	`43`	`+`
	`44`	`+ var request = URLRequest(url: url)`
	`45`	`+ if let authToken = authToken {`
	`46`	`+ request.setValue("Bearer \(authToken)", forHTTPHeaderField: "Authorization")`
	`47`	`+ }`
	`48`	`+`
	`49`	`+ self.urlSession?.downloadTask(with: request).resume()`
`44`	`50`	`}`
`45`	`51`	`}`
`46`	`52`
`@@ -91,9 +97,13 @@ extension Downloader: URLSessionDelegate, URLSessionDownloadDelegate {`
`91`	`97`	`}`
`92`	`98`	`}`
`93`	`99`
`94`		`- func urlSession(_: URLSession, task: URLSessionTask, didCompleteWithError error: Error?) {`
	`100`	`+ func urlSession(_ session: URLSession, task: URLSessionTask, didCompleteWithError error: Error?) {`
`95`	`101`	`if let error = error {`
`96`	`102`	`downloadState.value = .failed(error)`
	`103`	`+ } else if let response = task.response as? HTTPURLResponse {`
	`104`	`+ print("HTTP response status code: \(response.statusCode)")`
	`105`	`+// let headers = response.allHeaderFields`
	`106`	`+// print("HTTP response headers: \(headers)")`
`97`	`107`	`}`
`98`	`108`	`}`
`99`	`109`	`}`