[Swift Heroes '24] Delightful on-device AI experiences

venv venv source venv/bin/activate pip install -e . python -m python_coreml_stable_diffusion.torch2coreml \ -- bundle-resources-for-swift-cli \ -- attention-implementation SPLIT_EINSUM_V2 \ -- convert-unet \ -- convert-text-encoder \ -- convert-vae-decoder \ -- convert-vae-encoder \ -- model-version runwayml/stable-diffusion-v1-5 \ -- unet-support-controlnet \ -- convert-controlnet DionTimmer/controlnet_qrcode-control_v1p_sd15 \ -o generated

git clone https: / / github.com/apple/ml-stable-diffusion.git cd ml-stable-diffusion python3 -m

None

Loading Stable Di ff usion models

// swift-tools-version: 5.9 import PackageDescription let package = Package( name:

"StableDiffusionControlNet", platforms: [.macOS(.v14)], dependencies: [ ], targets: [ ] )

// swift-tools-version: 5.9 import PackageDescription let package = Package( name:

"StableDiffusionControlNet", platforms: [.macOS(.v14)], dependencies: [ ], targets: [ ] ) .package(url: "https: // github.com/apple/ml-stable-diffusion.git", exact: "1.1.0")

// swift-tools-version: 5.9 import PackageDescription let package = Package( name:

"StableDiffusionControlNet", platforms: [.macOS(.v14)], dependencies: [ .package(url: "https: // github.com/apple/ml-stable-diffusion.git", exact: "1.1.0") ], targets: [ ] ) .executableTarget( name: "StableDiffusionControlNet", dependencies: [.product(name: "StableDiffusion", package: "ml-stable-diffusion")], resources: [.process("Resources")] ),

import Foundation import StableDiffusion import CoreML func generate(prompt: String, startingImageURL:

URL, numberOfImages: Int) async throws -> [CGImage] { guard let resourcesURL = Bundle.module.url(forResource: "Resources", withExtension: nil) ?. path() else { return [] } let url = URL(fileURLWithPath: resourcesURL) let configuration = MLModelConfiguration() configuration.computeUnits = .all let pipeline = try StableDiffusionPipeline(resourcesAt: url, controlNet: ["DiontimmerControlnetQrcodeControlV1PSd15"], configuration: configuration, disableSafety: false, reduceMemory: true) try pipeline.loadResources() let startingNSImage = NSImage(contentsOf: startingImageURL) ?. resized(to: .init(width: 512, height: 512)) guard let startingImage = startingNSImage ?. cgImage(forProposedRect: nil, context: nil, hints: nil) else { return [] } var pipelineConfig = StableDiffusionPipeline.Configuration(prompt: prompt) pipelineConfig.negativePrompt = "ugly, disfigured, low quality, blurry, nsfw" pipelineConfig.controlNetInputs = [startingImage] pipelineConfig.startingImage = startingImage pipelineConfig.useDenoisedIntermediates = true pipelineConfig.strength = 0.9 pipelineConfig.seed = UInt32.random(in: (0 .. < UInt32.max)) pipelineConfig.guidanceScale = 7.5 pipelineConfig.stepCount = 50 pipelineConfig.originalSize = 512 pipelineConfig.targetSize = 512 pipelineConfig.imageCount = numberOfImages return try pipeline.generateImages(configuration: pipelineConfig, progressHandler: { _ in true }) .compactMap { $0 } }

import Foundation import StableDiffusion import CoreML func generate(prompt: String, startingImageURL:

URL, numberOfImages: Int) async throws -> [CGImage] { guard let resourcesURL = Bundle.module.url(forResource: "Resources", withExtension: nil) ?. path() else { return [] } let url = URL(fileURLWithPath: resourcesURL) let configuration = MLModelConfiguration() configuration.computeUnits = .all let pipeline = try StableDiffusionPipeline(resourcesAt: url, controlNet: ["DiontimmerControlnetQrcodeControlV1PSd15"], configuration: configuration, disableSafety: false, reduceMemory: false) try pipeline.loadResources() let startingNSImage = NSImage(contentsOf: startingImageURL) ?. resized(to: .init(width: 512, height: 512)) guard let startingImage = startingNSImage ?. cgImage(forProposedRect: nil, context: nil, hints: nil) else { return [] } var pipelineConfig = StableDiffusionPipeline.Configuration(prompt: prompt) pipelineConfig.negativePrompt = "ugly, disfigured, low quality, blurry, nsfw" pipelineConfig.controlNetInputs = [startingImage] pipelineConfig.startingImage = startingImage pipelineConfig.useDenoisedIntermediates = true pipelineConfig.strength = 0.9 pipelineConfig.seed = UInt32.random(in: (0 .. < UInt32.max)) pipelineConfig.guidanceScale = 7.5 pipelineConfig.stepCount = 50 pipelineConfig.originalSize = 512 pipelineConfig.targetSize = 512 pipelineConfig.imageCount = numberOfImages return try pipeline.generateImages(configuration: pipelineConfig, progressHandler: { _ in true }) .compactMap { $0 } }

import Foundation import StableDiffusion import CoreML func generate(prompt: String, startingImageURL:

URL, numberOfImages: Int) async throws -> [CGImage] { guard let resourcesURL = Bundle.module.url(forResource: "Resources", withExtension: nil) ?. path() else { return [] } let url = URL(fileURLWithPath: resourcesURL) let configuration = MLModelConfiguration() configuration.computeUnits = .all let pipeline = try StableDiffusionPipeline(resourcesAt: url, controlNet: ["DiontimmerControlnetQrcodeControlV1PSd15"], configuration: configuration, disableSafety: false, reduceMemory: false) try pipeline.loadResources() let startingNSImage = NSImage(contentsOf: startingImageURL) ?. resized(to: .init(width: 512, height: 512)) guard let startingImage = startingNSImage ?. cgImage(forProposedRect: nil, context: nil, hints: nil) else { return [] } var pipelineConfig = StableDiffusionPipeline.Configuration(prompt: prompt) pipelineConfig.negativePrompt = "ugly, disfigured, low quality, blurry, nsfw" pipelineConfig.controlNetInputs = [startingImage] pipelineConfig.startingImage = startingImage pipelineConfig.useDenoisedIntermediates = true pipelineConfig.strength = 0.9 pipelineConfig.seed = UInt32.random(in: (0 .. < UInt32.max)) pipelineConfig.guidanceScale = 7.5 pipelineConfig.stepCount = 50 pipelineConfig.originalSize = 512 pipelineConfig.targetSize = 512 pipelineConfig.imageCount = numberOfImages return try pipeline.generateImages(configuration: pipelineConfig, progressHandler: { _ in true }) .compactMap { $0 } }

let prompt = """ Style-NebMagic, award winning photo, A Dark-Eyed

Junco, sitting Great Basin National Park, intricate, nature background, wildlife photography, hyper realistic, Style-LostTemple, deep shadow, high contrast, dark, sunrise, morning, full moon """

let prompt = """ Style-NebMagic, award winning photo, A Dark-Eyed

Junco, sitting Great Basin National Park, intricate, nature background, wildlife photography, hyper realistic, Style-LostTemple, deep shadow, high contrast, dark, sunrise, morning, full moon """ let url = URL(filePath: "/my-qr-code.png")

let prompt = """ Style-NebMagic, award winning photo, A Dark-Eyed

Junco, sitting Great Basin National Park, intricate, nature background, wildlife photography, hyper realistic, Style-LostTemple, deep shadow, high contrast, dark, sunrise, morning, full moon """ let url = URL(filePath: "/my-qr-code.png") let image = try await generate( prompt: prompt, startingImageURL: url, numberOfImages: 1 )

None

https://github.com/huggingface/swi ft -coreml-di ff users

One more thing…

None

Host your models remotely And load them on demand

None

let modelURL = URL(string: "https: // huggingface.co/:user/:model/resolve/main/:file.zip?download=true")! let (location, downloadFileResponse)

= try await URLSession.shared.download(from: modelURL) guard let httpResponse = downloadFileResponse as? HTTPURLResponse, httpResponse.statusCode == 200 else { exit(1) } try FileManager.default .moveItem( at: location, to: URL.desktopDirectory.appending(component: "model.zip") ) Model from HuggingFace

[Swift Heroes '24] Delightful on-device AI expe...

[Swift Heroes '24] Delightful on-device AI experiences

More Decks by Pol Piella Abadia

Other Decks in Programming

Featured

Transcript