whisper.cpp/examples/whisper.swiftui/whisper.cpp.swift/LibWhisper.swift

import Foundation
import UIKit
import whisper

enum WhisperError: Error {
    case couldNotInitializeContext
}

// Meet Whisper C++ constraint: Don't access from more than one thread at a time.
actor WhisperContext {
    private var context: OpaquePointer

    init(context: OpaquePointer) {
        self.context = context
    }

    deinit {
        whisper_free(context)
    }

    func fullTranscribe(samples: [Float]) {
        // Leave 2 processors free (i.e. the high-efficiency cores).
        let maxThreads = max(1, min(8, cpuCount() - 2))
        print("Selecting \(maxThreads) threads")
        var params = whisper_full_default_params(WHISPER_SAMPLING_GREEDY)
        "en".withCString { en in
            // Adapted from whisper.objc
            params.print_realtime   = true
            params.print_progress   = false
            params.print_timestamps = true
            params.print_special    = false
            params.translate        = false
            params.language         = en
            params.n_threads        = Int32(maxThreads)
            params.offset_ms        = 0
            params.no_context       = true
            params.single_segment   = false

            whisper_reset_timings(context)
            print("About to run whisper_full")
            samples.withUnsafeBufferPointer { samples in
                if (whisper_full(context, params, samples.baseAddress, Int32(samples.count)) != 0) {
                    print("Failed to run the model")
                } else {
                    whisper_print_timings(context)
                }
            }
        }
    }

    func getTranscription() -> String {
        var transcription = ""
        for i in 0..<whisper_full_n_segments(context) {
            transcription += String.init(cString: whisper_full_get_segment_text(context, i))
        }
        return transcription
    }

    static func benchMemcpy(nThreads: Int32) async -> String {
        return String.init(cString: whisper_bench_memcpy_str(nThreads))
    }

    static func benchGgmlMulMat(nThreads: Int32) async -> String {
        return String.init(cString: whisper_bench_ggml_mul_mat_str(nThreads))
    }

    private func systemInfo() -> String {
        var info = ""
        if (ggml_cpu_has_neon() != 0) { info += "NEON " }
        return String(info.dropLast())
    }

    func benchFull(modelName: String, nThreads: Int32) async -> String {
        let nMels = whisper_model_n_mels(context)
        if (whisper_set_mel(context, nil, 0, nMels) != 0) {
            return "error: failed to set mel"
        }
        
        // heat encoder
        if (whisper_encode(context, 0, nThreads) != 0) {
            return "error: failed to encode"
        }
        
        var tokens = [whisper_token](repeating: 0, count: 512)
        
        // prompt heat
        if (whisper_decode(context, &tokens, 256, 0, nThreads) != 0) {
            return "error: failed to decode"
        }
        
        // text-generation heat
        if (whisper_decode(context, &tokens, 1, 256, nThreads) != 0) {
            return "error: failed to decode"
        }
        
        whisper_reset_timings(context)
        
        // actual run
        if (whisper_encode(context, 0, nThreads) != 0) {
            return "error: failed to encode"
        }
        
        // text-generation
        for i in 0..<256 {
            if (whisper_decode(context, &tokens, 1, Int32(i), nThreads) != 0) {
                return "error: failed to decode"
            }
        }
        
        // batched decoding
        for _ in 0..<64 {
            if (whisper_decode(context, &tokens, 5, 0, nThreads) != 0) {
                return "error: failed to decode"
            }
        }
        
        // prompt processing
        for _ in 0..<16 {
            if (whisper_decode(context, &tokens, 256, 0, nThreads) != 0) {
                return "error: failed to decode"
            }
        }

        whisper_print_timings(context)

        let deviceModel = await UIDevice.current.model
        let systemName = await UIDevice.current.systemName
        let systemInfo = self.systemInfo()
        let timings: whisper_timings = whisper_get_timings(context).pointee
        let encodeMs = String(format: "%.2f", timings.encode_ms)
        let decodeMs = String(format: "%.2f", timings.decode_ms)
        let batchdMs = String(format: "%.2f", timings.batchd_ms)
        let promptMs = String(format: "%.2f", timings.prompt_ms)
        return "| \(deviceModel) | \(systemName) | \(systemInfo) | \(modelName) | \(nThreads) | 1 | \(encodeMs) | \(decodeMs) | \(batchdMs) | \(promptMs) | <todo> |"
    }

    static func createContext(path: String) throws -> WhisperContext {
        var params = whisper_context_default_params()
#if targetEnvironment(simulator)
        params.use_gpu = false
        print("Running on the simulator, using CPU")
#else
        params.flash_attn = true // Enabled by default for Metal
#endif
        let context = whisper_init_from_file_with_params(path, params)
        if let context {
            return WhisperContext(context: context)
        } else {
            print("Couldn't load model at \(path)")
            throw WhisperError.couldNotInitializeContext
        }
    }
}

fileprivate func cpuCount() -> Int {
    ProcessInfo.processInfo.processorCount
}
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`import Foundation`
whisper.swiftui : add model download list & bench methods (#2546) * swift : fix resources & exclude build * whisper : impl whisper_timings struct & api * whisper.swiftui : model list & bench methods * whisper : return ptr for whisper_get_timings * revert unnecessary change * whisper : avoid designated initializer * whisper.swiftui: code style changes * whisper.swiftui : get device name / os from UIDevice * whisper.swiftui : fix UIDevice usage * whisper.swiftui : add memcpy and ggml_mul_mat (commented) 2024-11-13 19:51:34 +00:00			`import UIKit`
ios : add support for Swift Package Manager (#1370) * Add support for Swift * Make it build in Xcode * Use the SPM package in the SwiftUI example app 2023-11-07 21:53:31 +00:00			`import whisper`
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00
			`enum WhisperError: Error {`
			`case couldNotInitializeContext`
			`}`

			`// Meet Whisper C++ constraint: Don't access from more than one thread at a time.`
			`actor WhisperContext {`
			`private var context: OpaquePointer`
whisper.objc : disable timestamps for real-time transcription 2023-12-08 11:43:37 +00:00
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`init(context: OpaquePointer) {`
			`self.context = context`
			`}`
whisper.objc : disable timestamps for real-time transcription 2023-12-08 11:43:37 +00:00
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`deinit {`
			`whisper_free(context)`
			`}`
whisper.objc : disable timestamps for real-time transcription 2023-12-08 11:43:37 +00:00
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`func fullTranscribe(samples: [Float]) {`
			`// Leave 2 processors free (i.e. the high-efficiency cores).`
			`let maxThreads = max(1, min(8, cpuCount() - 2))`
			`print("Selecting \(maxThreads) threads")`
			`var params = whisper_full_default_params(WHISPER_SAMPLING_GREEDY)`
			`"en".withCString { en in`
			`// Adapted from whisper.objc`
whisper.objc : disable timestamps for real-time transcription 2023-12-08 11:43:37 +00:00			`params.print_realtime = true`
			`params.print_progress = false`
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`params.print_timestamps = true`
whisper.objc : disable timestamps for real-time transcription 2023-12-08 11:43:37 +00:00			`params.print_special = false`
			`params.translate = false`
			`params.language = en`
			`params.n_threads = Int32(maxThreads)`
			`params.offset_ms = 0`
			`params.no_context = true`
			`params.single_segment = false`

examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`whisper_reset_timings(context)`
			`print("About to run whisper_full")`
			`samples.withUnsafeBufferPointer { samples in`
			`if (whisper_full(context, params, samples.baseAddress, Int32(samples.count)) != 0) {`
			`print("Failed to run the model")`
			`} else {`
			`whisper_print_timings(context)`
			`}`
			`}`
			`}`
			`}`
whisper.objc : disable timestamps for real-time transcription 2023-12-08 11:43:37 +00:00
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`func getTranscription() -> String {`
			`var transcription = ""`
			`for i in 0..<whisper_full_n_segments(context) {`
			`transcription += String.init(cString: whisper_full_get_segment_text(context, i))`
			`}`
			`return transcription`
			`}`
whisper.objc : disable timestamps for real-time transcription 2023-12-08 11:43:37 +00:00
whisper.swiftui : add model download list & bench methods (#2546) * swift : fix resources & exclude build * whisper : impl whisper_timings struct & api * whisper.swiftui : model list & bench methods * whisper : return ptr for whisper_get_timings * revert unnecessary change * whisper : avoid designated initializer * whisper.swiftui: code style changes * whisper.swiftui : get device name / os from UIDevice * whisper.swiftui : fix UIDevice usage * whisper.swiftui : add memcpy and ggml_mul_mat (commented) 2024-11-13 19:51:34 +00:00			`static func benchMemcpy(nThreads: Int32) async -> String {`
			`return String.init(cString: whisper_bench_memcpy_str(nThreads))`
			`}`

			`static func benchGgmlMulMat(nThreads: Int32) async -> String {`
			`return String.init(cString: whisper_bench_ggml_mul_mat_str(nThreads))`
			`}`

			`private func systemInfo() -> String {`
			`var info = ""`
			`if (ggml_cpu_has_neon() != 0) { info += "NEON " }`
			`return String(info.dropLast())`
			`}`

			`func benchFull(modelName: String, nThreads: Int32) async -> String {`
			`let nMels = whisper_model_n_mels(context)`
			`if (whisper_set_mel(context, nil, 0, nMels) != 0) {`
			`return "error: failed to set mel"`
			`}`

			`// heat encoder`
			`if (whisper_encode(context, 0, nThreads) != 0) {`
			`return "error: failed to encode"`
			`}`

			`var tokens = [whisper_token](repeating: 0, count: 512)`

			`// prompt heat`
			`if (whisper_decode(context, &tokens, 256, 0, nThreads) != 0) {`
			`return "error: failed to decode"`
			`}`

			`// text-generation heat`
			`if (whisper_decode(context, &tokens, 1, 256, nThreads) != 0) {`
			`return "error: failed to decode"`
			`}`

			`whisper_reset_timings(context)`

			`// actual run`
			`if (whisper_encode(context, 0, nThreads) != 0) {`
			`return "error: failed to encode"`
			`}`

			`// text-generation`
			`for i in 0..<256 {`
			`if (whisper_decode(context, &tokens, 1, Int32(i), nThreads) != 0) {`
			`return "error: failed to decode"`
			`}`
			`}`

			`// batched decoding`
			`for _ in 0..<64 {`
			`if (whisper_decode(context, &tokens, 5, 0, nThreads) != 0) {`
			`return "error: failed to decode"`
			`}`
			`}`

			`// prompt processing`
			`for _ in 0..<16 {`
			`if (whisper_decode(context, &tokens, 256, 0, nThreads) != 0) {`
			`return "error: failed to decode"`
			`}`
			`}`

			`whisper_print_timings(context)`

			`let deviceModel = await UIDevice.current.model`
			`let systemName = await UIDevice.current.systemName`
			`let systemInfo = self.systemInfo()`
			`let timings: whisper_timings = whisper_get_timings(context).pointee`
			`let encodeMs = String(format: "%.2f", timings.encode_ms)`
			`let decodeMs = String(format: "%.2f", timings.decode_ms)`
			`let batchdMs = String(format: "%.2f", timings.batchd_ms)`
			`let promptMs = String(format: "%.2f", timings.prompt_ms)`
			`return "\| \(deviceModel) \| \(systemName) \| \(systemInfo) \| \(modelName) \| \(nThreads) \| 1 \| \(encodeMs) \| \(decodeMs) \| \(batchdMs) \| \(promptMs) \| <todo> \|"`
			`}`

examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`static func createContext(path: String) throws -> WhisperContext {`
whisper : add context param to disable gpu (#1293) * whisper : check state->ctx_metal not null * whisper : add whisper_context_params { use_gpu } * whisper : new API with params & deprecate old API * examples : use no-gpu param && whisper_init_from_file_with_params * whisper.objc : enable metal & disable on simulator * whisper.swiftui, metal : enable metal & support load default.metallib * whisper.android : use new API * bindings : use new API * addon.node : fix build & test * bindings : updata java binding * bindings : add missing whisper_context_default_params_by_ref WHISPER_API for java * metal : use SWIFTPM_MODULE_BUNDLE for GGML_SWIFT and reuse library load * metal : move bundle var into block * metal : use SWIFT_PACKAGE instead of GGML_SWIFT * style : minor updates --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-11-06 09:04:24 +00:00			`var params = whisper_context_default_params()`
			`#if targetEnvironment(simulator)`
			`params.use_gpu = false`
			`print("Running on the simulator, using CPU")`
whisper.swiftui : add model download list & bench methods (#2546) * swift : fix resources & exclude build * whisper : impl whisper_timings struct & api * whisper.swiftui : model list & bench methods * whisper : return ptr for whisper_get_timings * revert unnecessary change * whisper : avoid designated initializer * whisper.swiftui: code style changes * whisper.swiftui : get device name / os from UIDevice * whisper.swiftui : fix UIDevice usage * whisper.swiftui : add memcpy and ggml_mul_mat (commented) 2024-11-13 19:51:34 +00:00			`#else`
			`params.flash_attn = true // Enabled by default for Metal`
whisper : add context param to disable gpu (#1293) * whisper : check state->ctx_metal not null * whisper : add whisper_context_params { use_gpu } * whisper : new API with params & deprecate old API * examples : use no-gpu param && whisper_init_from_file_with_params * whisper.objc : enable metal & disable on simulator * whisper.swiftui, metal : enable metal & support load default.metallib * whisper.android : use new API * bindings : use new API * addon.node : fix build & test * bindings : updata java binding * bindings : add missing whisper_context_default_params_by_ref WHISPER_API for java * metal : use SWIFTPM_MODULE_BUNDLE for GGML_SWIFT and reuse library load * metal : move bundle var into block * metal : use SWIFT_PACKAGE instead of GGML_SWIFT * style : minor updates --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> 2023-11-06 09:04:24 +00:00			`#endif`
			`let context = whisper_init_from_file_with_params(path, params)`
examples : add whisper.swiftui demo app (#308) * Add SwiftUI demo project. * Add -DGGML_USE_ACCELERATE 2022-12-23 08:56:18 +00:00			`if let context {`
			`return WhisperContext(context: context)`
			`} else {`
			`print("Couldn't load model at \(path)")`
			`throw WhisperError.couldNotInitializeContext`
			`}`
			`}`
			`}`

			`fileprivate func cpuCount() -> Int {`
			`ProcessInfo.processInfo.processorCount`
			`}`