Spaces:

natasa365
/

whisper.cpp

Sleeping

App Files Files Community

whisper.cpp / examples /whisper.swiftui /whisper.cpp.swift /LibWhisper.swift

ggerganov

ci : disable Obj-C build + fixes

3859606 about 1 year ago

raw

history blame

5.28 kB

	import Foundation
	import UIKit
	import whisper

	enum WhisperError: Error {
	case couldNotInitializeContext
	}

	// Meet Whisper C++ constraint: Don't access from more than one thread at a time.
	actor WhisperContext {
	private var context: OpaquePointer

	init(context: OpaquePointer) {
	self.context = context
	}

	deinit {
	whisper_free(context)
	}

	func fullTranscribe(samples: [Float]) {
	// Leave 2 processors free (i.e. the high-efficiency cores).
	let maxThreads = max(1, min(8, cpuCount() - 2))
	print("Selecting \(maxThreads) threads")
	var params = whisper_full_default_params(WHISPER_SAMPLING_GREEDY)
	"en".withCString { en in
	// Adapted from whisper.objc
	params.print_realtime = true
	params.print_progress = false
	params.print_timestamps = true
	params.print_special = false
	params.translate = false
	params.language = en
	params.n_threads = Int32(maxThreads)
	params.offset_ms = 0
	params.no_context = true
	params.single_segment = false

	whisper_reset_timings(context)
	print("About to run whisper_full")
	samples.withUnsafeBufferPointer { samples in
	if (whisper_full(context, params, samples.baseAddress, Int32(samples.count)) != 0) {
	print("Failed to run the model")
	} else {
	whisper_print_timings(context)
	}
	}
	}
	}

	func getTranscription() -> String {
	var transcription = ""
	for i in 0..<whisper_full_n_segments(context) {
	transcription += String.init(cString: whisper_full_get_segment_text(context, i))
	}
	return transcription
	}

	static func benchMemcpy(nThreads: Int32) async -> String {
	return String.init(cString: whisper_bench_memcpy_str(nThreads))
	}

	static func benchGgmlMulMat(nThreads: Int32) async -> String {
	return String.init(cString: whisper_bench_ggml_mul_mat_str(nThreads))
	}

	private func systemInfo() -> String {
	var info = ""
	//if (ggml_cpu_has_neon() != 0) { info += "NEON " }
	return String(info.dropLast())
	}

	func benchFull(modelName: String, nThreads: Int32) async -> String {
	let nMels = whisper_model_n_mels(context)
	if (whisper_set_mel(context, nil, 0, nMels) != 0) {
	return "error: failed to set mel"
	}

	// heat encoder
	if (whisper_encode(context, 0, nThreads) != 0) {
	return "error: failed to encode"
	}

	var tokens = [whisper_token](repeating: 0, count: 512)

	// prompt heat
	if (whisper_decode(context, &tokens, 256, 0, nThreads) != 0) {
	return "error: failed to decode"
	}

	// text-generation heat
	if (whisper_decode(context, &tokens, 1, 256, nThreads) != 0) {
	return "error: failed to decode"
	}

	whisper_reset_timings(context)

	// actual run
	if (whisper_encode(context, 0, nThreads) != 0) {
	return "error: failed to encode"
	}

	// text-generation
	for i in 0..<256 {
	if (whisper_decode(context, &tokens, 1, Int32(i), nThreads) != 0) {
	return "error: failed to decode"
	}
	}

	// batched decoding
	for _ in 0..<64 {
	if (whisper_decode(context, &tokens, 5, 0, nThreads) != 0) {
	return "error: failed to decode"
	}
	}

	// prompt processing
	for _ in 0..<16 {
	if (whisper_decode(context, &tokens, 256, 0, nThreads) != 0) {
	return "error: failed to decode"
	}
	}

	whisper_print_timings(context)

	let deviceModel = await UIDevice.current.model
	let systemName = await UIDevice.current.systemName
	let systemInfo = self.systemInfo()
	let timings: whisper_timings = whisper_get_timings(context).pointee
	let encodeMs = String(format: "%.2f", timings.encode_ms)
	let decodeMs = String(format: "%.2f", timings.decode_ms)
	let batchdMs = String(format: "%.2f", timings.batchd_ms)
	let promptMs = String(format: "%.2f", timings.prompt_ms)
	return "\| \(deviceModel) \| \(systemName) \| \(systemInfo) \| \(modelName) \| \(nThreads) \| 1 \| \(encodeMs) \| \(decodeMs) \| \(batchdMs) \| \(promptMs) \| <todo> \|"
	}

	static func createContext(path: String) throws -> WhisperContext {
	var params = whisper_context_default_params()
	#if targetEnvironment(simulator)
	params.use_gpu = false
	print("Running on the simulator, using CPU")
	#else
	params.flash_attn = true // Enabled by default for Metal
	#endif
	let context = whisper_init_from_file_with_params(path, params)
	if let context {
	return WhisperContext(context: context)
	} else {
	print("Couldn't load model at \(path)")
	throw WhisperError.couldNotInitializeContext
	}
	}
	}

	fileprivate func cpuCount() -> Int {
	ProcessInfo.processInfo.processorCount
	}