ListenerApp/ListenerGS/SpeechForwarder.swift

//
//  SpeechForwarder.swift
//  ListenerGS
//
//  Created by Jeremy Rand on 2021-10-18.
//

import Foundation
import os
import Speech

class SpeechForwarder : SpeechForwarderProtocol {
    
    private let speechRecognizer = SFSpeechRecognizer(locale: Locale(identifier: Locale.preferredLanguages[0]))!
    
    private var recognitionRequest: SFSpeechAudioBufferRecognitionRequest?
    
    private var recognitionTask: SFSpeechRecognitionTask?
    
    private let audioEngine = AVAudioEngine()
    
    private let logger = Logger()
    
    func startListening(connection : GSConnection) -> Bool {
        SFSpeechRecognizer.requestAuthorization { authStatus in
            OperationQueue.main.addOperation {
                switch authStatus {
                case .authorized:
                    break
                        
                case .denied, .restricted, .notDetermined:
                    connection.stopListening()
                    
                default:
                    connection.stopListening()
                }
            }
        }
            
        do {
            try startRecording(connection: connection)
            logger.debug("Started listening")
        }
        catch {
            return false
        }
        return true
    }
    
    func stopListening() {
        logger.debug("Stopped listening")
        recognitionRequest?.endAudio()
        audioEngine.stop()
        audioEngine.inputNode.removeTap(onBus: 0)
        recognitionTask?.cancel()

        recognitionRequest = nil
        recognitionTask = nil
    }
    
    private func startRecording(connection : GSConnection) throws {
        
        // Cancel the previous task if it's running.
        recognitionTask?.cancel()
        self.recognitionTask = nil
        
        // Configure the audio session for the app.
        let audioSession = AVAudioSession.sharedInstance()
        try audioSession.setCategory(.record, mode: .measurement, options: .duckOthers)
        try audioSession.setActive(true, options: .notifyOthersOnDeactivation)
        let inputNode = audioEngine.inputNode
        
        // Configure the microphone input.
        let recordingFormat = inputNode.outputFormat(forBus: 0)
        inputNode.installTap(onBus: 0, bufferSize: 1024, format: recordingFormat) { (buffer: AVAudioPCMBuffer, when: AVAudioTime) in
            self.recognitionRequest?.append(buffer)
        }

        // Create and configure the speech recognition request.
        recognitionRequest = SFSpeechAudioBufferRecognitionRequest()
        guard let recognitionRequest = recognitionRequest else { fatalError("Unable to create a SFSpeechAudioBufferRecognitionRequest object") }
        recognitionRequest.shouldReportPartialResults = true
        recognitionRequest.requiresOnDeviceRecognition = false
        
        // Create a recognition task for the speech recognition session.
        // Keep a reference to the task so that it can be canceled.
        recognitionTask = speechRecognizer.recognitionTask(with: recognitionRequest) { result, error in
            var isFinal = false
            
            if let result = result {
                // Update the text view with the results.
                OperationQueue.main.addOperation { connection.set(text: result.bestTranscription.formattedString) }
                isFinal = result.isFinal
            }
            
            if error != nil {
                self.logger.error("Error from recognizer: \(String(describing: error))")
            }
            
            if error != nil || isFinal {
                OperationQueue.main.addOperation {
                    connection.stopListening()
                }
            }
        }
        
        audioEngine.prepare()
        try audioEngine.start()
    }
}
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`//`
			`// SpeechForwarder.swift`
			`// ListenerGS`
			`//`
			`// Created by Jeremy Rand on 2021-10-18.`
			`//`

			`import Foundation`
Connect up the speech forwarder to the new UI. 2022-01-12 04:30:41 +00:00			`import os`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`import Speech`

A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00			`class SpeechForwarder : SpeechForwarderProtocol {`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00
Fix button appearance in dark mode. Add the heard text the UI below the buttons. Convert to MacOS Roman character set so words like "resume" appear with the correct accents on the GS. 2022-01-19 03:51:28 +00:00			`private let speechRecognizer = SFSpeechRecognizer(locale: Locale(identifier: Locale.preferredLanguages[0]))!`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00
			`private var recognitionRequest: SFSpeechAudioBufferRecognitionRequest?`

			`private var recognitionTask: SFSpeechRecognitionTask?`

			`private let audioEngine = AVAudioEngine()`

Connect up the speech forwarder to the new UI. 2022-01-12 04:30:41 +00:00			`private let logger = Logger()`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00
Major rework of the network code, splitting out the speech recognition aspects and creating separate threads for read and write. This improves handling of network connection closure by the other end and other network connectivity errors. Add some unit tests for the connection code. 2022-03-16 22:13:56 +00:00			`func startListening(connection : GSConnection) -> Bool {`
A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00			`SFSpeechRecognizer.requestAuthorization { authStatus in`
			`OperationQueue.main.addOperation {`
			`switch authStatus {`
			`case .authorized:`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`break`
A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00
			`case .denied, .restricted, .notDetermined:`
Major rework of the network code, splitting out the speech recognition aspects and creating separate threads for read and write. This improves handling of network connection closure by the other end and other network connectivity errors. Add some unit tests for the connection code. 2022-03-16 22:13:56 +00:00			`connection.stopListening()`
A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00
			`default:`
Major rework of the network code, splitting out the speech recognition aspects and creating separate threads for read and write. This improves handling of network connection closure by the other end and other network connectivity errors. Add some unit tests for the connection code. 2022-03-16 22:13:56 +00:00			`connection.stopListening()`
Add code to pace the text to the GS to reduce the amount of re-typing required. 2022-02-23 04:52:00 +00:00			`}`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`}`
			`}`
A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00
			`do {`
Major rework of the network code, splitting out the speech recognition aspects and creating separate threads for read and write. This improves handling of network connection closure by the other end and other network connectivity errors. Add some unit tests for the connection code. 2022-03-16 22:13:56 +00:00			`try startRecording(connection: connection)`
A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00			`logger.debug("Started listening")`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`}`
A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00			`catch {`
Add code to pace the text to the GS to reduce the amount of re-typing required. 2022-02-23 04:52:00 +00:00			`return false`
			`}`
			`return true`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`}`

A fairly big rework of the code to split the network handling code from the speech handling code. Also, introduce a thread for reading from the socket and a separate thread for writing to the socket. That way, disconnections made by the NDA are handled correctly. 2022-03-16 03:58:04 +00:00			`func stopListening() {`
			`logger.debug("Stopped listening")`
			`recognitionRequest?.endAudio()`
			`audioEngine.stop()`
			`audioEngine.inputNode.removeTap(onBus: 0)`
			`recognitionTask?.cancel()`

			`recognitionRequest = nil`
			`recognitionTask = nil`
			`}`

Major rework of the network code, splitting out the speech recognition aspects and creating separate threads for read and write. This improves handling of network connection closure by the other end and other network connectivity errors. Add some unit tests for the connection code. 2022-03-16 22:13:56 +00:00			`private func startRecording(connection : GSConnection) throws {`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00
			`// Cancel the previous task if it's running.`
			`recognitionTask?.cancel()`
			`self.recognitionTask = nil`

			`// Configure the audio session for the app.`
			`let audioSession = AVAudioSession.sharedInstance()`
			`try audioSession.setCategory(.record, mode: .measurement, options: .duckOthers)`
			`try audioSession.setActive(true, options: .notifyOthersOnDeactivation)`
			`let inputNode = audioEngine.inputNode`
Some minor tweaks to try to get speech recognition working from MacOS. It is still not working from my x86 iMac but I just tested this on our new M1 MacBook Air and it does work there. Not sure what the difference is and hope it is just a problem on my iMac. 2022-02-22 04:22:58 +00:00
			`// Configure the microphone input.`
			`let recordingFormat = inputNode.outputFormat(forBus: 0)`
			`inputNode.installTap(onBus: 0, bufferSize: 1024, format: recordingFormat) { (buffer: AVAudioPCMBuffer, when: AVAudioTime) in`
			`self.recognitionRequest?.append(buffer)`
			`}`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00
			`// Create and configure the speech recognition request.`
			`recognitionRequest = SFSpeechAudioBufferRecognitionRequest()`
			`guard let recognitionRequest = recognitionRequest else { fatalError("Unable to create a SFSpeechAudioBufferRecognitionRequest object") }`
			`recognitionRequest.shouldReportPartialResults = true`
Final changes before starting beta testing. 2022-03-09 04:05:23 +00:00			`recognitionRequest.requiresOnDeviceRecognition = false`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00
			`// Create a recognition task for the speech recognition session.`
			`// Keep a reference to the task so that it can be canceled.`
			`recognitionTask = speechRecognizer.recognitionTask(with: recognitionRequest) { result, error in`
			`var isFinal = false`

			`if let result = result {`
			`// Update the text view with the results.`
Major rework of the network code, splitting out the speech recognition aspects and creating separate threads for read and write. This improves handling of network connection closure by the other end and other network connectivity errors. Add some unit tests for the connection code. 2022-03-16 22:13:56 +00:00			`OperationQueue.main.addOperation { connection.set(text: result.bestTranscription.formattedString) }`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`isFinal = result.isFinal`
			`}`

Some minor tweaks to try to get speech recognition working from MacOS. It is still not working from my x86 iMac but I just tested this on our new M1 MacBook Air and it does work there. Not sure what the difference is and hope it is just a problem on my iMac. 2022-02-22 04:22:58 +00:00			`if error != nil {`
			`self.logger.error("Error from recognizer: \(String(describing: error))")`
			`}`

Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`if error != nil \|\| isFinal {`
Add code to pace the text to the GS to reduce the amount of re-typing required. 2022-02-23 04:52:00 +00:00			`OperationQueue.main.addOperation {`
Major rework of the network code, splitting out the speech recognition aspects and creating separate threads for read and write. This improves handling of network connection closure by the other end and other network connectivity errors. Add some unit tests for the connection code. 2022-03-16 22:13:56 +00:00			`connection.stopListening()`
Connect up the speech forwarder to the new UI. 2022-01-12 04:30:41 +00:00			`}`
Move application logic out of view code. 2021-10-19 04:55:58 +00:00			`}`
			`}`

			`audioEngine.prepare()`
			`try audioEngine.start()`
			`}`
			`}`