diff --git a/VoiceInk/Services/AudioFileTranscriptionManager.swift b/VoiceInk/Services/AudioFileTranscriptionManager.swift index 5b49ba5..c6d32c5 100644 --- a/VoiceInk/Services/AudioFileTranscriptionManager.swift +++ b/VoiceInk/Services/AudioFileTranscriptionManager.swift @@ -111,7 +111,7 @@ class AudioTranscriptionManager: ObservableObject { } let transcriptionDuration = Date().timeIntervalSince(transcriptionStart) - text = WhisperHallucinationFilter.filter(text) + text = TranscriptionOutputFilter.filter(text) text = text.trimmingCharacters(in: .whitespacesAndNewlines) let powerModeManager = PowerModeManager.shared diff --git a/VoiceInk/Services/AudioFileTranscriptionService.swift b/VoiceInk/Services/AudioFileTranscriptionService.swift index 6e6095c..cdc41ab 100644 --- a/VoiceInk/Services/AudioFileTranscriptionService.swift +++ b/VoiceInk/Services/AudioFileTranscriptionService.swift @@ -61,7 +61,7 @@ class AudioTranscriptionService: ObservableObject { } let transcriptionDuration = Date().timeIntervalSince(transcriptionStart) - text = WhisperHallucinationFilter.filter(text) + text = TranscriptionOutputFilter.filter(text) text = text.trimmingCharacters(in: .whitespacesAndNewlines) let powerModeManager = PowerModeManager.shared diff --git a/VoiceInk/Whisper/WhisperHallucinationFilter.swift b/VoiceInk/Services/TranscriptionOutputFilter.swift similarity index 93% rename from VoiceInk/Whisper/WhisperHallucinationFilter.swift rename to VoiceInk/Services/TranscriptionOutputFilter.swift index c9b4c54..71548e5 100644 --- a/VoiceInk/Whisper/WhisperHallucinationFilter.swift +++ b/VoiceInk/Services/TranscriptionOutputFilter.swift @@ -1,8 +1,8 @@ import Foundation import os -struct WhisperHallucinationFilter { - private static let logger = Logger(subsystem: "com.prakashjoshipax.voiceink", category: "WhisperHallucinationFilter") +struct TranscriptionOutputFilter { + private static let logger = Logger(subsystem: "com.prakashjoshipax.voiceink", category: "TranscriptionOutputFilter") private static let hallucinationPatterns = [ #"\[.*?\]"#, // [] @@ -11,7 +11,7 @@ struct WhisperHallucinationFilter { ] private static let fillerWords = [ - "uh", "um", "uhm", "umm", "uhh", "uhhh", "er", "ah", "eh", + "uh", "um", "uhm", "umm", "uhh", "uhhh", "ah", "eh", "hmm", "hm", "mmm", "mm", "mh", "ha", "ehh" ] static func filter(_ text: String) -> String { diff --git a/VoiceInk/Whisper/WhisperState.swift b/VoiceInk/Whisper/WhisperState.swift index 12b9a95..8671b74 100644 --- a/VoiceInk/Whisper/WhisperState.swift +++ b/VoiceInk/Whisper/WhisperState.swift @@ -268,7 +268,7 @@ class WhisperState: NSObject, ObservableObject { let transcriptionStart = Date() var text = try await transcriptionService.transcribe(audioURL: url, model: model) - text = WhisperHallucinationFilter.filter(text) + text = TranscriptionOutputFilter.filter(text) let transcriptionDuration = Date().timeIntervalSince(transcriptionStart) let powerModeManager = PowerModeManager.shared