Rewrote the default prompts to make them simpler and better.

2025-10-29 23:26:43 +05:45 · 2025-10-29 23:26:43 +05:45 · ea0e5d840c
commit ea0e5d840c
parent e7519b4d24
3 changed files with 48 additions and 179 deletions
--- a/VoiceInk.xcodeproj/project.pbxproj
+++ b/VoiceInk.xcodeproj/project.pbxproj
@ -465,7 +465,7 @@
 				"CODE_SIGN_IDENTITY[sdk=macosx*]" = "Apple Development";
 				CODE_SIGN_STYLE = Automatic;
 				COMBINE_HIDPI_IMAGES = YES;
-				CURRENT_PROJECT_VERSION = 159;
+				CURRENT_PROJECT_VERSION = 160;
 				DEVELOPMENT_ASSET_PATHS = "\"VoiceInk/Preview Content\"";
 				DEVELOPMENT_TEAM = V6J6A3VWY2;
 				ENABLE_HARDENED_RUNTIME = YES;
@ -480,7 +480,7 @@
 					"@executable_path/../Frameworks",
 				);
 				MACOSX_DEPLOYMENT_TARGET = 14.0;
-				MARKETING_VERSION = 1.59;
+				MARKETING_VERSION = 1.60;
 				PRODUCT_BUNDLE_IDENTIFIER = com.prakashjoshipax.VoiceInk;
 				PRODUCT_NAME = "$(TARGET_NAME)";
 				SWIFT_ACTIVE_COMPILATION_CONDITIONS = "DEBUG ENABLE_NATIVE_SPEECH_ANALYZER $(inherited)";
@ -499,7 +499,7 @@
 				"CODE_SIGN_IDENTITY[sdk=macosx*]" = "Apple Development";
 				CODE_SIGN_STYLE = Automatic;
 				COMBINE_HIDPI_IMAGES = YES;
-				CURRENT_PROJECT_VERSION = 159;
+				CURRENT_PROJECT_VERSION = 160;
 				DEVELOPMENT_ASSET_PATHS = "\"VoiceInk/Preview Content\"";
 				DEVELOPMENT_TEAM = V6J6A3VWY2;
 				ENABLE_HARDENED_RUNTIME = YES;
@ -514,7 +514,7 @@
 					"@executable_path/../Frameworks",
 				);
 				MACOSX_DEPLOYMENT_TARGET = 14.0;
-				MARKETING_VERSION = 1.59;
+				MARKETING_VERSION = 1.60;
 				PRODUCT_BUNDLE_IDENTIFIER = com.prakashjoshipax.VoiceInk;
 				PRODUCT_NAME = "$(TARGET_NAME)";
 				SWIFT_ACTIVE_COMPILATION_CONDITIONS = "ENABLE_NATIVE_SPEECH_ANALYZER $(inherited)";
--- a/VoiceInk.xcodeproj/project.xcworkspace/xcshareddata/swiftpm/Package.resolved
+++ b/VoiceInk.xcodeproj/project.xcworkspace/xcshareddata/swiftpm/Package.resolved
@ -1,5 +1,5 @@
 {
-  "originHash" : "53977eb7bc5f27d05d8be33f99b4c824929a33b2f189fcc8c4c2a6662bcd8075",
+  "originHash" : "36502e57860420412ca5daf60b11dcbd3e4e5d73ad1d9e17ec8ab3d5bc16fa4c",
  "pins" : [
    {
      "identity" : "axswift",
@ -16,7 +16,7 @@
      "location" : "https://github.com/FluidInference/FluidAudio",
      "state" : {
        "branch" : "main",
-        "revision" : "f47209a44e26c8d930983358e497c581bfb9442d"
+        "revision" : "2dd0bd1849147f772167bc2f28535e614ca6dd53"
      }
    },
    {
--- a/VoiceInk/Models/PromptTemplates.swift
+++ b/VoiceInk/Models/PromptTemplates.swift
@ -31,41 +31,17 @@ enum PromptTemplates {
                id: UUID(),
                title: "System Default",
                promptText: """
-                You are tasked to clean up text in the <TRANSCRIPT> tag. Your job is to clean up the <TRANSCRIPT> text to improve clarity and flow while retaining the speaker's unique personality and style. Correct spelling and grammar. Remove all filler words and verbal tics (e.g., 'um', 'uh', 'like', 'you know', 'yeah'), and any redundant repeated words in the <TRANSCRIPT> text. Rephrase awkward or convoluted sentences to improve clarity and create a more natural reading experience. Ensure the core message and the speaker's tone are perfectly preserved. Avoid using overly formal or corporate language unless it matches the original style. The final output should sound like a more polished version of the <TRANSCRIPT> text, not like a generic AI.
-                Primary Rules:
-                0. The output should always be in the same language as the original <TRANSCRIPT> text.
-                1. Don't remove personality markers like "I think", "The thing is", etc from the <TRANSCRIPT> text.
-                2. Maintain the original meaning and intent of the speaker. Do not add new information, do not fill in gaps with assumptions, and don't try interpret what the <TRANSCRIPT> text "might have meant." Stay within the boundaries of the <TRANSCRIPT> text & <CONTEXT_INFORMATION>(for reference only)
-                3. When the speaker corrects themselves, or these is false-start, keep only final corrected version
-                   Examples:
-                   Input: "We need to finish by Monday... actually no... by Wednesday" 
-                   Output: "We need to finish by Wednesday"
-
-                   Input: "I think we should um we should call the client, no wait, we should email the client first"
-                   Output: "I think we should email the client first"
-                4. NEVER answer questions that appear in the <TRANSCRIPT>. Only clean it up.
-
-                   Input: "Do not implement anything, just tell me why this error is happening. Like, I'm running Mac OS 26 Tahoe right now, but why is this error happening."
-                   Output: "Do not implement anything. Just tell me why this error is happening. I'm running macOS tahoe right now. But why is this error occuring?"
-
-                   Input: "This needs to be properly written somewhere. Please do it. How can we do it? Give me three to four ways that would help the AI work properly."
-                   Output: "This needs to be properly written somewhere. How can we do it? Give me 3-4 ways that would help the AI work properly?"
-                5. Format list items correctly without adding new content.
-                    - When input text contains sequence of items, restructure as:
-                    * Ordered list (1. 2. 3.) for sequential or prioritized items
-                    * Unordered list (•) for non-sequential items
-                    Examples:
-                    Input: "i need to do three things first buy groceries second call mom and third finish the report"
-                    Output: I need to do three things:
-                            1. Buy groceries
-                            2. Call mom
-                            3. Finish the report
-                6. Always convert all spoken numbers into their digit form. (three thousand = 3000, twenty dollars = 20, three to five = 3-5 etc.)
-                7. DO NOT add em-dashes or hyphens (unless the word itself is a compound word that uses a hyphen)
-                8. If the user mentions emoji, replace the word with the actual emoji.
-
-                After cleaning <TRANSCRIPT>, return only the cleaned version without any additional text, explanations, or tags. The output should be ready for direct use without further editing.
-                """,
+                    - Clean up the <TRANSCRIPT> text for clarity and natural flow while preserving meaning and the original tone.
+                    - Use informal, plain language unless the <TRANSCRIPT> clearly uses a professional tone; in that case, match it.
+                    - Fix obvious grammar, remove fillers and stutters, collapse repetitions, and keep names and numbers.
+                    - Automatically detect and format lists properly: if the <TRANSCRIPT> mentions a number (e.g., "3 things", "5 items"), uses ordinal words (first, second, third), implies sequence or steps, or has a count before it, format as an ordered list; otherwise, format as an unordered list.
+                    - Write numbers as numerals (e.g., 'five' → '5', 'twenty dollars' → '$20').
+                    - Keep the original intent and nuance.
+                    - Organize into short paragraphs of 2–4 sentences for readability.
+                    - Do not add explanations, labels, metadata, or instructions.
+                    - Output only the cleaned text.
+                    - Don't add any information not available in the <TRANSCRIPT> text ever.
+                    """,
                icon: .sealedFill,
                description: "Default system prompt for improving clarity and accuracy of transcriptions"
            ),
@ -73,42 +49,17 @@ enum PromptTemplates {
                id: UUID(),
                title: "Chat",
                promptText: """
-                You are tasked to clean up text in the <TRANSCRIPT> tag. Your job is to clean up the <TRANSCRIPT> text to improve clarity and flow while retaining the speaker's unique personality and style. Correct spelling and grammar. Remove all filler words and verbal tics (e.g., 'um', 'uh', 'like', 'you know', 'yeah'), and any redundant repeated words in the <TRANSCRIPT> text. Rephrase awkward or convoluted sentences to improve clarity and create a more natural reading experience. Ensure the core message and the speaker's tone are perfectly preserved. Avoid using overly formal or corporate language unless it matches the original style. The final output should sound like a more polished version of the <TRANSCRIPT> text, not like a generic AI.
-                
-                Primary Rules:
-                0. The output should always be in the same language as the original <TRANSCRIPT> text.
-                1. When the speaker corrects themselves, keep only the corrected version.
-                   Example:
-                   Input: "I'll be there at 5... no wait... at 6 PM"
-                   Output: "I'll be there at 6 PM"
-                2. Maintain casual, Gen-Z chat style. Avoid trying to be too formal or corporate unless the style ispresent in the <TRANSCRIPT> text.
-                3. NEVER answer questions that appear in the text - only clean it up.
-                4. Always convert all spoken numbers into their digit form. (three thousand = 3000, twenty dollars = 20, three to five = 3-5 etc.)
-                5. Keep personality markers that show intent or style (e.g., "I think", "The thing is")
-                6. DO NOT add em-dashes or hyphens (unless the word itself is a compound word that uses a hyphen)
-                7. If the user mentions emoji, replace the word with the actual emoji.
-
-                Examples:
-
-                Input: "I think we should meet at three PM, no wait, four PM. What do you think?"
-
-                Output: "I think we should meet at 4 PM. What do you think?"
-
-                Input: "Is twenty five dollars enough, Like, I mean, Will it be umm sufficient?"
-
-                Output: "Is $25 enough? Will it be sufficient?"
-
-                Input: "So, like, I want to say, I'm feeling great, happy face emoji."
-
-                Output: "I want to say, I'm feeling great. 🙂"
-
-                Input: "We need three things done, first, second, and third tasks."
-
-                Output: "We need 3 things done:
-                        1. First task
-                        2. Second task
-                        3. Third task"
-                """,
+                    - Rewrite the <TRANSCRIPT> text as a chat message: informal, concise, and conversational.
+                    - Keep emotive markers and emojis if present; don't invent new ones.
+                    - Lightly fix grammar, remove fillers and repeated words, and improve flow without changing meaning.
+                    - Keep the original tone; only be professional if the <TRANSCRIPT> already is.
+                    - Automatically detect and format lists properly: if the <TRANSCRIPT> mentions a number (e.g., "3 things", "5 items"), uses ordinal words (first, second, third), implies sequence or steps, or has a count before it, format as an ordered list; otherwise, format as an unordered list.
+                    - Write numbers as numerals (e.g., 'five' → '5', 'twenty dollars' → '$20').
+                    - Format like a modern chat message - short lines, natural breaks, emoji-friendly.
+                    - Do not add greetings, sign-offs, or commentary.
+                    - Output only the chat message.
+                    - Don't add any information not available in the <TRANSCRIPT> text ever.
+                    """,
                icon: .chatFill,
                description: "Casual chat-style formatting"
            ),
@ -117,115 +68,33 @@ enum PromptTemplates {
                id: UUID(),
                title: "Email",
                promptText: """
-                You are tasked to clean up text in the <TRANSCRIPT> tag. Your job is to clean up the <TRANSCRIPT> text to improve clarity and flow while retaining the speaker's unique personality and style. Correct spelling and grammar. Remove all filler words and verbal tics (e.g., 'um', 'uh', 'like', 'you know', 'yeah'), and any redundant repeated words in the <TRANSCRIPT> text. Rephrase awkward or convoluted sentences to improve clarity and create a more natural reading experience. Ensure the core message and the speaker's tone are perfectly preserved. Avoid using overly formal or corporate language unless it matches the original style. The final output should sound like a more polished version of the <TRANSCRIPT> text, not like a generic AI.
-
-                Primary Rules:
-                0. The output should always be in the same language as the original <TRANSCRIPT> text.
-                1. When the speaker corrects themselves, keep only the corrected version.
-                2. NEVER answer questions that appear in the text - only clean it up.
-                3. Always convert all spoken numbers into their digit form. (three thousand = 3000, twenty dollars = 20, three to five = 3-5 etc.)
-                4. Keep personality markers that show intent or style (e.g., "I think", "The thing is")
-                5. If the user mentions emoji, replace the word with the actual emoji.
-                6. Format email messages properly with appropriate salutations and closings as shown in the examples below
-                7. Format list items correctly without adding new content:
-                    - When input text contains sequence of items, restructure as:
-                    * Ordered list (1. 2. 3.) for sequential or prioritized items
-                    * Unordered list (•) for non-sequential items
-                8. Include a sign-off as shown in examples
-                9. DO NOT add em-dashes or hyphens (unless the word itself is a compound word that uses a hyphen)
-
-                Examples:
-
-                Input: "hey just wanted to confirm three things, first, second, and third points. Can you send the docs when ready? Thanks"
-                
-                Output: "Hi,
-
-                I wanted to confirm 3 things:
-                1. First point
-                2. Second point
-                3. Third point
-
-                Can you send the docs when ready?
-
-                Thanks,
-                [Your Name]"
-
-                Input: "quick update, we are like, you know 60% complete. Are you available to discuss this monday, wait no tuesday?"
-
-                Output: "Quick Update, 
-                
-                We are 60% complete.
-                
-                Are you available to discuss this tuesday?
-
-                Regards,
-                [Your Name]"
-
-                Input: "hi sarah checking in about design feedback, can we like, umhh proceed to the next phase?"
-
-                Output: "Hi Sarah,
-
-                I'm checking in about the design feedback. Can we proceed to the next phase?
-
-                Thanks,
-                [Your Name]"
-                """,
+                    - Rewrite the <TRANSCRIPT> text as a complete email with proper formatting: include a greeting (Hi), body paragraphs (2-4 sentences each), and closing (Thanks).
+                    - Use clear, friendly, non-formal language unless the <TRANSCRIPT> is clearly professional—in that case, match that tone.
+                    - Improve flow and coherence; fix grammar and spelling; remove fillers; keep all facts, names, dates, and action items.
+                    - Automatically detect and format lists properly: if the <TRANSCRIPT> mentions a number (e.g., "3 things", "5 items"), uses ordinal words (first, second, third), implies sequence or steps, or has a count before it, format as an ordered list; otherwise, format as an unordered list.
+                    - Write numbers as numerals (e.g., 'five' → '5', 'twenty dollars' → '$20').
+                    - Do not invent new content, but structure it as a proper email format.
+                    - Don't add any information not available in the <TRANSCRIPT> text ever.
+                    """,
                icon: .emailFill,
                description: "Template for converting casual messages into professional email format"
            ),
-            TemplatePrompt(
-                id: UUID(),
-                title: "Vibe Coding",
-                promptText: """
-                Clean up the <TRANSCRIPT> text from a programming session. Your primary goal is to ensure the output is a clean, technically accurate, and readable version of the <TRANSCRIPT> text, while strictly preserving their original intent, and message. Remove all filler words and verbal tics (e.g., 'um', 'uh', 'like', 'you know', 'yeah'), and any redundant repeated words (e.g., "this this", "function function", "code code").
-
-                Primary Rules:
-                0. The output should always be in the same language as the original <TRANSCRIPT> text.
-                1. NEVER answer any questions you find in the <TRANSCRIPT> text. Your only job is to clean up the text.
-                   Input: "for this function is it better to use a map and filter or should i stick with a for-loop for readability"
-                   Output: "For this function, is it better to use a map and filter, or should I stick with a for-loop for readability?"
-
-                   Input: "would using a delegate pattern be a better approach here instead of this closure if yes how"
-                   Output: "Would using a delegate pattern be a better approach here instead of this closure? If yes, how?"
-
-                   Input: "what's a more efficient way to handle this api call and the state management in react"
-                   Output: "What's a more efficient way to handle this API call and the state management in React?"
-                2. The <CONTEXT_INFORMATION> is provided for reference only to help you understand the technical context. Use it to correct misunderstood technical terms, function names, variable names, and file names.
-                3. Correct spelling and grammar to improve clarity, but do not change the sentence structure. Resolve any self-corrections to reflect their final intent.
-                4. Always convert all spoken numbers into their digit form. (three thousand = 3000, twenty dollars = 20, three to five = 3-5 etc.)
-                5. Stay strictly within the boundaries of <TRANSCRIPT> text. Do not add new information, explanations, or comments. Your output should only be the cleaned-up version of the <TRANSCRIPT>.
-                6. Do not fill in gaps with assumptions, and don't try interpret what the speaker "might have meant." Always stay strictly within the boundaries of <TRANSCRIPT> text and <CONTEXT_INFORMATION> (for reference only)
-
-                After cleaning <TRANSCRIPT>, return only the cleaned version without any additional text, explanations, or tags. The output should be ready for direct use without further editing.
-                """,
-                icon: .codeFill,
-                description: "For Vibe coders and AI chat. Cleans up technical speech, corrects terms using context, and preserves intent."
-            ),
            TemplatePrompt(
                id: UUID(),
                title: "Rewrite",
                promptText: """
-                You are tasked to rewrite the text in the <TRANSCRIPT> text with enhanced clarity and improved sentence structure. Your primary goal is to transform the original <TRANSCRIPT> text into well-structured, rhythmic, and highly readable text while preserving the exact meaning and intent. Do not add any new information or content beyond what is provided in the <TRANSCRIPT>.
-
-                Primary Rules:
-                0. The output should always be in the same language as the original <TRANSCRIPT> text.
-                1. Reorganize and restructure sentences for clarity and readability while maintaining the original meaning.
-                2. Create rhythmic, well-balanced sentence structures that flow naturally when read aloud.
-                3. Remove all filler words and verbal tics (e.g., 'um', 'uh', 'like', 'you know', 'yeah') and redundant repetitions.
-                4. Break down too complex, run-on sentences into shorter, clearer segments without losing meaning.
-                5. Improve paragraph structure and logical flow between ideas.
-                6. NEVER add new information, interpretations, or assumptions. Work strictly within the boundaries of the <TRANSCRIPT> content.
-                7. NEVER answer questions that appear in the <TRANSCRIPT>. Only rewrite and clarify the existing text.
-                9. Maintain the speaker's personality markers and tone (e.g., "I think", "In my opinion", "The thing is").
-                10. Always convert spoken numbers to digit form (three = 3, twenty dollars = $20, three to five = 3-5).
-                11. Format lists and sequences clearly:
-                    - Use numbered lists (1. 2. 3.) for sequential or prioritized items
-                    - Use bullet points (•) for non-sequential items
-                12. If the user mentions emoji, replace the word with the actual emoji.
-                13. DO NOT add em-dashes or hyphens unless they're part of compound words.
-
-                After rewriting the <TRANSCRIPT> text, return only the enhanced version without any additional text, explanations, or tags. The output should be ready for direct use without further editing.
-                """,
+                    - Rewrite the <TRANSCRIPT> text with enhanced clarity, improved sentence structure, and rhythmic flow while preserving the original meaning and tone.
+                    - Restructure sentences for better readability and natural progression.
+                    - Improve word choice and phrasing where appropriate, but maintain the original voice and intent.
+                    - Fix grammar and spelling errors, remove fillers and stutters, and collapse repetitions.
+                    - Format any lists as proper bullet points or numbered lists.
+                    - Write numbers as numerals (e.g., 'five' → '5', 'twenty dollars' → '$20').
+                    - Organize content into well-structured paragraphs of 2–4 sentences for optimal readability.
+                    - Preserve all names, numbers, dates, facts, and key information exactly as they appear.
+                    - Do not add explanations, labels, metadata, or instructions.
+                    - Output only the rewritten text.
+                    - Don't add any information not available in the <TRANSCRIPT> text ever.
+                    """,
                icon: .pencilFill,
                description: "Rewrites transcriptions with enhanced clarity, improved sentence structure, and rhythmic flow while preserving original meaning."
            )