From f38904c7a17b1ff8932abcb542115ce2b4397267 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Sun, 11 Jan 2026 02:44:54 -0800
Subject: [PATCH 01/13] feat: speech interview helper assistant

---
 electron/AnswerAssistant.ts                   | 175 ++++++++++
 electron/ConversationManager.ts               | 152 +++++++++
 electron/TranscriptionHelper.ts               | 131 ++++++++
 electron/ipcHandlers.ts                       | 141 ++++++++
 electron/main.ts                              |  25 +-
 electron/preload.ts                           |  56 +++-
 electron/shortcuts.ts                         |  33 ++
 package.json                                  |   4 +-
 src/_pages/Queue.tsx                          |  10 +-
 src/_pages/Solutions.tsx                      |   6 +
 .../Conversation/ConversationSection.tsx      | 309 ++++++++++++++++++
 src/types/electron.d.ts                       |  13 +
 src/utils/audioRecorder.ts                    |  99 ++++++
 stealth-run.sh                                |   0
 14 files changed, 1147 insertions(+), 7 deletions(-)
 create mode 100644 electron/AnswerAssistant.ts
 create mode 100644 electron/ConversationManager.ts
 create mode 100644 electron/TranscriptionHelper.ts
 create mode 100644 src/components/Conversation/ConversationSection.tsx
 create mode 100644 src/utils/audioRecorder.ts
 mode change 100644 => 100755 stealth-run.sh
diff --git a/electron/AnswerAssistant.ts b/electron/AnswerAssistant.ts
new file mode 100644
index 00000000..3664306a
--- /dev/null
+++ b/electron/AnswerAssistant.ts
@@ -0,0 +1,175 @@
+/**
+ * AnswerAssistant - Generates AI-powered answer suggestions based on conversation context
+ * Follows Single Responsibility Principle - only handles answer suggestion generation
+ * Uses Dependency Inversion Principle - depends on IConversationManager interface
+ */
+import OpenAI from 'openai';
+import { configHelper } from './ConfigHelper';
+import { IConversationManager } from './ConversationManager';
+
+export interface AnswerSuggestion {
+  suggestions: string[];
+  reasoning: string;
+}
+
+export interface IAnswerAssistant {
+  generateAnswerSuggestions(
+    currentQuestion: string,
+    conversationManager: IConversationManager,
+    screenshotContext?: string
+  ): Promise<AnswerSuggestion>;
+}
+
+export class AnswerAssistant implements IAnswerAssistant {
+  private openai: OpenAI | null = null;
+  private readonly defaultModel: string = 'gpt-4o-mini';
+
+  constructor() {
+    this.initializeOpenAI();
+  }
+
+  /**
+   * Initializes OpenAI client with API key from config
+   */
+  private initializeOpenAI(): void {
+    const config = configHelper.loadConfig();
+    if (config.apiKey && config.apiKey.trim().length > 0) {
+      this.openai = new OpenAI({ apiKey: config.apiKey });
+    }
+  }
+
+  /**
+   * Generates answer suggestions based on conversation context
+   * @param currentQuestion - The current interviewer question
+   * @param conversationManager - Conversation manager instance (dependency injection)
+   * @param screenshotContext - Optional screenshot context for coding interviews
+   * @returns Promise resolving to answer suggestions
+   * @throws Error if OpenAI client not initialized or request fails
+   */
+  public async generateAnswerSuggestions(
+    currentQuestion: string,
+    conversationManager: IConversationManager,
+    screenshotContext?: string
+  ): Promise<AnswerSuggestion> {
+    if (!this.openai) {
+      throw new Error('OpenAI client not initialized. Please set API key.');
+    }
+
+    if (!currentQuestion || currentQuestion.trim().length === 0) {
+      throw new Error('Current question cannot be empty');
+    }
+
+    const conversationHistory = conversationManager.getConversationHistory();
+    const previousAnswers = conversationManager.getIntervieweeAnswers();
+
+    const contextPrompt = this.buildContextPrompt(
+      currentQuestion,
+      conversationHistory,
+      previousAnswers,
+      screenshotContext
+    );
+
+    try {
+      const response = await this.openai.chat.completions.create({
+        model: this.defaultModel,
+        messages: [
+          {
+            role: 'system',
+            content: 'You are a helpful interview assistant that provides contextual answer suggestions based on conversation history. Provide concise, actionable suggestions.'
+          },
+          {
+            role: 'user',
+            content: contextPrompt
+          }
+        ],
+        temperature: 0.7,
+        max_tokens: 500,
+      });
+
+      const suggestionsText = response.choices[0]?.message?.content || '';
+      const suggestions = this.parseSuggestions(suggestionsText);
+
+      return {
+        suggestions: suggestions.length > 0 
+          ? suggestions 
+          : ['Consider answering based on your experience and background.'],
+        reasoning: 'Based on conversation history and previous answers',
+      };
+    } catch (error: any) {
+      console.error('Error generating suggestions:', error);
+      
+      // Provide specific error messages
+      if (error.status === 401) {
+        throw new Error('Invalid API key. Please check your OpenAI API key in settings.');
+      } else if (error.status === 429) {
+        throw new Error('Rate limit exceeded. Please try again in a moment.');
+      }
+      
+      throw new Error(`Failed to generate suggestions: ${error.message || 'Unknown error'}`);
+    }
+  }
+
+  /**
+   * Builds the context prompt for the AI
+   */
+  private buildContextPrompt(
+    currentQuestion: string,
+    conversationHistory: string,
+    previousAnswers: string[],
+    screenshotContext?: string
+  ): string {
+    let prompt = `You are an AI assistant helping someone during an interview. 
+The interviewer just asked: "${currentQuestion}"
+
+Previous conversation:
+${conversationHistory || 'No previous conversation yet.'}
+
+Previous answers the interviewee has given:
+${previousAnswers.length > 0 ? previousAnswers.join('\n\n') : 'No previous answers yet.'}
+
+Based on the current question and conversation history, provide 3-5 bullet point suggestions that:
+1. Directly answer the current question
+2. Reference and build upon previous answers for consistency
+3. Maintain a coherent narrative
+4. Are specific and actionable
+
+Format as simple bullet points, one per line starting with "-".`;
+
+    if (screenshotContext) {
+      prompt += `\n\nAdditional context from code screenshot: ${screenshotContext}`;
+    }
+
+    return prompt;
+  }
+
+  /**
+   * Parses AI response into structured suggestions
+   */
+  private parseSuggestions(suggestionsText: string): string[] {
+    return suggestionsText
+      .split('\n')
+      .map(line => line.trim())
+      .filter(line => {
+        // Match bullet points, numbered lists, or lines starting with common prefixes
+        return line.startsWith('-') || 
+               line.startsWith('•') || 
+               line.match(/^\d+\./) ||
+               (line.length > 0 && line.length < 200); // Reasonable length
+      })
+      .map(line => {
+        // Remove bullet/number prefixes
+        return line
+          .replace(/^[-•]\s*/, '')
+          .replace(/^\d+\.\s*/, '')
+          .trim();
+      })
+      .filter(line => line.length > 0 && line.length < 200); // Filter out empty or too long
+  }
+
+  /**
+   * Checks if OpenAI client is initialized
+   */
+  public isInitialized(): boolean {
+    return this.openai !== null;
+  }
+}
diff --git a/electron/ConversationManager.ts b/electron/ConversationManager.ts
new file mode 100644
index 00000000..4df0319c
--- /dev/null
+++ b/electron/ConversationManager.ts
@@ -0,0 +1,152 @@
+/**
+ * ConversationManager - Manages conversation state and messages
+ * Follows Single Responsibility Principle - only handles conversation state
+ * Uses EventEmitter for loose coupling (Observer pattern)
+ */
+import { EventEmitter } from 'events';
+
+export interface ConversationMessage {
+  id: string;
+  speaker: 'interviewer' | 'interviewee';
+  text: string;
+  timestamp: number;
+  edited?: boolean;
+}
+
+export interface IConversationManager {
+  addMessage(text: string, speaker?: 'interviewer' | 'interviewee'): ConversationMessage;
+  toggleSpeaker(): 'interviewer' | 'interviewee';
+  getCurrentSpeaker(): 'interviewer' | 'interviewee';
+  getMessages(): ConversationMessage[];
+  getConversationHistory(): string;
+  getIntervieweeAnswers(): string[];
+  updateMessage(messageId: string, newText: string): boolean;
+  clearConversation(): void;
+  setSpeaker(speaker: 'interviewer' | 'interviewee'): void;
+}
+
+export class ConversationManager extends EventEmitter implements IConversationManager {
+  private messages: ConversationMessage[] = [];
+  private currentSpeaker: 'interviewer' | 'interviewee' = 'interviewee';
+
+  /**
+   * Adds a new message to the conversation
+   * @param text - Message text
+   * @param speaker - Optional speaker override, uses current speaker if not provided
+   * @returns The created message
+   */
+  public addMessage(
+    text: string, 
+    speaker?: 'interviewer' | 'interviewee'
+  ): ConversationMessage {
+    if (!text || text.trim().length === 0) {
+      throw new Error('Message text cannot be empty');
+    }
+
+    const message: ConversationMessage = {
+      id: this.generateMessageId(),
+      speaker: speaker || this.currentSpeaker,
+      text: text.trim(),
+      timestamp: Date.now(),
+    };
+
+    this.messages.push(message);
+    this.emit('message-added', message);
+    return message;
+  }
+
+  /**
+   * Toggles between interviewer and interviewee speaker modes
+   * @returns The new speaker mode
+   */
+  public toggleSpeaker(): 'interviewer' | 'interviewee' {
+    this.currentSpeaker = this.currentSpeaker === 'interviewer' 
+      ? 'interviewee' 
+      : 'interviewer';
+    this.emit('speaker-changed', this.currentSpeaker);
+    return this.currentSpeaker;
+  }
+
+  /**
+   * Sets the current speaker mode
+   * @param speaker - Speaker mode to set
+   */
+  public setSpeaker(speaker: 'interviewer' | 'interviewee'): void {
+    if (this.currentSpeaker !== speaker) {
+      this.currentSpeaker = speaker;
+      this.emit('speaker-changed', this.currentSpeaker);
+    }
+  }
+
+  /**
+   * Gets the current speaker mode
+   */
+  public getCurrentSpeaker(): 'interviewer' | 'interviewee' {
+    return this.currentSpeaker;
+  }
+
+  /**
+   * Gets all messages in the conversation
+   * @returns Copy of messages array (immutable)
+   */
+  public getMessages(): ConversationMessage[] {
+    return [...this.messages];
+  }
+
+  /**
+   * Gets conversation history as formatted string
+   * @returns Formatted conversation history
+   */
+  public getConversationHistory(): string {
+    return this.messages
+      .map(msg => `[${msg.speaker === 'interviewer' ? 'Interviewer' : 'You'}] ${msg.text}`)
+      .join('\n\n');
+  }
+
+  /**
+   * Gets all answers from the interviewee
+   * @returns Array of interviewee answer texts
+   */
+  public getIntervieweeAnswers(): string[] {
+    return this.messages
+      .filter(msg => msg.speaker === 'interviewee')
+      .map(msg => msg.text);
+  }
+
+  /**
+   * Updates an existing message
+   * @param messageId - ID of message to update
+   * @param newText - New text for the message
+   * @returns True if message was found and updated, false otherwise
+   */
+  public updateMessage(messageId: string, newText: string): boolean {
+    if (!newText || newText.trim().length === 0) {
+      return false;
+    }
+
+    const message = this.messages.find(m => m.id === messageId);
+    if (message) {
+      message.text = newText.trim();
+      message.edited = true;
+      this.emit('message-updated', message);
+      return true;
+    }
+    return false;
+  }
+
+  /**
+   * Clears all messages and resets to default speaker
+   */
+  public clearConversation(): void {
+    this.messages = [];
+    this.currentSpeaker = 'interviewee';
+    this.emit('conversation-cleared');
+  }
+
+  /**
+   * Generates a unique message ID
+   */
+  private generateMessageId(): string {
+    return `msg-${Date.now()}-${Math.random().toString(36).substring(2, 9)}`;
+  }
+}
diff --git a/electron/TranscriptionHelper.ts b/electron/TranscriptionHelper.ts
new file mode 100644
index 00000000..bf8bf23e
--- /dev/null
+++ b/electron/TranscriptionHelper.ts
@@ -0,0 +1,131 @@
+/**
+ * TranscriptionHelper - Handles audio transcription using OpenAI Whisper API
+ * Follows Single Responsibility Principle - only handles transcription
+ */
+import OpenAI from 'openai';
+import fs from 'fs';
+import path from 'path';
+import { app } from 'electron';
+import { configHelper } from './ConfigHelper';
+
+export interface TranscriptionResult {
+  text: string;
+  language?: string;
+}
+
+export interface ITranscriptionHelper {
+  transcribeAudio(audioBuffer: Buffer, mimeType?: string): Promise<TranscriptionResult>;
+}
+
+export class TranscriptionHelper implements ITranscriptionHelper {
+  private openai: OpenAI | null = null;
+  private readonly tempDir: string;
+
+  constructor() {
+    this.tempDir = path.join(app.getPath('temp'), 'audio-transcriptions');
+    this.ensureTempDirectory();
+    this.initializeOpenAI();
+  }
+
+  /**
+   * Initializes OpenAI client with API key from config
+   */
+  private initializeOpenAI(): void {
+    const config = configHelper.loadConfig();
+    if (config.apiKey && config.apiKey.trim().length > 0) {
+      this.openai = new OpenAI({ apiKey: config.apiKey });
+    }
+  }
+
+  /**
+   * Ensures temp directory exists for audio files
+   */
+  private ensureTempDirectory(): void {
+    if (!fs.existsSync(this.tempDir)) {
+      fs.mkdirSync(this.tempDir, { recursive: true });
+    }
+  }
+
+  /**
+   * Transcribes audio buffer using OpenAI Whisper API
+   * @param audioBuffer - Audio data as Buffer
+   * @param mimeType - MIME type of the audio (default: 'audio/webm')
+   * @returns Promise resolving to transcription result
+   * @throws Error if transcription fails or OpenAI client not initialized
+   */
+  public async transcribeAudio(
+    audioBuffer: Buffer, 
+    mimeType: string = 'audio/webm'
+  ): Promise<TranscriptionResult> {
+    if (!this.openai) {
+      throw new Error('OpenAI client not initialized. Please set API key.');
+    }
+
+    if (!audioBuffer || audioBuffer.length === 0) {
+      throw new Error('Audio buffer is empty');
+    }
+
+    const tempPath = path.join(this.tempDir, `audio-${Date.now()}-${Math.random().toString(36).substring(7)}.webm`);
+    
+    try {
+      // Write buffer to temp file
+      fs.writeFileSync(tempPath, audioBuffer);
+      
+      // Create read stream for OpenAI API
+      const file = fs.createReadStream(tempPath);
+      
+      // Transcribe using Whisper API
+      const transcription = await this.openai.audio.transcriptions.create({
+        file: file,
+        model: 'whisper-1',
+        language: 'en', // Optional: can be auto-detected
+        response_format: 'verbose_json',
+      });
+
+      // Clean up temp file
+      this.cleanupTempFile(tempPath);
+      
+      return {
+        text: transcription.text,
+        language: transcription.language,
+      };
+    } catch (error: any) {
+      // Clean up on error
+      this.cleanupTempFile(tempPath);
+      
+      console.error('Transcription error:', error);
+      
+      // Provide more specific error messages
+      if (error.status === 401) {
+        throw new Error('Invalid API key. Please check your OpenAI API key in settings.');
+      } else if (error.status === 429) {
+        throw new Error('Rate limit exceeded. Please try again in a moment.');
+      } else if (error.message?.includes('file')) {
+        throw new Error('Invalid audio file format. Please try recording again.');
+      }
+      
+      throw new Error(`Transcription failed: ${error.message || 'Unknown error'}`);
+    }
+  }
+
+  /**
+   * Safely removes temporary file
+   */
+  private cleanupTempFile(filePath: string): void {
+    try {
+      if (fs.existsSync(filePath)) {
+        fs.unlinkSync(filePath);
+      }
+    } catch (error) {
+      console.error('Error cleaning up temp file:', error);
+      // Don't throw - cleanup errors shouldn't break the flow
+    }
+  }
+
+  /**
+   * Checks if OpenAI client is initialized
+   */
+  public isInitialized(): boolean {
+    return this.openai !== null;
+  }
+}
diff --git a/electron/ipcHandlers.ts b/electron/ipcHandlers.ts
index f05a9aee..841b64b3 100644
--- a/electron/ipcHandlers.ts
+++ b/electron/ipcHandlers.ts
@@ -348,4 +348,145 @@ export function initializeIpcHandlers(deps: IIpcHandlerDeps): void {
       return { success: false, error: "Failed to delete last screenshot" }
     }
   })
+
+  // ============================================
+  // Conversation & Transcription Handlers
+  // ============================================
+
+  // Transcription handler - receives audio buffer from renderer
+  ipcMain.handle("transcribe-audio", async (_event, audioBuffer: ArrayBuffer, mimeType: string) => {
+    try {
+      if (!deps.transcriptionHelper) {
+        return { success: false, error: "Transcription helper not initialized" };
+      }
+
+      const buffer = Buffer.from(audioBuffer);
+      const result = await deps.transcriptionHelper.transcribeAudio(buffer, mimeType);
+      return { success: true, result };
+    } catch (error: any) {
+      console.error("Transcription error:", error);
+      return { success: false, error: error.message || "Transcription failed" };
+    }
+  })
+
+  // Conversation message handlers
+  ipcMain.handle("add-conversation-message", (_event, text: string, speaker?: string) => {
+    try {
+      if (!deps.conversationManager) {
+        return { success: false, error: "Conversation manager not initialized" };
+      }
+
+      const message = deps.conversationManager.addMessage(text, speaker as any);
+      return { success: true, message };
+    } catch (error: any) {
+      console.error("Error adding message:", error);
+      return { success: false, error: error.message || "Failed to add message" };
+    }
+  })
+
+  ipcMain.handle("toggle-speaker", () => {
+    try {
+      if (!deps.conversationManager) {
+        return { success: false, error: "Conversation manager not initialized" };
+      }
+
+      const speaker = deps.conversationManager.toggleSpeaker();
+      return { success: true, speaker };
+    } catch (error: any) {
+      console.error("Error toggling speaker:", error);
+      return { success: false, error: error.message || "Failed to toggle speaker" };
+    }
+  })
+
+  ipcMain.handle("get-conversation", () => {
+    try {
+      if (!deps.conversationManager) {
+        return { success: false, error: "Conversation manager not initialized", messages: [] };
+      }
+
+      const messages = deps.conversationManager.getMessages();
+      return { success: true, messages };
+    } catch (error: any) {
+      console.error("Error getting conversation:", error);
+      return { success: false, error: error.message || "Failed to get conversation", messages: [] };
+    }
+  })
+
+  ipcMain.handle("clear-conversation", () => {
+    try {
+      if (!deps.conversationManager) {
+        return { success: false, error: "Conversation manager not initialized" };
+      }
+
+      deps.conversationManager.clearConversation();
+      return { success: true };
+    } catch (error: any) {
+      console.error("Error clearing conversation:", error);
+      return { success: false, error: error.message || "Failed to clear conversation" };
+    }
+  })
+
+  ipcMain.handle("update-conversation-message", (_event, messageId: string, newText: string) => {
+    try {
+      if (!deps.conversationManager) {
+        return { success: false, error: "Conversation manager not initialized" };
+      }
+
+      const success = deps.conversationManager.updateMessage(messageId, newText);
+      return { success };
+    } catch (error: any) {
+      console.error("Error updating message:", error);
+      return { success: false, error: error.message || "Failed to update message" };
+    }
+  })
+
+  // AI suggestion handler
+  ipcMain.handle("get-answer-suggestions", async (_event, question: string, screenshotContext?: string) => {
+    try {
+      if (!deps.answerAssistant || !deps.conversationManager) {
+        return { success: false, error: "Answer assistant or conversation manager not initialized" };
+      }
+
+      const suggestions = await deps.answerAssistant.generateAnswerSuggestions(
+        question,
+        deps.conversationManager,
+        screenshotContext
+      );
+      return { success: true, suggestions };
+    } catch (error: any) {
+      console.error("Error generating suggestions:", error);
+      return { success: false, error: error.message || "Failed to generate suggestions" };
+    }
+  })
+
+  // Event listeners for conversation events
+  if (deps.conversationManager) {
+    deps.conversationManager.on('message-added', (message) => {
+      const mainWindow = deps.getMainWindow();
+      if (mainWindow && !mainWindow.isDestroyed()) {
+        mainWindow.webContents.send('conversation-message-added', message);
+      }
+    });
+
+    deps.conversationManager.on('speaker-changed', (speaker) => {
+      const mainWindow = deps.getMainWindow();
+      if (mainWindow && !mainWindow.isDestroyed()) {
+        mainWindow.webContents.send('speaker-changed', speaker);
+      }
+    });
+
+    deps.conversationManager.on('message-updated', (message) => {
+      const mainWindow = deps.getMainWindow();
+      if (mainWindow && !mainWindow.isDestroyed()) {
+        mainWindow.webContents.send('conversation-message-updated', message);
+      }
+    });
+
+    deps.conversationManager.on('conversation-cleared', () => {
+      const mainWindow = deps.getMainWindow();
+      if (mainWindow && !mainWindow.isDestroyed()) {
+        mainWindow.webContents.send('conversation-cleared');
+      }
+    });
+  }
 }
diff --git a/electron/main.ts b/electron/main.ts
index 0eae187a..752e5963 100644
--- a/electron/main.ts
+++ b/electron/main.ts
@@ -29,6 +29,9 @@ const state = {
   screenshotHelper: null as ScreenshotHelper | null,
   shortcutsHelper: null as ShortcutsHelper | null,
   processingHelper: null as ProcessingHelper | null,
+  transcriptionHelper: null as import('./TranscriptionHelper').TranscriptionHelper | null,
+  conversationManager: null as import('./ConversationManager').ConversationManager | null,
+  answerAssistant: null as import('./AnswerAssistant').AnswerAssistant | null,
 
   // View and state management
   view: "queue" as "queue" | "solutions" | "debug",
@@ -107,10 +110,13 @@ export interface IIpcHandlerDeps {
   moveWindowRight: () => void
   moveWindowUp: () => void
   moveWindowDown: () => void
+  transcriptionHelper?: import('./TranscriptionHelper').TranscriptionHelper
+  conversationManager?: import('./ConversationManager').ConversationManager
+  answerAssistant?: import('./AnswerAssistant').AnswerAssistant
 }
 
 // Initialize helpers
-function initializeHelpers() {
+async function initializeHelpers() {
   state.screenshotHelper = new ScreenshotHelper(state.view)
   state.processingHelper = new ProcessingHelper({
     getScreenshotHelper,
@@ -129,6 +135,16 @@ function initializeHelpers() {
     getHasDebugged,
     PROCESSING_EVENTS: state.PROCESSING_EVENTS
   } as IProcessingHelperDeps)
+  
+  // Initialize conversation and transcription helpers
+  const { TranscriptionHelper } = await import('./TranscriptionHelper')
+  const { ConversationManager } = await import('./ConversationManager')
+  const { AnswerAssistant } = await import('./AnswerAssistant')
+  
+  state.transcriptionHelper = new TranscriptionHelper()
+  state.conversationManager = new ConversationManager()
+  state.answerAssistant = new AnswerAssistant()
+  
   state.shortcutsHelper = new ShortcutsHelper({
     getMainWindow,
     takeScreenshot,
@@ -530,7 +546,7 @@ async function initializeApp() {
       console.log("No API key found in configuration. User will need to set up.")
     }
     
-    initializeHelpers()
+    await initializeHelpers()
     initializeIpcHandlers({
       getMainWindow,
       setWindowDimensions,
@@ -557,7 +573,10 @@ async function initializeApp() {
           )
         ),
       moveWindowUp: () => moveWindowVertical((y) => y - state.step),
-      moveWindowDown: () => moveWindowVertical((y) => y + state.step)
+      moveWindowDown: () => moveWindowVertical((y) => y + state.step),
+      transcriptionHelper: state.transcriptionHelper,
+      conversationManager: state.conversationManager,
+      answerAssistant: state.answerAssistant
     })
     await createWindow()
     state.shortcutsHelper?.registerGlobalShortcuts()
diff --git a/electron/preload.ts b/electron/preload.ts
index 85f32156..36b7ca93 100644
--- a/electron/preload.ts
+++ b/electron/preload.ts
@@ -236,7 +236,61 @@ const electronAPI = {
       ipcRenderer.removeListener("delete-last-screenshot", subscription)
     }
   },
-  deleteLastScreenshot: () => ipcRenderer.invoke("delete-last-screenshot")
+  deleteLastScreenshot: () => ipcRenderer.invoke("delete-last-screenshot"),
+  
+  // ============================================
+  // Conversation & Transcription Methods
+  // ============================================
+  
+  // Transcription
+  transcribeAudio: (audioBuffer: ArrayBuffer, mimeType: string) => 
+    ipcRenderer.invoke("transcribe-audio", audioBuffer, mimeType),
+  
+  // Conversation
+  addConversationMessage: (text: string, speaker?: string) => 
+    ipcRenderer.invoke("add-conversation-message", text, speaker),
+  toggleSpeaker: () => ipcRenderer.invoke("toggle-speaker"),
+  getConversation: () => ipcRenderer.invoke("get-conversation"),
+  clearConversation: () => ipcRenderer.invoke("clear-conversation"),
+  updateConversationMessage: (messageId: string, newText: string) =>
+    ipcRenderer.invoke("update-conversation-message", messageId, newText),
+  
+  // AI suggestions
+  getAnswerSuggestions: (question: string, screenshotContext?: string) =>
+    ipcRenderer.invoke("get-answer-suggestions", question, screenshotContext),
+  
+  // Event listeners
+  onConversationMessageAdded: (callback: (message: any) => void) => {
+    const subscription = (_: any, message: any) => callback(message)
+    ipcRenderer.on("conversation-message-added", subscription)
+    return () => {
+      ipcRenderer.removeListener("conversation-message-added", subscription)
+    }
+  },
+  
+  onSpeakerChanged: (callback: (speaker: string) => void) => {
+    const subscription = (_: any, speaker: string) => callback(speaker)
+    ipcRenderer.on("speaker-changed", subscription)
+    return () => {
+      ipcRenderer.removeListener("speaker-changed", subscription)
+    }
+  },
+  
+  onConversationMessageUpdated: (callback: (message: any) => void) => {
+    const subscription = (_: any, message: any) => callback(message)
+    ipcRenderer.on("conversation-message-updated", subscription)
+    return () => {
+      ipcRenderer.removeListener("conversation-message-updated", subscription)
+    }
+  },
+  
+  onConversationCleared: (callback: () => void) => {
+    const subscription = () => callback()
+    ipcRenderer.on("conversation-cleared", subscription)
+    return () => {
+      ipcRenderer.removeListener("conversation-cleared", subscription)
+    }
+  }
 }
 
 // Before exposing the API
diff --git a/electron/shortcuts.ts b/electron/shortcuts.ts
index a6fa5ebb..e53dc34a 100644
--- a/electron/shortcuts.ts
+++ b/electron/shortcuts.ts
@@ -106,6 +106,39 @@ export class ShortcutsHelper {
       this.deps.toggleMainWindow()
     })
 
+    // Recording toggle (Ctrl/Cmd+M)
+    globalShortcut.register("CommandOrControl+M", async () => {
+      const mainWindow = this.deps.getMainWindow();
+      if (mainWindow && !mainWindow.isDestroyed()) {
+        console.log("Command/Ctrl + M pressed. Toggling recording.");
+        try {
+          await mainWindow.webContents.executeJavaScript(`
+            (async () => {
+              const event = new CustomEvent('toggle-recording');
+              window.dispatchEvent(event);
+            })();
+          `);
+        } catch (error) {
+          console.error("Error toggling recording:", error);
+        }
+      }
+    });
+
+    // Speaker toggle (Ctrl/Cmd+Shift+M)
+    globalShortcut.register("CommandOrControl+Shift+M", async () => {
+      const mainWindow = this.deps.getMainWindow();
+      if (mainWindow && !mainWindow.isDestroyed()) {
+        console.log("Command/Ctrl + Shift + M pressed. Toggling speaker.");
+        try {
+          await mainWindow.webContents.executeJavaScript(`
+            window.electronAPI.toggleSpeaker();
+          `);
+        } catch (error) {
+          console.error("Error toggling speaker:", error);
+        }
+      }
+    });
+
     globalShortcut.register("CommandOrControl+Q", () => {
       console.log("Command/Ctrl + Q pressed. Quitting application.")
       app.quit()
diff --git a/package.json b/package.json
index 1fffcfb5..fee68383 100644
--- a/package.json
+++ b/package.json
@@ -144,7 +144,6 @@
     "lucide-react": "^0.460.0",
     "openai": "^4.28.4",
     "react": "^18.2.0",
-    "react-code-blocks": "^0.1.6",
     "react-dom": "^18.2.0",
     "react-router-dom": "^6.28.1",
     "react-syntax-highlighter": "^15.6.1",
@@ -202,5 +201,8 @@
       "last 1 firefox version",
       "last 1 safari version"
     ]
+  },
+  "overrides": {
+    "prismjs": ">=1.30.0"
   }
 }
diff --git a/src/_pages/Queue.tsx b/src/_pages/Queue.tsx
index c9194d5e..9b40be6e 100644
--- a/src/_pages/Queue.tsx
+++ b/src/_pages/Queue.tsx
@@ -2,6 +2,7 @@ import React, { useState, useEffect, useRef } from "react"
 import { useQuery } from "@tanstack/react-query"
 import ScreenshotQueue from "../components/Queue/ScreenshotQueue"
 import QueueCommands from "../components/Queue/QueueCommands"
+import { ConversationSection } from "../components/Conversation/ConversationSection"
 
 import { useToast } from "../contexts/toast"
 import { Screenshot } from "../types/screenshots"
@@ -137,9 +138,14 @@ const Queue: React.FC<QueueProps> = ({
   };
   
   return (
-    <div ref={contentRef} className={`bg-transparent w-1/2`}>
+    <div ref={contentRef} className={`bg-transparent w-full`}>
       <div className="px-4 py-3">
-        <div className="space-y-3 w-fit">
+        <div className="space-y-3 w-full">
+          {/* Conversation Section - Works independently of screenshots */}
+          <div className="bg-black/60 rounded-md p-4">
+            <ConversationSection />
+          </div>
+
           <ScreenshotQueue
             isLoading={false}
             screenshots={screenshots}
diff --git a/src/_pages/Solutions.tsx b/src/_pages/Solutions.tsx
index e1939451..0bdcf7d5 100644
--- a/src/_pages/Solutions.tsx
+++ b/src/_pages/Solutions.tsx
@@ -11,6 +11,7 @@ import SolutionCommands from "../components/Solutions/SolutionCommands"
 import Debug from "./Debug"
 import { useToast } from "../contexts/toast"
 import { COMMAND_KEY } from "../utils/platform"
+import { ConversationSection } from "../components/Conversation/ConversationSection"
 
 export const ContentSection = ({
   title,
@@ -500,6 +501,11 @@ const Solutions: React.FC<SolutionsProps> = ({
             setLanguage={setLanguage}
           />
 
+          {/* Conversation Section */}
+          <div className="bg-black/60 rounded-md p-4">
+            <ConversationSection />
+          </div>
+
           {/* Main Content - Modified width constraints */}
           <div className="w-full text-sm text-black bg-black/60 rounded-md">
             <div className="rounded-lg overflow-hidden">
diff --git a/src/components/Conversation/ConversationSection.tsx b/src/components/Conversation/ConversationSection.tsx
new file mode 100644
index 00000000..b3e0a2d0
--- /dev/null
+++ b/src/components/Conversation/ConversationSection.tsx
@@ -0,0 +1,309 @@
+/**
+ * ConversationSection - UI component for conversation recording and AI suggestions
+ * Follows Single Responsibility Principle - only handles conversation UI
+ * Uses existing ContentSection pattern for consistency
+ */
+import React, { useState, useEffect, useRef } from 'react';
+import { AudioRecorder } from '../../utils/audioRecorder';
+
+interface ConversationMessage {
+  id: string;
+  speaker: 'interviewer' | 'interviewee';
+  text: string;
+  timestamp: number;
+  edited?: boolean;
+}
+
+interface AISuggestion {
+  suggestions: string[];
+  reasoning: string;
+}
+
+// Reuse the same ContentSection style from Solutions.tsx for consistency
+const ContentSection = ({
+  title,
+  content,
+  isLoading
+}: {
+  title: string;
+  content: React.ReactNode;
+  isLoading: boolean;
+}) => (
+  <div className="space-y-2">
+    <h2 className="text-[13px] font-medium text-white tracking-wide">
+      {title}
+    </h2>
+    {isLoading ? (
+      <div className="mt-4 flex">
+        <p className="text-xs bg-gradient-to-r from-gray-300 via-gray-100 to-gray-300 bg-clip-text text-transparent animate-pulse">
+          Processing...
+        </p>
+      </div>
+    ) : (
+      <div className="text-[13px] leading-[1.4] text-gray-100 max-w-[600px]">
+        {content}
+      </div>
+    )}
+  </div>
+);
+
+export const ConversationSection: React.FC = () => {
+  const [messages, setMessages] = useState<ConversationMessage[]>([]);
+  const [isRecording, setIsRecording] = useState(false);
+  const [currentSpeaker, setCurrentSpeaker] = useState<'interviewer' | 'interviewee'>('interviewee');
+  const [aiSuggestions, setAiSuggestions] = useState<AISuggestion | null>(null);
+  const [isProcessing, setIsProcessing] = useState(false);
+  const [recordingDuration, setRecordingDuration] = useState(0);
+  const messagesEndRef = useRef<HTMLDivElement>(null);
+  const audioRecorderRef = useRef<AudioRecorder | null>(null);
+  const durationIntervalRef = useRef<NodeJS.Timeout | null>(null);
+
+  useEffect(() => {
+    loadConversation();
+    
+    const unsubscribeMessageAdded = window.electronAPI.onConversationMessageAdded((message: ConversationMessage) => {
+      setMessages(prev => [...prev, message]);
+      scrollToBottom();
+    });
+    
+    const unsubscribeSpeakerChanged = window.electronAPI.onSpeakerChanged((speaker: string) => {
+      setCurrentSpeaker(speaker as 'interviewer' | 'interviewee');
+    });
+
+    const unsubscribeMessageUpdated = window.electronAPI.onConversationMessageUpdated((message: ConversationMessage) => {
+      setMessages(prev => prev.map(msg => msg.id === message.id ? message : msg));
+    });
+
+    const unsubscribeCleared = window.electronAPI.onConversationCleared(() => {
+      setMessages([]);
+      setAiSuggestions(null);
+    });
+
+    // Listen for keyboard shortcut to toggle recording
+    const handleToggleRecording = async () => {
+      const currentIsRecording = audioRecorderRef.current?.getIsRecording() || false;
+      if (currentIsRecording) {
+        await handleStopRecording();
+      } else {
+        await handleStartRecording();
+      }
+    };
+
+    window.addEventListener('toggle-recording', handleToggleRecording);
+
+    return () => {
+      unsubscribeMessageAdded();
+      unsubscribeSpeakerChanged();
+      unsubscribeMessageUpdated();
+      unsubscribeCleared();
+      window.removeEventListener('toggle-recording', handleToggleRecording);
+      if (durationIntervalRef.current) {
+        clearInterval(durationIntervalRef.current);
+      }
+    };
+  }, []);
+
+  const scrollToBottom = () => {
+    messagesEndRef.current?.scrollIntoView({ behavior: 'smooth' });
+  };
+
+  const loadConversation = async () => {
+    try {
+      const result = await window.electronAPI.getConversation();
+      if (result.success) {
+        setMessages(result.messages);
+        scrollToBottom();
+      }
+    } catch (error) {
+      console.error('Failed to load conversation:', error);
+    }
+  };
+
+  const handleStartRecording = async () => {
+    try {
+      if (!audioRecorderRef.current) {
+        audioRecorderRef.current = new AudioRecorder();
+      }
+      
+      await audioRecorderRef.current.startRecording();
+      setIsRecording(true);
+      setRecordingDuration(0);
+      
+      // Start duration counter
+      durationIntervalRef.current = setInterval(() => {
+        setRecordingDuration(prev => prev + 1);
+      }, 1000);
+    } catch (error: any) {
+      console.error('Failed to start recording:', error);
+      alert(error.message || 'Failed to start recording. Please check microphone permissions.');
+    }
+  };
+
+  const handleStopRecording = async () => {
+    if (!audioRecorderRef.current || !isRecording) return;
+    
+    setIsRecording(false);
+    if (durationIntervalRef.current) {
+      clearInterval(durationIntervalRef.current);
+      durationIntervalRef.current = null;
+    }
+    
+    setIsProcessing(true);
+    try {
+      const audioBlob = await audioRecorderRef.current.stopRecording();
+      
+      // Convert blob to ArrayBuffer
+      const arrayBuffer = await audioBlob.arrayBuffer();
+      
+      // Transcribe
+      const transcribeResult = await window.electronAPI.transcribeAudio(arrayBuffer, audioBlob.type);
+      
+      if (transcribeResult.success && transcribeResult.result) {
+        const text = transcribeResult.result.text;
+        
+        // Add message
+        await window.electronAPI.addConversationMessage(text, currentSpeaker);
+        
+        // If interviewer question, get AI suggestions
+        if (currentSpeaker === 'interviewer') {
+          await fetchAISuggestions(text);
+        } else {
+          // Clear suggestions when interviewee responds
+          setAiSuggestions(null);
+        }
+      }
+    } catch (error: any) {
+      console.error('Failed to process recording:', error);
+      alert(error.message || 'Failed to process recording');
+    } finally {
+      setIsProcessing(false);
+      setRecordingDuration(0);
+    }
+  };
+
+  const fetchAISuggestions = async (question: string) => {
+    try {
+      const result = await window.electronAPI.getAnswerSuggestions(question);
+      if (result.success && result.suggestions) {
+        setAiSuggestions(result.suggestions);
+      }
+    } catch (error: any) {
+      console.error('Failed to get AI suggestions:', error);
+      // Don't show alert for suggestion errors - it's not critical
+    }
+  };
+
+  const handleToggleSpeaker = async () => {
+    try {
+      const result = await window.electronAPI.toggleSpeaker();
+      if (result.success) {
+        setCurrentSpeaker(result.speaker);
+        setAiSuggestions(null); // Clear suggestions when switching speaker
+      }
+    } catch (error) {
+      console.error('Failed to toggle speaker:', error);
+    }
+  };
+
+  const formatTime = (timestamp: number) => {
+    return new Date(timestamp).toLocaleTimeString([], { 
+      hour: '2-digit', 
+      minute: '2-digit' 
+    });
+  };
+
+  const formatDuration = (seconds: number) => {
+    const mins = Math.floor(seconds / 60);
+    const secs = seconds % 60;
+    return `${mins}:${secs.toString().padStart(2, '0')}`;
+  };
+
+  return (
+    <div className="space-y-3">
+      {/* Recording Controls */}
+      <div className="flex items-center gap-3 flex-wrap">
+        <button
+          onClick={isRecording ? handleStopRecording : handleStartRecording}
+          disabled={isProcessing}
+          className={`px-3 py-1.5 rounded text-xs font-medium transition disabled:opacity-50 disabled:cursor-not-allowed ${
+            isRecording
+              ? 'bg-red-600 hover:bg-red-700 text-white'
+              : 'bg-green-600 hover:bg-green-700 text-white'
+          }`}
+        >
+          {isRecording ? `⏹ Stop (${formatDuration(recordingDuration)})` : '⏺ Start Recording'}
+        </button>
+        
+        <button
+          onClick={handleToggleSpeaker}
+          disabled={isRecording || isProcessing}
+          className="px-3 py-1.5 rounded text-xs font-medium bg-blue-600 hover:bg-blue-700 text-white disabled:opacity-50 disabled:cursor-not-allowed"
+        >
+          {currentSpeaker === 'interviewer' ? '👤 Interviewer' : '🎤 You'}
+        </button>
+        
+        {isProcessing && (
+          <span className="text-xs text-white/70">Processing...</span>
+        )}
+      </div>
+
+      {/* Messages */}
+      {messages.length > 0 && (
+        <ContentSection
+          title="Conversation"
+          content={
+            <div className="space-y-3">
+              {messages.map((message) => (
+                <div
+                  key={message.id}
+                  className={`flex flex-col ${
+                    message.speaker === 'interviewer' ? 'items-start' : 'items-end'
+                  }`}
+                >
+                  <div
+                    className={`max-w-[80%] rounded-lg p-2.5 ${
+                      message.speaker === 'interviewer'
+                        ? 'bg-blue-600/20 border border-blue-500/30'
+                        : 'bg-green-600/20 border border-green-500/30'
+                    }`}
+                  >
+                    <div className="text-xs text-white/60 mb-1">
+                      {message.speaker === 'interviewer' ? '👤 Interviewer' : '🎤 You'}
+                    </div>
+                    <div className="text-white text-[13px]">{message.text}</div>
+                    <div className="text-xs text-white/40 mt-1">
+                      {formatTime(message.timestamp)}
+                    </div>
+                  </div>
+                </div>
+              ))}
+            </div>
+          }
+          isLoading={false}
+        />
+      )}
+
+      {/* AI Suggestions - styled like "My Thoughts" from Solutions */}
+      {aiSuggestions && (
+        <ContentSection
+          title="🤖 AI Answer Suggestions"
+          content={
+            <div className="space-y-3">
+              <div className="space-y-1">
+                {aiSuggestions.suggestions.map((suggestion, index) => (
+                  <div key={index} className="flex items-start gap-2">
+                    <div className="w-1 h-1 rounded-full bg-purple-400/80 mt-2 shrink-0" />
+                    <div className="text-[13px]">{suggestion}</div>
+                  </div>
+                ))}
+              </div>
+            </div>
+          }
+          isLoading={false}
+        />
+      )}
+      
+      <div ref={messagesEndRef} />
+    </div>
+  );
+};
diff --git a/src/types/electron.d.ts b/src/types/electron.d.ts
index a467cae3..59b067b9 100644
--- a/src/types/electron.d.ts
+++ b/src/types/electron.d.ts
@@ -61,6 +61,19 @@ export interface ElectronAPI {
   openLink: (url: string) => void
   onApiKeyInvalid: (callback: () => void) => () => void
   removeListener: (eventName: string, callback: (...args: any[]) => void) => void
+  
+  // Conversation & Transcription methods
+  transcribeAudio: (audioBuffer: ArrayBuffer, mimeType: string) => Promise<{ success: boolean; result?: { text: string; language?: string }; error?: string }>
+  addConversationMessage: (text: string, speaker?: string) => Promise<{ success: boolean; message?: any; error?: string }>
+  toggleSpeaker: () => Promise<{ success: boolean; speaker?: string; error?: string }>
+  getConversation: () => Promise<{ success: boolean; messages?: any[]; error?: string }>
+  clearConversation: () => Promise<{ success: boolean; error?: string }>
+  updateConversationMessage: (messageId: string, newText: string) => Promise<{ success: boolean; error?: string }>
+  getAnswerSuggestions: (question: string, screenshotContext?: string) => Promise<{ success: boolean; suggestions?: { suggestions: string[]; reasoning: string }; error?: string }>
+  onConversationMessageAdded: (callback: (message: any) => void) => () => void
+  onSpeakerChanged: (callback: (speaker: string) => void) => () => void
+  onConversationMessageUpdated: (callback: (message: any) => void) => () => void
+  onConversationCleared: (callback: () => void) => () => void
 }
 
 declare global {
diff --git a/src/utils/audioRecorder.ts b/src/utils/audioRecorder.ts
new file mode 100644
index 00000000..060bffe9
--- /dev/null
+++ b/src/utils/audioRecorder.ts
@@ -0,0 +1,99 @@
+/**
+ * AudioRecorder - Handles audio recording using Web Audio API
+ * Follows Single Responsibility Principle - only handles audio recording
+ */
+export interface IAudioRecorder {
+  startRecording(): Promise<void>;
+  stopRecording(): Promise<Blob>;
+  getIsRecording(): boolean;
+}
+
+export class AudioRecorder implements IAudioRecorder {
+  private mediaRecorder: MediaRecorder | null = null;
+  private audioChunks: Blob[] = [];
+  private stream: MediaStream | null = null;
+  private isRecording: boolean = false;
+
+  /**
+   * Starts audio recording from the user's microphone
+   * @throws Error if microphone access fails
+   */
+  async startRecording(): Promise<void> {
+    try {
+      const stream = await navigator.mediaDevices.getUserMedia({ 
+        audio: {
+          sampleRate: 16000, // Whisper prefers 16kHz
+          channelCount: 1,   // Mono
+          echoCancellation: true,
+          noiseSuppression: true,
+        } 
+      });
+      
+      this.stream = stream;
+      this.audioChunks = [];
+      
+      // Use WebM format (works everywhere)
+      const options = { mimeType: 'audio/webm;codecs=opus' };
+      this.mediaRecorder = new MediaRecorder(stream, options);
+      
+      this.mediaRecorder.ondataavailable = (event) => {
+        if (event.data.size > 0) {
+          this.audioChunks.push(event.data);
+        }
+      };
+      
+      this.mediaRecorder.start(1000); // Collect data every second
+      this.isRecording = true;
+    } catch (error) {
+      console.error('Error starting recording:', error);
+      throw new Error('Failed to access microphone. Please check permissions.');
+    }
+  }
+
+  /**
+   * Stops recording and returns the audio blob
+   * @returns Promise resolving to the recorded audio blob
+   * @throws Error if not currently recording
+   */
+  async stopRecording(): Promise<Blob> {
+    return new Promise((resolve, reject) => {
+      if (!this.mediaRecorder || !this.isRecording) {
+        reject(new Error('Not currently recording'));
+        return;
+      }
+
+      this.mediaRecorder.onstop = () => {
+        const audioBlob = new Blob(this.audioChunks, { type: 'audio/webm' });
+        this.cleanup();
+        resolve(audioBlob);
+      };
+
+      this.mediaRecorder.onerror = (error) => {
+        this.cleanup();
+        reject(new Error(`Recording error: ${error}`));
+      };
+
+      this.mediaRecorder.stop();
+      this.isRecording = false;
+    });
+  }
+
+  /**
+   * Gets the current recording state
+   */
+  getIsRecording(): boolean {
+    return this.isRecording;
+  }
+
+  /**
+   * Cleans up resources (stops tracks, clears state)
+   */
+  private cleanup(): void {
+    if (this.stream) {
+      this.stream.getTracks().forEach(track => track.stop());
+      this.stream = null;
+    }
+    this.mediaRecorder = null;
+    this.audioChunks = [];
+  }
+}
diff --git a/stealth-run.sh b/stealth-run.sh
old mode 100644
new mode 100755

From ee3592753c7ba970d651581e864dc8a3b6e2aa0e Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Sun, 11 Jan 2026 03:23:55 -0800
Subject: [PATCH 02/13] feat: added conversations view with screenshot support
 for coding and normal interview as well

---
 electron/ProcessingHelper.ts                  |  49 ++++++-
 electron/main.ts                              |   4 +-
 src/_pages/Queue.tsx                          |   2 +-
 src/_pages/Solutions.tsx                      |   2 +-
 .../Conversation/ConversationSection.tsx      | 130 ++++++++++--------
 src/components/Queue/QueueCommands.tsx        |  68 +++++++++
 src/components/Settings/SettingsDialog.tsx    |   6 +
 src/components/Solutions/SolutionCommands.tsx |  68 +++++++++
 8 files changed, 266 insertions(+), 63 deletions(-)

diff --git a/electron/ProcessingHelper.ts b/electron/ProcessingHelper.ts
index 0dcd26f0..9f40916b 100644
--- a/electron/ProcessingHelper.ts
+++ b/electron/ProcessingHelper.ts
@@ -66,6 +66,22 @@ export class ProcessingHelper {
       this.initializeAIClient();
     });
   }
+
+  /**
+   * Get conversation context for integration with screenshot processing
+   */
+  private getConversationContext(): string | null {
+    try {
+      const conversationManager = this.deps.getConversationManager?.();
+      if (conversationManager) {
+        const history = conversationManager.getConversationHistory();
+        return history && history.trim().length > 0 ? history : null;
+      }
+    } catch (error) {
+      console.error('Error getting conversation context:', error);
+    }
+    return null;
+  }
   
   /**
    * Initialize or reinitialize the AI client with current config
@@ -473,18 +489,29 @@ export class ProcessingHelper {
           }
         }
 
+        // Get conversation context if available
+        const conversationContext = this.getConversationContext();
+        
         // Use OpenAI for processing
+        const systemPrompt = conversationContext
+          ? `You are a coding challenge interpreter. Analyze the screenshot of the coding problem and extract all relevant information. Consider the conversation context provided. Return the information in JSON format with these fields: problem_statement, constraints, example_input, example_output. Just return the structured JSON without any other text.`
+          : "You are a coding challenge interpreter. Analyze the screenshot of the coding problem and extract all relevant information. Return the information in JSON format with these fields: problem_statement, constraints, example_input, example_output. Just return the structured JSON without any other text.";
+        
+        const userPrompt = conversationContext
+          ? `Extract the coding problem details from these screenshots. Consider the following conversation context:\n\n${conversationContext}\n\nReturn in JSON format. Preferred coding language we gonna use for this problem is ${language}.`
+          : `Extract the coding problem details from these screenshots. Return in JSON format. Preferred coding language we gonna use for this problem is ${language}.`;
+        
         const messages = [
           {
             role: "system" as const, 
-            content: "You are a coding challenge interpreter. Analyze the screenshot of the coding problem and extract all relevant information. Return the information in JSON format with these fields: problem_statement, constraints, example_input, example_output. Just return the structured JSON without any other text."
+            content: systemPrompt
           },
           {
             role: "user" as const,
             content: [
               {
                 type: "text" as const, 
-                text: `Extract the coding problem details from these screenshots. Return in JSON format. Preferred coding language we gonna use for this problem is ${language}.`
+                text: userPrompt
               },
               ...imageDataList.map(data => ({
                 type: "image_url" as const,
@@ -525,13 +552,20 @@ export class ProcessingHelper {
         }
 
         try {
+          // Get conversation context if available
+          const conversationContext = this.getConversationContext();
+          
+          const geminiPrompt = conversationContext
+            ? `You are a coding challenge interpreter. Analyze the screenshots of the coding problem and extract all relevant information. Consider the following conversation context:\n\n${conversationContext}\n\nReturn the information in JSON format with these fields: problem_statement, constraints, example_input, example_output. Just return the structured JSON without any other text. Preferred coding language we gonna use for this problem is ${language}.`
+            : `You are a coding challenge interpreter. Analyze the screenshots of the coding problem and extract all relevant information. Return the information in JSON format with these fields: problem_statement, constraints, example_input, example_output. Just return the structured JSON without any other text. Preferred coding language we gonna use for this problem is ${language}.`;
+          
           // Create Gemini message structure
           const geminiMessages: GeminiMessage[] = [
             {
               role: "user",
               parts: [
                 {
-                  text: `You are a coding challenge interpreter. Analyze the screenshots of the coding problem and extract all relevant information. Return the information in JSON format with these fields: problem_statement, constraints, example_input, example_output. Just return the structured JSON without any other text. Preferred coding language we gonna use for this problem is ${language}.`
+                  text: geminiPrompt
                 },
                 ...imageDataList.map(data => ({
                   inlineData: {
@@ -583,13 +617,20 @@ export class ProcessingHelper {
         }
 
         try {
+          // Get conversation context if available
+          const conversationContext = this.getConversationContext();
+          
+          const anthropicPrompt = conversationContext
+            ? `Extract the coding problem details from these screenshots. Consider the following conversation context:\n\n${conversationContext}\n\nReturn in JSON format with these fields: problem_statement, constraints, example_input, example_output. Preferred coding language is ${language}.`
+            : `Extract the coding problem details from these screenshots. Return in JSON format with these fields: problem_statement, constraints, example_input, example_output. Preferred coding language is ${language}.`;
+          
           const messages = [
             {
               role: "user" as const,
               content: [
                 {
                   type: "text" as const,
-                  text: `Extract the coding problem details from these screenshots. Return in JSON format with these fields: problem_statement, constraints, example_input, example_output. Preferred coding language is ${language}.`
+                  text: anthropicPrompt
                 },
                 ...imageDataList.map(data => ({
                   type: "image" as const,
diff --git a/electron/main.ts b/electron/main.ts
index 752e5963..ea751ec1 100644
--- a/electron/main.ts
+++ b/electron/main.ts
@@ -73,6 +73,7 @@ export interface IProcessingHelperDeps {
   setHasDebugged: (value: boolean) => void
   getHasDebugged: () => boolean
   PROCESSING_EVENTS: typeof state.PROCESSING_EVENTS
+  getConversationManager?: () => import('./ConversationManager').ConversationManager | null
 }
 
 export interface IShortcutsHelperDeps {
@@ -133,7 +134,8 @@ async function initializeHelpers() {
     deleteScreenshot,
     setHasDebugged,
     getHasDebugged,
-    PROCESSING_EVENTS: state.PROCESSING_EVENTS
+    PROCESSING_EVENTS: state.PROCESSING_EVENTS,
+    getConversationManager: () => state.conversationManager
   } as IProcessingHelperDeps)
   
   // Initialize conversation and transcription helpers
diff --git a/src/_pages/Queue.tsx b/src/_pages/Queue.tsx
index 9b40be6e..a384bb32 100644
--- a/src/_pages/Queue.tsx
+++ b/src/_pages/Queue.tsx
@@ -142,7 +142,7 @@ const Queue: React.FC<QueueProps> = ({
       <div className="px-4 py-3">
         <div className="space-y-3 w-full">
           {/* Conversation Section - Works independently of screenshots */}
-          <div className="bg-black/60 rounded-md p-4">
+          <div className="bg-black/60 rounded-md p-4" style={{ height: '500px', display: 'flex', flexDirection: 'column' }}>
             <ConversationSection />
           </div>
 
diff --git a/src/_pages/Solutions.tsx b/src/_pages/Solutions.tsx
index 0bdcf7d5..79cacb2c 100644
--- a/src/_pages/Solutions.tsx
+++ b/src/_pages/Solutions.tsx
@@ -502,7 +502,7 @@ const Solutions: React.FC<SolutionsProps> = ({
           />
 
           {/* Conversation Section */}
-          <div className="bg-black/60 rounded-md p-4">
+          <div className="bg-black/60 rounded-md p-4" style={{ height: '500px', display: 'flex', flexDirection: 'column' }}>
             <ConversationSection />
           </div>
 
diff --git a/src/components/Conversation/ConversationSection.tsx b/src/components/Conversation/ConversationSection.tsx
index b3e0a2d0..40e71342 100644
--- a/src/components/Conversation/ConversationSection.tsx
+++ b/src/components/Conversation/ConversationSection.tsx
@@ -2,8 +2,10 @@
  * ConversationSection - UI component for conversation recording and AI suggestions
  * Follows Single Responsibility Principle - only handles conversation UI
  * Uses existing ContentSection pattern for consistency
+ * Integrates with screenshot system for cohesive experience
  */
 import React, { useState, useEffect, useRef } from 'react';
+import { useQueryClient } from '@tanstack/react-query';
 import { AudioRecorder } from '../../utils/audioRecorder';
 
 interface ConversationMessage {
@@ -48,6 +50,7 @@ const ContentSection = ({
 );
 
 export const ConversationSection: React.FC = () => {
+  const queryClient = useQueryClient();
   const [messages, setMessages] = useState<ConversationMessage[]>([]);
   const [isRecording, setIsRecording] = useState(false);
   const [currentSpeaker, setCurrentSpeaker] = useState<'interviewer' | 'interviewee'>('interviewee');
@@ -167,10 +170,8 @@ export const ConversationSection: React.FC = () => {
         // If interviewer question, get AI suggestions
         if (currentSpeaker === 'interviewer') {
           await fetchAISuggestions(text);
-        } else {
-          // Clear suggestions when interviewee responds
-          setAiSuggestions(null);
         }
+        // Don't clear suggestions when interviewee responds - user needs to see them!
       }
     } catch (error: any) {
       console.error('Failed to process recording:', error);
@@ -183,7 +184,15 @@ export const ConversationSection: React.FC = () => {
 
   const fetchAISuggestions = async (question: string) => {
     try {
-      const result = await window.electronAPI.getAnswerSuggestions(question);
+      // Get problem statement from query cache if available (from screenshots)
+      const problemStatement = queryClient.getQueryData(['problem_statement']) as any;
+      let screenshotContext: string | undefined;
+      
+      if (problemStatement?.problem_statement) {
+        screenshotContext = `Problem Statement: ${problemStatement.problem_statement}\nConstraints: ${problemStatement.constraints || 'N/A'}\nExample Input: ${problemStatement.example_input || 'N/A'}\nExample Output: ${problemStatement.example_output || 'N/A'}`;
+      }
+      
+      const result = await window.electronAPI.getAnswerSuggestions(question, screenshotContext);
       if (result.success && result.suggestions) {
         setAiSuggestions(result.suggestions);
       }
@@ -198,7 +207,7 @@ export const ConversationSection: React.FC = () => {
       const result = await window.electronAPI.toggleSpeaker();
       if (result.success) {
         setCurrentSpeaker(result.speaker);
-        setAiSuggestions(null); // Clear suggestions when switching speaker
+        // Don't clear suggestions - user needs to see them when preparing their answer!
       }
     } catch (error) {
       console.error('Failed to toggle speaker:', error);
@@ -219,9 +228,9 @@ export const ConversationSection: React.FC = () => {
   };
 
   return (
-    <div className="space-y-3">
-      {/* Recording Controls */}
-      <div className="flex items-center gap-3 flex-wrap">
+    <div className="flex flex-col h-full">
+      {/* Recording Controls - Always visible at top */}
+      <div className="flex items-center gap-3 flex-wrap flex-shrink-0 mb-3">
         <button
           onClick={isRecording ? handleStopRecording : handleStartRecording}
           disabled={isProcessing}
@@ -247,63 +256,72 @@ export const ConversationSection: React.FC = () => {
         )}
       </div>
 
-      {/* Messages */}
-      {messages.length > 0 && (
-        <ContentSection
-          title="Conversation"
-          content={
-            <div className="space-y-3">
-              {messages.map((message) => (
-                <div
-                  key={message.id}
-                  className={`flex flex-col ${
-                    message.speaker === 'interviewer' ? 'items-start' : 'items-end'
-                  }`}
-                >
+      {/* Scrollable Conversation Area - Takes remaining space above AI suggestions */}
+      <div 
+        className="overflow-y-auto flex-1 min-h-0 mb-3 pr-2"
+        style={{ 
+          maxHeight: aiSuggestions ? 'calc(100% - 180px)' : '100%',
+          scrollBehavior: 'smooth'
+        }}
+      >
+        {messages.length > 0 && (
+          <ContentSection
+            title="Conversation"
+            content={
+              <div className="space-y-3">
+                {messages.map((message) => (
                   <div
-                    className={`max-w-[80%] rounded-lg p-2.5 ${
-                      message.speaker === 'interviewer'
-                        ? 'bg-blue-600/20 border border-blue-500/30'
-                        : 'bg-green-600/20 border border-green-500/30'
+                    key={message.id}
+                    className={`flex flex-col ${
+                      message.speaker === 'interviewer' ? 'items-start' : 'items-end'
                     }`}
                   >
-                    <div className="text-xs text-white/60 mb-1">
-                      {message.speaker === 'interviewer' ? '👤 Interviewer' : '🎤 You'}
-                    </div>
-                    <div className="text-white text-[13px]">{message.text}</div>
-                    <div className="text-xs text-white/40 mt-1">
-                      {formatTime(message.timestamp)}
+                    <div
+                      className={`max-w-[80%] rounded-lg p-2.5 ${
+                        message.speaker === 'interviewer'
+                          ? 'bg-blue-600/20 border border-blue-500/30'
+                          : 'bg-green-600/20 border border-green-500/30'
+                      }`}
+                    >
+                      <div className="text-xs text-white/60 mb-1">
+                        {message.speaker === 'interviewer' ? '👤 Interviewer' : '🎤 You'}
+                      </div>
+                      <div className="text-white text-[13px]">{message.text}</div>
+                      <div className="text-xs text-white/40 mt-1">
+                        {formatTime(message.timestamp)}
+                      </div>
                     </div>
                   </div>
-                </div>
-              ))}
-            </div>
-          }
-          isLoading={false}
-        />
-      )}
+                ))}
+              </div>
+            }
+            isLoading={false}
+          />
+        )}
+        <div ref={messagesEndRef} />
+      </div>
 
-      {/* AI Suggestions - styled like "My Thoughts" from Solutions */}
+      {/* AI Suggestions - Fixed at bottom, always visible, never scrolls */}
       {aiSuggestions && (
-        <ContentSection
-          title="🤖 AI Answer Suggestions"
-          content={
-            <div className="space-y-3">
-              <div className="space-y-1">
-                {aiSuggestions.suggestions.map((suggestion, index) => (
-                  <div key={index} className="flex items-start gap-2">
-                    <div className="w-1 h-1 rounded-full bg-purple-400/80 mt-2 shrink-0" />
-                    <div className="text-[13px]">{suggestion}</div>
-                  </div>
-                ))}
+        <div className="flex-shrink-0 border-t border-white/10 pt-3 bg-black/60 -mx-4 -mb-4 px-4 pb-4">
+          <ContentSection
+            title="🤖 AI Answer Suggestions"
+            content={
+              <div className="space-y-3">
+                <div className="space-y-1">
+                  {aiSuggestions.suggestions.map((suggestion, index) => (
+                    <div key={index} className="flex items-start gap-2">
+                      <div className="w-1 h-1 rounded-full bg-purple-400/80 mt-2 shrink-0" />
+                      <div className="text-[13px]">{suggestion}</div>
+                    </div>
+                  ))}
+                </div>
               </div>
-            </div>
-          }
-          isLoading={false}
-        />
+            }
+            isLoading={false}
+          />
+        </div>
       )}
-      
-      <div ref={messagesEndRef} />
     </div>
   );
 };
diff --git a/src/components/Queue/QueueCommands.tsx b/src/components/Queue/QueueCommands.tsx
index 88d6c283..f33fe518 100644
--- a/src/components/Queue/QueueCommands.tsx
+++ b/src/components/Queue/QueueCommands.tsx
@@ -321,6 +321,74 @@ const QueueCommands: React.FC<QueueCommandsProps> = ({
                         </p>
                       </div>
 
+                      {/* Start/Stop Recording Command */}
+                      <div
+                        className="cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+                        onClick={async () => {
+                          try {
+                            const event = new CustomEvent('toggle-recording');
+                            window.dispatchEvent(event);
+                          } catch (error) {
+                            console.error("Error toggling recording:", error)
+                            showToast(
+                              "Error",
+                              "Failed to toggle recording",
+                              "error"
+                            )
+                          }
+                        }}
+                      >
+                        <div className="flex items-center justify-between">
+                          <span className="truncate">Start/Stop Recording</span>
+                          <div className="flex gap-1 flex-shrink-0">
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              {COMMAND_KEY}
+                            </span>
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              M
+                            </span>
+                          </div>
+                        </div>
+                        <p className="text-[10px] leading-relaxed text-white/70 truncate mt-1">
+                          Record interview conversation for transcription.
+                        </p>
+                      </div>
+
+                      {/* Toggle Speaker Mode Command */}
+                      <div
+                        className="cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+                        onClick={async () => {
+                          try {
+                            await window.electronAPI.toggleSpeaker();
+                          } catch (error) {
+                            console.error("Error toggling speaker:", error)
+                            showToast(
+                              "Error",
+                              "Failed to toggle speaker mode",
+                              "error"
+                            )
+                          }
+                        }}
+                      >
+                        <div className="flex items-center justify-between">
+                          <span className="truncate">Toggle Speaker Mode</span>
+                          <div className="flex gap-1 flex-shrink-0">
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              {COMMAND_KEY}
+                            </span>
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              Shift
+                            </span>
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              M
+                            </span>
+                          </div>
+                        </div>
+                        <p className="text-[10px] leading-relaxed text-white/70 truncate mt-1">
+                          Switch between Interviewer and You mode.
+                        </p>
+                      </div>
+
                       {/* Solve Command */}
                       <div
                         className={`cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors ${
diff --git a/src/components/Settings/SettingsDialog.tsx b/src/components/Settings/SettingsDialog.tsx
index 463ea120..3460ca8b 100644
--- a/src/components/Settings/SettingsDialog.tsx
+++ b/src/components/Settings/SettingsDialog.tsx
@@ -467,6 +467,12 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
                 <div className="text-white/70">Take Screenshot</div>
                 <div className="text-white/90 font-mono">Ctrl+H / Cmd+H</div>
                 
+                <div className="text-white/70">Start/Stop Recording</div>
+                <div className="text-white/90 font-mono">Ctrl+M / Cmd+M</div>
+                
+                <div className="text-white/70">Toggle Speaker Mode</div>
+                <div className="text-white/90 font-mono">Ctrl+Shift+M / Cmd+Shift+M</div>
+                
                 <div className="text-white/70">Process Screenshots</div>
                 <div className="text-white/90 font-mono">Ctrl+Enter / Cmd+Enter</div>
                 
diff --git a/src/components/Solutions/SolutionCommands.tsx b/src/components/Solutions/SolutionCommands.tsx
index 49497299..4701c854 100644
--- a/src/components/Solutions/SolutionCommands.tsx
+++ b/src/components/Solutions/SolutionCommands.tsx
@@ -324,6 +324,74 @@ const SolutionCommands: React.FC<SolutionCommandsProps> = ({
                             </p>
                           </div>
 
+                          {/* Start/Stop Recording Command */}
+                          <div
+                            className="cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+                            onClick={async () => {
+                              try {
+                                const event = new CustomEvent('toggle-recording');
+                                window.dispatchEvent(event);
+                              } catch (error) {
+                                console.error("Error toggling recording:", error)
+                                showToast(
+                                  "Error",
+                                  "Failed to toggle recording",
+                                  "error"
+                                )
+                              }
+                            }}
+                          >
+                            <div className="flex items-center justify-between">
+                              <span className="truncate">Start/Stop Recording</span>
+                              <div className="flex gap-1 flex-shrink-0">
+                                <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                                  {COMMAND_KEY}
+                                </span>
+                                <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                                  M
+                                </span>
+                              </div>
+                            </div>
+                            <p className="text-[10px] leading-relaxed text-white/70 truncate mt-1">
+                              Record interview conversation for transcription.
+                            </p>
+                          </div>
+
+                          {/* Toggle Speaker Mode Command */}
+                          <div
+                            className="cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+                            onClick={async () => {
+                              try {
+                                await window.electronAPI.toggleSpeaker();
+                              } catch (error) {
+                                console.error("Error toggling speaker:", error)
+                                showToast(
+                                  "Error",
+                                  "Failed to toggle speaker mode",
+                                  "error"
+                                )
+                              }
+                            }}
+                          >
+                            <div className="flex items-center justify-between">
+                              <span className="truncate">Toggle Speaker Mode</span>
+                              <div className="flex gap-1 flex-shrink-0">
+                                <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                                  {COMMAND_KEY}
+                                </span>
+                                <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                                  Shift
+                                </span>
+                                <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                                  M
+                                </span>
+                              </div>
+                            </div>
+                            <p className="text-[10px] leading-relaxed text-white/70 truncate mt-1">
+                              Switch between Interviewer and You mode.
+                            </p>
+                          </div>
+
                           {extraScreenshots.length > 0 && (
                             <div
                               className="cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"

From 7a508110c4324b188d8542df7d2da90959ea52c0 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Sun, 11 Jan 2026 03:27:27 -0800
Subject: [PATCH 03/13] fix: cmd +m for toggle recording for ease

---
 .../Conversation/ConversationSection.tsx      | 25 +++++++++++++++++--
 1 file changed, 23 insertions(+), 2 deletions(-)

diff --git a/src/components/Conversation/ConversationSection.tsx b/src/components/Conversation/ConversationSection.tsx
index 40e71342..351ae463 100644
--- a/src/components/Conversation/ConversationSection.tsx
+++ b/src/components/Conversation/ConversationSection.tsx
@@ -61,6 +61,13 @@ export const ConversationSection: React.FC = () => {
   const audioRecorderRef = useRef<AudioRecorder | null>(null);
   const durationIntervalRef = useRef<NodeJS.Timeout | null>(null);
 
+  // Use ref to track recording state for event listener
+  const isRecordingRef = useRef(false);
+  
+  useEffect(() => {
+    isRecordingRef.current = isRecording;
+  }, [isRecording]);
+
   useEffect(() => {
     loadConversation();
     
@@ -84,7 +91,8 @@ export const ConversationSection: React.FC = () => {
 
     // Listen for keyboard shortcut to toggle recording
     const handleToggleRecording = async () => {
-      const currentIsRecording = audioRecorderRef.current?.getIsRecording() || false;
+      // Check actual recording state using ref to get latest value
+      const currentIsRecording = isRecordingRef.current || (audioRecorderRef.current?.getIsRecording() || false);
       if (currentIsRecording) {
         await handleStopRecording();
       } else {
@@ -124,12 +132,19 @@ export const ConversationSection: React.FC = () => {
 
   const handleStartRecording = async () => {
     try {
+      // Check if already recording
+      if (audioRecorderRef.current?.getIsRecording()) {
+        console.log('Already recording');
+        return;
+      }
+      
       if (!audioRecorderRef.current) {
         audioRecorderRef.current = new AudioRecorder();
       }
       
       await audioRecorderRef.current.startRecording();
       setIsRecording(true);
+      isRecordingRef.current = true;
       setRecordingDuration(0);
       
       // Start duration counter
@@ -143,9 +158,15 @@ export const ConversationSection: React.FC = () => {
   };
 
   const handleStopRecording = async () => {
-    if (!audioRecorderRef.current || !isRecording) return;
+    // Check recorder state directly instead of React state to avoid stale closures
+    if (!audioRecorderRef.current || !audioRecorderRef.current.getIsRecording()) {
+      console.log('Not recording, cannot stop');
+      return;
+    }
     
     setIsRecording(false);
+    isRecordingRef.current = false;
+    
     if (durationIntervalRef.current) {
       clearInterval(durationIntervalRef.current);
       durationIntervalRef.current = null;

From b7beff3f73563228ff680552b0655477ed280e59 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Sun, 11 Jan 2026 03:48:38 -0800
Subject: [PATCH 04/13] feat: add speech recognition model configuration and
 validation for OpenAI integration+ Reduced the conversation section height
 from 500px to 350px in both the Queue and Solutions views.

---
 electron/ConfigHelper.ts                   | 25 ++++++++++-
 electron/TranscriptionHelper.ts            | 25 +++++++++--
 electron/preload.ts                        |  2 +-
 src/_pages/Queue.tsx                       |  2 +-
 src/_pages/Solutions.tsx                   |  2 +-
 src/components/Settings/SettingsDialog.tsx | 48 ++++++++++++++++++++++
 src/types/electron.d.ts                    |  4 +-
 7 files changed, 99 insertions(+), 9 deletions(-)

diff --git a/electron/ConfigHelper.ts b/electron/ConfigHelper.ts
index 6d1d2dba..afde8103 100644
--- a/electron/ConfigHelper.ts
+++ b/electron/ConfigHelper.ts
@@ -11,6 +11,7 @@ interface Config {
   extractionModel: string;
   solutionModel: string;
   debuggingModel: string;
+  speechRecognitionModel: string;  // Speech recognition model (Whisper for OpenAI)
   language: string;
   opacity: number;
 }
@@ -23,6 +24,7 @@ export class ConfigHelper extends EventEmitter {
     extractionModel: "gemini-2.0-flash", // Default to Flash for faster responses
     solutionModel: "gemini-2.0-flash",
     debuggingModel: "gemini-2.0-flash",
+    speechRecognitionModel: "whisper-1", // Default to Whisper for OpenAI
     language: "python",
     opacity: 1.0
   };
@@ -110,6 +112,15 @@ export class ConfigHelper extends EventEmitter {
           config.debuggingModel = this.sanitizeModelSelection(config.debuggingModel, config.apiProvider);
         }
         
+        // Ensure speechRecognitionModel is valid (only whisper-1 for OpenAI)
+        if (config.speechRecognitionModel && config.apiProvider === "openai") {
+          if (config.speechRecognitionModel !== "whisper-1") {
+            config.speechRecognitionModel = "whisper-1";
+          }
+        } else if (!config.speechRecognitionModel) {
+          config.speechRecognitionModel = this.defaultConfig.speechRecognitionModel;
+        }
+        
         return {
           ...this.defaultConfig,
           ...config
@@ -174,14 +185,25 @@ export class ConfigHelper extends EventEmitter {
           updates.extractionModel = "gpt-4o";
           updates.solutionModel = "gpt-4o";
           updates.debuggingModel = "gpt-4o";
+          updates.speechRecognitionModel = "whisper-1";
         } else if (updates.apiProvider === "anthropic") {
           updates.extractionModel = "claude-3-7-sonnet-20250219";
           updates.solutionModel = "claude-3-7-sonnet-20250219";
           updates.debuggingModel = "claude-3-7-sonnet-20250219";
+          // Speech recognition not supported for Anthropic
         } else {
           updates.extractionModel = "gemini-2.0-flash";
           updates.solutionModel = "gemini-2.0-flash";
           updates.debuggingModel = "gemini-2.0-flash";
+          // Speech recognition not supported for Gemini
+        }
+      }
+      
+      // Validate speech recognition model (only whisper-1 is supported, and only for OpenAI)
+      if (updates.speechRecognitionModel) {
+        if (provider === "openai" && updates.speechRecognitionModel !== "whisper-1") {
+          console.warn(`Invalid speech recognition model: ${updates.speechRecognitionModel}. Only whisper-1 is supported for OpenAI.`);
+          updates.speechRecognitionModel = "whisper-1";
         }
       }
       
@@ -203,7 +225,8 @@ export class ConfigHelper extends EventEmitter {
       // This prevents re-initializing the AI client when only opacity changes
       if (updates.apiKey !== undefined || updates.apiProvider !== undefined || 
           updates.extractionModel !== undefined || updates.solutionModel !== undefined || 
-          updates.debuggingModel !== undefined || updates.language !== undefined) {
+          updates.debuggingModel !== undefined || updates.speechRecognitionModel !== undefined || 
+          updates.language !== undefined) {
         this.emit('config-updated', newConfig);
       }
       
diff --git a/electron/TranscriptionHelper.ts b/electron/TranscriptionHelper.ts
index bf8bf23e..63836a79 100644
--- a/electron/TranscriptionHelper.ts
+++ b/electron/TranscriptionHelper.ts
@@ -25,15 +25,24 @@ export class TranscriptionHelper implements ITranscriptionHelper {
     this.tempDir = path.join(app.getPath('temp'), 'audio-transcriptions');
     this.ensureTempDirectory();
     this.initializeOpenAI();
+    
+    // Listen for config changes to re-initialize
+    configHelper.on('config-updated', () => {
+      this.initializeOpenAI();
+    });
   }
 
   /**
    * Initializes OpenAI client with API key from config
+   * Only initializes if provider is OpenAI (Whisper only works with OpenAI)
    */
   private initializeOpenAI(): void {
     const config = configHelper.loadConfig();
-    if (config.apiKey && config.apiKey.trim().length > 0) {
+    if (config.apiProvider === "openai" && config.apiKey && config.apiKey.trim().length > 0) {
       this.openai = new OpenAI({ apiKey: config.apiKey });
+    } else if (config.apiProvider !== "openai") {
+      console.log("Speech recognition is only supported with OpenAI provider");
+      this.openai = null;
     }
   }
 
@@ -57,8 +66,14 @@ export class TranscriptionHelper implements ITranscriptionHelper {
     audioBuffer: Buffer, 
     mimeType: string = 'audio/webm'
   ): Promise<TranscriptionResult> {
+    const config = configHelper.loadConfig();
+    
+    if (config.apiProvider !== "openai") {
+      throw new Error('Speech recognition is only supported with OpenAI provider. Please switch to OpenAI in settings.');
+    }
+    
     if (!this.openai) {
-      throw new Error('OpenAI client not initialized. Please set API key.');
+      throw new Error('OpenAI client not initialized. Please set OpenAI API key in settings.');
     }
 
     if (!audioBuffer || audioBuffer.length === 0) {
@@ -74,10 +89,14 @@ export class TranscriptionHelper implements ITranscriptionHelper {
       // Create read stream for OpenAI API
       const file = fs.createReadStream(tempPath);
       
+      // Get speech recognition model from config
+      const config = configHelper.loadConfig();
+      const speechModel = config.speechRecognitionModel || 'whisper-1';
+      
       // Transcribe using Whisper API
       const transcription = await this.openai.audio.transcriptions.create({
         file: file,
-        model: 'whisper-1',
+        model: speechModel,
         language: 'en', // Optional: can be auto-detected
         response_format: 'verbose_json',
       });
diff --git a/electron/preload.ts b/electron/preload.ts
index 36b7ca93..aa8e92ae 100644
--- a/electron/preload.ts
+++ b/electron/preload.ts
@@ -205,7 +205,7 @@ const electronAPI = {
   
   // New methods for OpenAI API integration
   getConfig: () => ipcRenderer.invoke("get-config"),
-  updateConfig: (config: { apiKey?: string; model?: string; language?: string; opacity?: number }) => 
+  updateConfig: (config: { apiKey?: string; model?: string; language?: string; opacity?: number; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string }) => 
     ipcRenderer.invoke("update-config", config),
   onShowSettings: (callback: () => void) => {
     const subscription = () => callback()
diff --git a/src/_pages/Queue.tsx b/src/_pages/Queue.tsx
index a384bb32..db9a3058 100644
--- a/src/_pages/Queue.tsx
+++ b/src/_pages/Queue.tsx
@@ -142,7 +142,7 @@ const Queue: React.FC<QueueProps> = ({
       <div className="px-4 py-3">
         <div className="space-y-3 w-full">
           {/* Conversation Section - Works independently of screenshots */}
-          <div className="bg-black/60 rounded-md p-4" style={{ height: '500px', display: 'flex', flexDirection: 'column' }}>
+          <div className="bg-black/60 rounded-md p-4" style={{ height: '350px', display: 'flex', flexDirection: 'column' }}>
             <ConversationSection />
           </div>
 
diff --git a/src/_pages/Solutions.tsx b/src/_pages/Solutions.tsx
index 79cacb2c..296c54dd 100644
--- a/src/_pages/Solutions.tsx
+++ b/src/_pages/Solutions.tsx
@@ -502,7 +502,7 @@ const Solutions: React.FC<SolutionsProps> = ({
           />
 
           {/* Conversation Section */}
-          <div className="bg-black/60 rounded-md p-4" style={{ height: '500px', display: 'flex', flexDirection: 'column' }}>
+          <div className="bg-black/60 rounded-md p-4" style={{ height: '350px', display: 'flex', flexDirection: 'column' }}>
             <ConversationSection />
           </div>
 
diff --git a/src/components/Settings/SettingsDialog.tsx b/src/components/Settings/SettingsDialog.tsx
index 3460ca8b..a9ecb34d 100644
--- a/src/components/Settings/SettingsDialog.tsx
+++ b/src/components/Settings/SettingsDialog.tsx
@@ -184,6 +184,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
   const [extractionModel, setExtractionModel] = useState("gpt-4o");
   const [solutionModel, setSolutionModel] = useState("gpt-4o");
   const [debuggingModel, setDebuggingModel] = useState("gpt-4o");
+  const [speechRecognitionModel, setSpeechRecognitionModel] = useState("whisper-1");
   const [isLoading, setIsLoading] = useState(false);
   const { showToast } = useToast();
 
@@ -213,6 +214,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         extractionModel?: string;
         solutionModel?: string;
         debuggingModel?: string;
+        speechRecognitionModel?: string;
       }
 
       window.electronAPI
@@ -223,6 +225,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
           setExtractionModel(config.extractionModel || "gpt-4o");
           setSolutionModel(config.solutionModel || "gpt-4o");
           setDebuggingModel(config.debuggingModel || "gpt-4o");
+          setSpeechRecognitionModel(config.speechRecognitionModel || "whisper-1");
         })
         .catch((error: unknown) => {
           console.error("Failed to load config:", error);
@@ -243,14 +246,17 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
       setExtractionModel("gpt-4o");
       setSolutionModel("gpt-4o");
       setDebuggingModel("gpt-4o");
+      setSpeechRecognitionModel("whisper-1");
     } else if (provider === "gemini") {
       setExtractionModel("gemini-1.5-pro");
       setSolutionModel("gemini-1.5-pro");
       setDebuggingModel("gemini-1.5-pro");
+      setSpeechRecognitionModel("whisper-1"); // Keep whisper-1 but will show as not supported
     } else if (provider === "anthropic") {
       setExtractionModel("claude-3-7-sonnet-20250219");
       setSolutionModel("claude-3-7-sonnet-20250219");
       setDebuggingModel("claude-3-7-sonnet-20250219");
+      setSpeechRecognitionModel("whisper-1"); // Keep whisper-1 but will show as not supported
     }
   };
 
@@ -263,6 +269,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         extractionModel,
         solutionModel,
         debuggingModel,
+        speechRecognitionModel,
       });
       
       if (result) {
@@ -569,6 +576,47 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
               );
             })}
           </div>
+          
+          {/* Speech Recognition Model Selection */}
+          <div className="space-y-2 mt-4">
+            <label className="text-sm font-medium text-white mb-1 block">
+              Speech Recognition Model
+            </label>
+            <p className="text-xs text-white/60 mb-2">
+              Model used for transcribing interview conversations
+            </p>
+            
+            {apiProvider === "openai" ? (
+              <div className="space-y-2">
+                <div
+                  className={`p-2 rounded-lg cursor-pointer transition-colors ${
+                    speechRecognitionModel === "whisper-1"
+                      ? "bg-white/10 border border-white/20"
+                      : "bg-black/30 border border-white/5 hover:bg-white/5"
+                  }`}
+                  onClick={() => setSpeechRecognitionModel("whisper-1")}
+                >
+                  <div className="flex items-center gap-2">
+                    <div
+                      className={`w-3 h-3 rounded-full ${
+                        speechRecognitionModel === "whisper-1" ? "bg-white" : "bg-white/20"
+                      }`}
+                    />
+                    <div>
+                      <p className="font-medium text-white text-xs">Whisper-1</p>
+                      <p className="text-xs text-white/60">OpenAI's speech-to-text model</p>
+                    </div>
+                  </div>
+                </div>
+              </div>
+            ) : (
+              <div className="p-3 rounded-lg bg-black/30 border border-white/10">
+                <p className="text-sm text-white/70">
+                  Speech recognition is only supported with OpenAI. Please switch to OpenAI provider to use this feature.
+                </p>
+              </div>
+            )}
+          </div>
         </div>
         <DialogFooter className="flex justify-between sm:justify-between">
           <Button
diff --git a/src/types/electron.d.ts b/src/types/electron.d.ts
index 59b067b9..2e1b7237 100644
--- a/src/types/electron.d.ts
+++ b/src/types/electron.d.ts
@@ -54,8 +54,8 @@ export interface ElectronAPI {
   getPlatform: () => string
   
   // New methods for OpenAI integration
-  getConfig: () => Promise<{ apiKey: string; model: string }>
-  updateConfig: (config: { apiKey?: string; model?: string }) => Promise<boolean>
+  getConfig: () => Promise<{ apiKey: string; model: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string }>
+  updateConfig: (config: { apiKey?: string; model?: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string }) => Promise<boolean>
   checkApiKey: () => Promise<boolean>
   validateApiKey: (apiKey: string) => Promise<{ valid: boolean; error?: string }>
   openLink: (url: string) => void

From 143915a4b33289fa8aad1233d735080e05400f42 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Sun, 11 Jan 2026 03:55:14 -0800
Subject: [PATCH 05/13] feat: enhance README with Speech Recognition Helper
 details and usage instructions

---
 README.md | 54 +++++++++++++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 51 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index 47aeaf6a..c14bea73 100644
--- a/README.md
+++ b/README.md
@@ -56,6 +56,7 @@ All it takes is modest JavaScript/TypeScript knowledge and understanding of the
 - 🤖 AI-Powered Analysis: Automatically extracts and analyzes coding problems using GPT-4o
 - 💡 Solution Generation: Get detailed explanations and solutions with time/space complexity analysis
 - 🔧 Real-time Debugging: Debug your code with AI assistance and structured feedback
+- 🎙️ Speech Recognition Helper: Record and transcribe interview conversations with AI-powered answer suggestions
 - 🎨 Advanced Window Management: Freely move, resize, change opacity, and zoom the window
 - 🔄 Model Selection: Choose between GPT-4o and GPT-4o-mini for different processing stages
 - 🔒 Privacy-Focused: Your API key and data never leave your computer except for OpenAI API calls
@@ -70,6 +71,7 @@ The application uses unidentifiable global keyboard shortcuts that won't be dete
 - Delete Last Screenshot: [Control or Cmd + L]
 - Process Screenshots: [Control or Cmd + Enter]
 - Start New Problem: [Control or Cmd + R]
+- Toggle Recording: [Control or Cmd + M] (Speech Recognition Helper)
 - Quit: [Control or Cmd + Q]
 - Decrease Opacity: [Control or Cmd + []
 - Increase Opacity: [Control or Cmd + ]]
@@ -96,7 +98,7 @@ Note: The application is **NOT** invisible to:
 
 - Node.js (v16 or higher)
 - npm or bun package manager
-- OpenAI API Key
+- OpenAI API Key (required for all AI features including speech recognition)
 - Screen Recording Permission for Terminal/IDE
   - On macOS:
     1. Go to System Preferences > Security & Privacy > Privacy > Screen Recording
@@ -106,6 +108,14 @@ Note: The application is **NOT** invisible to:
     - No additional permissions needed
   - On Linux:
     - May require `xhost` access depending on your distribution
+- Microphone Permission (required for Speech Recognition Helper)
+  - On macOS:
+    1. Go to System Preferences > Security & Privacy > Privacy > Microphone
+    2. Ensure that CodeInterviewAssist has microphone permission enabled
+  - On Windows:
+    - Windows will prompt for microphone access when first using the feature
+  - On Linux:
+    - May require PulseAudio or ALSA configuration depending on your distribution
 
 ## Running the Application
 
@@ -201,6 +211,9 @@ The packaged applications will be available in the `release` directory.
 | Multi-language Support | ✅ | ✅ |
 | Time/Space Complexity Analysis | ✅ | ✅ |
 | Window Management | ✅ | ✅ |
+| Speech Recognition | ✅ | ✅ (OpenAI Whisper) |
+| AI Answer Suggestions | ✅ | ✅ (Context-aware) |
+| Conversation History | ✅ | ✅ |
 | Auth System | Required | None (Simplified) |
 | Payment Processing | Required | None (Use your own API key) |
 | Privacy | Server-processed | 100% Local Processing |
@@ -215,7 +228,8 @@ The packaged applications will be available in the `release` directory.
 - Vite
 - Tailwind CSS
 - Radix UI Components
-- OpenAI API
+- OpenAI API (GPT-4o, GPT-4o-mini, Whisper)
+- Web Audio API (for speech recording)
 
 ## How It Works
 
@@ -248,13 +262,28 @@ The packaged applications will be available in the `release` directory.
    - Window remains invisible to specified screen sharing applications
    - Start a new problem using [Control or Cmd + R]
 
-6. **Language Selection
+6. **Language Selection**
 
    - Easily switch between programming languages with a single click
    - Use arrow keys for keyboard navigation through available languages
    - The system dynamically adapts to any languages added or removed from the codebase
    - Your language preference is saved between sessions
 
+7. **Speech Recognition Helper**
+
+   - Record interview conversations using your microphone with [Control or Cmd + M]
+   - Automatically transcribe audio to text using OpenAI's Whisper API
+   - Toggle between "Interviewer" and "You" (Interviewee) speaker modes
+   - Maintain conversation history with timestamps for both speakers
+   - Get AI-powered answer suggestions when the interviewer asks questions
+   - Suggestions are context-aware and consider:
+     - Previous conversation history
+     - Your previous answers for consistency
+     - Screenshot context (if coding problems are captured)
+   - View real-time transcription and suggestions in the Conversations view
+   - All audio processing happens locally; only transcription requests are sent to OpenAI
+   - Supports both coding interviews (with screenshot context) and behavioral interviews
+
 ## Adding More AI Models
 
 This application is built with extensibility in mind. You can easily add support for additional LLMs alongside the existing OpenAI integration:
@@ -272,10 +301,29 @@ To add new models, simply extend the API integration in `electron/ProcessingHelp
   - Problem Extraction: Analyzes screenshots to understand the coding problem
   - Solution Generation: Creates optimized solutions with explanations
   - Debugging: Provides detailed analysis of errors and improvement suggestions
+- **Speech Recognition Model**: Configure the speech-to-text model for transcription:
+  - Currently supports OpenAI's Whisper-1 model
+  - Only available when using OpenAI as the API provider
+  - Configured in Settings > Speech Recognition Model
 - **Language**: Select your preferred programming language for solutions
 - **Window Controls**: Adjust opacity, position, and zoom level using keyboard shortcuts
 - **All settings are stored locally** in your user data directory and persist between sessions
 
+### Speech Recognition Helper Configuration
+
+The Speech Recognition Helper uses OpenAI's Whisper API for transcription. To use this feature:
+
+1. **API Provider**: Must be set to OpenAI (not Gemini or Anthropic)
+2. **Speech Recognition Model**: Select "whisper-1" in Settings
+3. **Microphone Access**: Grant microphone permissions when prompted
+4. **Usage**: 
+   - Press [Control or Cmd + M] to start/stop recording
+   - Toggle speaker mode between Interviewer and You (Interviewee)
+   - View transcribed conversation and AI suggestions in the Conversations view
+   - Suggestions automatically appear when interviewer questions are detected
+
+**Note**: Speech recognition requires an active OpenAI API key with sufficient credits. Audio is processed locally and only sent to OpenAI for transcription. Conversation history is stored locally and never transmitted except for transcription requests.
+
 ## License
 
 This project is licensed under the GNU Affero General Public License v3.0 (AGPL-3.0).

From b185a56b7b224587da3acebf1b8817914d09d70b Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Sun, 11 Jan 2026 04:01:53 -0800
Subject: [PATCH 06/13] feat: integrate ConversationCommands component for
 improved conversation controls and tooltip management

---
 .../Conversation/ConversationCommands.tsx     | 199 ++++++++++++++++++
 .../Conversation/ConversationSection.tsx      |  60 +++---
 2 files changed, 230 insertions(+), 29 deletions(-)
 create mode 100644 src/components/Conversation/ConversationCommands.tsx

diff --git a/src/components/Conversation/ConversationCommands.tsx b/src/components/Conversation/ConversationCommands.tsx
new file mode 100644
index 00000000..9046642d
--- /dev/null
+++ b/src/components/Conversation/ConversationCommands.tsx
@@ -0,0 +1,199 @@
+/**
+ * ConversationCommands - Command bar for conversation/recording features
+ * Follows the same design pattern as QueueCommands and SolutionCommands
+ */
+import React, { useState, useEffect, useRef } from "react";
+import { useToast } from "../../contexts/toast";
+import { COMMAND_KEY } from "../../utils/platform";
+
+interface ConversationCommandsProps {
+  onTooltipVisibilityChange: (visible: boolean, height: number) => void;
+  isRecording: boolean;
+  isProcessing: boolean;
+  recordingDuration: number;
+  currentSpeaker: 'interviewer' | 'interviewee';
+  onStartRecording: () => Promise<void>;
+  onStopRecording: () => Promise<void>;
+  onToggleSpeaker: () => Promise<void>;
+  onClearConversation: () => Promise<void>;
+}
+
+export const ConversationCommands: React.FC<ConversationCommandsProps> = ({
+  onTooltipVisibilityChange,
+  isRecording,
+  isProcessing,
+  recordingDuration,
+  currentSpeaker,
+  onStartRecording,
+  onStopRecording,
+  onToggleSpeaker,
+  onClearConversation,
+}) => {
+  const [isTooltipVisible, setIsTooltipVisible] = useState(false);
+  const tooltipRef = useRef<HTMLDivElement>(null);
+  const { showToast } = useToast();
+
+  useEffect(() => {
+    let tooltipHeight = 0;
+    if (tooltipRef.current && isTooltipVisible) {
+      tooltipHeight = tooltipRef.current.offsetHeight + 10;
+    }
+    onTooltipVisibilityChange(isTooltipVisible, tooltipHeight);
+  }, [isTooltipVisible, onTooltipVisibilityChange]);
+
+  const handleMouseEnter = () => {
+    setIsTooltipVisible(true);
+  };
+
+  const handleMouseLeave = () => {
+    setIsTooltipVisible(false);
+  };
+
+  const formatDuration = (seconds: number) => {
+    const mins = Math.floor(seconds / 60);
+    const secs = seconds % 60;
+    return `${mins}:${secs.toString().padStart(2, '0')}`;
+  };
+
+  const handleToggleRecording = async () => {
+    if (isRecording) {
+      await onStopRecording();
+    } else {
+      await onStartRecording();
+    }
+  };
+
+  return (
+    <div>
+      <div className="pt-2 w-fit">
+        <div className="text-xs text-white/90 backdrop-blur-md bg-black/60 rounded-lg py-2 px-4 flex items-center justify-center gap-4 flex-wrap">
+          {/* Start/Stop Recording */}
+          <div
+            className="flex items-center gap-2 cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+            onClick={handleToggleRecording}
+          >
+            <span className="text-[11px] leading-none">
+              {isRecording ? `Stop (${formatDuration(recordingDuration)})` : 'Start Recording'}
+            </span>
+            <div className="flex gap-1">
+              <button className="bg-white/10 rounded-md px-1.5 py-1 text-[11px] leading-none text-white/70">
+                {COMMAND_KEY}
+              </button>
+              <button className="bg-white/10 rounded-md px-1.5 py-1 text-[11px] leading-none text-white/70">
+                M
+              </button>
+            </div>
+          </div>
+
+          {/* Toggle Speaker Mode */}
+          <div
+            className="flex items-center gap-2 cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors disabled:opacity-50 disabled:cursor-not-allowed"
+            onClick={onToggleSpeaker}
+            style={{ opacity: (isRecording || isProcessing) ? 0.5 : 1, pointerEvents: (isRecording || isProcessing) ? 'none' : 'auto' }}
+          >
+            <span className="text-[11px] leading-none">
+              {currentSpeaker === 'interviewer' ? 'Interviewer' : 'You'}
+            </span>
+            <div className="flex gap-1">
+              <button className="bg-white/10 rounded-md px-1.5 py-1 text-[11px] leading-none text-white/70">
+                {COMMAND_KEY}
+              </button>
+              <button className="bg-white/10 rounded-md px-1.5 py-1 text-[11px] leading-none text-white/70">
+                Shift
+              </button>
+              <button className="bg-white/10 rounded-md px-1.5 py-1 text-[11px] leading-none text-white/70">
+                M
+              </button>
+            </div>
+          </div>
+
+          {/* Clear Conversation */}
+          <div
+            className="flex items-center gap-2 cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+            onClick={onClearConversation}
+          >
+            <span className="text-[11px] leading-none">Clear</span>
+          </div>
+
+          {/* Keyboard Shortcuts Tooltip Trigger */}
+          <div
+            className="relative flex items-center gap-2 cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+            onMouseEnter={handleMouseEnter}
+            onMouseLeave={handleMouseLeave}
+          >
+            <span className="text-[11px] leading-none">Shortcuts</span>
+
+            {/* Tooltip Content */}
+            {isTooltipVisible && (
+              <div
+                ref={tooltipRef}
+                className="absolute top-full right-0 mt-2 w-80"
+                style={{ zIndex: 100 }}
+              >
+                {/* Add transparent bridge */}
+                <div className="absolute -top-2 right-0 w-full h-2" />
+                <div className="p-3 text-xs bg-black/80 backdrop-blur-md rounded-lg border border-white/10 text-white/90 shadow-lg">
+                  <div className="space-y-4">
+                    <h3 className="font-medium whitespace-nowrap">
+                      Keyboard Shortcuts
+                    </h3>
+                    <div className="space-y-3">
+                      {/* Start/Stop Recording */}
+                      <div
+                        className="cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+                        onClick={handleToggleRecording}
+                      >
+                        <div className="flex items-center justify-between">
+                          <span className="truncate">Start/Stop Recording</span>
+                          <div className="flex gap-1 flex-shrink-0">
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              {COMMAND_KEY}
+                            </span>
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              M
+                            </span>
+                          </div>
+                        </div>
+                        <p className="text-[10px] leading-relaxed text-white/70 truncate mt-1">
+                          Record interview conversation for transcription.
+                        </p>
+                      </div>
+
+                      {/* Toggle Speaker Mode */}
+                      <div
+                        className="cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors"
+                        onClick={onToggleSpeaker}
+                      >
+                        <div className="flex items-center justify-between">
+                          <span className="truncate">Toggle Speaker Mode</span>
+                          <div className="flex gap-1 flex-shrink-0">
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              {COMMAND_KEY}
+                            </span>
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              Shift
+                            </span>
+                            <span className="bg-white/20 px-1.5 py-0.5 rounded text-[10px] leading-none">
+                              M
+                            </span>
+                          </div>
+                        </div>
+                        <p className="text-[10px] leading-relaxed text-white/70 truncate mt-1">
+                          Switch between Interviewer and You mode.
+                        </p>
+                      </div>
+                    </div>
+                  </div>
+                </div>
+              </div>
+            )}
+          </div>
+
+          {isProcessing && (
+            <span className="text-[11px] text-white/70">Processing...</span>
+          )}
+        </div>
+      </div>
+    </div>
+  );
+};
diff --git a/src/components/Conversation/ConversationSection.tsx b/src/components/Conversation/ConversationSection.tsx
index 351ae463..aa7ff0a8 100644
--- a/src/components/Conversation/ConversationSection.tsx
+++ b/src/components/Conversation/ConversationSection.tsx
@@ -7,6 +7,7 @@
 import React, { useState, useEffect, useRef } from 'react';
 import { useQueryClient } from '@tanstack/react-query';
 import { AudioRecorder } from '../../utils/audioRecorder';
+import { ConversationCommands } from './ConversationCommands';
 
 interface ConversationMessage {
   id: string;
@@ -57,13 +58,26 @@ export const ConversationSection: React.FC = () => {
   const [aiSuggestions, setAiSuggestions] = useState<AISuggestion | null>(null);
   const [isProcessing, setIsProcessing] = useState(false);
   const [recordingDuration, setRecordingDuration] = useState(0);
+  const [tooltipHeight, setTooltipHeight] = useState(0);
   const messagesEndRef = useRef<HTMLDivElement>(null);
   const audioRecorderRef = useRef<AudioRecorder | null>(null);
   const durationIntervalRef = useRef<NodeJS.Timeout | null>(null);
-
+  
   // Use ref to track recording state for event listener
   const isRecordingRef = useRef(false);
   
+  const handleTooltipVisibilityChange = (visible: boolean, height: number) => {
+    setTooltipHeight(height);
+  };
+  
+  const handleClearConversation = async () => {
+    try {
+      await window.electronAPI.clearConversation();
+    } catch (error) {
+      console.error('Failed to clear conversation:', error);
+    }
+  };
+  
   useEffect(() => {
     isRecordingRef.current = isRecording;
   }, [isRecording]);
@@ -250,38 +264,26 @@ export const ConversationSection: React.FC = () => {
 
   return (
     <div className="flex flex-col h-full">
-      {/* Recording Controls - Always visible at top */}
-      <div className="flex items-center gap-3 flex-wrap flex-shrink-0 mb-3">
-        <button
-          onClick={isRecording ? handleStopRecording : handleStartRecording}
-          disabled={isProcessing}
-          className={`px-3 py-1.5 rounded text-xs font-medium transition disabled:opacity-50 disabled:cursor-not-allowed ${
-            isRecording
-              ? 'bg-red-600 hover:bg-red-700 text-white'
-              : 'bg-green-600 hover:bg-green-700 text-white'
-          }`}
-        >
-          {isRecording ? `⏹ Stop (${formatDuration(recordingDuration)})` : '⏺ Start Recording'}
-        </button>
-        
-        <button
-          onClick={handleToggleSpeaker}
-          disabled={isRecording || isProcessing}
-          className="px-3 py-1.5 rounded text-xs font-medium bg-blue-600 hover:bg-blue-700 text-white disabled:opacity-50 disabled:cursor-not-allowed"
-        >
-          {currentSpeaker === 'interviewer' ? '👤 Interviewer' : '🎤 You'}
-        </button>
-        
-        {isProcessing && (
-          <span className="text-xs text-white/70">Processing...</span>
-        )}
-      </div>
+      {/* Conversation Commands Bar - Matches QueueCommands/SolutionCommands style */}
+      <ConversationCommands
+        onTooltipVisibilityChange={handleTooltipVisibilityChange}
+        isRecording={isRecording}
+        isProcessing={isProcessing}
+        recordingDuration={recordingDuration}
+        currentSpeaker={currentSpeaker}
+        onStartRecording={handleStartRecording}
+        onStopRecording={handleStopRecording}
+        onToggleSpeaker={handleToggleSpeaker}
+        onClearConversation={handleClearConversation}
+      />
 
       {/* Scrollable Conversation Area - Takes remaining space above AI suggestions */}
       <div 
-        className="overflow-y-auto flex-1 min-h-0 mb-3 pr-2"
+        className="overflow-y-auto flex-1 min-h-0 mb-3 pr-2 mt-2"
         style={{ 
-          maxHeight: aiSuggestions ? 'calc(100% - 180px)' : '100%',
+          maxHeight: aiSuggestions 
+            ? `calc(100% - ${180 + tooltipHeight}px)` 
+            : `calc(100% - ${60 + tooltipHeight}px)`,
           scrollBehavior: 'smooth'
         }}
       >

From 1c2961e1defdc60c1a32dfb980187e5794bedb0e Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Sun, 11 Jan 2026 04:10:57 -0800
Subject: [PATCH 07/13] refactor: optimize code splitting by lazy loading
 components and syntax highlighter, adjust build configurations for
 environment-specific settings

---
 package.json             |  2 --
 src/App.tsx              | 46 ++++++++++++++++++++++++++++------------
 src/_pages/Debug.tsx     | 31 ++++++++++++++++++++-------
 src/_pages/Solutions.tsx | 33 +++++++++++++++++++++-------
 vite.config.ts           | 20 +++++++++++++----
 5 files changed, 97 insertions(+), 35 deletions(-)

diff --git a/package.json b/package.json
index fee68383..b92bc9cf 100644
--- a/package.json
+++ b/package.json
@@ -124,8 +124,6 @@
   "dependencies": {
     "@anthropic-ai/sdk": "^0.39.0",
     "@electron/notarize": "^2.3.0",
-    "@emotion/react": "^11.11.0",
-    "@emotion/styled": "^11.11.0",
     "@radix-ui/react-dialog": "^1.1.2",
     "@radix-ui/react-label": "^2.1.0",
     "@radix-ui/react-slot": "^1.1.0",
diff --git a/src/App.tsx b/src/App.tsx
index f2dd348d..eab3d738 100644
--- a/src/App.tsx
+++ b/src/App.tsx
@@ -1,4 +1,4 @@
-import SubscribedApp from "./_pages/SubscribedApp"
+import { lazy, Suspense } from "react"
 import { UpdateNotification } from "./components/UpdateNotification"
 import {
   QueryClient,
@@ -14,14 +14,21 @@ import {
 } from "./components/ui/toast"
 import { ToastContext } from "./contexts/toast"
 import { WelcomeScreen } from "./components/WelcomeScreen"
-import { SettingsDialog } from "./components/Settings/SettingsDialog"
+
+// Lazy load heavy components for better code splitting
+const SubscribedApp = lazy(() => import("./_pages/SubscribedApp"))
+const SettingsDialog = lazy(() => 
+  import("./components/Settings/SettingsDialog").then(module => ({ 
+    default: module.SettingsDialog 
+  }))
+)
 
 // Create a React Query client
 const queryClient = new QueryClient({
   defaultOptions: {
     queries: {
       staleTime: 0,
-      gcTime: Infinity,
+      gcTime: 5 * 60 * 1000, // 5 minutes - prevents memory leaks
       retry: 1,
       refetchOnWindowFocus: false
     },
@@ -243,11 +250,20 @@ function App() {
           <div className="relative">
             {isInitialized ? (
               hasApiKey ? (
-                <SubscribedApp
-                  credits={credits}
-                  currentLanguage={currentLanguage}
-                  setLanguage={updateLanguage}
-                />
+                <Suspense fallback={
+                  <div className="min-h-screen bg-black flex items-center justify-center">
+                    <div className="flex flex-col items-center gap-3">
+                      <div className="w-6 h-6 border-2 border-white/20 border-t-white/80 rounded-full animate-spin"></div>
+                      <p className="text-white/60 text-sm">Loading...</p>
+                    </div>
+                  </div>
+                }>
+                  <SubscribedApp
+                    credits={credits}
+                    currentLanguage={currentLanguage}
+                    setLanguage={updateLanguage}
+                  />
+                </Suspense>
               ) : (
                 <WelcomeScreen onOpenSettings={handleOpenSettings} />
               )
@@ -264,11 +280,15 @@ function App() {
             <UpdateNotification />
           </div>
           
-          {/* Settings Dialog */}
-          <SettingsDialog 
-            open={isSettingsOpen} 
-            onOpenChange={handleCloseSettings} 
-          />
+          {/* Settings Dialog - Lazy loaded */}
+          {isSettingsOpen && (
+            <Suspense fallback={null}>
+              <SettingsDialog 
+                open={isSettingsOpen} 
+                onOpenChange={handleCloseSettings} 
+              />
+            </Suspense>
+          )}
           
           <Toast
             open={toastState.open}
diff --git a/src/_pages/Debug.tsx b/src/_pages/Debug.tsx
index 10608723..eab5411a 100644
--- a/src/_pages/Debug.tsx
+++ b/src/_pages/Debug.tsx
@@ -1,8 +1,12 @@
 // Debug.tsx
 import { useQuery, useQueryClient } from "@tanstack/react-query"
-import React, { useEffect, useRef, useState } from "react"
-import { Prism as SyntaxHighlighter } from "react-syntax-highlighter"
-import { dracula } from "react-syntax-highlighter/dist/esm/styles/prism"
+import React, { useEffect, useRef, useState, lazy, Suspense } from "react"
+// Lazy load syntax highlighter to reduce initial bundle size
+const SyntaxHighlighter = lazy(() => 
+  import("react-syntax-highlighter").then(module => ({ 
+    default: module.Prism 
+  }))
+)
 import ScreenshotQueue from "../components/Queue/ScreenshotQueue"
 import SolutionCommands from "../components/Solutions/SolutionCommands"
 import { Screenshot } from "../types/screenshots"
@@ -32,10 +36,20 @@ const CodeSection = ({
       </div>
     ) : (
       <div className="w-full">
-        <SyntaxHighlighter
-          showLineNumbers
-          language={currentLanguage == "golang" ? "go" : currentLanguage}
-          style={dracula}
+        <Suspense fallback={<div className="text-white/60 text-sm">Loading syntax highlighter...</div>}>
+          <SyntaxHighlighter
+            showLineNumbers
+            language={currentLanguage == "golang" ? "go" : currentLanguage}
+            style={(() => {
+              // Dynamically import style to reduce initial bundle size
+              // This will be code-split by Vite
+              try {
+                const styleModule = require("react-syntax-highlighter/dist/esm/styles/prism")
+                return styleModule.dracula || {}
+              } catch {
+                return {}
+              }
+            })()}
           customStyle={{
             maxWidth: "100%",
             margin: 0,
@@ -47,7 +61,8 @@ const CodeSection = ({
           wrapLongLines={true}
         >
           {code as string}
-        </SyntaxHighlighter>
+          </SyntaxHighlighter>
+        </Suspense>
       </div>
     )}
   </div>
diff --git a/src/_pages/Solutions.tsx b/src/_pages/Solutions.tsx
index 296c54dd..29085136 100644
--- a/src/_pages/Solutions.tsx
+++ b/src/_pages/Solutions.tsx
@@ -1,8 +1,13 @@
 // Solutions.tsx
-import React, { useState, useEffect, useRef } from "react"
+import React, { useState, useEffect, useRef, lazy, Suspense } from "react"
 import { useQuery, useQueryClient } from "@tanstack/react-query"
-import { Prism as SyntaxHighlighter } from "react-syntax-highlighter"
-import { dracula } from "react-syntax-highlighter/dist/esm/styles/prism"
+// Dynamic import for syntax highlighter - loaded only when code is displayed
+// This reduces initial bundle size significantly
+const SyntaxHighlighter = lazy(() => 
+  import("react-syntax-highlighter").then(module => ({ 
+    default: module.Prism 
+  }))
+)
 
 import ScreenshotQueue from "../components/Queue/ScreenshotQueue"
 
@@ -82,10 +87,21 @@ const SolutionSection = ({
           >
             {copied ? "Copied!" : "Copy"}
           </button>
-          <SyntaxHighlighter
-            showLineNumbers
-            language={currentLanguage == "golang" ? "go" : currentLanguage}
-            style={dracula}
+          <Suspense fallback={<div className="text-white/60 text-sm">Loading syntax highlighter...</div>}>
+            <SyntaxHighlighter
+              showLineNumbers
+              language={currentLanguage == "golang" ? "go" : currentLanguage}
+              style={(() => {
+                // Dynamically import style to reduce initial bundle size
+                // This will be code-split by Vite
+                try {
+                  // Use dynamic import for better tree-shaking
+                  const styleModule = require("react-syntax-highlighter/dist/esm/styles/prism")
+                  return styleModule.dracula || {}
+                } catch {
+                  return {}
+                }
+              })()}
             customStyle={{
               maxWidth: "100%",
               margin: 0,
@@ -97,7 +113,8 @@ const SolutionSection = ({
             wrapLongLines={true}
           >
             {content as string}
-          </SyntaxHighlighter>
+            </SyntaxHighlighter>
+          </Suspense>
         </div>
       )}
     </div>
diff --git a/vite.config.ts b/vite.config.ts
index d7360772..e6ba2d1a 100644
--- a/vite.config.ts
+++ b/vite.config.ts
@@ -14,8 +14,8 @@ export default defineConfig({
         vite: {
           build: {
             outDir: "dist-electron",
-            sourcemap: true,
-            minify: false,
+            sourcemap: process.env.NODE_ENV === "development",
+            minify: process.env.NODE_ENV === "production" ? "esbuild" : false,
             rollupOptions: {
               external: ["electron"]
             }
@@ -28,7 +28,8 @@ export default defineConfig({
         vite: {
           build: {
             outDir: "dist-electron",
-            sourcemap: true,
+            sourcemap: process.env.NODE_ENV === "development",
+            minify: process.env.NODE_ENV === "production" ? "esbuild" : false,
             rollupOptions: {
               external: ["electron"]
             }
@@ -48,7 +49,18 @@ export default defineConfig({
   build: {
     outDir: "dist",
     emptyOutDir: true,
-    sourcemap: true
+    sourcemap: process.env.NODE_ENV === "development",
+    minify: process.env.NODE_ENV === "production" ? "esbuild" : false,
+    rollupOptions: {
+      output: {
+        manualChunks: {
+          'react-vendor': ['react', 'react-dom', 'react-router-dom'],
+          'query-vendor': ['@tanstack/react-query'],
+          'ui-vendor': ['@radix-ui/react-dialog', '@radix-ui/react-toast', '@radix-ui/react-label', '@radix-ui/react-slot'],
+          'icons': ['lucide-react']
+        }
+      }
+    }
   },
   resolve: {
     alias: {

From 63251578b95e889044ee352b6fa335f11d49ce50 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Tue, 20 Jan 2026 00:32:10 -0800
Subject: [PATCH 08/13] feat: implement candidate profile feature for
 personalized AI suggestions in interview context

---
 electron/AnswerAssistant.ts                   | 35 +++++++++--
 electron/ConfigHelper.ts                      | 12 +++-
 electron/ipcHandlers.ts                       |  5 +-
 electron/preload.ts                           |  6 +-
 .../Conversation/ConversationSection.tsx      |  6 +-
 .../Settings/CandidateProfileSection.tsx      | 59 +++++++++++++++++++
 src/components/Settings/SettingsDialog.tsx    | 40 ++++++++++++-
 src/types/electron.d.ts                       |  6 +-
 8 files changed, 152 insertions(+), 17 deletions(-)
 create mode 100644 src/components/Settings/CandidateProfileSection.tsx

diff --git a/electron/AnswerAssistant.ts b/electron/AnswerAssistant.ts
index 3664306a..a9df0754 100644
--- a/electron/AnswerAssistant.ts
+++ b/electron/AnswerAssistant.ts
@@ -4,7 +4,7 @@
  * Uses Dependency Inversion Principle - depends on IConversationManager interface
  */
 import OpenAI from 'openai';
-import { configHelper } from './ConfigHelper';
+import { configHelper, CandidateProfile } from './ConfigHelper';
 import { IConversationManager } from './ConversationManager';
 
 export interface AnswerSuggestion {
@@ -49,7 +49,8 @@ export class AnswerAssistant implements IAnswerAssistant {
   public async generateAnswerSuggestions(
     currentQuestion: string,
     conversationManager: IConversationManager,
-    screenshotContext?: string
+    screenshotContext?: string,
+    candidateProfile?: CandidateProfile
   ): Promise<AnswerSuggestion> {
     if (!this.openai) {
       throw new Error('OpenAI client not initialized. Please set API key.');
@@ -62,11 +63,15 @@ export class AnswerAssistant implements IAnswerAssistant {
     const conversationHistory = conversationManager.getConversationHistory();
     const previousAnswers = conversationManager.getIntervieweeAnswers();
 
+    // Get candidate profile from config if not provided
+    const profile = candidateProfile || configHelper.loadConfig().candidateProfile;
+    
     const contextPrompt = this.buildContextPrompt(
       currentQuestion,
       conversationHistory,
       previousAnswers,
-      screenshotContext
+      screenshotContext,
+      profile
     );
 
     try {
@@ -116,7 +121,8 @@ export class AnswerAssistant implements IAnswerAssistant {
     currentQuestion: string,
     conversationHistory: string,
     previousAnswers: string[],
-    screenshotContext?: string
+    screenshotContext?: string,
+    candidateProfile?: CandidateProfile
   ): string {
     let prompt = `You are an AI assistant helping someone during an interview. 
 The interviewer just asked: "${currentQuestion}"
@@ -126,8 +132,27 @@ ${conversationHistory || 'No previous conversation yet.'}
 
 Previous answers the interviewee has given:
 ${previousAnswers.length > 0 ? previousAnswers.join('\n\n') : 'No previous answers yet.'}
+`;
+
+    // Add candidate profile context if available
+    if (candidateProfile) {
+      const profileSections: string[] = [];
+      
+      if (candidateProfile.name) {
+        profileSections.push(`Name: ${candidateProfile.name}`);
+      }
+      
+      if (candidateProfile.resume) {
+        profileSections.push(`Resume: ${candidateProfile.resume}`);
+      }
+      
+      if (profileSections.length > 0) {
+        prompt += `\n\nCandidate Profile (use this to personalize suggestions):
+${profileSections.join('\n')}`;
+      }
+    }
 
-Based on the current question and conversation history, provide 3-5 bullet point suggestions that:
+    prompt += `\n\nBased on the current question, conversation history${candidateProfile ? ', and candidate profile' : ''}, provide 3-5 bullet point suggestions that:
 1. Directly answer the current question
 2. Reference and build upon previous answers for consistency
 3. Maintain a coherent narrative
diff --git a/electron/ConfigHelper.ts b/electron/ConfigHelper.ts
index afde8103..a95c5f9d 100644
--- a/electron/ConfigHelper.ts
+++ b/electron/ConfigHelper.ts
@@ -5,6 +5,11 @@ import { app } from "electron"
 import { EventEmitter } from "events"
 import { OpenAI } from "openai"
 
+export interface CandidateProfile {
+  name?: string;
+  resume?: string;  // Full resume text
+}
+
 interface Config {
   apiKey: string;
   apiProvider: "openai" | "gemini" | "anthropic";  // Added provider selection
@@ -14,6 +19,7 @@ interface Config {
   speechRecognitionModel: string;  // Speech recognition model (Whisper for OpenAI)
   language: string;
   opacity: number;
+  candidateProfile?: CandidateProfile;  // Candidate profile for personalized AI suggestions
 }
 
 export class ConfigHelper extends EventEmitter {
@@ -26,7 +32,11 @@ export class ConfigHelper extends EventEmitter {
     debuggingModel: "gemini-2.0-flash",
     speechRecognitionModel: "whisper-1", // Default to Whisper for OpenAI
     language: "python",
-    opacity: 1.0
+    opacity: 1.0,
+    candidateProfile: {
+      name: "",
+      resume: ""
+    }
   };
 
   constructor() {
diff --git a/electron/ipcHandlers.ts b/electron/ipcHandlers.ts
index 841b64b3..b2ce8bd1 100644
--- a/electron/ipcHandlers.ts
+++ b/electron/ipcHandlers.ts
@@ -441,7 +441,7 @@ export function initializeIpcHandlers(deps: IIpcHandlerDeps): void {
   })
 
   // AI suggestion handler
-  ipcMain.handle("get-answer-suggestions", async (_event, question: string, screenshotContext?: string) => {
+  ipcMain.handle("get-answer-suggestions", async (_event, question: string, screenshotContext?: string, candidateProfile?: any) => {
     try {
       if (!deps.answerAssistant || !deps.conversationManager) {
         return { success: false, error: "Answer assistant or conversation manager not initialized" };
@@ -450,7 +450,8 @@ export function initializeIpcHandlers(deps: IIpcHandlerDeps): void {
       const suggestions = await deps.answerAssistant.generateAnswerSuggestions(
         question,
         deps.conversationManager,
-        screenshotContext
+        screenshotContext,
+        candidateProfile
       );
       return { success: true, suggestions };
     } catch (error: any) {
diff --git a/electron/preload.ts b/electron/preload.ts
index aa8e92ae..0b83247b 100644
--- a/electron/preload.ts
+++ b/electron/preload.ts
@@ -205,7 +205,7 @@ const electronAPI = {
   
   // New methods for OpenAI API integration
   getConfig: () => ipcRenderer.invoke("get-config"),
-  updateConfig: (config: { apiKey?: string; model?: string; language?: string; opacity?: number; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string }) => 
+  updateConfig: (config: { apiKey?: string; model?: string; language?: string; opacity?: number; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string; candidateProfile?: any }) => 
     ipcRenderer.invoke("update-config", config),
   onShowSettings: (callback: () => void) => {
     const subscription = () => callback()
@@ -256,8 +256,8 @@ const electronAPI = {
     ipcRenderer.invoke("update-conversation-message", messageId, newText),
   
   // AI suggestions
-  getAnswerSuggestions: (question: string, screenshotContext?: string) =>
-    ipcRenderer.invoke("get-answer-suggestions", question, screenshotContext),
+  getAnswerSuggestions: (question: string, screenshotContext?: string, candidateProfile?: any) =>
+    ipcRenderer.invoke("get-answer-suggestions", question, screenshotContext, candidateProfile),
   
   // Event listeners
   onConversationMessageAdded: (callback: (message: any) => void) => {
diff --git a/src/components/Conversation/ConversationSection.tsx b/src/components/Conversation/ConversationSection.tsx
index aa7ff0a8..9a167589 100644
--- a/src/components/Conversation/ConversationSection.tsx
+++ b/src/components/Conversation/ConversationSection.tsx
@@ -227,7 +227,11 @@ export const ConversationSection: React.FC = () => {
         screenshotContext = `Problem Statement: ${problemStatement.problem_statement}\nConstraints: ${problemStatement.constraints || 'N/A'}\nExample Input: ${problemStatement.example_input || 'N/A'}\nExample Output: ${problemStatement.example_output || 'N/A'}`;
       }
       
-      const result = await window.electronAPI.getAnswerSuggestions(question, screenshotContext);
+      // Get candidate profile from config
+      const config = await window.electronAPI.getConfig();
+      const candidateProfile = (config as any).candidateProfile;
+      
+      const result = await window.electronAPI.getAnswerSuggestions(question, screenshotContext, candidateProfile);
       if (result.success && result.suggestions) {
         setAiSuggestions(result.suggestions);
       }
diff --git a/src/components/Settings/CandidateProfileSection.tsx b/src/components/Settings/CandidateProfileSection.tsx
new file mode 100644
index 00000000..4c2ee372
--- /dev/null
+++ b/src/components/Settings/CandidateProfileSection.tsx
@@ -0,0 +1,59 @@
+/**
+ * CandidateProfileSection - Component for editing candidate profile
+ * Used in SettingsDialog to allow users to input their resume and details
+ */
+import React, { useState } from 'react';
+import { Input } from '../ui/input';
+import { Button } from '../ui/button';
+
+export interface CandidateProfile {
+  name?: string;
+  resume?: string;
+}
+
+interface CandidateProfileSectionProps {
+  profile: CandidateProfile;
+  onProfileChange: (profile: CandidateProfile) => void;
+}
+
+export const CandidateProfileSection: React.FC<CandidateProfileSectionProps> = ({
+  profile,
+  onProfileChange,
+}) => {
+  const [localProfile, setLocalProfile] = useState<CandidateProfile>(profile);
+
+  const handleFieldChange = (field: keyof CandidateProfile, value: string) => {
+    const updated = { ...localProfile, [field]: value };
+    setLocalProfile(updated);
+    onProfileChange(updated);
+  };
+
+  return (
+    <div className="space-y-4">
+      <div className="space-y-2">
+        <label className="text-sm font-medium text-white">Name (Optional)</label>
+        <Input
+          type="text"
+          value={localProfile.name || ''}
+          onChange={(e) => handleFieldChange('name', e.target.value)}
+          placeholder="Your name"
+          className="bg-black/30 border-white/10 text-white placeholder:text-white/40"
+        />
+      </div>
+
+      <div className="space-y-2">
+        <label className="text-sm font-medium text-white">Resume</label>
+        <textarea
+          value={localProfile.resume || ''}
+          onChange={(e) => handleFieldChange('resume', e.target.value)}
+          placeholder="Paste your full resume text here. This will help AI provide more personalized answer suggestions."
+          rows={6}
+          className="w-full px-3 py-2 bg-black/30 border border-white/10 rounded-md text-white text-sm placeholder:text-white/40 focus:outline-none focus:ring-2 focus:ring-white/20 resize-y"
+        />
+        <p className="text-xs text-white/60">
+          Include your work experience, education, skills, and achievements. The more detail, the better the AI suggestions.
+        </p>
+      </div>
+    </div>
+  );
+};
diff --git a/src/components/Settings/SettingsDialog.tsx b/src/components/Settings/SettingsDialog.tsx
index a9ecb34d..f6f468ab 100644
--- a/src/components/Settings/SettingsDialog.tsx
+++ b/src/components/Settings/SettingsDialog.tsx
@@ -12,6 +12,7 @@ import { Input } from "../ui/input";
 import { Button } from "../ui/button";
 import { Settings } from "lucide-react";
 import { useToast } from "../../contexts/toast";
+import { CandidateProfileSection, CandidateProfile } from "./CandidateProfileSection";
 
 type APIProvider = "openai" | "gemini" | "anthropic";
 
@@ -185,6 +186,10 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
   const [solutionModel, setSolutionModel] = useState("gpt-4o");
   const [debuggingModel, setDebuggingModel] = useState("gpt-4o");
   const [speechRecognitionModel, setSpeechRecognitionModel] = useState("whisper-1");
+  const [candidateProfile, setCandidateProfile] = useState<CandidateProfile>({
+    name: "",
+    resume: ""
+  });
   const [isLoading, setIsLoading] = useState(false);
   const { showToast } = useToast();
 
@@ -215,6 +220,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         solutionModel?: string;
         debuggingModel?: string;
         speechRecognitionModel?: string;
+        candidateProfile?: CandidateProfile;
       }
 
       window.electronAPI
@@ -226,6 +232,10 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
           setSolutionModel(config.solutionModel || "gpt-4o");
           setDebuggingModel(config.debuggingModel || "gpt-4o");
           setSpeechRecognitionModel(config.speechRecognitionModel || "whisper-1");
+          setCandidateProfile(config.candidateProfile || {
+            name: "",
+            resume: ""
+          });
         })
         .catch((error: unknown) => {
           console.error("Failed to load config:", error);
@@ -270,6 +280,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         solutionModel,
         debuggingModel,
         speechRecognitionModel,
+        candidateProfile,
       });
       
       if (result) {
@@ -323,12 +334,21 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         }}
       >        
         <DialogHeader>
-          <DialogTitle>API Settings</DialogTitle>
+          <DialogTitle>Settings</DialogTitle>
           <DialogDescription className="text-white/70">
-            Configure your API key and model preferences. You'll need your own API key to use this application.
+            Configure your API key, AI models, and optional candidate profile. You'll need your own API key to use this application.
           </DialogDescription>
         </DialogHeader>
         <div className="space-y-4 py-4">
+          {/* API Settings Section */}
+          <div className="space-y-1">
+            <h2 className="text-sm font-semibold text-white">API Settings</h2>
+            <p className="text-xs text-white/60">
+              Choose your provider and models. These control how screenshots and solutions are processed.
+            </p>
+          </div>
+          
+          {/* API Provider Selection */}
           {/* API Provider Selection */}
           <div className="space-y-2">
             <label className="text-sm font-medium text-white">API Provider</label>
@@ -617,6 +637,22 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
               </div>
             )}
           </div>
+          
+          {/* Candidate Profile Section */}
+          <div className="space-y-4 mt-6 border-t border-white/10 pt-4">
+            <div>
+              <label className="text-sm font-medium text-white mb-1 block">
+                Candidate Profile
+              </label>
+              <p className="text-xs text-white/60 mb-3">
+                Add your resume and details to get more personalized AI answer suggestions during interviews.
+              </p>
+              <CandidateProfileSection
+                profile={candidateProfile}
+                onProfileChange={setCandidateProfile}
+              />
+            </div>
+          </div>
         </div>
         <DialogFooter className="flex justify-between sm:justify-between">
           <Button
diff --git a/src/types/electron.d.ts b/src/types/electron.d.ts
index 2e1b7237..4a5e5725 100644
--- a/src/types/electron.d.ts
+++ b/src/types/electron.d.ts
@@ -54,8 +54,8 @@ export interface ElectronAPI {
   getPlatform: () => string
   
   // New methods for OpenAI integration
-  getConfig: () => Promise<{ apiKey: string; model: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string }>
-  updateConfig: (config: { apiKey?: string; model?: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string }) => Promise<boolean>
+  getConfig: () => Promise<{ apiKey: string; model: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string; candidateProfile?: any }>
+  updateConfig: (config: { apiKey?: string; model?: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string; candidateProfile?: any }) => Promise<boolean>
   checkApiKey: () => Promise<boolean>
   validateApiKey: (apiKey: string) => Promise<{ valid: boolean; error?: string }>
   openLink: (url: string) => void
@@ -69,7 +69,7 @@ export interface ElectronAPI {
   getConversation: () => Promise<{ success: boolean; messages?: any[]; error?: string }>
   clearConversation: () => Promise<{ success: boolean; error?: string }>
   updateConversationMessage: (messageId: string, newText: string) => Promise<{ success: boolean; error?: string }>
-  getAnswerSuggestions: (question: string, screenshotContext?: string) => Promise<{ success: boolean; suggestions?: { suggestions: string[]; reasoning: string }; error?: string }>
+  getAnswerSuggestions: (question: string, screenshotContext?: string, candidateProfile?: any) => Promise<{ success: boolean; suggestions?: { suggestions: string[]; reasoning: string }; error?: string }>
   onConversationMessageAdded: (callback: (message: any) => void) => () => void
   onSpeakerChanged: (callback: (speaker: string) => void) => () => void
   onConversationMessageUpdated: (callback: (message: any) => void) => () => void

From becadf6688c7d1d5fe0ff50897067fb59cf95d27 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Tue, 20 Jan 2026 00:55:34 -0800
Subject: [PATCH 09/13] feat: enhance AnswerAssistant to utilize job
 description for tailored suggestions and add resume relevance check

---
 electron/AnswerAssistant.ts                   | 36 ++++++++++++--
 electron/ConfigHelper.ts                      |  4 +-
 .../Conversation/ConversationCommands.tsx     |  2 +-
 .../Conversation/ConversationSection.tsx      | 48 ++++++++++++++-----
 .../Settings/CandidateProfileSection.tsx      | 15 ++++++
 src/components/Settings/SettingsDialog.tsx    |  6 ++-
 6 files changed, 93 insertions(+), 18 deletions(-)

diff --git a/electron/AnswerAssistant.ts b/electron/AnswerAssistant.ts
index a9df0754..eb77c199 100644
--- a/electron/AnswerAssistant.ts
+++ b/electron/AnswerAssistant.ts
@@ -80,7 +80,7 @@ export class AnswerAssistant implements IAnswerAssistant {
         messages: [
           {
             role: 'system',
-            content: 'You are a helpful interview assistant that provides contextual answer suggestions based on conversation history. Provide concise, actionable suggestions.'
+            content: 'You are a helpful interview assistant supporting the candidate for this interview. Tailor suggestions to the job description when provided, and only use resume details when the question is about the candidate’s background. Provide concise, actionable suggestions.'
           },
           {
             role: 'user',
@@ -124,6 +124,7 @@ export class AnswerAssistant implements IAnswerAssistant {
     screenshotContext?: string,
     candidateProfile?: CandidateProfile
   ): string {
+    const shouldUseResume = this.isResumeRelevant(currentQuestion);
     let prompt = `You are an AI assistant helping someone during an interview. 
 The interviewer just asked: "${currentQuestion}"
 
@@ -134,8 +135,13 @@ Previous answers the interviewee has given:
 ${previousAnswers.length > 0 ? previousAnswers.join('\n\n') : 'No previous answers yet.'}
 `;
 
+    if (candidateProfile?.jobDescription) {
+      prompt += `\n\nJob Description (use to tailor answers to this interview):
+${candidateProfile.jobDescription}`;
+    }
+
     // Add candidate profile context if available
-    if (candidateProfile) {
+    if (candidateProfile && shouldUseResume) {
       const profileSections: string[] = [];
       
       if (candidateProfile.name) {
@@ -152,7 +158,7 @@ ${profileSections.join('\n')}`;
       }
     }
 
-    prompt += `\n\nBased on the current question, conversation history${candidateProfile ? ', and candidate profile' : ''}, provide 3-5 bullet point suggestions that:
+    prompt += `\n\nBased on the current question and conversation history${shouldUseResume && candidateProfile ? ', and candidate profile (resume only when relevant)' : ''}, provide 3-5 bullet point suggestions that:
 1. Directly answer the current question
 2. Reference and build upon previous answers for consistency
 3. Maintain a coherent narrative
@@ -167,6 +173,30 @@ Format as simple bullet points, one per line starting with "-".`;
     return prompt;
   }
 
+  /**
+   * Only treat resume as relevant when the question is about the candidate's background
+   */
+  private isResumeRelevant(question: string): boolean {
+    if (!question) return false;
+    const q = question.toLowerCase();
+    const resumeKeywords = [
+      'resume',
+      'cv',
+      'experience',
+      'background',
+      'work history',
+      'employment',
+      'projects',
+      'portfolio',
+      'skills',
+      'education',
+      'certification',
+      'accomplishment',
+      'achievement'
+    ];
+    return resumeKeywords.some(keyword => q.includes(keyword));
+  }
+
   /**
    * Parses AI response into structured suggestions
    */
diff --git a/electron/ConfigHelper.ts b/electron/ConfigHelper.ts
index a95c5f9d..643fcfbf 100644
--- a/electron/ConfigHelper.ts
+++ b/electron/ConfigHelper.ts
@@ -8,6 +8,7 @@ import { OpenAI } from "openai"
 export interface CandidateProfile {
   name?: string;
   resume?: string;  // Full resume text
+  jobDescription?: string; // Target role/job description
 }
 
 interface Config {
@@ -35,7 +36,8 @@ export class ConfigHelper extends EventEmitter {
     opacity: 1.0,
     candidateProfile: {
       name: "",
-      resume: ""
+      resume: "",
+      jobDescription: ""
     }
   };
 
diff --git a/src/components/Conversation/ConversationCommands.tsx b/src/components/Conversation/ConversationCommands.tsx
index 9046642d..8b7f7923 100644
--- a/src/components/Conversation/ConversationCommands.tsx
+++ b/src/components/Conversation/ConversationCommands.tsx
@@ -89,7 +89,7 @@ export const ConversationCommands: React.FC<ConversationCommandsProps> = ({
           <div
             className="flex items-center gap-2 cursor-pointer rounded px-2 py-1.5 hover:bg-white/10 transition-colors disabled:opacity-50 disabled:cursor-not-allowed"
             onClick={onToggleSpeaker}
-            style={{ opacity: (isRecording || isProcessing) ? 0.5 : 1, pointerEvents: (isRecording || isProcessing) ? 'none' : 'auto' }}
+            style={{ opacity: isRecording ? 0.5 : 1, pointerEvents: isRecording ? 'none' : 'auto' }}
           >
             <span className="text-[11px] leading-none">
               {currentSpeaker === 'interviewer' ? 'Interviewer' : 'You'}
diff --git a/src/components/Conversation/ConversationSection.tsx b/src/components/Conversation/ConversationSection.tsx
index 9a167589..9aa33464 100644
--- a/src/components/Conversation/ConversationSection.tsx
+++ b/src/components/Conversation/ConversationSection.tsx
@@ -62,6 +62,7 @@ export const ConversationSection: React.FC = () => {
   const messagesEndRef = useRef<HTMLDivElement>(null);
   const audioRecorderRef = useRef<AudioRecorder | null>(null);
   const durationIntervalRef = useRef<NodeJS.Timeout | null>(null);
+  const processingCountRef = useRef(0);
   
   // Use ref to track recording state for event listener
   const isRecordingRef = useRef(false);
@@ -186,37 +187,51 @@ export const ConversationSection: React.FC = () => {
       durationIntervalRef.current = null;
     }
     
-    setIsProcessing(true);
     try {
       const audioBlob = await audioRecorderRef.current.stopRecording();
-      
-      // Convert blob to ArrayBuffer
+      const speakerAtStop = currentSpeaker;
+      setRecordingDuration(0);
+
+      // Kick off transcription/processing asynchronously so UI stays responsive
+      void processRecording(audioBlob, speakerAtStop);
+
+      // Auto-toggle speaker for the next recording cycle
+      void toggleSpeakerForNextTurn();
+    } catch (error: any) {
+      console.error('Failed to stop recording:', error);
+      alert(error.message || 'Failed to stop recording');
+    }
+  };
+
+  const processRecording = async (audioBlob: Blob, speaker: 'interviewer' | 'interviewee') => {
+    updateProcessingStatus(1);
+    try {
       const arrayBuffer = await audioBlob.arrayBuffer();
       
-      // Transcribe
       const transcribeResult = await window.electronAPI.transcribeAudio(arrayBuffer, audioBlob.type);
       
       if (transcribeResult.success && transcribeResult.result) {
         const text = transcribeResult.result.text;
         
-        // Add message
-        await window.electronAPI.addConversationMessage(text, currentSpeaker);
+        await window.electronAPI.addConversationMessage(text, speaker);
         
-        // If interviewer question, get AI suggestions
-        if (currentSpeaker === 'interviewer') {
+        if (speaker === 'interviewer') {
           await fetchAISuggestions(text);
         }
-        // Don't clear suggestions when interviewee responds - user needs to see them!
       }
     } catch (error: any) {
       console.error('Failed to process recording:', error);
       alert(error.message || 'Failed to process recording');
     } finally {
-      setIsProcessing(false);
-      setRecordingDuration(0);
+      updateProcessingStatus(-1);
     }
   };
 
+  const updateProcessingStatus = (delta: number) => {
+    processingCountRef.current = Math.max(0, processingCountRef.current + delta);
+    setIsProcessing(processingCountRef.current > 0);
+  };
+
   const fetchAISuggestions = async (question: string) => {
     try {
       // Get problem statement from query cache if available (from screenshots)
@@ -253,6 +268,17 @@ export const ConversationSection: React.FC = () => {
     }
   };
 
+  const toggleSpeakerForNextTurn = async () => {
+    try {
+      const result = await window.electronAPI.toggleSpeaker();
+      if (result.success) {
+        setCurrentSpeaker(result.speaker);
+      }
+    } catch (error) {
+      console.error('Failed to auto-toggle speaker:', error);
+    }
+  };
+
   const formatTime = (timestamp: number) => {
     return new Date(timestamp).toLocaleTimeString([], { 
       hour: '2-digit', 
diff --git a/src/components/Settings/CandidateProfileSection.tsx b/src/components/Settings/CandidateProfileSection.tsx
index 4c2ee372..1aedd7fc 100644
--- a/src/components/Settings/CandidateProfileSection.tsx
+++ b/src/components/Settings/CandidateProfileSection.tsx
@@ -9,6 +9,7 @@ import { Button } from '../ui/button';
 export interface CandidateProfile {
   name?: string;
   resume?: string;
+  jobDescription?: string;
 }
 
 interface CandidateProfileSectionProps {
@@ -54,6 +55,20 @@ export const CandidateProfileSection: React.FC<CandidateProfileSectionProps> = (
           Include your work experience, education, skills, and achievements. The more detail, the better the AI suggestions.
         </p>
       </div>
+
+      <div className="space-y-2">
+        <label className="text-sm font-medium text-white">Job Description</label>
+        <textarea
+          value={localProfile.jobDescription || ''}
+          onChange={(e) => handleFieldChange('jobDescription', e.target.value)}
+          placeholder="Paste the target job description or role requirements."
+          rows={4}
+          className="w-full px-3 py-2 bg-black/30 border border-white/10 rounded-md text-white text-sm placeholder:text-white/40 focus:outline-none focus:ring-2 focus:ring-white/20 resize-y"
+        />
+        <p className="text-xs text-white/60">
+          This is used to tailor suggestions to the target role.
+        </p>
+      </div>
     </div>
   );
 };
diff --git a/src/components/Settings/SettingsDialog.tsx b/src/components/Settings/SettingsDialog.tsx
index f6f468ab..b8f70b5c 100644
--- a/src/components/Settings/SettingsDialog.tsx
+++ b/src/components/Settings/SettingsDialog.tsx
@@ -188,7 +188,8 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
   const [speechRecognitionModel, setSpeechRecognitionModel] = useState("whisper-1");
   const [candidateProfile, setCandidateProfile] = useState<CandidateProfile>({
     name: "",
-    resume: ""
+    resume: "",
+    jobDescription: ""
   });
   const [isLoading, setIsLoading] = useState(false);
   const { showToast } = useToast();
@@ -234,7 +235,8 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
           setSpeechRecognitionModel(config.speechRecognitionModel || "whisper-1");
           setCandidateProfile(config.candidateProfile || {
             name: "",
-            resume: ""
+            resume: "",
+            jobDescription: ""
           });
         })
         .catch((error: unknown) => {

From 106d9a0c7a3f862435f554a599fb3a10259aa955 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Thu, 22 Jan 2026 01:18:25 -0800
Subject: [PATCH 10/13] feat: extend AnswerAssistant to support multiple AI
 providers (OpenAI, Gemini, Anthropic) for enhanced answer suggestions

---
 electron/AnswerAssistant.ts | 147 ++++++++++++++++++++++++++++++------
 1 file changed, 122 insertions(+), 25 deletions(-)

diff --git a/electron/AnswerAssistant.ts b/electron/AnswerAssistant.ts
index eb77c199..18f02ef0 100644
--- a/electron/AnswerAssistant.ts
+++ b/electron/AnswerAssistant.ts
@@ -4,9 +4,30 @@
  * Uses Dependency Inversion Principle - depends on IConversationManager interface
  */
 import OpenAI from 'openai';
+import Anthropic from '@anthropic-ai/sdk';
+import * as axios from 'axios';
 import { configHelper, CandidateProfile } from './ConfigHelper';
 import { IConversationManager } from './ConversationManager';
 
+// Interface for Gemini API requests
+interface GeminiMessage {
+  role: string;
+  parts: Array<{
+    text?: string;
+  }>;
+}
+
+interface GeminiResponse {
+  candidates: Array<{
+    content: {
+      parts: Array<{
+        text: string;
+      }>;
+    };
+    finishReason: string;
+  }>;
+}
+
 export interface AnswerSuggestion {
   suggestions: string[];
   reasoning: string;
@@ -22,19 +43,42 @@ export interface IAnswerAssistant {
 
 export class AnswerAssistant implements IAnswerAssistant {
   private openai: OpenAI | null = null;
-  private readonly defaultModel: string = 'gpt-4o-mini';
+  private geminiApiKey: string | null = null;
+  private anthropic: Anthropic | null = null;
+  private readonly defaultOpenAIModel: string = 'gpt-4o-mini';
+  private readonly defaultGeminiModel: string = 'gemini-2.0-flash';
+  private readonly defaultAnthropicModel: string = 'claude-3-7-sonnet-20250219';
 
   constructor() {
-    this.initializeOpenAI();
+    this.initializeAIClients();
+    
+    // Listen for config changes to re-initialize the AI clients
+    configHelper.on('config-updated', () => {
+      this.initializeAIClients();
+    });
   }
 
   /**
-   * Initializes OpenAI client with API key from config
+   * Initializes AI clients based on API provider from config
    */
-  private initializeOpenAI(): void {
+  private initializeAIClients(): void {
     const config = configHelper.loadConfig();
-    if (config.apiKey && config.apiKey.trim().length > 0) {
+    
+    // Reset all clients
+    this.openai = null;
+    this.geminiApiKey = null;
+    this.anthropic = null;
+    
+    if (!config.apiKey || config.apiKey.trim().length === 0) {
+      return;
+    }
+    
+    if (config.apiProvider === "openai") {
       this.openai = new OpenAI({ apiKey: config.apiKey });
+    } else if (config.apiProvider === "gemini") {
+      this.geminiApiKey = config.apiKey;
+    } else if (config.apiProvider === "anthropic") {
+      this.anthropic = new Anthropic({ apiKey: config.apiKey });
     }
   }
 
@@ -44,7 +88,7 @@ export class AnswerAssistant implements IAnswerAssistant {
    * @param conversationManager - Conversation manager instance (dependency injection)
    * @param screenshotContext - Optional screenshot context for coding interviews
    * @returns Promise resolving to answer suggestions
-   * @throws Error if OpenAI client not initialized or request fails
+   * @throws Error if AI client not initialized or request fails
    */
   public async generateAnswerSuggestions(
     currentQuestion: string,
@@ -52,8 +96,11 @@ export class AnswerAssistant implements IAnswerAssistant {
     screenshotContext?: string,
     candidateProfile?: CandidateProfile
   ): Promise<AnswerSuggestion> {
-    if (!this.openai) {
-      throw new Error('OpenAI client not initialized. Please set API key.');
+    const config = configHelper.loadConfig();
+    
+    // Check if any AI client is initialized
+    if (!this.openai && !this.geminiApiKey && !this.anthropic) {
+      throw new Error('AI client not initialized. Please set API key in settings.');
     }
 
     if (!currentQuestion || currentQuestion.trim().length === 0) {
@@ -74,24 +121,74 @@ export class AnswerAssistant implements IAnswerAssistant {
       profile
     );
 
+    const systemMessage = 'You are a helpful interview assistant supporting the candidate for this interview. Tailor suggestions to the job description when provided, and only use resume details when the question is about the candidate\'s background. Provide concise, actionable suggestions.';
+
     try {
-      const response = await this.openai.chat.completions.create({
-        model: this.defaultModel,
-        messages: [
+      let suggestionsText = '';
+
+      if (config.apiProvider === "openai" && this.openai) {
+        const response = await this.openai.chat.completions.create({
+          model: this.defaultOpenAIModel,
+          messages: [
+            {
+              role: 'system',
+              content: systemMessage
+            },
+            {
+              role: 'user',
+              content: contextPrompt
+            }
+          ],
+          temperature: 0.7,
+          max_tokens: 500,
+        });
+
+        suggestionsText = response.choices[0]?.message?.content || '';
+      } else if (config.apiProvider === "gemini" && this.geminiApiKey) {
+        const geminiMessages: GeminiMessage[] = [
           {
-            role: 'system',
-            content: 'You are a helpful interview assistant supporting the candidate for this interview. Tailor suggestions to the job description when provided, and only use resume details when the question is about the candidate’s background. Provide concise, actionable suggestions.'
-          },
+            role: "user",
+            parts: [
+              {
+                text: `${systemMessage}\n\n${contextPrompt}`
+              }
+            ]
+          }
+        ];
+
+        const response = await axios.default.post(
+          `https://generativelanguage.googleapis.com/v1beta/models/${this.defaultGeminiModel}:generateContent?key=${this.geminiApiKey}`,
           {
-            role: 'user',
-            content: contextPrompt
+            contents: geminiMessages,
+            generationConfig: {
+              temperature: 0.7,
+              maxOutputTokens: 500
+            }
           }
-        ],
-        temperature: 0.7,
-        max_tokens: 500,
-      });
+        );
+
+        const responseData = response.data as GeminiResponse;
+        if (responseData.candidates && responseData.candidates.length > 0) {
+          suggestionsText = responseData.candidates[0].content.parts[0].text;
+        }
+      } else if (config.apiProvider === "anthropic" && this.anthropic) {
+        const response = await this.anthropic.messages.create({
+          model: this.defaultAnthropicModel,
+          max_tokens: 500,
+          messages: [
+            {
+              role: 'user',
+              content: `${systemMessage}\n\n${contextPrompt}`
+            }
+          ],
+          temperature: 0.7
+        });
+
+        suggestionsText = (response.content[0] as { type: 'text', text: string }).text;
+      } else {
+        throw new Error('No AI client available. Please configure your API key in settings.');
+      }
 
-      const suggestionsText = response.choices[0]?.message?.content || '';
       const suggestions = this.parseSuggestions(suggestionsText);
 
       return {
@@ -103,9 +200,9 @@ export class AnswerAssistant implements IAnswerAssistant {
     } catch (error: any) {
       console.error('Error generating suggestions:', error);
       
-      // Provide specific error messages
+      // Provide specific error messages based on provider
       if (error.status === 401) {
-        throw new Error('Invalid API key. Please check your OpenAI API key in settings.');
+        throw new Error(`Invalid API key. Please check your ${config.apiProvider} API key in settings.`);
       } else if (error.status === 429) {
         throw new Error('Rate limit exceeded. Please try again in a moment.');
       }
@@ -222,9 +319,9 @@ Format as simple bullet points, one per line starting with "-".`;
   }
 
   /**
-   * Checks if OpenAI client is initialized
+   * Checks if any AI client is initialized
    */
   public isInitialized(): boolean {
-    return this.openai !== null;
+    return this.openai !== null || this.geminiApiKey !== null || this.anthropic !== null;
   }
 }

From a9e2ac61e7258253a08514fe8d79c5603ea100e3 Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Thu, 22 Jan 2026 02:09:27 -0800
Subject: [PATCH 11/13] feat: enhance AI model management by centralizing
 configuration and validation for multiple providers, including OpenAI,
 Gemini, and Anthropic

---
 electron/AnswerAssistant.ts                |  39 ++-
 electron/ConfigHelper.ts                   | 114 ++++----
 electron/ProcessingHelper.ts               |  53 ++--
 electron/TranscriptionHelper.ts            | 166 +++++++++--
 shared/aiModels.ts                         | 325 +++++++++++++++++++++
 src/components/Settings/SettingsDialog.tsx | 231 +++------------
 tsconfig.electron.json                     |   2 +-
 tsconfig.json                              |   2 +-
 8 files changed, 623 insertions(+), 309 deletions(-)
 create mode 100644 shared/aiModels.ts

diff --git a/electron/AnswerAssistant.ts b/electron/AnswerAssistant.ts
index 18f02ef0..6a8c7f75 100644
--- a/electron/AnswerAssistant.ts
+++ b/electron/AnswerAssistant.ts
@@ -8,6 +8,10 @@ import Anthropic from '@anthropic-ai/sdk';
 import * as axios from 'axios';
 import { configHelper, CandidateProfile } from './ConfigHelper';
 import { IConversationManager } from './ConversationManager';
+import {
+  APIProvider,
+  DEFAULT_ANSWER_MODELS,
+} from "../shared/aiModels";
 
 // Interface for Gemini API requests
 interface GeminiMessage {
@@ -45,9 +49,19 @@ export class AnswerAssistant implements IAnswerAssistant {
   private openai: OpenAI | null = null;
   private geminiApiKey: string | null = null;
   private anthropic: Anthropic | null = null;
-  private readonly defaultOpenAIModel: string = 'gpt-4o-mini';
-  private readonly defaultGeminiModel: string = 'gemini-2.0-flash';
-  private readonly defaultAnthropicModel: string = 'claude-3-7-sonnet-20250219';
+  private readonly defaultModels: Record<APIProvider, string> = DEFAULT_ANSWER_MODELS;
+
+  private formatProviderError(provider: "openai" | "gemini" | "anthropic", error: any, context: string): string {
+    const status =
+      typeof error?.status === "number"
+        ? error.status
+        : typeof error?.response?.status === "number"
+          ? error.response.status
+          : undefined;
+    const message = error?.message || error?.response?.data?.error?.message || "Unknown error";
+    const statusPart = status ? ` (status ${status})` : "";
+    return `[${provider}] ${context} failed${statusPart}: ${message}`;
+  }
 
   constructor() {
     this.initializeAIClients();
@@ -128,7 +142,7 @@ export class AnswerAssistant implements IAnswerAssistant {
 
       if (config.apiProvider === "openai" && this.openai) {
         const response = await this.openai.chat.completions.create({
-          model: this.defaultOpenAIModel,
+          model: this.defaultModels.openai,
           messages: [
             {
               role: 'system',
@@ -157,7 +171,7 @@ export class AnswerAssistant implements IAnswerAssistant {
         ];
 
         const response = await axios.default.post(
-          `https://generativelanguage.googleapis.com/v1beta/models/${this.defaultGeminiModel}:generateContent?key=${this.geminiApiKey}`,
+          `https://generativelanguage.googleapis.com/v1beta/models/${this.defaultModels.gemini}:generateContent?key=${this.geminiApiKey}`,
           {
             contents: geminiMessages,
             generationConfig: {
@@ -173,7 +187,7 @@ export class AnswerAssistant implements IAnswerAssistant {
         }
       } else if (config.apiProvider === "anthropic" && this.anthropic) {
         const response = await this.anthropic.messages.create({
-          model: this.defaultAnthropicModel,
+          model: this.defaultModels.anthropic,
           max_tokens: 500,
           messages: [
             {
@@ -201,13 +215,14 @@ export class AnswerAssistant implements IAnswerAssistant {
       console.error('Error generating suggestions:', error);
       
       // Provide specific error messages based on provider
-      if (error.status === 401) {
-        throw new Error(`Invalid API key. Please check your ${config.apiProvider} API key in settings.`);
-      } else if (error.status === 429) {
-        throw new Error('Rate limit exceeded. Please try again in a moment.');
+      const status = error?.status ?? error?.response?.status;
+      if (status === 401) {
+        throw new Error(this.formatProviderError(config.apiProvider, error, "Auth"));
+      } else if (status === 429) {
+        throw new Error(this.formatProviderError(config.apiProvider, error, "Rate limit"));
       }
-      
-      throw new Error(`Failed to generate suggestions: ${error.message || 'Unknown error'}`);
+
+      throw new Error(this.formatProviderError(config.apiProvider, error, "Answer suggestion generation"));
     }
   }
 
diff --git a/electron/ConfigHelper.ts b/electron/ConfigHelper.ts
index 643fcfbf..60989c2b 100644
--- a/electron/ConfigHelper.ts
+++ b/electron/ConfigHelper.ts
@@ -4,6 +4,12 @@ import path from "node:path"
 import { app } from "electron"
 import { EventEmitter } from "events"
 import { OpenAI } from "openai"
+import {
+  APIProvider,
+  DEFAULT_PROVIDER,
+  DEFAULT_MODELS,
+  sanitizeModelSelection,
+} from "../shared/aiModels";
 
 export interface CandidateProfile {
   name?: string;
@@ -13,7 +19,7 @@ export interface CandidateProfile {
 
 interface Config {
   apiKey: string;
-  apiProvider: "openai" | "gemini" | "anthropic";  // Added provider selection
+  apiProvider: APIProvider;  // Added provider selection
   extractionModel: string;
   solutionModel: string;
   debuggingModel: string;
@@ -27,11 +33,12 @@ export class ConfigHelper extends EventEmitter {
   private configPath: string;
   private defaultConfig: Config = {
     apiKey: "",
-    apiProvider: "gemini", // Default to Gemini
-    extractionModel: "gemini-2.0-flash", // Default to Flash for faster responses
-    solutionModel: "gemini-2.0-flash",
-    debuggingModel: "gemini-2.0-flash",
-    speechRecognitionModel: "whisper-1", // Default to Whisper for OpenAI
+    apiProvider: DEFAULT_PROVIDER,
+    extractionModel: DEFAULT_MODELS[DEFAULT_PROVIDER].extractionModel,
+    solutionModel: DEFAULT_MODELS[DEFAULT_PROVIDER].solutionModel,
+    debuggingModel: DEFAULT_MODELS[DEFAULT_PROVIDER].debuggingModel,
+    speechRecognitionModel:
+      DEFAULT_MODELS.openai.speechRecognitionModel || "whisper-1",
     language: "python",
     opacity: 1.0,
     candidateProfile: {
@@ -70,38 +77,9 @@ export class ConfigHelper extends EventEmitter {
   }
 
   /**
-   * Validate and sanitize model selection to ensure only allowed models are used
+   * Validate and sanitize model selection to ensure only allowed models are used.
+   * Delegates to shared model configuration for single source of truth.
    */
-  private sanitizeModelSelection(model: string, provider: "openai" | "gemini" | "anthropic"): string {
-    if (provider === "openai") {
-      // Only allow gpt-4o and gpt-4o-mini for OpenAI
-      const allowedModels = ['gpt-4o', 'gpt-4o-mini'];
-      if (!allowedModels.includes(model)) {
-        console.warn(`Invalid OpenAI model specified: ${model}. Using default model: gpt-4o`);
-        return 'gpt-4o';
-      }
-      return model;
-    } else if (provider === "gemini")  {
-      // Only allow gemini-1.5-pro and gemini-2.0-flash for Gemini
-      const allowedModels = ['gemini-1.5-pro', 'gemini-2.0-flash'];
-      if (!allowedModels.includes(model)) {
-        console.warn(`Invalid Gemini model specified: ${model}. Using default model: gemini-2.0-flash`);
-        return 'gemini-2.0-flash'; // Changed default to flash
-      }
-      return model;
-    }  else if (provider === "anthropic") {
-      // Only allow Claude models
-      const allowedModels = ['claude-3-7-sonnet-20250219', 'claude-3-5-sonnet-20241022', 'claude-3-opus-20240229'];
-      if (!allowedModels.includes(model)) {
-        console.warn(`Invalid Anthropic model specified: ${model}. Using default model: claude-3-7-sonnet-20250219`);
-        return 'claude-3-7-sonnet-20250219';
-      }
-      return model;
-    }
-    // Default fallback
-    return model;
-  }
-
   public loadConfig(): Config {
     try {
       if (fs.existsSync(this.configPath)) {
@@ -110,18 +88,30 @@ export class ConfigHelper extends EventEmitter {
         
         // Ensure apiProvider is a valid value
         if (config.apiProvider !== "openai" && config.apiProvider !== "gemini"  && config.apiProvider !== "anthropic") {
-          config.apiProvider = "gemini"; // Default to Gemini if invalid
+          config.apiProvider = DEFAULT_PROVIDER; // Default to shared provider if invalid
         }
         
         // Sanitize model selections to ensure only allowed models are used
         if (config.extractionModel) {
-          config.extractionModel = this.sanitizeModelSelection(config.extractionModel, config.apiProvider);
+          config.extractionModel = sanitizeModelSelection(
+            config.extractionModel,
+            config.apiProvider,
+            "extractionModel"
+          );
         }
         if (config.solutionModel) {
-          config.solutionModel = this.sanitizeModelSelection(config.solutionModel, config.apiProvider);
+          config.solutionModel = sanitizeModelSelection(
+            config.solutionModel,
+            config.apiProvider,
+            "solutionModel"
+          );
         }
         if (config.debuggingModel) {
-          config.debuggingModel = this.sanitizeModelSelection(config.debuggingModel, config.apiProvider);
+          config.debuggingModel = sanitizeModelSelection(
+            config.debuggingModel,
+            config.apiProvider,
+            "debuggingModel"
+          );
         }
         
         // Ensure speechRecognitionModel is valid (only whisper-1 for OpenAI)
@@ -171,7 +161,7 @@ export class ConfigHelper extends EventEmitter {
   public updateConfig(updates: Partial<Config>): Config {
     try {
       const currentConfig = this.loadConfig();
-      let provider = updates.apiProvider || currentConfig.apiProvider;
+      let provider: APIProvider = updates.apiProvider || currentConfig.apiProvider;
       
       // Auto-detect provider based on API key format if a new key is provided
       if (updates.apiKey && !updates.apiProvider) {
@@ -193,21 +183,13 @@ export class ConfigHelper extends EventEmitter {
       
       // If provider is changing, reset models to the default for that provider
       if (updates.apiProvider && updates.apiProvider !== currentConfig.apiProvider) {
-        if (updates.apiProvider === "openai") {
-          updates.extractionModel = "gpt-4o";
-          updates.solutionModel = "gpt-4o";
-          updates.debuggingModel = "gpt-4o";
-          updates.speechRecognitionModel = "whisper-1";
-        } else if (updates.apiProvider === "anthropic") {
-          updates.extractionModel = "claude-3-7-sonnet-20250219";
-          updates.solutionModel = "claude-3-7-sonnet-20250219";
-          updates.debuggingModel = "claude-3-7-sonnet-20250219";
-          // Speech recognition not supported for Anthropic
-        } else {
-          updates.extractionModel = "gemini-2.0-flash";
-          updates.solutionModel = "gemini-2.0-flash";
-          updates.debuggingModel = "gemini-2.0-flash";
-          // Speech recognition not supported for Gemini
+        const defaults = DEFAULT_MODELS[updates.apiProvider];
+        updates.extractionModel = defaults.extractionModel;
+        updates.solutionModel = defaults.solutionModel;
+        updates.debuggingModel = defaults.debuggingModel;
+        // Speech recognition currently only supported for OpenAI
+        if (defaults.speechRecognitionModel) {
+          updates.speechRecognitionModel = defaults.speechRecognitionModel;
         }
       }
       
@@ -221,13 +203,25 @@ export class ConfigHelper extends EventEmitter {
       
       // Sanitize model selections in the updates
       if (updates.extractionModel) {
-        updates.extractionModel = this.sanitizeModelSelection(updates.extractionModel, provider);
+        updates.extractionModel = sanitizeModelSelection(
+          updates.extractionModel,
+          provider,
+          "extractionModel"
+        );
       }
       if (updates.solutionModel) {
-        updates.solutionModel = this.sanitizeModelSelection(updates.solutionModel, provider);
+        updates.solutionModel = sanitizeModelSelection(
+          updates.solutionModel,
+          provider,
+          "solutionModel"
+        );
       }
       if (updates.debuggingModel) {
-        updates.debuggingModel = this.sanitizeModelSelection(updates.debuggingModel, provider);
+        updates.debuggingModel = sanitizeModelSelection(
+          updates.debuggingModel,
+          provider,
+          "debuggingModel"
+        );
       }
       
       const newConfig = { ...currentConfig, ...updates };
diff --git a/electron/ProcessingHelper.ts b/electron/ProcessingHelper.ts
index 9f40916b..7d13bb88 100644
--- a/electron/ProcessingHelper.ts
+++ b/electron/ProcessingHelper.ts
@@ -8,6 +8,10 @@ import { app, BrowserWindow, dialog } from "electron"
 import { OpenAI } from "openai"
 import { configHelper } from "./ConfigHelper"
 import Anthropic from '@anthropic-ai/sdk';
+import {
+  APIProvider,
+  DEFAULT_MODELS,
+} from "../shared/aiModels";
 
 // Interface for Gemini API requests
 interface GeminiMessage {
@@ -53,6 +57,18 @@ export class ProcessingHelper {
   // AbortControllers for API requests
   private currentProcessingAbortController: AbortController | null = null
   private currentExtraProcessingAbortController: AbortController | null = null
+  
+  private formatProviderError(provider: "openai" | "gemini" | "anthropic", error: any, context: string): string {
+    const status =
+      typeof error?.status === "number"
+        ? error.status
+        : typeof error?.response?.status === "number"
+          ? error.response.status
+          : undefined;
+    const message = error?.message || error?.response?.data?.error?.message || "Unknown error";
+    const statusPart = status ? ` (status ${status})` : "";
+    return `[${provider}] ${context} failed${statusPart}: ${message}`;
+  }
 
   constructor(deps: IProcessingHelperDeps) {
     this.deps = deps
@@ -579,7 +595,7 @@ export class ProcessingHelper {
 
           // Make API request to Gemini
           const response = await axios.default.post(
-            `https://generativelanguage.googleapis.com/v1beta/models/${config.extractionModel || "gemini-2.0-flash"}:generateContent?key=${this.geminiApiKey}`,
+            `https://generativelanguage.googleapis.com/v1beta/models/${config.extractionModel || "gemini-3-flash-latest"}:generateContent?key=${this.geminiApiKey}`,
             {
               contents: geminiMessages,
               generationConfig: {
@@ -605,7 +621,7 @@ export class ProcessingHelper {
           console.error("Error using Gemini API:", error);
           return {
             success: false,
-            error: "Failed to process with Gemini API. Please check your API key or try again later."
+            error: this.formatProviderError("gemini", error, "Problem extraction")
           };
         }
       } else if (config.apiProvider === "anthropic") {
@@ -672,7 +688,7 @@ export class ProcessingHelper {
 
           return {
             success: false,
-            error: "Failed to process with Anthropic API. Please check your API key or try again later."
+            error: this.formatProviderError("anthropic", error, "Problem extraction")
           };
         }
       }
@@ -729,28 +745,31 @@ export class ProcessingHelper {
         };
       }
       
+      const config = configHelper.loadConfig();
+      const provider: APIProvider = config.apiProvider;
+
       // Handle OpenAI API errors specifically
       if (error?.response?.status === 401) {
         return {
           success: false,
-          error: "Invalid OpenAI API key. Please check your settings."
+          error: this.formatProviderError(provider, error, "Auth")
         };
       } else if (error?.response?.status === 429) {
         return {
           success: false,
-          error: "OpenAI API rate limit exceeded or insufficient credits. Please try again later."
+          error: this.formatProviderError(provider, error, "Rate limit / quota")
         };
       } else if (error?.response?.status === 500) {
         return {
           success: false,
-          error: "OpenAI server error. Please try again later."
+          error: this.formatProviderError(provider, error, "Server error")
         };
       }
 
       console.error("API Error Details:", error);
       return { 
         success: false, 
-        error: error.message || "Failed to process screenshots. Please try again." 
+        error: this.formatProviderError(provider, error, "Processing screenshots")
       };
     }
   }
@@ -850,7 +869,7 @@ Your solution should be efficient, well-commented, and handle edge cases.
 
           // Make API request to Gemini
           const response = await axios.default.post(
-            `https://generativelanguage.googleapis.com/v1beta/models/${config.solutionModel || "gemini-2.0-flash"}:generateContent?key=${this.geminiApiKey}`,
+            `https://generativelanguage.googleapis.com/v1beta/models/${config.solutionModel || "gemini-3-flash-latest"}:generateContent?key=${this.geminiApiKey}`,
             {
               contents: geminiMessages,
               generationConfig: {
@@ -872,7 +891,7 @@ Your solution should be efficient, well-commented, and handle edge cases.
           console.error("Error using Gemini API for solution:", error);
           return {
             success: false,
-            error: "Failed to generate solution with Gemini API. Please check your API key or try again later."
+            error: this.formatProviderError("gemini", error, "Solution generation")
           };
         }
       } else if (config.apiProvider === "anthropic") {
@@ -924,7 +943,7 @@ Your solution should be efficient, well-commented, and handle edge cases.
 
           return {
             success: false,
-            error: "Failed to generate solution with Anthropic API. Please check your API key or try again later."
+            error: this.formatProviderError("anthropic", error, "Solution generation")
           };
         }
       }
@@ -1009,17 +1028,17 @@ Your solution should be efficient, well-commented, and handle edge cases.
       if (error?.response?.status === 401) {
         return {
           success: false,
-          error: "Invalid OpenAI API key. Please check your settings."
+          error: this.formatProviderError(configHelper.loadConfig().apiProvider, error, "Auth")
         };
       } else if (error?.response?.status === 429) {
         return {
           success: false,
-          error: "OpenAI API rate limit exceeded or insufficient credits. Please try again later."
+          error: this.formatProviderError(configHelper.loadConfig().apiProvider, error, "Rate limit / quota")
         };
       }
       
       console.error("Solution generation error:", error);
-      return { success: false, error: error.message || "Failed to generate solution" };
+      return { success: false, error: this.formatProviderError(configHelper.loadConfig().apiProvider, error, "Solution generation") };
     }
   }
 
@@ -1171,7 +1190,7 @@ If you include code examples, use proper markdown code blocks with language spec
           }
 
           const response = await axios.default.post(
-            `https://generativelanguage.googleapis.com/v1beta/models/${config.debuggingModel || "gemini-2.0-flash"}:generateContent?key=${this.geminiApiKey}`,
+            `https://generativelanguage.googleapis.com/v1beta/models/${config.debuggingModel || "gemini-3-flash-latest"}:generateContent?key=${this.geminiApiKey}`,
             {
               contents: geminiMessages,
               generationConfig: {
@@ -1193,7 +1212,7 @@ If you include code examples, use proper markdown code blocks with language spec
           console.error("Error using Gemini API for debugging:", error);
           return {
             success: false,
-            error: "Failed to process debug request with Gemini API. Please check your API key or try again later."
+            error: this.formatProviderError("gemini", error, "Debugging")
           };
         }
       } else if (config.apiProvider === "anthropic") {
@@ -1282,7 +1301,7 @@ If you include code examples, use proper markdown code blocks with language spec
           
           return {
             success: false,
-            error: "Failed to process debug request with Anthropic API. Please check your API key or try again later."
+            error: this.formatProviderError("anthropic", error, "Debugging")
           };
         }
       }
@@ -1327,7 +1346,7 @@ If you include code examples, use proper markdown code blocks with language spec
       return { success: true, data: response };
     } catch (error: any) {
       console.error("Debug processing error:", error);
-      return { success: false, error: error.message || "Failed to process debug request" };
+      return { success: false, error: this.formatProviderError(configHelper.loadConfig().apiProvider, error, "Debug processing") };
     }
   }
 
diff --git a/electron/TranscriptionHelper.ts b/electron/TranscriptionHelper.ts
index 63836a79..f5ebd790 100644
--- a/electron/TranscriptionHelper.ts
+++ b/electron/TranscriptionHelper.ts
@@ -1,8 +1,11 @@
 /**
- * TranscriptionHelper - Handles audio transcription using OpenAI Whisper API
+ * TranscriptionHelper - Handles audio transcription using various AI providers
  * Follows Single Responsibility Principle - only handles transcription
+ * Supports multiple providers: OpenAI (Whisper), Gemini (future), Anthropic (future)
  */
 import OpenAI from 'openai';
+import Anthropic from '@anthropic-ai/sdk';
+// import * as axios from 'axios'; // Uncomment when implementing Gemini speech recognition
 import fs from 'fs';
 import path from 'path';
 import { app } from 'electron';
@@ -19,33 +22,77 @@ export interface ITranscriptionHelper {
 
 export class TranscriptionHelper implements ITranscriptionHelper {
   private openai: OpenAI | null = null;
+  private geminiApiKey: string | null = null;
+  private anthropic: Anthropic | null = null;
   private readonly tempDir: string;
+  
+  // Default models for each provider
+  private readonly defaultOpenAIModel: string = 'whisper-1';
+  private readonly defaultGeminiModel: string = ''; // To be set when Gemini speech recognition is available
+  private readonly defaultAnthropicModel: string = ''; // To be set when Anthropic speech recognition is available
 
   constructor() {
     this.tempDir = path.join(app.getPath('temp'), 'audio-transcriptions');
     this.ensureTempDirectory();
-    this.initializeOpenAI();
+    this.initializeAIClients();
     
     // Listen for config changes to re-initialize
     configHelper.on('config-updated', () => {
-      this.initializeOpenAI();
+      this.initializeAIClients();
     });
   }
 
   /**
-   * Initializes OpenAI client with API key from config
-   * Only initializes if provider is OpenAI (Whisper only works with OpenAI)
+   * Initializes AI clients based on API provider from config
+   * Currently supports OpenAI (Whisper), with structure ready for future providers
    */
-  private initializeOpenAI(): void {
+  private initializeAIClients(): void {
     const config = configHelper.loadConfig();
-    if (config.apiProvider === "openai" && config.apiKey && config.apiKey.trim().length > 0) {
+    
+    // Reset all clients
+    this.openai = null;
+    this.geminiApiKey = null;
+    this.anthropic = null;
+    
+    if (!config.apiKey || config.apiKey.trim().length === 0) {
+      return;
+    }
+    
+    if (config.apiProvider === "openai") {
       this.openai = new OpenAI({ apiKey: config.apiKey });
-    } else if (config.apiProvider !== "openai") {
-      console.log("Speech recognition is only supported with OpenAI provider");
-      this.openai = null;
+      console.log("OpenAI transcription client initialized");
+    } else if (config.apiProvider === "gemini") {
+      // Future: Initialize Gemini client when speech recognition is available
+      this.geminiApiKey = config.apiKey;
+      console.log("Gemini API key set (speech recognition not yet available)");
+    } else if (config.apiProvider === "anthropic") {
+      // Future: Initialize Anthropic client when speech recognition is available
+      this.anthropic = new Anthropic({ apiKey: config.apiKey });
+      console.log("Anthropic client initialized (speech recognition not yet available)");
     }
   }
 
+  /**
+   * Checks if the current provider supports speech recognition
+   */
+  private isSpeechRecognitionSupported(provider: "openai" | "gemini" | "anthropic"): boolean {
+    // Currently only OpenAI supports speech recognition
+    // Update this as other providers add support
+    return provider === "openai";
+  }
+
+  private formatProviderError(provider: "openai" | "gemini" | "anthropic", error: any, context: string): string {
+    const status =
+      typeof error?.status === "number"
+        ? error.status
+        : typeof error?.response?.status === "number"
+          ? error.response.status
+          : undefined;
+    const message = error?.message || error?.response?.data?.error?.message || "Unknown error";
+    const statusPart = status ? ` (status ${status})` : "";
+    return `[${provider}] ${context} failed${statusPart}: ${message}`;
+  }
+
   /**
    * Ensures temp directory exists for audio files
    */
@@ -56,11 +103,11 @@ export class TranscriptionHelper implements ITranscriptionHelper {
   }
 
   /**
-   * Transcribes audio buffer using OpenAI Whisper API
+   * Transcribes audio buffer using the configured AI provider
    * @param audioBuffer - Audio data as Buffer
    * @param mimeType - MIME type of the audio (default: 'audio/webm')
    * @returns Promise resolving to transcription result
-   * @throws Error if transcription fails or OpenAI client not initialized
+   * @throws Error if transcription fails or AI client not initialized
    */
   public async transcribeAudio(
     audioBuffer: Buffer, 
@@ -68,18 +115,38 @@ export class TranscriptionHelper implements ITranscriptionHelper {
   ): Promise<TranscriptionResult> {
     const config = configHelper.loadConfig();
     
-    if (config.apiProvider !== "openai") {
-      throw new Error('Speech recognition is only supported with OpenAI provider. Please switch to OpenAI in settings.');
-    }
-    
-    if (!this.openai) {
-      throw new Error('OpenAI client not initialized. Please set OpenAI API key in settings.');
+    // Check if speech recognition is supported for the current provider
+    if (!this.isSpeechRecognitionSupported(config.apiProvider)) {
+      throw new Error(`Speech recognition is currently only supported with OpenAI provider. Please switch to OpenAI in settings.`);
     }
 
     if (!audioBuffer || audioBuffer.length === 0) {
       throw new Error('Audio buffer is empty');
     }
 
+    // Route to the appropriate provider's transcription method
+    if (config.apiProvider === "openai") {
+      return this.transcribeWithOpenAI(audioBuffer, mimeType);
+    } else if (config.apiProvider === "gemini") {
+      return this.transcribeWithGemini(audioBuffer, mimeType);
+    } else if (config.apiProvider === "anthropic") {
+      return this.transcribeWithAnthropic(audioBuffer, mimeType);
+    } else {
+      throw new Error(`Unsupported API provider: ${config.apiProvider}`);
+    }
+  }
+
+  /**
+   * Transcribes audio using OpenAI Whisper API
+   */
+  private async transcribeWithOpenAI(
+    audioBuffer: Buffer,
+    mimeType: string
+  ): Promise<TranscriptionResult> {
+    if (!this.openai) {
+      throw new Error('OpenAI client not initialized. Please set OpenAI API key in settings.');
+    }
+
     const tempPath = path.join(this.tempDir, `audio-${Date.now()}-${Math.random().toString(36).substring(7)}.webm`);
     
     try {
@@ -91,7 +158,7 @@ export class TranscriptionHelper implements ITranscriptionHelper {
       
       // Get speech recognition model from config
       const config = configHelper.loadConfig();
-      const speechModel = config.speechRecognitionModel || 'whisper-1';
+      const speechModel = config.speechRecognitionModel || this.defaultOpenAIModel;
       
       // Transcribe using Whisper API
       const transcription = await this.openai.audio.transcriptions.create({
@@ -112,19 +179,52 @@ export class TranscriptionHelper implements ITranscriptionHelper {
       // Clean up on error
       this.cleanupTempFile(tempPath);
       
-      console.error('Transcription error:', error);
+      console.error('OpenAI transcription error:', error);
       
       // Provide more specific error messages
-      if (error.status === 401) {
-        throw new Error('Invalid API key. Please check your OpenAI API key in settings.');
-      } else if (error.status === 429) {
-        throw new Error('Rate limit exceeded. Please try again in a moment.');
+      const status = error?.status ?? error?.response?.status;
+      if (status === 401) {
+        throw new Error(this.formatProviderError("openai", error, "Auth"));
+      } else if (status === 429) {
+        throw new Error(this.formatProviderError("openai", error, "Rate limit"));
       } else if (error.message?.includes('file')) {
-        throw new Error('Invalid audio file format. Please try recording again.');
+        throw new Error(this.formatProviderError("openai", error, "Invalid audio file"));
       }
-      
-      throw new Error(`Transcription failed: ${error.message || 'Unknown error'}`);
+
+      throw new Error(this.formatProviderError("openai", error, "Transcription"));
+    }
+  }
+
+  /**
+   * Transcribes audio using Gemini API (Future implementation)
+   * TODO: Implement when Gemini speech recognition becomes available
+   */
+  private async transcribeWithGemini(
+    audioBuffer: Buffer,
+    mimeType: string
+  ): Promise<TranscriptionResult> {
+    if (!this.geminiApiKey) {
+      throw new Error('Gemini API key not initialized. Please set Gemini API key in settings.');
+    }
+
+    // TODO: Implement Gemini speech recognition when available
+    throw new Error('Gemini speech recognition is not yet available. Please use OpenAI provider for transcription.');
+  }
+
+  /**
+   * Transcribes audio using Anthropic API (Future implementation)
+   * TODO: Implement when Anthropic speech recognition becomes available
+   */
+  private async transcribeWithAnthropic(
+    audioBuffer: Buffer,
+    mimeType: string
+  ): Promise<TranscriptionResult> {
+    if (!this.anthropic) {
+      throw new Error('Anthropic client not initialized. Please set Anthropic API key in settings.');
     }
+
+    // TODO: Implement Anthropic speech recognition when available
+    throw new Error('Anthropic speech recognition is not yet available. Please use OpenAI provider for transcription.');
   }
 
   /**
@@ -142,9 +242,17 @@ export class TranscriptionHelper implements ITranscriptionHelper {
   }
 
   /**
-   * Checks if OpenAI client is initialized
+   * Checks if any AI client is initialized
    */
   public isInitialized(): boolean {
-    return this.openai !== null;
+    return this.openai !== null || this.geminiApiKey !== null || this.anthropic !== null;
+  }
+
+  /**
+   * Checks if speech recognition is available for the current provider
+   */
+  public isSpeechRecognitionAvailable(): boolean {
+    const config = configHelper.loadConfig();
+    return this.isSpeechRecognitionSupported(config.apiProvider) && this.isInitialized();
   }
 }
diff --git a/shared/aiModels.ts b/shared/aiModels.ts
new file mode 100644
index 00000000..45fdb6b7
--- /dev/null
+++ b/shared/aiModels.ts
@@ -0,0 +1,325 @@
+// shared/aiModels.ts
+// Central configuration for AI providers, models, and related helpers.
+// This module is the single source of truth for:
+// - Supported providers
+// - Available models per provider and category
+// - Default models per provider and category
+// - Model validation/sanitization
+//
+// Changing models or providers should only require edits in this file.
+
+export type APIProvider = "openai" | "gemini" | "anthropic";
+
+export type ModelCategoryKey =
+  | "extractionModel"
+  | "solutionModel"
+  | "debuggingModel";
+
+export interface AIModel {
+  id: string;
+  name: string;
+  description: string;
+}
+
+export interface ModelCategoryDefinition {
+  key: ModelCategoryKey;
+  title: string;
+  description: string;
+  modelsByProvider: Record<APIProvider, AIModel[]>;
+}
+
+/**
+ * Default provider used when no provider is configured or an invalid provider is found.
+ */
+export const DEFAULT_PROVIDER: APIProvider = "gemini";
+
+/**
+ * Default models per provider and category.
+ * These are used for:
+ * - Initial config defaults
+ * - Resetting models when provider changes
+ * - Fallbacks when a model is missing in config
+ */
+export const DEFAULT_MODELS: Record<
+  APIProvider,
+  {
+    extractionModel: string;
+    solutionModel: string;
+    debuggingModel: string;
+    // Speech recognition is only supported for OpenAI right now.
+    speechRecognitionModel?: string;
+  }
+> = {
+  openai: {
+    extractionModel: "gpt-4o",
+    solutionModel: "gpt-4o",
+    debuggingModel: "gpt-4o",
+    speechRecognitionModel: "whisper-1",
+  },
+  gemini: {
+    extractionModel: "gemini-3-flash-preview",
+    solutionModel: "gemini-3-flash-preview",
+    debuggingModel: "gemini-3-flash-preview",
+  },
+  anthropic: {
+    extractionModel: "claude-3-7-sonnet-20250219",
+    solutionModel: "claude-3-7-sonnet-20250219",
+    debuggingModel: "claude-3-7-sonnet-20250219",
+  },
+};
+
+/**
+ * Default models specifically for the answer suggestion assistant.
+ * This allows us to evolve those independently from the screenshot
+ * processing defaults if needed.
+ */
+export const DEFAULT_ANSWER_MODELS: Record<APIProvider, string> = {
+  openai: "gpt-4o-mini",
+  gemini: "gemini-3-flash-preview",
+  anthropic: "claude-3-7-sonnet-20250219",
+};
+
+/**
+ * Allowed model ids per provider.
+ * Used for validation/sanitization when reading or updating config.
+ */
+export const ALLOWED_MODELS: Record<APIProvider, string[]> = {
+  openai: [
+    "gpt-4o",
+    "gpt-4o-mini",
+  ],
+  gemini: [
+    // Current Gemini 3 models (preview)
+    "gemini-3-pro-preview",
+    "gemini-3-flash-preview",
+    "gemini-3-pro-image-preview",
+    // Legacy models kept for backwards compatibility
+    "gemini-1.5-pro",
+    "gemini-1.5-flash",
+    "gemini-2.0-flash-exp",
+  ],
+  anthropic: [
+    "claude-3-7-sonnet-20250219",
+    "claude-3-5-sonnet-20241022",
+    "claude-3-opus-20240229",
+  ],
+};
+
+/**
+ * Settings UI model catalogue, organized by functional category and provider.
+ */
+export const MODEL_CATEGORIES: ModelCategoryDefinition[] = [
+  {
+    key: "extractionModel",
+    title: "Problem Extraction",
+    description:
+      "Model used to analyze screenshots and extract problem details",
+    modelsByProvider: {
+      openai: [
+        {
+          id: "gpt-4o",
+          name: "gpt-4o",
+          description: "Best overall performance for problem extraction",
+        },
+        {
+          id: "gpt-4o-mini",
+          name: "gpt-4o-mini",
+          description: "Faster, more cost-effective option",
+        },
+      ],
+      gemini: [
+        {
+          id: "gemini-3-pro-preview",
+          name: "Gemini 3 Pro (Preview)",
+          description: "Best overall performance for complex tasks requiring advanced reasoning",
+        },
+        {
+          id: "gemini-3-flash-preview",
+          name: "Gemini 3 Flash (Preview)",
+          description: "Pro-level intelligence at Flash speed and pricing",
+        },
+        {
+          id: "gemini-1.5-pro",
+          name: "Gemini 1.5 Pro",
+          description: "Legacy model - use Gemini 3 for best results",
+        },
+        {
+          id: "gemini-1.5-flash",
+          name: "Gemini 1.5 Flash",
+          description: "Legacy model - use Gemini 3 Flash for best results",
+        },
+      ],
+      anthropic: [
+        {
+          id: "claude-3-7-sonnet-20250219",
+          name: "Claude 3.7 Sonnet",
+          description: "Best overall performance for problem extraction",
+        },
+        {
+          id: "claude-3-5-sonnet-20241022",
+          name: "Claude 3.5 Sonnet",
+          description: "Balanced performance and speed",
+        },
+        {
+          id: "claude-3-opus-20240229",
+          name: "Claude 3 Opus",
+          description:
+            "Top-level intelligence, fluency, and understanding",
+        },
+      ],
+    },
+  },
+  {
+    key: "solutionModel",
+    title: "Solution Generation",
+    description: "Model used to generate coding solutions",
+    modelsByProvider: {
+      openai: [
+        {
+          id: "gpt-4o",
+          name: "gpt-4o",
+          description: "Strong overall performance for coding tasks",
+        },
+        {
+          id: "gpt-4o-mini",
+          name: "gpt-4o-mini",
+          description: "Faster, more cost-effective option",
+        },
+      ],
+      gemini: [
+        {
+          id: "gemini-3-pro-latest",
+          name: "Gemini 3 Pro (Latest)",
+          description: "Strong overall performance - latest version",
+        },
+        {
+          id: "gemini-3-flash-latest",
+          name: "Gemini 3 Flash (Latest)",
+          description: "Faster, more cost-effective - latest version",
+        },
+        {
+          id: "gemini-3-pro",
+          name: "Gemini 3 Pro",
+          description: "Stable version",
+        },
+        {
+          id: "gemini-3-flash",
+          name: "Gemini 3 Flash",
+          description: "Stable version",
+        },
+        {
+          id: "gemini-1.5-pro",
+          name: "Gemini 1.5 Pro",
+          description: "Legacy model - use Gemini 3 for best results",
+        },
+      ],
+      anthropic: [
+        {
+          id: "claude-3-7-sonnet-20250219",
+          name: "Claude 3.7 Sonnet",
+          description: "Strong overall performance for coding tasks",
+        },
+        {
+          id: "claude-3-5-sonnet-20241022",
+          name: "Claude 3.5 Sonnet",
+          description: "Balanced performance and speed",
+        },
+        {
+          id: "claude-3-opus-20240229",
+          name: "Claude 3 Opus",
+          description:
+            "Top-level intelligence, fluency, and understanding",
+        },
+      ],
+    },
+  },
+  {
+    key: "debuggingModel",
+    title: "Debugging",
+    description: "Model used to debug and improve solutions",
+    modelsByProvider: {
+      openai: [
+        {
+          id: "gpt-4o",
+          name: "gpt-4o",
+          description: "Best for analyzing code and error messages",
+        },
+        {
+          id: "gpt-4o-mini",
+          name: "gpt-4o-mini",
+          description: "Faster, more cost-effective option",
+        },
+      ],
+      gemini: [
+        {
+          id: "gemini-3-pro-latest",
+          name: "Gemini 3 Pro (Latest)",
+          description:
+            "Best for analyzing code and error messages - latest version",
+        },
+        {
+          id: "gemini-3-flash-latest",
+          name: "Gemini 3 Flash (Latest)",
+          description: "Faster, more cost-effective - latest version",
+        },
+        {
+          id: "gemini-3-pro",
+          name: "Gemini 3 Pro",
+          description: "Stable version",
+        },
+        {
+          id: "gemini-3-flash",
+          name: "Gemini 3 Flash",
+          description: "Stable version",
+        },
+        {
+          id: "gemini-1.5-pro",
+          name: "Gemini 1.5 Pro",
+          description: "Legacy model - use Gemini 3 for best results",
+        },
+      ],
+      anthropic: [
+        {
+          id: "claude-3-7-sonnet-20250219",
+          name: "Claude 3.7 Sonnet",
+          description: "Best for analyzing code and error messages",
+        },
+        {
+          id: "claude-3-5-sonnet-20241022",
+          name: "Claude 3.5 Sonnet",
+          description: "Balanced performance and speed",
+        },
+        {
+          id: "claude-3-opus-20240229",
+          name: "Claude 3 Opus",
+          description:
+            "Top-level intelligence, fluency, and understanding",
+        },
+      ],
+    },
+  },
+];
+
+/**
+ * Sanitize a model selection to ensure only allowed models are used.
+ * If the model is not allowed for the provider, the provider's default
+ * model for the given category is returned.
+ */
+export function sanitizeModelSelection(
+  model: string,
+  provider: APIProvider,
+  category: ModelCategoryKey
+): string {
+  const allowed = ALLOWED_MODELS[provider];
+  if (allowed.includes(model)) {
+    return model;
+  }
+
+  const fallback = DEFAULT_MODELS[provider][category];
+  // eslint-disable-next-line no-console
+  console.warn(
+    `Invalid ${provider} model specified for ${category}: ${model}. Using default model: ${fallback}`
+  );
+  return fallback;
+}
+
diff --git a/src/components/Settings/SettingsDialog.tsx b/src/components/Settings/SettingsDialog.tsx
index b8f70b5c..7cfb52f6 100644
--- a/src/components/Settings/SettingsDialog.tsx
+++ b/src/components/Settings/SettingsDialog.tsx
@@ -13,165 +13,12 @@ import { Button } from "../ui/button";
 import { Settings } from "lucide-react";
 import { useToast } from "../../contexts/toast";
 import { CandidateProfileSection, CandidateProfile } from "./CandidateProfileSection";
-
-type APIProvider = "openai" | "gemini" | "anthropic";
-
-type AIModel = {
-  id: string;
-  name: string;
-  description: string;
-};
-
-type ModelCategory = {
-  key: 'extractionModel' | 'solutionModel' | 'debuggingModel';
-  title: string;
-  description: string;
-  openaiModels: AIModel[];
-  geminiModels: AIModel[];
-  anthropicModels: AIModel[];
-};
-
-// Define available models for each category
-const modelCategories: ModelCategory[] = [
-  {
-    key: 'extractionModel',
-    title: 'Problem Extraction',
-    description: 'Model used to analyze screenshots and extract problem details',
-    openaiModels: [
-      {
-        id: "gpt-4o",
-        name: "gpt-4o",
-        description: "Best overall performance for problem extraction"
-      },
-      {
-        id: "gpt-4o-mini",
-        name: "gpt-4o-mini",
-        description: "Faster, more cost-effective option"
-      }
-    ],
-    geminiModels: [
-      {
-        id: "gemini-1.5-pro",
-        name: "Gemini 1.5 Pro",
-        description: "Best overall performance for problem extraction"
-      },
-      {
-        id: "gemini-2.0-flash",
-        name: "Gemini 2.0 Flash",
-        description: "Faster, more cost-effective option"
-      }
-    ],
-    anthropicModels: [
-      {
-        id: "claude-3-7-sonnet-20250219",
-        name: "Claude 3.7 Sonnet",
-        description: "Best overall performance for problem extraction"
-      },
-      {
-        id: "claude-3-5-sonnet-20241022",
-        name: "Claude 3.5 Sonnet",
-        description: "Balanced performance and speed"
-      },
-      {
-        id: "claude-3-opus-20240229",
-        name: "Claude 3 Opus",
-        description: "Top-level intelligence, fluency, and understanding"
-      }
-    ]
-  },
-  {
-    key: 'solutionModel',
-    title: 'Solution Generation',
-    description: 'Model used to generate coding solutions',
-    openaiModels: [
-      {
-        id: "gpt-4o",
-        name: "gpt-4o",
-        description: "Strong overall performance for coding tasks"
-      },
-      {
-        id: "gpt-4o-mini",
-        name: "gpt-4o-mini",
-        description: "Faster, more cost-effective option"
-      }
-    ],
-    geminiModels: [
-      {
-        id: "gemini-1.5-pro",
-        name: "Gemini 1.5 Pro",
-        description: "Strong overall performance for coding tasks"
-      },
-      {
-        id: "gemini-2.0-flash",
-        name: "Gemini 2.0 Flash",
-        description: "Faster, more cost-effective option"
-      }
-    ],
-    anthropicModels: [
-      {
-        id: "claude-3-7-sonnet-20250219",
-        name: "Claude 3.7 Sonnet",
-        description: "Strong overall performance for coding tasks"
-      },
-      {
-        id: "claude-3-5-sonnet-20241022",
-        name: "Claude 3.5 Sonnet",
-        description: "Balanced performance and speed"
-      },
-      {
-        id: "claude-3-opus-20240229",
-        name: "Claude 3 Opus",
-        description: "Top-level intelligence, fluency, and understanding"
-      }
-    ]
-  },
-  {
-    key: 'debuggingModel',
-    title: 'Debugging',
-    description: 'Model used to debug and improve solutions',
-    openaiModels: [
-      {
-        id: "gpt-4o",
-        name: "gpt-4o",
-        description: "Best for analyzing code and error messages"
-      },
-      {
-        id: "gpt-4o-mini",
-        name: "gpt-4o-mini",
-        description: "Faster, more cost-effective option"
-      }
-    ],
-    geminiModels: [
-      {
-        id: "gemini-1.5-pro",
-        name: "Gemini 1.5 Pro",
-        description: "Best for analyzing code and error messages"
-      },
-      {
-        id: "gemini-2.0-flash",
-        name: "Gemini 2.0 Flash",
-        description: "Faster, more cost-effective option"
-      }
-    ],
-    anthropicModels: [
-      {
-        id: "claude-3-7-sonnet-20250219",
-        name: "Claude 3.7 Sonnet",
-        description: "Best for analyzing code and error messages"
-      },
-      {
-        id: "claude-3-5-sonnet-20241022",
-        name: "Claude 3.5 Sonnet",
-        description: "Balanced performance and speed"
-      },
-      {
-        id: "claude-3-opus-20240229",
-        name: "Claude 3 Opus",
-        description: "Top-level intelligence, fluency, and understanding"
-      }
-    ]
-  }
-];
+import {
+  APIProvider,
+  AIModel,
+  MODEL_CATEGORIES,
+  DEFAULT_MODELS,
+} from "../../../shared/aiModels";
 
 interface SettingsDialogProps {
   open?: boolean;
@@ -182,9 +29,15 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
   const [open, setOpen] = useState(externalOpen || false);
   const [apiKey, setApiKey] = useState("");
   const [apiProvider, setApiProvider] = useState<APIProvider>("openai");
-  const [extractionModel, setExtractionModel] = useState("gpt-4o");
-  const [solutionModel, setSolutionModel] = useState("gpt-4o");
-  const [debuggingModel, setDebuggingModel] = useState("gpt-4o");
+  const [extractionModel, setExtractionModel] = useState(
+    DEFAULT_MODELS.openai.extractionModel
+  );
+  const [solutionModel, setSolutionModel] = useState(
+    DEFAULT_MODELS.openai.solutionModel
+  );
+  const [debuggingModel, setDebuggingModel] = useState(
+    DEFAULT_MODELS.openai.debuggingModel
+  );
   const [speechRecognitionModel, setSpeechRecognitionModel] = useState("whisper-1");
   const [candidateProfile, setCandidateProfile] = useState<CandidateProfile>({
     name: "",
@@ -228,11 +81,23 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         .getConfig()
         .then((config: Config) => {
           setApiKey(config.apiKey || "");
-          setApiProvider(config.apiProvider || "openai");
-          setExtractionModel(config.extractionModel || "gpt-4o");
-          setSolutionModel(config.solutionModel || "gpt-4o");
-          setDebuggingModel(config.debuggingModel || "gpt-4o");
-          setSpeechRecognitionModel(config.speechRecognitionModel || "whisper-1");
+          const provider: APIProvider = config.apiProvider || "openai";
+          setApiProvider(provider);
+          const providerDefaults = DEFAULT_MODELS[provider];
+          setExtractionModel(
+            config.extractionModel || providerDefaults.extractionModel
+          );
+          setSolutionModel(
+            config.solutionModel || providerDefaults.solutionModel
+          );
+          setDebuggingModel(
+            config.debuggingModel || providerDefaults.debuggingModel
+          );
+          setSpeechRecognitionModel(
+            config.speechRecognitionModel ||
+              providerDefaults.speechRecognitionModel ||
+              "whisper-1"
+          );
           setCandidateProfile(config.candidateProfile || {
             name: "",
             resume: "",
@@ -254,22 +119,13 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
     setApiProvider(provider);
     
     // Reset models to defaults when changing provider
-    if (provider === "openai") {
-      setExtractionModel("gpt-4o");
-      setSolutionModel("gpt-4o");
-      setDebuggingModel("gpt-4o");
-      setSpeechRecognitionModel("whisper-1");
-    } else if (provider === "gemini") {
-      setExtractionModel("gemini-1.5-pro");
-      setSolutionModel("gemini-1.5-pro");
-      setDebuggingModel("gemini-1.5-pro");
-      setSpeechRecognitionModel("whisper-1"); // Keep whisper-1 but will show as not supported
-    } else if (provider === "anthropic") {
-      setExtractionModel("claude-3-7-sonnet-20250219");
-      setSolutionModel("claude-3-7-sonnet-20250219");
-      setDebuggingModel("claude-3-7-sonnet-20250219");
-      setSpeechRecognitionModel("whisper-1"); // Keep whisper-1 but will show as not supported
-    }
+    const defaults = DEFAULT_MODELS[provider];
+    setExtractionModel(defaults.extractionModel);
+    setSolutionModel(defaults.solutionModel);
+    setDebuggingModel(defaults.debuggingModel);
+    setSpeechRecognitionModel(
+      defaults.speechRecognitionModel || "whisper-1"
+    );
   };
 
   const handleSave = async () => {
@@ -391,7 +247,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
                   />
                   <div className="flex flex-col">
                     <p className="font-medium text-white text-sm">Gemini</p>
-                    <p className="text-xs text-white/60">Gemini 1.5 models</p>
+                    <p className="text-xs text-white/60">Gemini 3 models</p>
                   </div>
                 </div>
               </div>
@@ -541,12 +397,9 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
               Select which models to use for each stage of the process
             </p>
             
-            {modelCategories.map((category) => {
+            {MODEL_CATEGORIES.map((category) => {
               // Get the appropriate model list based on selected provider
-              const models = 
-                apiProvider === "openai" ? category.openaiModels : 
-                apiProvider === "gemini" ? category.geminiModels :
-                category.anthropicModels;
+              const models: AIModel[] = category.modelsByProvider[apiProvider];
               
               return (
                 <div key={category.key} className="mb-4">
diff --git a/tsconfig.electron.json b/tsconfig.electron.json
index daa45613..34497688 100644
--- a/tsconfig.electron.json
+++ b/tsconfig.electron.json
@@ -16,5 +16,5 @@
       "main": ["electron/main.ts"]
     }
   },
-  "include": ["electron/**/*"]
+  "include": ["electron/**/*", "shared/**/*"]
 }
diff --git a/tsconfig.json b/tsconfig.json
index a831c76b..39abecef 100644
--- a/tsconfig.json
+++ b/tsconfig.json
@@ -19,6 +19,6 @@
     "allowImportingTsExtensions": true,
     "types": ["vite/client"]
   },
-  "include": ["electron/**/*", "src/**/*"],
+  "include": ["electron/**/*", "src/**/*", "shared/**/*"],
   "references": [{ "path": "./tsconfig.node.json" }]
 }

From 96cc2142ed3732aa0fbf860f1f8b9a1fba1cf83a Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Thu, 22 Jan 2026 02:24:55 -0800
Subject: [PATCH 12/13] feat: enhance support for speech recognition by adding
 Gemini models and improving suggestion parsing for multi-line inputs

---
 electron/AnswerAssistant.ts                |  68 ++++++++++---
 electron/ConfigHelper.ts                   |  35 ++++++-
 electron/TranscriptionHelper.ts            | 111 ++++++++++++++++++---
 shared/aiModels.ts                         |   3 +-
 src/components/Settings/SettingsDialog.tsx |  90 ++++++++++++++++-
 5 files changed, 269 insertions(+), 38 deletions(-)

diff --git a/electron/AnswerAssistant.ts b/electron/AnswerAssistant.ts
index 6a8c7f75..f5455c06 100644
--- a/electron/AnswerAssistant.ts
+++ b/electron/AnswerAssistant.ts
@@ -311,26 +311,64 @@ Format as simple bullet points, one per line starting with "-".`;
 
   /**
    * Parses AI response into structured suggestions
+   * Handles multi-line suggestions and text after colons (e.g., "Explain that: ...")
    */
   private parseSuggestions(suggestionsText: string): string[] {
-    return suggestionsText
-      .split('\n')
-      .map(line => line.trim())
-      .filter(line => {
-        // Match bullet points, numbered lists, or lines starting with common prefixes
-        return line.startsWith('-') || 
-               line.startsWith('•') || 
-               line.match(/^\d+\./) ||
-               (line.length > 0 && line.length < 200); // Reasonable length
-      })
-      .map(line => {
-        // Remove bullet/number prefixes
-        return line
+    const lines = suggestionsText.split('\n').map(line => line.trim());
+    const suggestions: string[] = [];
+    let currentSuggestion = '';
+
+    for (let i = 0; i < lines.length; i++) {
+      const line = lines[i];
+      
+      // Skip empty lines
+      if (!line) {
+        if (currentSuggestion) {
+          suggestions.push(currentSuggestion.trim());
+          currentSuggestion = '';
+        }
+        continue;
+      }
+
+      // Check if this line starts a new suggestion (bullet point, number, or starts with capital letter after empty line)
+      const isNewSuggestion = 
+        line.startsWith('-') || 
+        line.startsWith('•') || 
+        line.match(/^\d+\./) ||
+        (i > 0 && !lines[i - 1] && line.length > 0 && line.length < 200);
+
+      if (isNewSuggestion) {
+        // Save previous suggestion if exists
+        if (currentSuggestion) {
+          suggestions.push(currentSuggestion.trim());
+        }
+        // Start new suggestion, removing bullet/number prefix
+        currentSuggestion = line
           .replace(/^[-•]\s*/, '')
           .replace(/^\d+\.\s*/, '')
           .trim();
-      })
-      .filter(line => line.length > 0 && line.length < 200); // Filter out empty or too long
+      } else if (currentSuggestion) {
+        // Continue current suggestion (multi-line)
+        currentSuggestion += ' ' + line;
+      } else if (line.length > 0 && line.length < 200) {
+        // Standalone line that might be a suggestion
+        currentSuggestion = line;
+      }
+    }
+
+    // Don't forget the last suggestion
+    if (currentSuggestion) {
+      suggestions.push(currentSuggestion.trim());
+    }
+
+    // Filter out empty or too long suggestions, and clean up
+    return suggestions
+      .map(s => s.trim())
+      .filter(s => s.length > 0 && s.length < 500) // Increased limit for multi-line suggestions
+      .map(s => {
+        // Clean up any extra whitespace
+        return s.replace(/\s+/g, ' ').trim();
+      });
   }
 
   /**
diff --git a/electron/ConfigHelper.ts b/electron/ConfigHelper.ts
index 60989c2b..13945d15 100644
--- a/electron/ConfigHelper.ts
+++ b/electron/ConfigHelper.ts
@@ -114,10 +114,21 @@ export class ConfigHelper extends EventEmitter {
           );
         }
         
-        // Ensure speechRecognitionModel is valid (only whisper-1 for OpenAI)
-        if (config.speechRecognitionModel && config.apiProvider === "openai") {
-          if (config.speechRecognitionModel !== "whisper-1") {
+        // Ensure speechRecognitionModel is valid
+        if (config.speechRecognitionModel) {
+          if (config.apiProvider === "openai" && config.speechRecognitionModel !== "whisper-1") {
             config.speechRecognitionModel = "whisper-1";
+          } else if (config.apiProvider === "gemini") {
+            const allowedGeminiSpeechModels = [
+              "gemini-1.5-flash",
+              "gemini-1.5-pro",
+              "gemini-3-flash-preview",
+              "gemini-3-pro-preview",
+              "gemini-2.0-flash-exp"
+            ];
+            if (!allowedGeminiSpeechModels.includes(config.speechRecognitionModel)) {
+              config.speechRecognitionModel = DEFAULT_MODELS.gemini.speechRecognitionModel || "gemini-3-flash-preview";
+            }
           }
         } else if (!config.speechRecognitionModel) {
           config.speechRecognitionModel = this.defaultConfig.speechRecognitionModel;
@@ -187,17 +198,31 @@ export class ConfigHelper extends EventEmitter {
         updates.extractionModel = defaults.extractionModel;
         updates.solutionModel = defaults.solutionModel;
         updates.debuggingModel = defaults.debuggingModel;
-        // Speech recognition currently only supported for OpenAI
+        // Speech recognition supported for OpenAI and Gemini
         if (defaults.speechRecognitionModel) {
           updates.speechRecognitionModel = defaults.speechRecognitionModel;
         }
       }
       
-      // Validate speech recognition model (only whisper-1 is supported, and only for OpenAI)
+      // Validate speech recognition model
       if (updates.speechRecognitionModel) {
         if (provider === "openai" && updates.speechRecognitionModel !== "whisper-1") {
           console.warn(`Invalid speech recognition model: ${updates.speechRecognitionModel}. Only whisper-1 is supported for OpenAI.`);
           updates.speechRecognitionModel = "whisper-1";
+        } else if (provider === "gemini") {
+          // Validate Gemini models that support audio understanding
+          const allowedGeminiSpeechModels = [
+            "gemini-1.5-flash",
+            "gemini-1.5-pro",
+            "gemini-3-flash-preview",
+            "gemini-3-pro-preview",
+            "gemini-2.0-flash-exp"
+          ];
+          if (!allowedGeminiSpeechModels.includes(updates.speechRecognitionModel)) {
+            const defaultModel = DEFAULT_MODELS[provider].speechRecognitionModel || "gemini-3-flash-preview";
+            console.warn(`Invalid Gemini speech recognition model: ${updates.speechRecognitionModel}. Using default: ${defaultModel}`);
+            updates.speechRecognitionModel = defaultModel;
+          }
         }
       }
       
diff --git a/electron/TranscriptionHelper.ts b/electron/TranscriptionHelper.ts
index f5ebd790..a61d0aa7 100644
--- a/electron/TranscriptionHelper.ts
+++ b/electron/TranscriptionHelper.ts
@@ -1,11 +1,11 @@
 /**
  * TranscriptionHelper - Handles audio transcription using various AI providers
  * Follows Single Responsibility Principle - only handles transcription
- * Supports multiple providers: OpenAI (Whisper), Gemini (future), Anthropic (future)
+ * Supports multiple providers: OpenAI (Whisper), Gemini (Audio Understanding), Anthropic (future)
  */
 import OpenAI from 'openai';
 import Anthropic from '@anthropic-ai/sdk';
-// import * as axios from 'axios'; // Uncomment when implementing Gemini speech recognition
+import * as axios from 'axios';
 import fs from 'fs';
 import path from 'path';
 import { app } from 'electron';
@@ -28,7 +28,7 @@ export class TranscriptionHelper implements ITranscriptionHelper {
   
   // Default models for each provider
   private readonly defaultOpenAIModel: string = 'whisper-1';
-  private readonly defaultGeminiModel: string = ''; // To be set when Gemini speech recognition is available
+  private readonly defaultGeminiModel: string = 'gemini-3-flash-preview'; // Gemini model with audio understanding support
   private readonly defaultAnthropicModel: string = ''; // To be set when Anthropic speech recognition is available
 
   constructor() {
@@ -44,7 +44,7 @@ export class TranscriptionHelper implements ITranscriptionHelper {
 
   /**
    * Initializes AI clients based on API provider from config
-   * Currently supports OpenAI (Whisper), with structure ready for future providers
+   * Supports OpenAI (Whisper) and Gemini (Audio Understanding)
    */
   private initializeAIClients(): void {
     const config = configHelper.loadConfig();
@@ -62,9 +62,8 @@ export class TranscriptionHelper implements ITranscriptionHelper {
       this.openai = new OpenAI({ apiKey: config.apiKey });
       console.log("OpenAI transcription client initialized");
     } else if (config.apiProvider === "gemini") {
-      // Future: Initialize Gemini client when speech recognition is available
       this.geminiApiKey = config.apiKey;
-      console.log("Gemini API key set (speech recognition not yet available)");
+      console.log("Gemini API key set for audio understanding");
     } else if (config.apiProvider === "anthropic") {
       // Future: Initialize Anthropic client when speech recognition is available
       this.anthropic = new Anthropic({ apiKey: config.apiKey });
@@ -76,9 +75,8 @@ export class TranscriptionHelper implements ITranscriptionHelper {
    * Checks if the current provider supports speech recognition
    */
   private isSpeechRecognitionSupported(provider: "openai" | "gemini" | "anthropic"): boolean {
-    // Currently only OpenAI supports speech recognition
-    // Update this as other providers add support
-    return provider === "openai";
+    // OpenAI (Whisper) and Gemini (Audio Understanding) support speech recognition
+    return provider === "openai" || provider === "gemini";
   }
 
   private formatProviderError(provider: "openai" | "gemini" | "anthropic", error: any, context: string): string {
@@ -117,7 +115,7 @@ export class TranscriptionHelper implements ITranscriptionHelper {
     
     // Check if speech recognition is supported for the current provider
     if (!this.isSpeechRecognitionSupported(config.apiProvider)) {
-      throw new Error(`Speech recognition is currently only supported with OpenAI provider. Please switch to OpenAI in settings.`);
+      throw new Error(`Speech recognition is currently only supported with OpenAI or Gemini providers. Please switch to one of these providers in settings.`);
     }
 
     if (!audioBuffer || audioBuffer.length === 0) {
@@ -196,8 +194,8 @@ export class TranscriptionHelper implements ITranscriptionHelper {
   }
 
   /**
-   * Transcribes audio using Gemini API (Future implementation)
-   * TODO: Implement when Gemini speech recognition becomes available
+   * Transcribes audio using Gemini API Audio Understanding
+   * Uses Gemini's multimodal capabilities to transcribe audio to text
    */
   private async transcribeWithGemini(
     audioBuffer: Buffer,
@@ -207,8 +205,93 @@ export class TranscriptionHelper implements ITranscriptionHelper {
       throw new Error('Gemini API key not initialized. Please set Gemini API key in settings.');
     }
 
-    // TODO: Implement Gemini speech recognition when available
-    throw new Error('Gemini speech recognition is not yet available. Please use OpenAI provider for transcription.');
+    // Get speech recognition model from config
+    const config = configHelper.loadConfig();
+    const speechModel = config.speechRecognitionModel || this.defaultGeminiModel;
+
+    try {
+      // Convert audio buffer to base64
+      const audioBase64 = audioBuffer.toString('base64');
+
+      // Normalize MIME type for Gemini API
+      // Gemini supports: audio/mpeg, audio/mp3, audio/wav, audio/flac, audio/webm, audio/m4a, audio/ogg
+      let normalizedMimeType = mimeType;
+      if (mimeType === 'audio/webm') {
+        normalizedMimeType = 'audio/webm';
+      } else if (mimeType.includes('mp3') || mimeType.includes('mpeg')) {
+        normalizedMimeType = 'audio/mpeg';
+      } else if (mimeType.includes('wav')) {
+        normalizedMimeType = 'audio/wav';
+      } else if (mimeType.includes('flac')) {
+        normalizedMimeType = 'audio/flac';
+      } else if (mimeType.includes('m4a')) {
+        normalizedMimeType = 'audio/m4a';
+      } else if (mimeType.includes('ogg')) {
+        normalizedMimeType = 'audio/ogg';
+      }
+
+      // Create Gemini message with audio data and transcription prompt
+      const geminiMessages = [
+        {
+          role: "user",
+          parts: [
+            {
+              text: "Please transcribe this audio to text. Return only the transcribed text without any additional commentary."
+            },
+            {
+              inlineData: {
+                mimeType: normalizedMimeType,
+                data: audioBase64
+              }
+            }
+          ]
+        }
+      ];
+
+      // Make API request to Gemini
+      const response = await axios.default.post(
+        `https://generativelanguage.googleapis.com/v1beta/models/${speechModel}:generateContent?key=${this.geminiApiKey}`,
+        {
+          contents: geminiMessages,
+          generationConfig: {
+            temperature: 0.1, // Low temperature for accurate transcription
+            maxOutputTokens: 4096
+          }
+        }
+      );
+
+      const responseData = response.data;
+
+      // Extract transcription text from response
+      if (!responseData.candidates || responseData.candidates.length === 0) {
+        throw new Error("Empty response from Gemini API");
+      }
+
+      const transcriptionText = responseData.candidates[0].content.parts[0].text;
+
+      // Gemini doesn't provide language detection in the same way as Whisper
+      // We can try to extract it from the response if available, otherwise return undefined
+      const language = responseData.candidates[0]?.content?.parts[0]?.text?.match(/\[Language: (\w+)\]/)?.[1];
+
+      return {
+        text: transcriptionText.trim(),
+        language: language || undefined,
+      };
+    } catch (error: any) {
+      console.error('Gemini transcription error:', error);
+      
+      // Provide more specific error messages
+      const status = error?.status ?? error?.response?.status;
+      if (status === 401) {
+        throw new Error(this.formatProviderError("gemini", error, "Auth"));
+      } else if (status === 429) {
+        throw new Error(this.formatProviderError("gemini", error, "Rate limit"));
+      } else if (status === 400) {
+        throw new Error(this.formatProviderError("gemini", error, "Invalid audio file or request"));
+      }
+
+      throw new Error(this.formatProviderError("gemini", error, "Transcription"));
+    }
   }
 
   /**
diff --git a/shared/aiModels.ts b/shared/aiModels.ts
index 45fdb6b7..f95a8b2b 100644
--- a/shared/aiModels.ts
+++ b/shared/aiModels.ts
@@ -46,7 +46,7 @@ export const DEFAULT_MODELS: Record<
     extractionModel: string;
     solutionModel: string;
     debuggingModel: string;
-    // Speech recognition is only supported for OpenAI right now.
+    // Speech recognition is supported for OpenAI (Whisper) and Gemini (Audio Understanding)
     speechRecognitionModel?: string;
   }
 > = {
@@ -60,6 +60,7 @@ export const DEFAULT_MODELS: Record<
     extractionModel: "gemini-3-flash-preview",
     solutionModel: "gemini-3-flash-preview",
     debuggingModel: "gemini-3-flash-preview",
+    speechRecognitionModel: "gemini-3-flash-preview",
   },
   anthropic: {
     extractionModel: "claude-3-7-sonnet-20250219",
diff --git a/src/components/Settings/SettingsDialog.tsx b/src/components/Settings/SettingsDialog.tsx
index 7cfb52f6..89342ed9 100644
--- a/src/components/Settings/SettingsDialog.tsx
+++ b/src/components/Settings/SettingsDialog.tsx
@@ -96,7 +96,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
           setSpeechRecognitionModel(
             config.speechRecognitionModel ||
               providerDefaults.speechRecognitionModel ||
-              "whisper-1"
+              (config.apiProvider === "gemini" ? "gemini-3-flash-preview" : "whisper-1")
           );
           setCandidateProfile(config.candidateProfile || {
             name: "",
@@ -124,7 +124,8 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
     setSolutionModel(defaults.solutionModel);
     setDebuggingModel(defaults.debuggingModel);
     setSpeechRecognitionModel(
-      defaults.speechRecognitionModel || "whisper-1"
+      defaults.speechRecognitionModel || 
+      (provider === "gemini" ? "gemini-3-flash-preview" : "whisper-1")
     );
   };
 
@@ -484,10 +485,93 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
                   </div>
                 </div>
               </div>
+            ) : apiProvider === "gemini" ? (
+              <div className="space-y-2">
+                <div
+                  className={`p-2 rounded-lg cursor-pointer transition-colors ${
+                    speechRecognitionModel === "gemini-1.5-flash"
+                      ? "bg-white/10 border border-white/20"
+                      : "bg-black/30 border border-white/5 hover:bg-white/5"
+                  }`}
+                  onClick={() => setSpeechRecognitionModel("gemini-1.5-flash")}
+                >
+                  <div className="flex items-center gap-2">
+                    <div
+                      className={`w-3 h-3 rounded-full ${
+                        speechRecognitionModel === "gemini-1.5-flash" ? "bg-white" : "bg-white/20"
+                      }`}
+                    />
+                    <div>
+                      <p className="font-medium text-white text-xs">Gemini 1.5 Flash</p>
+                      <p className="text-xs text-white/60">Fast and efficient audio understanding</p>
+                    </div>
+                  </div>
+                </div>
+                <div
+                  className={`p-2 rounded-lg cursor-pointer transition-colors ${
+                    speechRecognitionModel === "gemini-1.5-pro"
+                      ? "bg-white/10 border border-white/20"
+                      : "bg-black/30 border border-white/5 hover:bg-white/5"
+                  }`}
+                  onClick={() => setSpeechRecognitionModel("gemini-1.5-pro")}
+                >
+                  <div className="flex items-center gap-2">
+                    <div
+                      className={`w-3 h-3 rounded-full ${
+                        speechRecognitionModel === "gemini-1.5-pro" ? "bg-white" : "bg-white/20"
+                      }`}
+                    />
+                    <div>
+                      <p className="font-medium text-white text-xs">Gemini 1.5 Pro</p>
+                      <p className="text-xs text-white/60">Higher accuracy audio understanding</p>
+                    </div>
+                  </div>
+                </div>
+                <div
+                  className={`p-2 rounded-lg cursor-pointer transition-colors ${
+                    speechRecognitionModel === "gemini-3-flash-preview"
+                      ? "bg-white/10 border border-white/20"
+                      : "bg-black/30 border border-white/5 hover:bg-white/5"
+                  }`}
+                  onClick={() => setSpeechRecognitionModel("gemini-3-flash-preview")}
+                >
+                  <div className="flex items-center gap-2">
+                    <div
+                      className={`w-3 h-3 rounded-full ${
+                        speechRecognitionModel === "gemini-3-flash-preview" ? "bg-white" : "bg-white/20"
+                      }`}
+                    />
+                    <div>
+                      <p className="font-medium text-white text-xs">Gemini 3 Flash (Preview)</p>
+                      <p className="text-xs text-white/60">Latest preview model with audio understanding</p>
+                    </div>
+                  </div>
+                </div>
+                <div
+                  className={`p-2 rounded-lg cursor-pointer transition-colors ${
+                    speechRecognitionModel === "gemini-3-pro-preview"
+                      ? "bg-white/10 border border-white/20"
+                      : "bg-black/30 border border-white/5 hover:bg-white/5"
+                  }`}
+                  onClick={() => setSpeechRecognitionModel("gemini-3-pro-preview")}
+                >
+                  <div className="flex items-center gap-2">
+                    <div
+                      className={`w-3 h-3 rounded-full ${
+                        speechRecognitionModel === "gemini-3-pro-preview" ? "bg-white" : "bg-white/20"
+                      }`}
+                    />
+                    <div>
+                      <p className="font-medium text-white text-xs">Gemini 3 Pro (Preview)</p>
+                      <p className="text-xs text-white/60">Best accuracy with audio understanding</p>
+                    </div>
+                  </div>
+                </div>
+              </div>
             ) : (
               <div className="p-3 rounded-lg bg-black/30 border border-white/10">
                 <p className="text-sm text-white/70">
-                  Speech recognition is only supported with OpenAI. Please switch to OpenAI provider to use this feature.
+                  Speech recognition is only supported with OpenAI or Gemini. Please switch to one of these providers to use this feature.
                 </p>
               </div>
             )}

From b0aa78337347af6c00a3d792e786602187ffc04a Mon Sep 17 00:00:00 2001
From: Pratik Shankar Jadhav
 <44173994+pratikjadhav2726@users.noreply.github.com>
Date: Thu, 22 Jan 2026 02:40:17 -0800
Subject: [PATCH 13/13] feat: add answer model configuration to support AI
 answer suggestions across multiple providers

---
 electron/AnswerAssistant.ts                | 10 ++--
 electron/ConfigHelper.ts                   | 20 ++++++-
 electron/preload.ts                        |  2 +-
 shared/aiModels.ts                         | 66 +++++++++++++++++++++-
 src/components/Settings/SettingsDialog.tsx | 15 ++++-
 src/types/electron.d.ts                    |  4 +-
 6 files changed, 106 insertions(+), 11 deletions(-)

diff --git a/electron/AnswerAssistant.ts b/electron/AnswerAssistant.ts
index f5455c06..95461415 100644
--- a/electron/AnswerAssistant.ts
+++ b/electron/AnswerAssistant.ts
@@ -49,7 +49,6 @@ export class AnswerAssistant implements IAnswerAssistant {
   private openai: OpenAI | null = null;
   private geminiApiKey: string | null = null;
   private anthropic: Anthropic | null = null;
-  private readonly defaultModels: Record<APIProvider, string> = DEFAULT_ANSWER_MODELS;
 
   private formatProviderError(provider: "openai" | "gemini" | "anthropic", error: any, context: string): string {
     const status =
@@ -139,10 +138,13 @@ export class AnswerAssistant implements IAnswerAssistant {
 
     try {
       let suggestionsText = '';
+      
+      // Get the configured answer model, fallback to default if not set
+      const answerModel = config.answerModel || DEFAULT_ANSWER_MODELS[config.apiProvider];
 
       if (config.apiProvider === "openai" && this.openai) {
         const response = await this.openai.chat.completions.create({
-          model: this.defaultModels.openai,
+          model: answerModel,
           messages: [
             {
               role: 'system',
@@ -171,7 +173,7 @@ export class AnswerAssistant implements IAnswerAssistant {
         ];
 
         const response = await axios.default.post(
-          `https://generativelanguage.googleapis.com/v1beta/models/${this.defaultModels.gemini}:generateContent?key=${this.geminiApiKey}`,
+          `https://generativelanguage.googleapis.com/v1beta/models/${answerModel}:generateContent?key=${this.geminiApiKey}`,
           {
             contents: geminiMessages,
             generationConfig: {
@@ -187,7 +189,7 @@ export class AnswerAssistant implements IAnswerAssistant {
         }
       } else if (config.apiProvider === "anthropic" && this.anthropic) {
         const response = await this.anthropic.messages.create({
-          model: this.defaultModels.anthropic,
+          model: answerModel,
           max_tokens: 500,
           messages: [
             {
diff --git a/electron/ConfigHelper.ts b/electron/ConfigHelper.ts
index 13945d15..06d77ac8 100644
--- a/electron/ConfigHelper.ts
+++ b/electron/ConfigHelper.ts
@@ -23,6 +23,7 @@ interface Config {
   extractionModel: string;
   solutionModel: string;
   debuggingModel: string;
+  answerModel: string;  // Model for AI answer suggestions in conversations
   speechRecognitionModel: string;  // Speech recognition model (Whisper for OpenAI)
   language: string;
   opacity: number;
@@ -37,6 +38,7 @@ export class ConfigHelper extends EventEmitter {
     extractionModel: DEFAULT_MODELS[DEFAULT_PROVIDER].extractionModel,
     solutionModel: DEFAULT_MODELS[DEFAULT_PROVIDER].solutionModel,
     debuggingModel: DEFAULT_MODELS[DEFAULT_PROVIDER].debuggingModel,
+    answerModel: DEFAULT_MODELS[DEFAULT_PROVIDER].answerModel,
     speechRecognitionModel:
       DEFAULT_MODELS.openai.speechRecognitionModel || "whisper-1",
     language: "python",
@@ -113,6 +115,13 @@ export class ConfigHelper extends EventEmitter {
             "debuggingModel"
           );
         }
+        if (config.answerModel) {
+          config.answerModel = sanitizeModelSelection(
+            config.answerModel,
+            config.apiProvider,
+            "answerModel"
+          );
+        }
         
         // Ensure speechRecognitionModel is valid
         if (config.speechRecognitionModel) {
@@ -198,6 +207,7 @@ export class ConfigHelper extends EventEmitter {
         updates.extractionModel = defaults.extractionModel;
         updates.solutionModel = defaults.solutionModel;
         updates.debuggingModel = defaults.debuggingModel;
+        updates.answerModel = defaults.answerModel;
         // Speech recognition supported for OpenAI and Gemini
         if (defaults.speechRecognitionModel) {
           updates.speechRecognitionModel = defaults.speechRecognitionModel;
@@ -248,6 +258,13 @@ export class ConfigHelper extends EventEmitter {
           "debuggingModel"
         );
       }
+      if (updates.answerModel) {
+        updates.answerModel = sanitizeModelSelection(
+          updates.answerModel,
+          provider,
+          "answerModel"
+        );
+      }
       
       const newConfig = { ...currentConfig, ...updates };
       this.saveConfig(newConfig);
@@ -256,7 +273,8 @@ export class ConfigHelper extends EventEmitter {
       // This prevents re-initializing the AI client when only opacity changes
       if (updates.apiKey !== undefined || updates.apiProvider !== undefined || 
           updates.extractionModel !== undefined || updates.solutionModel !== undefined || 
-          updates.debuggingModel !== undefined || updates.speechRecognitionModel !== undefined || 
+          updates.debuggingModel !== undefined || updates.answerModel !== undefined ||
+          updates.speechRecognitionModel !== undefined || 
           updates.language !== undefined) {
         this.emit('config-updated', newConfig);
       }
diff --git a/electron/preload.ts b/electron/preload.ts
index 0b83247b..7feecb48 100644
--- a/electron/preload.ts
+++ b/electron/preload.ts
@@ -205,7 +205,7 @@ const electronAPI = {
   
   // New methods for OpenAI API integration
   getConfig: () => ipcRenderer.invoke("get-config"),
-  updateConfig: (config: { apiKey?: string; model?: string; language?: string; opacity?: number; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string; candidateProfile?: any }) => 
+  updateConfig: (config: { apiKey?: string; model?: string; language?: string; opacity?: number; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; answerModel?: string; speechRecognitionModel?: string; candidateProfile?: any }) => 
     ipcRenderer.invoke("update-config", config),
   onShowSettings: (callback: () => void) => {
     const subscription = () => callback()
diff --git a/shared/aiModels.ts b/shared/aiModels.ts
index f95a8b2b..583203b3 100644
--- a/shared/aiModels.ts
+++ b/shared/aiModels.ts
@@ -13,7 +13,8 @@ export type APIProvider = "openai" | "gemini" | "anthropic";
 export type ModelCategoryKey =
   | "extractionModel"
   | "solutionModel"
-  | "debuggingModel";
+  | "debuggingModel"
+  | "answerModel";
 
 export interface AIModel {
   id: string;
@@ -46,6 +47,7 @@ export const DEFAULT_MODELS: Record<
     extractionModel: string;
     solutionModel: string;
     debuggingModel: string;
+    answerModel: string;
     // Speech recognition is supported for OpenAI (Whisper) and Gemini (Audio Understanding)
     speechRecognitionModel?: string;
   }
@@ -54,18 +56,21 @@ export const DEFAULT_MODELS: Record<
     extractionModel: "gpt-4o",
     solutionModel: "gpt-4o",
     debuggingModel: "gpt-4o",
+    answerModel: "gpt-4o-mini",
     speechRecognitionModel: "whisper-1",
   },
   gemini: {
     extractionModel: "gemini-3-flash-preview",
     solutionModel: "gemini-3-flash-preview",
     debuggingModel: "gemini-3-flash-preview",
+    answerModel: "gemini-3-flash-preview",
     speechRecognitionModel: "gemini-3-flash-preview",
   },
   anthropic: {
     extractionModel: "claude-3-7-sonnet-20250219",
     solutionModel: "claude-3-7-sonnet-20250219",
     debuggingModel: "claude-3-7-sonnet-20250219",
+    answerModel: "claude-3-7-sonnet-20250219",
   },
 };
 
@@ -299,6 +304,65 @@ export const MODEL_CATEGORIES: ModelCategoryDefinition[] = [
       ],
     },
   },
+  {
+    key: "answerModel",
+    title: "Answer Suggestions",
+    description: "Model used to generate AI answer suggestions for conversation questions",
+    modelsByProvider: {
+      openai: [
+        {
+          id: "gpt-4o-mini",
+          name: "gpt-4o-mini",
+          description: "Fast and cost-effective for conversation suggestions",
+        },
+        {
+          id: "gpt-4o",
+          name: "gpt-4o",
+          description: "Best overall performance for answer suggestions",
+        },
+      ],
+      gemini: [
+        {
+          id: "gemini-3-flash-preview",
+          name: "Gemini 3 Flash (Preview)",
+          description: "Fast and efficient for conversation suggestions",
+        },
+        {
+          id: "gemini-3-pro-preview",
+          name: "Gemini 3 Pro (Preview)",
+          description: "Best performance for complex conversation contexts",
+        },
+        {
+          id: "gemini-1.5-pro",
+          name: "Gemini 1.5 Pro",
+          description: "Legacy model - use Gemini 3 for best results",
+        },
+        {
+          id: "gemini-1.5-flash",
+          name: "Gemini 1.5 Flash",
+          description: "Legacy model - use Gemini 3 Flash for best results",
+        },
+      ],
+      anthropic: [
+        {
+          id: "claude-3-7-sonnet-20250219",
+          name: "Claude 3.7 Sonnet",
+          description: "Best overall performance for answer suggestions",
+        },
+        {
+          id: "claude-3-5-sonnet-20241022",
+          name: "Claude 3.5 Sonnet",
+          description: "Balanced performance and speed",
+        },
+        {
+          id: "claude-3-opus-20240229",
+          name: "Claude 3 Opus",
+          description:
+            "Top-level intelligence, fluency, and understanding",
+        },
+      ],
+    },
+  },
 ];
 
 /**
diff --git a/src/components/Settings/SettingsDialog.tsx b/src/components/Settings/SettingsDialog.tsx
index 89342ed9..ab83895d 100644
--- a/src/components/Settings/SettingsDialog.tsx
+++ b/src/components/Settings/SettingsDialog.tsx
@@ -38,6 +38,9 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
   const [debuggingModel, setDebuggingModel] = useState(
     DEFAULT_MODELS.openai.debuggingModel
   );
+  const [answerModel, setAnswerModel] = useState(
+    DEFAULT_MODELS.openai.answerModel
+  );
   const [speechRecognitionModel, setSpeechRecognitionModel] = useState("whisper-1");
   const [candidateProfile, setCandidateProfile] = useState<CandidateProfile>({
     name: "",
@@ -73,6 +76,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         extractionModel?: string;
         solutionModel?: string;
         debuggingModel?: string;
+        answerModel?: string;
         speechRecognitionModel?: string;
         candidateProfile?: CandidateProfile;
       }
@@ -93,6 +97,9 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
           setDebuggingModel(
             config.debuggingModel || providerDefaults.debuggingModel
           );
+          setAnswerModel(
+            config.answerModel || providerDefaults.answerModel
+          );
           setSpeechRecognitionModel(
             config.speechRecognitionModel ||
               providerDefaults.speechRecognitionModel ||
@@ -123,6 +130,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
     setExtractionModel(defaults.extractionModel);
     setSolutionModel(defaults.solutionModel);
     setDebuggingModel(defaults.debuggingModel);
+    setAnswerModel(defaults.answerModel);
     setSpeechRecognitionModel(
       defaults.speechRecognitionModel || 
       (provider === "gemini" ? "gemini-3-flash-preview" : "whisper-1")
@@ -138,6 +146,7 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
         extractionModel,
         solutionModel,
         debuggingModel,
+        answerModel,
         speechRecognitionModel,
         candidateProfile,
       });
@@ -415,13 +424,15 @@ export function SettingsDialog({ open: externalOpen, onOpenChange }: SettingsDia
                       const currentValue = 
                         category.key === 'extractionModel' ? extractionModel :
                         category.key === 'solutionModel' ? solutionModel :
-                        debuggingModel;
+                        category.key === 'debuggingModel' ? debuggingModel :
+                        answerModel;
                       
                       // Determine which setter function to use
                       const setValue = 
                         category.key === 'extractionModel' ? setExtractionModel :
                         category.key === 'solutionModel' ? setSolutionModel :
-                        setDebuggingModel;
+                        category.key === 'debuggingModel' ? setDebuggingModel :
+                        setAnswerModel;
                         
                       return (
                         <div
diff --git a/src/types/electron.d.ts b/src/types/electron.d.ts
index 4a5e5725..7ee7cf6c 100644
--- a/src/types/electron.d.ts
+++ b/src/types/electron.d.ts
@@ -54,8 +54,8 @@ export interface ElectronAPI {
   getPlatform: () => string
   
   // New methods for OpenAI integration
-  getConfig: () => Promise<{ apiKey: string; model: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string; candidateProfile?: any }>
-  updateConfig: (config: { apiKey?: string; model?: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; speechRecognitionModel?: string; candidateProfile?: any }) => Promise<boolean>
+  getConfig: () => Promise<{ apiKey: string; model: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; answerModel?: string; speechRecognitionModel?: string; candidateProfile?: any }>
+  updateConfig: (config: { apiKey?: string; model?: string; apiProvider?: string; extractionModel?: string; solutionModel?: string; debuggingModel?: string; answerModel?: string; speechRecognitionModel?: string; candidateProfile?: any }) => Promise<boolean>
   checkApiKey: () => Promise<boolean>
   validateApiKey: (apiKey: string) => Promise<{ valid: boolean; error?: string }>
   openLink: (url: string) => void