feat(parsers): Enhance parsers to deal with some thinking models better.

2025-05-08 00:20:31 -06:00 · 2025-05-08 00:20:31 -06:00 · 3b547251c2
commit 3b547251c2
parent bdace57cfd
4 changed files with 32 additions and 0 deletions
--- a/src/lib/chains/suggestionGeneratorAgent.ts
+++ b/src/lib/chains/suggestionGeneratorAgent.ts
@ -10,6 +10,7 @@ const suggestionGeneratorPrompt = `
 You are an AI suggestion generator for an AI powered search engine. You will be given a conversation below. You need to generate 4-5 suggestions based on the conversation. The suggestion should be relevant to the conversation that can be used by the user to ask the chat model for more information.
 You need to make sure the suggestions are relevant to the conversation and are helpful to the user. Keep a note that the user might use these suggestions to ask a chat model for more information. 
 Make sure the suggestions are medium in length and are informative and relevant to the conversation.
+If you are a thinking or reasoning AI, you should avoid using \`<suggestions>\` and \`</suggestions>\` tags in your thinking. Those tags should only be used in the final output.

 Provide these suggestions separated by newlines between the XML tags <suggestions> and </suggestions>. For example:

--- a/src/lib/outputParsers/lineOutputParser.ts
+++ b/src/lib/outputParsers/lineOutputParser.ts
@ -21,6 +21,10 @@ class LineOutputParser extends BaseOutputParser<string> {
  async parse(text: string): Promise<string> {
    text = text.trim() || '';

+    // First, remove all <think>...</think> blocks to avoid parsing tags inside thinking content
+    // This might be a little aggressive. Prompt massaging might be all we need, but this is a guarantee and should rarely mess anything up.
+    text = this.removeThinkingBlocks(text);
+
    const regex = /^(\s*(-|\*|\d+\.\s|\d+\)\s|\u2022)\s*)+/;
    const startKeyIndex = text.indexOf(`<${this.key}>`);
    const endKeyIndex = text.indexOf(`</${this.key}>`);
@ -40,6 +44,17 @@ class LineOutputParser extends BaseOutputParser<string> {
    return line;
  }

+  /**
+   * Removes all content within <think>...</think> blocks
+   * @param text The input text containing thinking blocks
+   * @returns The text with all thinking blocks removed
+   */
+  private removeThinkingBlocks(text: string): string {
+    // Use regex to identify and remove all <think>...</think> blocks
+    // Using the 's' flag to make dot match newlines
+    return text.replace(/<think>[\s\S]*?<\/think>/g, '').trim();
+  }
+
  getFormatInstructions(): string {
    throw new Error('Not implemented.');
  }
--- a/src/lib/outputParsers/listLineOutputParser.ts
+++ b/src/lib/outputParsers/listLineOutputParser.ts
@ -21,6 +21,10 @@ class LineListOutputParser extends BaseOutputParser<string[]> {
  async parse(text: string): Promise<string[]> {
    text = text.trim() || '';

+    // First, remove all <think>...</think> blocks to avoid parsing tags inside thinking content
+    // This might be a little aggressive. Prompt massaging might be all we need, but this is a guarantee and should rarely mess anything up.
+    text = this.removeThinkingBlocks(text);
+
    const regex = /^(\s*(-|\*|\d+\.\s|\d+\)\s|\u2022)\s*)+/;
    const startKeyIndex = text.indexOf(`<${this.key}>`);
    const endKeyIndex = text.indexOf(`</${this.key}>`);
@ -42,6 +46,17 @@ class LineListOutputParser extends BaseOutputParser<string[]> {
    return lines;
  }

+  /**
+   * Removes all content within <think>...</think> blocks
+   * @param text The input text containing thinking blocks
+   * @returns The text with all thinking blocks removed
+   */
+  private removeThinkingBlocks(text: string): string {
+    // Use regex to identify and remove all <think>...</think> blocks
+    // Using [\s\S] pattern to match all characters including newlines
+    return text.replace(/<think>[\s\S]*?<\/think>/g, '').trim();
+  }
+
  getFormatInstructions(): string {
    throw new Error('Not implemented.');
  }
--- a/src/lib/prompts/webSearch.ts
+++ b/src/lib/prompts/webSearch.ts
@ -3,6 +3,7 @@ You are an AI question rephraser. You will be given a conversation and a follow-
 If it is a simple writing task or a greeting (unless the greeting contains a question after it) like Hi, Hello, How are you, etc. than a question then you need to return \`not_needed\` as the response (This is because the LLM won't need to search the web for finding information on this topic).
 If the user asks some question from some URL or wants you to summarize a PDF or a webpage (via URL) you need to return the links inside the \`links\` XML block and the question inside the \`question\` XML block. If the user wants to you to summarize the webpage or the PDF you need to return \`summarize\` inside the \`question\` XML block in place of a question and the link to summarize in the \`links\` XML block.
 You must always return the rephrased question inside the \`question\` XML block, if there are no links in the follow-up question then don't insert a \`links\` XML block in your response.
+If you are a thinking or reasoning AI, you should avoid using \`<question>\` and \`</question>\` tags in your thinking. Those tags should only be used in the final output. You should also avoid using \`<links>\` and \`</links>\` tags in your thinking. Those tags should only be used in the final output.

 There are several examples attached for your reference inside the below \`examples\` XML block