From 3cf27bb83828c4740df1391e70da9a74875e27e4 Mon Sep 17 00:00:00 2001 From: Elliot Kang <kkang2097@gmail.com> Date: Mon, 11 Sep 2023 14:55:50 -0700 Subject: [PATCH] Okay, should be final version. --- packages/core/src/OutputParser.ts | 52 ++++--------------------------- 1 file changed, 6 insertions(+), 46 deletions(-) diff --git a/packages/core/src/OutputParser.ts b/packages/core/src/OutputParser.ts index 11bd7f023..1498f3f00 100644 --- a/packages/core/src/OutputParser.ts +++ b/packages/core/src/OutputParser.ts @@ -56,54 +56,14 @@ class OutputParserError extends Error { function parseJsonMarkdown(text: string) { text = text.trim(); - const beginDelimiter = "```json"; - const endDelimiter = "```"; - - const beginIndex = text.indexOf(beginDelimiter); - const endIndex = text.indexOf( - endDelimiter, - beginIndex + beginDelimiter.length, - ); - //Scenario 1: LLM follows instruction format. However, it doesn't always do this. - if (!(beginIndex === -1 || endIndex === -1)) { - const jsonText = text.substring( - beginIndex + beginDelimiter.length, - endIndex, - ); - return JSON.parse(jsonText); - } - - //Scenario 2: LLM follows instruction format roughly, but doesn't do this exactly. - // For example: [```json] part was not returned, or there are irregular \n spaces. + //This code is more general than the previous version, and should be faster. + const beginIndex = text.indexOf("["); + const endIndex = text.lastIndexOf("]"); + const jsonText = text.substring(beginIndex, endIndex + 1); try { - //This isn't a JSON markdown, but we should try again with something else. - //Try to get data_str to be a list of JSON objects - const new_data_str: string[] = text - .replace("[", " ") - .replace("]", " ") - .replace("\n", " ") - .trim() - //Warning: This regex might be slow. - .split(/(?=},)/g); - const arr_length = new_data_str.length; - - //String formatting - //First to penultimate element - for (let i = 0; i < arr_length - 1; i++) { - new_data_str[i] += "}"; - } - //Second to final element - for (let i = 1; i < arr_length; i++) { - new_data_str[i] = new_data_str[i].replace("},", " "); - } - const output: object[] = new_data_str.map((item) => JSON.parse(item)); - return output; + return JSON.parse(jsonText); } catch (e) { - //In the worst case scenario and our options are exhausted, throw error. - throw new OutputParserError("Not a valid json", { - cause: e as Error, - output: text, - }); + throw new OutputParserError("Not a json markdown", { output: text }); } } -- GitLab