Skip to content
Snippets Groups Projects
Commit ff0e831d authored by Elliot Kang's avatar Elliot Kang
Browse files

Simplified OutputParser

parent b75e2d23
No related branches found
No related tags found
No related merge requests found
#!/usr/bin/env sh
. "$(dirname -- "$0")/_/husky.sh"
pnpm lint
#!/usr/bin/env sh
. "$(dirname -- "$0")/_/husky.sh"
pnpm test
......@@ -56,54 +56,14 @@ class OutputParserError extends Error {
function parseJsonMarkdown(text: string) {
text = text.trim();
const beginDelimiter = "```json";
const endDelimiter = "```";
const beginIndex = text.indexOf(beginDelimiter);
const endIndex = text.indexOf(
endDelimiter,
beginIndex + beginDelimiter.length,
);
//Scenario 1: LLM follows instruction format. However, it doesn't always do this.
if (!(beginIndex === -1 || endIndex === -1)) {
const jsonText = text.substring(
beginIndex + beginDelimiter.length,
endIndex,
);
return JSON.parse(jsonText);
}
//Scenario 2: LLM follows instruction format roughly, but doesn't do this exactly.
// For example: [```json] part was not returned, or there are irregular \n spaces.
//This code is more general than the previous version, and should be faster.
const beginIndex = text.indexOf("[");
const endIndex = text.lastIndexOf("]");
const jsonText = text.substring(beginIndex, endIndex + 1);
try {
//This isn't a JSON markdown, but we should try again with something else.
//Try to get data_str to be a list of JSON objects
const new_data_str: string[] = text
.replace("[", " ")
.replace("]", " ")
.replace("\n", " ")
.trim()
//Warning: This regex might be slow.
.split(/(?=},)/g);
const arr_length = new_data_str.length;
//String formatting
//First to penultimate element
for (let i = 0; i < arr_length - 1; i++) {
new_data_str[i] += "}";
}
//Second to final element
for (let i = 1; i < arr_length; i++) {
new_data_str[i] = new_data_str[i].replace("},", " ");
}
const output: object[] = new_data_str.map((item) => JSON.parse(item));
return output;
return JSON.parse(jsonText);
} catch (e) {
//In the worst case scenario and our options are exhausted, throw error.
throw new OutputParserError("Not a valid json", {
cause: e as Error,
output: text,
});
throw new OutputParserError("Not a json markdown", { output: text });
}
}
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment