// The maximum timeout in seconds to wait for the parsing to finish.
maxTimeout=2000;
// The result type for the parser.
resultType:ResultType="text";
// The interval in seconds to check if the parsing is done.
checkInterval=1;
// The maximum timeout in seconds to wait for the parsing to finish.
maxTimeout=2000;
// Whether to print the progress of the parsing.
verbose=true;
// The result type for the parser.
resultType:ResultType="text";
// The language of the text to parse.
language:Language="en";
// The parsing instruction for the parser.
parsingInstruction:string="";
// If set to true, the parser will ignore diagonal text (when the text rotation in degrees modulo 90 is not 0).
skipDiagonalText:boolean=false;
// If set to true, the cache will be ignored and the document re-processes. All document are kept in cache for 48hours after the job was completed to avoid processing the same document twice.
invalidateCache:boolean=false;
// The parsing instruction for the parser. Backend default is an empty string.
parsingInstruction?:string;
// Wether to ignore diagonal text (when the text rotation in degrees is not 0, 90, 180 or 270, so not a horizontal or vertical text). Backend default is false.
skipDiagonalText?:boolean;
// Wheter to ignore the cache and re-process the document. All documents are kept in cache for 48hours after the job was completed to avoid processing the same document twice. Backend default is false.
invalidateCache?:boolean;
// Wether the document should not be cached in the first place. Backend default is false.
doNotCache?:boolean;
// Wether to use a faster mode to extract text from documents. This mode will skip OCR of images, and table/heading reconstruction. Note: Non-compatible with gpt4oMode. Backend default is false.
fastMode?:boolean;
// Wether to keep column in the text according to document layout. Reduce reconstruction accuracy, and LLM's/embedings performances in most cases.
doNotUnrollColumns?:boolean;
// The page separator to use to split the text. Default is None, which means the parser will use the default separator '\\n---\\n'.
pageSeperator?:string;
// Whether to use gpt-4o to extract text from documents.
gpt4oMode:boolean=false;
// The API key for the GPT-4o API. Optional, lowers the cost of parsing. Can be set as an env variable: LLAMA_CLOUD_GPT4O_API_KEY.
...
...
@@ -162,14 +170,26 @@ export class LlamaParseReader extends FileReader {