diff --git a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/docs/base.py b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/docs/base.py index a2db764561e60c45f2a1a04deccd796990c0ff4f..a3c168d61e2f56fab4b8e82621c8b2a1341b5ae7 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/docs/base.py +++ b/llama-index-integrations/readers/llama-index-readers-file/llama_index/readers/file/docs/base.py @@ -53,7 +53,7 @@ class PDFReader(BaseReader): # This block returns a whole PDF as a single Document if self.return_full_document: text = "" - metadata = {"file_name": fp.name} + metadata = {"file_name": file.name} for page in range(num_pages): # Extract the text from the page @@ -71,7 +71,7 @@ class PDFReader(BaseReader): page_text = pdf.pages[page].extract_text() page_label = pdf.page_labels[page] - metadata = {"page_label": page_label, "file_name": fp.name} + metadata = {"page_label": page_label, "file_name": file.name} if extra_info is not None: metadata.update(extra_info) diff --git a/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml b/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml index 71561c017a295f1efe4d7123a115534a6c676db4..92528f5930d3545a520e5414f45b935e908d6380 100644 --- a/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml +++ b/llama-index-integrations/readers/llama-index-readers-file/pyproject.toml @@ -50,7 +50,7 @@ license = "MIT" maintainers = ["FarisHijazi", "Haowjy", "ephe-meral", "hursh-desai", "iamarunbrahma", "jon-chuang", "mmaatouk", "ravi03071991", "sangwongenip", "thejessezhang"] name = "llama-index-readers-file" readme = "README.md" -version = "0.1.11" +version = "0.1.12" [tool.poetry.dependencies] python = ">=3.8.1,<4.0"