From 1843c6d806702dc12bd771ac1362b6c3c2931ca2 Mon Sep 17 00:00:00 2001
From: James Zhao <3120325+jzcruiser@users.noreply.github.com>
Date: Thu, 8 Feb 2024 00:50:51 +0800
Subject: [PATCH] Fix ImportError in MetadataExtractionSEC.ipynb (pypdf
 missing) (#10491)

Update MetadataExtractionSEC.ipynb

fix ImportError: pypdf is required to read PDF files
---
 .../metadata_extraction/MetadataExtractionSEC.ipynb   | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb b/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb
index 15ee39c1a..3c2040905 100644
--- a/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb
+++ b/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb
@@ -173,6 +173,17 @@
     "!wget -O \"data/10k-vFinal.pdf\" \"https://www.dropbox.com/scl/fi/qn7g3vrk5mqb18ko4e5in/lyft.pdf?rlkey=j6jxtjwo8zbstdo4wz3ns8zoj&dl=1\""
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2da91ecc-afef-409a-b94a-13e80aab6c6a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# pypdf is required to read PDF files\n",
+    "!pip install pypdf"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
-- 
GitLab