diff --git a/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb b/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb
index 15ee39c1a0dda240dcde18e1d1cac2ffef1f5252..3c20409051797efc688fff127270046120760f6b 100644
--- a/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb
+++ b/docs/examples/metadata_extraction/MetadataExtractionSEC.ipynb
@@ -173,6 +173,17 @@
     "!wget -O \"data/10k-vFinal.pdf\" \"https://www.dropbox.com/scl/fi/qn7g3vrk5mqb18ko4e5in/lyft.pdf?rlkey=j6jxtjwo8zbstdo4wz3ns8zoj&dl=1\""
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2da91ecc-afef-409a-b94a-13e80aab6c6a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# pypdf is required to read PDF files\n",
+    "!pip install pypdf"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,