From 6b9a2feac54710ab59ac2069fa7adc7474aa751c Mon Sep 17 00:00:00 2001
From: Ian Sinnott <3154865+iansinnott@users.noreply.github.com>
Date: Tue, 6 Feb 2024 16:52:29 +0800
Subject: [PATCH] Consistent Document IDs in NotionReader.ts (#519)

---
 packages/core/src/readers/NotionReader.ts | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/packages/core/src/readers/NotionReader.ts b/packages/core/src/readers/NotionReader.ts
index b7512c8cb..0b4569d8f 100644
--- a/packages/core/src/readers/NotionReader.ts
+++ b/packages/core/src/readers/NotionReader.ts
@@ -42,7 +42,11 @@ export class NotionReader implements BaseReader {
   toDocuments(pages: Pages): Document[] {
     return Object.values(pages).map((page) => {
       const text = pageToString(page);
-      return new Document({ text, metadata: page.metadata });
+      return new Document({
+        id_: page.metadata.id, // Use the Notion-provided UUID for the document
+        text,
+        metadata: page.metadata,
+      });
     });
   }
 
-- 
GitLab