diff --git a/llama-index-core/llama_index/core/query_engine/multi_modal.py b/llama-index-core/llama_index/core/query_engine/multi_modal.py
index 8ae118dcefe0202245d0448bd4faf04343d61070..168fb142620d4677306476ccb3e624ad4d68ac70 100644
--- a/llama-index-core/llama_index/core/query_engine/multi_modal.py
+++ b/llama-index-core/llama_index/core/query_engine/multi_modal.py
@@ -157,7 +157,7 @@ class SimpleMultiModalQueryEngine(BaseQueryEngine):
         )
         llm_response = await self._multi_modal_llm.acomplete(
             prompt=fmt_prompt,
-            image_documents=image_nodes,
+            image_documents=[image_node.node for image_node in image_nodes],
         )
         return Response(
             response=str(llm_response),