diff --git a/llama-index-core/llama_index/core/query_engine/multi_modal.py b/llama-index-core/llama_index/core/query_engine/multi_modal.py index 8ae118dcefe0202245d0448bd4faf04343d61070..168fb142620d4677306476ccb3e624ad4d68ac70 100644 --- a/llama-index-core/llama_index/core/query_engine/multi_modal.py +++ b/llama-index-core/llama_index/core/query_engine/multi_modal.py @@ -157,7 +157,7 @@ class SimpleMultiModalQueryEngine(BaseQueryEngine): ) llm_response = await self._multi_modal_llm.acomplete( prompt=fmt_prompt, - image_documents=image_nodes, + image_documents=[image_node.node for image_node in image_nodes], ) return Response( response=str(llm_response),