From 8106cb5aa578c69bfb6cc788e3981063661b631d Mon Sep 17 00:00:00 2001 From: Baptiste Pasquier Date: Thu, 2 May 2024 18:51:13 +0200 Subject: [PATCH] :bug: Fix handling of empty image list --- backend/rag_components/retriever.py | 2 ++ backend/rag_components/unstructured.py | 6 ++++++ 2 files changed, 8 insertions(+) diff --git a/backend/rag_components/retriever.py b/backend/rag_components/retriever.py index 9f0238c..d324249 100644 --- a/backend/rag_components/retriever.py +++ b/backend/rag_components/retriever.py @@ -72,6 +72,8 @@ def add_documents_multivector( raise ValueError( "The length of vectorstore_content and metadata_list must be the same" ) + if len(vectorstore_content) == 0: + return if not isinstance(retriever, MultiVectorRetriever): raise ValueError("retriever must be a MultiVectorRetriever") diff --git a/backend/rag_components/unstructured.py b/backend/rag_components/unstructured.py index a54c5ed..62f0426 100644 --- a/backend/rag_components/unstructured.py +++ b/backend/rag_components/unstructured.py @@ -62,6 +62,12 @@ def select_images( if width < min_size[0] or height < min_size[1]: continue + if ( + element.metadata.image_mime_type is None + or element.metadata.image_base64 is None + ): + continue + image = Image( base64=element.metadata.image_base64, mime_type=element.metadata.image_mime_type,