From 323df2b50e05b71c095a54dbb098e0da643304aa Mon Sep 17 00:00:00 2001 From: George Burton Date: Wed, 11 Sep 2024 16:09:32 +0100 Subject: [PATCH 1/2] added images to file types --- django_app/redbox_app/redbox_core/views/document_views.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/django_app/redbox_app/redbox_core/views/document_views.py b/django_app/redbox_app/redbox_core/views/document_views.py index 8390c5e59..3e3d1adf0 100644 --- a/django_app/redbox_app/redbox_core/views/document_views.py +++ b/django_app/redbox_app/redbox_core/views/document_views.py @@ -43,6 +43,9 @@ ".tsv", ".xlsx", ".htm", + ".bmp", + ".jpeg", + ".png", ] MAX_FILE_SIZE = 209715200 # 200 MB or 200 * 1024 * 1024 From 2f20278ce52245da3c917b8623ec3ffa5c5e8729 Mon Sep 17 00:00:00 2001 From: George Burton Date: Wed, 11 Sep 2024 16:40:47 +0100 Subject: [PATCH 2/2] removed fast strategy --- django_app/redbox_app/redbox_core/views/document_views.py | 1 + redbox-core/redbox/loader/loaders.py | 1 - 2 files changed, 1 insertion(+), 1 deletion(-) diff --git a/django_app/redbox_app/redbox_core/views/document_views.py b/django_app/redbox_app/redbox_core/views/document_views.py index 3e3d1adf0..a1a81fed5 100644 --- a/django_app/redbox_app/redbox_core/views/document_views.py +++ b/django_app/redbox_app/redbox_core/views/document_views.py @@ -46,6 +46,7 @@ ".bmp", ".jpeg", ".png", + ".jpeg", ] MAX_FILE_SIZE = 209715200 # 200 MB or 200 * 1024 * 1024 diff --git a/redbox-core/redbox/loader/loaders.py b/redbox-core/redbox/loader/loaders.py index 30407935d..829f5eb64 100644 --- a/redbox-core/redbox/loader/loaders.py +++ b/redbox-core/redbox/loader/loaders.py @@ -52,7 +52,6 @@ def lazy_load(self, file_name: str, file_bytes: BytesIO) -> Iterator[Document]: url, files=files, data={ - "strategy": "fast", "chunking_strategy": "by_title", "max_characters": self._max_chunk_size, "combine_under_n_chars": self._min_chunk_size,