From f14616f7886d4a8c098a8e4496df543bc16935d6 Mon Sep 17 00:00:00 2001 From: rchan Date: Thu, 13 Jun 2024 12:16:25 +0100 Subject: [PATCH] reduce batch size of sentence-transformer --- reginald/models/llama_index/llama_utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/reginald/models/llama_index/llama_utils.py b/reginald/models/llama_index/llama_utils.py index 65e5a59..75209a1 100644 --- a/reginald/models/llama_index/llama_utils.py +++ b/reginald/models/llama_index/llama_utils.py @@ -91,7 +91,7 @@ def setup_settings( # initialise embedding model to use to create the index vectors embed_model = HuggingFaceEmbedding( model_name="sentence-transformers/all-mpnet-base-v2", - embed_batch_size=128, + embed_batch_size=64, ) # construct the prompt helper