enh: embedding_batch_size for local embedding engine

This commit is contained in:
Timothy Jaeryang Baek
2026-01-01 16:06:42 +04:00
parent d3ee3fd23e
commit e4a5b06ca6
2 changed files with 19 additions and 17 deletions

View File

@@ -795,7 +795,9 @@ def get_embedding_function(
return await asyncio.to_thread(
(
lambda query, prefix=None: embedding_function.encode(
query, **({"prompt": prefix} if prefix else {})
query,
batch_size=int(embedding_batch_size),
**({"prompt": prefix} if prefix else {}),
).tolist()
),
query,

View File

@@ -950,24 +950,24 @@
</div>
</div>
{#if RAG_EMBEDDING_ENGINE === 'ollama' || RAG_EMBEDDING_ENGINE === 'openai' || RAG_EMBEDDING_ENGINE === 'azure_openai'}
<div class=" mb-2.5 flex w-full justify-between">
<div class=" self-center text-xs font-medium">
{$i18n.t('Embedding Batch Size')}
</div>
<div class="">
<input
bind:value={RAG_EMBEDDING_BATCH_SIZE}
type="number"
class=" bg-transparent text-center w-14 outline-none"
min="-2"
max="16000"
step="1"
/>
</div>
<div class=" mb-2.5 flex w-full justify-between">
<div class=" self-center text-xs font-medium">
{$i18n.t('Embedding Batch Size')}
</div>
<div class="">
<input
bind:value={RAG_EMBEDDING_BATCH_SIZE}
type="number"
class=" bg-transparent text-center w-14 outline-none"
min="-2"
max="16000"
step="1"
/>
</div>
</div>
{#if RAG_EMBEDDING_ENGINE === 'ollama' || RAG_EMBEDDING_ENGINE === 'openai' || RAG_EMBEDDING_ENGINE === 'azure_openai'}
<div class=" mb-2.5 flex w-full justify-between">
<div class="self-center text-xs font-medium">
<Tooltip