From c7de7c9aac40ad56ed9493c803d33e6973b975be Mon Sep 17 00:00:00 2001 From: saksham-jain177 <177sakshamjain@gmail.com> Date: Mon, 29 Dec 2025 21:17:06 +0530 Subject: [PATCH] Make embedding device configurable instead of forcing GPU --- utils.py | 10 ++++++++-- 1 file changed, 8 insertions(+), 2 deletions(-) diff --git a/utils.py b/utils.py index 408e33d..1f33322 100644 --- a/utils.py +++ b/utils.py @@ -11,6 +11,7 @@ from transformers import BitsAndBytesConfig import torch, dotenv, os, gc from huggingface_hub import login +import os dotenv.load_dotenv() @@ -20,8 +21,13 @@ def set_device(gpu: int = None) -> str: # Sets embedding model using a hugging face embedding model for local embeddings. def set_embedding_model(): - embed_model = HuggingFaceEmbedding(model_name="/home/jake/Programming/Models/embedding/multilingual-e5-large-instruct", - device=set_device(0), trust_remote_code=True) + device = os.getenv("EMBEDDING_DEVICE", "cpu") + + embed_model = HuggingFaceEmbedding( + model_name="intfloat/multilingual-e5-large-instruct", + device=device, + trust_remote_code=True + ) return embed_model # Function that configures Ollama models and sets some of the initial parameters