diff --git a/rag/llm/embedding_model.py b/rag/llm/embedding_model.py index 17bb84ef5..dba11b7db 100644 --- a/rag/llm/embedding_model.py +++ b/rag/llm/embedding_model.py @@ -260,14 +260,16 @@ class OllamaEmbed(Base): tks_num = 0 for txt in texts: res = self.client.embeddings(prompt=txt, - model=self.model_name) + model=self.model_name, + options={"use_mmap": True}) arr.append(res["embedding"]) tks_num += 128 return np.array(arr), tks_num def encode_queries(self, text): res = self.client.embeddings(prompt=text, - model=self.model_name) + model=self.model_name, + options={"use_mmap": True}) return np.array(res["embedding"]), 128 @@ -834,4 +836,4 @@ class GPUStackEmbed(OpenAIEmbed): print(key,base_url) self.client = OpenAI(api_key=key, base_url=base_url) - self.model_name = model_name \ No newline at end of file + self.model_name = model_name