Fix: Reduce excessive IO operations by loading LLM factory configurations (#6047)

…ions ### What problem does this PR solve? This PR fixes an issue where the application was repeatedly reading the llm_factories.json file from disk in multiple places, which could lead to "Too many open files" errors under high load conditions. The fix centralizes the file reading operation in the settings.py module and stores the data in a global variable that can be accessed by other modules. ### Type of change - [x] Bug Fix (non-breaking change which fixes an issue) - [ ] New Feature (non-breaking change which adds functionality) - [ ] Documentation Update - [ ] Refactoring - [x] Performance Improvement - [ ] Other (please describe):
2026-01-30 15:16:45 +08:00 · 2025-03-14 09:54:38 +08:00
parent 47926f7d21
commit 2d4a60cae6
4 changed files with 18 additions and 17 deletions
--- a/api/settings.py
+++ b/api/settings.py
@ -16,6 +16,7 @@
 import os
 from datetime import date
 from enum import IntEnum, Enum
+import json
 import rag.utils.es_conn
 import rag.utils.infinity_conn

@ -24,6 +25,7 @@ from rag.nlp import search
 from graphrag import search as kg_search
 from api.utils import get_base_config, decrypt_database_config
 from api.constants import RAG_FLOW_SERVICE_NAME
+from api.utils.file_utils import get_project_base_directory

 LIGHTEN = int(os.environ.get('LIGHTEN', "0"))

@ -40,6 +42,7 @@ PARSERS = None
 HOST_IP = None
 HOST_PORT = None
 SECRET_KEY = None
+FACTORY_LLM_INFOS = None

 DATABASE_TYPE = os.getenv("DB_TYPE", 'mysql')
 DATABASE = decrypt_database_config(name=DATABASE_TYPE)
@ -61,7 +64,7 @@ kg_retrievaler = None


 def init_settings():
-    global LLM, LLM_FACTORY, LLM_BASE_URL, LIGHTEN, DATABASE_TYPE, DATABASE
+    global LLM, LLM_FACTORY, LLM_BASE_URL, LIGHTEN, DATABASE_TYPE, DATABASE, FACTORY_LLM_INFOS
    LIGHTEN = int(os.environ.get('LIGHTEN', "0"))
    DATABASE_TYPE = os.getenv("DB_TYPE", 'mysql')
    DATABASE = decrypt_database_config(name=DATABASE_TYPE)
@ -69,6 +72,12 @@ def init_settings():
    LLM_DEFAULT_MODELS = LLM.get("default_models", {})
    LLM_FACTORY = LLM.get("factory", "Tongyi-Qianwen")
    LLM_BASE_URL = LLM.get("base_url")
+    
+    try:
+        with open(os.path.join(get_project_base_directory(), "conf", "llm_factories.json"), "r") as f:
+            FACTORY_LLM_INFOS = json.load(f)["factory_llm_infos"]
+    except Exception:
+        FACTORY_LLM_INFOS = []

    global CHAT_MDL, EMBEDDING_MDL, RERANK_MDL, ASR_MDL, IMAGE2TEXT_MDL
    if not LIGHTEN: