Perf: test llm before RAPTOR. (#8897)

### What problem does this PR solve? ### Type of change - [x] Performance Improvement
2026-01-23 03:26:53 +08:00 · 2025-07-17 16:48:50 +08:00
parent 606bf20a3f
commit ecdb1701df
4 changed files with 22 additions and 12 deletions
--- a/graphrag/general/index.py
+++ b/graphrag/general/index.py
@ -20,7 +20,7 @@ import trio

 from api import settings
 from api.utils import get_uuid
-from api.utils.api_utils import timeout
+from api.utils.api_utils import timeout, is_strong_enough
 from graphrag.light.graph_extractor import GraphExtractor as LightKGExt
 from graphrag.general.graph_extractor import GraphExtractor as GeneralKGExt
 from graphrag.general.community_reports_extractor import CommunityReportsExtractor
@ -39,13 +39,6 @@ from rag.nlp import rag_tokenizer, search
 from rag.utils.redis_conn import RedisDistributedLock


-@timeout(30, 2)
-async def _is_strong_enough(chat_model, embedding_model):
-    _ = await trio.to_thread.run_sync(lambda: embedding_model.encode(["Are you strong enough!?"]))
-    res =  await trio.to_thread.run_sync(lambda: chat_model.chat("Nothing special.", [{"role":"user", "content": "Are you strong enough!?"}], {}))
-    if res.find("**ERROR**") >= 0:
-        raise Exception(res)
-

 async def run_graphrag(
    row: dict,
@ -57,9 +50,7 @@ async def run_graphrag(
    callback,
 ):
    # Pressure test for GraphRAG task
-    async with trio.open_nursery() as nursery:
-        for _ in range(12):
-            nursery.start_soon(_is_strong_enough, chat_model, embedding_model)
+    await is_strong_enough(chat_model, embedding_model)

    start = trio.current_time()
    tenant_id, kb_id, doc_id = row["tenant_id"], str(row["kb_id"]), row["doc_id"]