Cache the result from llm for graphrag and raptor (#4051)

### What problem does this PR solve? #4045 ### Type of change - [x] New Feature (non-breaking change which adds functionality)
2026-02-02 00:25:06 +08:00 · 2024-12-17 09:48:03 +08:00
parent 8ea631a2a0
commit cb6e9ce164
12 changed files with 161 additions and 38 deletions
--- a/graphrag/claim_extractor.py
+++ b/graphrag/claim_extractor.py
@ -16,6 +16,7 @@ from typing import Any
 import tiktoken

 from graphrag.claim_prompt import CLAIM_EXTRACTION_PROMPT, CONTINUE_PROMPT, LOOP_PROMPT
+from graphrag.extractor import Extractor
 from rag.llm.chat_model import Base as CompletionLLM
 from graphrag.utils import ErrorHandlerFn, perform_variable_replacements

@ -33,10 +34,9 @@ class ClaimExtractorResult:
    source_docs: dict[str, Any]


-class ClaimExtractor:
+class ClaimExtractor(Extractor):
    """Claim extractor class definition."""

-    _llm: CompletionLLM
    _extraction_prompt: str
    _summary_prompt: str
    _output_formatter_prompt: str
@ -169,7 +169,7 @@ class ClaimExtractor:
                    }
        text = perform_variable_replacements(self._extraction_prompt, variables=variables)
        gen_conf = {"temperature": 0.5}
-        results = self._llm.chat(text, [{"role": "user", "content": "Output:"}], gen_conf)
+        results = self._chat(text, [{"role": "user", "content": "Output:"}], gen_conf)
        claims = results.strip().removesuffix(completion_delimiter)
        history = [{"role": "system", "content": text}, {"role": "assistant", "content": results}]

@ -177,7 +177,7 @@ class ClaimExtractor:
        for i in range(self._max_gleanings):
            text = perform_variable_replacements(CONTINUE_PROMPT, history=history, variables=variables)
            history.append({"role": "user", "content": text})
-            extension = self._llm.chat("", history, gen_conf)
+            extension = self._chat("", history, gen_conf)
            claims += record_delimiter + extension.strip().removesuffix(
                completion_delimiter
            )
@ -188,7 +188,7 @@ class ClaimExtractor:

            history.append({"role": "assistant", "content": extension})
            history.append({"role": "user", "content": LOOP_PROMPT})
-            continuation = self._llm.chat("", history, self._loop_args)
+            continuation = self._chat("", history, self._loop_args)
            if continuation != "YES":
                break