Refactor function name (#11210)

### What problem does this PR solve? As title ### Type of change - [x] Refactoring --------- Signed-off-by: Jin Hai <haijin.chn@gmail.com>
2026-02-03 00:55:10 +08:00 · 2025-11-12 19:00:15 +08:00
parent a36a0fe71c
commit 296476ab89
20 changed files with 105 additions and 103 deletions
--- a/rag/nlp/term_weight.py
+++ b/rag/nlp/term_weight.py
@ -113,20 +113,20 @@ class Dealer:
                res.append(tk)
        return res

-    def tokenMerge(self, tks):
-        def oneTerm(t): return len(t) == 1 or re.match(r"[0-9a-z]{1,2}$", t)
+    def token_merge(self, tks):
+        def one_term(t): return len(t) == 1 or re.match(r"[0-9a-z]{1,2}$", t)

        res, i = [], 0
        while i < len(tks):
            j = i
-            if i == 0 and oneTerm(tks[i]) and len(
+            if i == 0 and one_term(tks[i]) and len(
                    tks) > 1 and (len(tks[i + 1]) > 1 and not re.match(r"[0-9a-zA-Z]", tks[i + 1])):  # 多 工位
                res.append(" ".join(tks[0:2]))
                i = 2
                continue

            while j < len(
-                    tks) and tks[j] and tks[j] not in self.stop_words and oneTerm(tks[j]):
+                    tks) and tks[j] and tks[j] not in self.stop_words and one_term(tks[j]):
                j += 1
            if j - i > 1:
                if j - i < 5:
@ -232,7 +232,7 @@ class Dealer:
            tw = list(zip(tks, wts))
        else:
            for tk in tks:
-                tt = self.tokenMerge(self.pretoken(tk, True))
+                tt = self.token_merge(self.pretoken(tk, True))
                idf1 = np.array([idf(freq(t), 10000000) for t in tt])
                idf2 = np.array([idf(df(t), 1000000000) for t in tt])
                wts = (0.3 * idf1 + 0.7 * idf2) * \