Add test for API (#3134)

### What problem does this PR solve? Add test for API ### Type of change - [x] New Feature (non-breaking change which adds functionality) --------- Co-authored-by: liuhua <10215101452@stu.ecun.edu.cn> Co-authored-by: Zhichang Yu <yuzhichang@gmail.com>
2026-01-30 23:26:36 +08:00 · 2024-11-01 22:59:17 +08:00
parent 7eafccf78a
commit 44ad9a6cd7
10 changed files with 292 additions and 355 deletions
--- a/api/db/services/document_service.py
+++ b/api/db/services/document_service.py
@ -52,11 +52,15 @@ class DocumentService(CommonService):
    @classmethod
    @DB.connection_context()
    def get_list(cls, kb_id, page_number, items_per_page,
-                     orderby, desc, keywords, id):
-        docs =cls.model.select().where(cls.model.kb_id==kb_id)
+                 orderby, desc, keywords, id, name):
+        docs = cls.model.select().where(cls.model.kb_id == kb_id)
        if id:
            docs = docs.where(
-                cls.model.id== id )
+                cls.model.id == id)
+        if name:
+            docs = docs.where(
+                cls.model.name == name
+            )
        if keywords:
            docs = docs.where(
                fn.LOWER(cls.model.name).contains(keywords.lower())
@ -70,7 +74,6 @@ class DocumentService(CommonService):
        count = docs.count()
        return list(docs.dicts()), count

-
    @classmethod
    @DB.connection_context()
    def get_by_kb_id(cls, kb_id, page_number, items_per_page,
@ -162,26 +165,27 @@ class DocumentService(CommonService):
            cls.model.update_time]
        docs = cls.model.select(*fields) \
            .join(Knowledgebase, on=(cls.model.kb_id == Knowledgebase.id)) \
-            .join(Tenant, on=(Knowledgebase.tenant_id == Tenant.id))\
+            .join(Tenant, on=(Knowledgebase.tenant_id == Tenant.id)) \
            .where(
-                cls.model.status == StatusEnum.VALID.value,
-                ~(cls.model.type == FileType.VIRTUAL.value),
-                cls.model.progress == 0,
-                cls.model.update_time >= current_timestamp() - 1000 * 600,
-                cls.model.run == TaskStatus.RUNNING.value)\
+            cls.model.status == StatusEnum.VALID.value,
+            ~(cls.model.type == FileType.VIRTUAL.value),
+            cls.model.progress == 0,
+            cls.model.update_time >= current_timestamp() - 1000 * 600,
+            cls.model.run == TaskStatus.RUNNING.value) \
            .order_by(cls.model.update_time.asc())
        return list(docs.dicts())

    @classmethod
    @DB.connection_context()
    def get_unfinished_docs(cls):
-        fields = [cls.model.id, cls.model.process_begin_at, cls.model.parser_config, cls.model.progress_msg, cls.model.run]
+        fields = [cls.model.id, cls.model.process_begin_at, cls.model.parser_config, cls.model.progress_msg,
+                  cls.model.run]
        docs = cls.model.select(*fields) \
            .where(
-                cls.model.status == StatusEnum.VALID.value,
-                ~(cls.model.type == FileType.VIRTUAL.value),
-                cls.model.progress < 1,
-                cls.model.progress > 0)
+            cls.model.status == StatusEnum.VALID.value,
+            ~(cls.model.type == FileType.VIRTUAL.value),
+            cls.model.progress < 1,
+            cls.model.progress > 0)
        return list(docs.dicts())

    @classmethod
@ -196,12 +200,12 @@ class DocumentService(CommonService):
                "Document not found which is supposed to be there")
        num = Knowledgebase.update(
            token_num=Knowledgebase.token_num +
-            token_num,
+                      token_num,
            chunk_num=Knowledgebase.chunk_num +
-            chunk_num).where(
+                      chunk_num).where(
            Knowledgebase.id == kb_id).execute()
        return num
-    
+
    @classmethod
    @DB.connection_context()
    def decrement_chunk_num(cls, doc_id, kb_id, token_num, chunk_num, duation):
@ -214,13 +218,13 @@ class DocumentService(CommonService):
                "Document not found which is supposed to be there")
        num = Knowledgebase.update(
            token_num=Knowledgebase.token_num -
-            token_num,
+                      token_num,
            chunk_num=Knowledgebase.chunk_num -
-            chunk_num
+                      chunk_num
        ).where(
            Knowledgebase.id == kb_id).execute()
        return num
-    
+
    @classmethod
    @DB.connection_context()
    def clear_chunk_num(cls, doc_id):
@ -229,10 +233,10 @@ class DocumentService(CommonService):

        num = Knowledgebase.update(
            token_num=Knowledgebase.token_num -
-            doc.token_num,
+                      doc.token_num,
            chunk_num=Knowledgebase.chunk_num -
-            doc.chunk_num,
-            doc_num=Knowledgebase.doc_num-1
+                      doc.chunk_num,
+            doc_num=Knowledgebase.doc_num - 1
        ).where(
            Knowledgebase.id == doc.kb_id).execute()
        return num
@ -243,8 +247,8 @@ class DocumentService(CommonService):
        docs = cls.model.select(
            Knowledgebase.tenant_id).join(
            Knowledgebase, on=(
-                Knowledgebase.id == cls.model.kb_id)).where(
-                cls.model.id == doc_id, Knowledgebase.status == StatusEnum.VALID.value)
+                    Knowledgebase.id == cls.model.kb_id)).where(
+            cls.model.id == doc_id, Knowledgebase.status == StatusEnum.VALID.value)
        docs = docs.dicts()
        if not docs:
            return
@ -270,8 +274,8 @@ class DocumentService(CommonService):
            cls.model.id).join(
            Knowledgebase, on=(
                    Knowledgebase.id == cls.model.kb_id)
-            ).join(UserTenant, on=(UserTenant.tenant_id == Knowledgebase.tenant_id)
-            ).where(cls.model.id == doc_id, UserTenant.user_id == user_id).paginate(0, 1)
+        ).join(UserTenant, on=(UserTenant.tenant_id == Knowledgebase.tenant_id)
+               ).where(cls.model.id == doc_id, UserTenant.user_id == user_id).paginate(0, 1)
        docs = docs.dicts()
        if not docs:
            return False
@ -284,7 +288,7 @@ class DocumentService(CommonService):
            cls.model.id).join(
            Knowledgebase, on=(
                    Knowledgebase.id == cls.model.kb_id)
-            ).where(cls.model.id == doc_id, Knowledgebase.created_by == user_id).paginate(0, 1)
+        ).where(cls.model.id == doc_id, Knowledgebase.created_by == user_id).paginate(0, 1)
        docs = docs.dicts()
        if not docs:
            return False
@ -296,13 +300,13 @@ class DocumentService(CommonService):
        docs = cls.model.select(
            Knowledgebase.embd_id).join(
            Knowledgebase, on=(
-                Knowledgebase.id == cls.model.kb_id)).where(
-                cls.model.id == doc_id, Knowledgebase.status == StatusEnum.VALID.value)
+                    Knowledgebase.id == cls.model.kb_id)).where(
+            cls.model.id == doc_id, Knowledgebase.status == StatusEnum.VALID.value)
        docs = docs.dicts()
        if not docs:
            return
        return docs[0]["embd_id"]
-    
+
    @classmethod
    @DB.connection_context()
    def get_doc_id_by_doc_name(cls, doc_name):
@ -338,6 +342,7 @@ class DocumentService(CommonService):
                    dfs_update(old[k], v)
                else:
                    old[k] = v
+
        dfs_update(d.parser_config, config)
        cls.update_by_id(id, {"parser_config": d.parser_config})

@ -372,7 +377,7 @@ class DocumentService(CommonService):
                finished = True
                bad = 0
                e, doc = DocumentService.get_by_id(d["id"])
-                status = doc.run#TaskStatus.RUNNING.value
+                status = doc.run  # TaskStatus.RUNNING.value
                for t in tsks:
                    if 0 <= t.progress < 1:
                        finished = False
@ -386,9 +391,10 @@ class DocumentService(CommonService):
                    prg = -1
                    status = TaskStatus.FAIL.value
                elif finished:
-                    if d["parser_config"].get("raptor", {}).get("use_raptor") and d["progress_msg"].lower().find(" raptor")<0:
+                    if d["parser_config"].get("raptor", {}).get("use_raptor") and d["progress_msg"].lower().find(
+                            " raptor") < 0:
                        queue_raptor_tasks(d)
-                        prg = 0.98 * len(tsks)/(len(tsks)+1)
+                        prg = 0.98 * len(tsks) / (len(tsks) + 1)
                        msg.append("------ RAPTOR -------")
                    else:
                        status = TaskStatus.DONE.value
@ -414,7 +420,6 @@ class DocumentService(CommonService):
        return len(cls.model.select(cls.model.id).where(
            cls.model.kb_id == kb_id).dicts())

-
    @classmethod
    @DB.connection_context()
    def do_cancel(cls, doc_id):
@ -579,4 +584,4 @@ def doc_upload_and_parse(conversation_id, file_objs, user_id):
        DocumentService.increment_chunk_num(
            doc_id, kb.id, token_counts[doc_id], chunk_counts[doc_id], 0)

-    return [d["id"] for d,_ in files]
+    return [d["id"] for d, _ in files]