Refa: http API create dataset and test cases (#7393)

### What problem does this PR solve? This PR introduces Pydantic-based validation for the create dataset HTTP API, improving code clarity and robustness. Key changes include: 1. Pydantic Validation 2. Error Handling 3. Test Updates 4. Documentation ### Type of change - [x] Bug Fix (non-breaking change which fixes an issue) - [x] Documentation Update - [x] Refactoring
2026-01-23 11:36:38 +08:00 · 2025-04-29 16:53:57 +08:00
parent c88e4b3fc0
commit 78380fa181
11 changed files with 1239 additions and 812 deletions
--- a/api/utils/api_utils.py
+++ b/api/utils/api_utils.py
@ -322,6 +322,10 @@ def get_error_data_result(
    return jsonify(response)


+def get_error_argument_result(message="Invalid arguments"):
+    return get_result(code=settings.RetCode.ARGUMENT_ERROR, message=message)
+
+
 def generate_confirmation_token(tenant_id):
    serializer = URLSafeTimedSerializer(tenant_id)
    return "ragflow-" + serializer.dumps(get_uuid(), salt=tenant_id)[2:34]
@ -368,46 +372,34 @@ def get_parser_config(chunk_method, parser_config):
    return parser_config


-def get_data_openai(id=None, 
-                    created=None, 
-                    model=None, 
-                    prompt_tokens= 0, 
-                    completion_tokens=0, 
-                    content = None, 
-                    finish_reason= None,
-                    object="chat.completion",
-                    param=None,
+def get_data_openai(
+    id=None,
+    created=None,
+    model=None,
+    prompt_tokens=0,
+    completion_tokens=0,
+    content=None,
+    finish_reason=None,
+    object="chat.completion",
+    param=None,
 ):
-   
-    total_tokens= prompt_tokens + completion_tokens
+    total_tokens = prompt_tokens + completion_tokens
    return {
-        "id":f"{id}",
+        "id": f"{id}",
        "object": object,
        "created": int(time.time()) if created else None,
        "model": model,
-        "param":param,
+        "param": param,
        "usage": {
            "prompt_tokens": prompt_tokens,
            "completion_tokens": completion_tokens,
            "total_tokens": total_tokens,
-            "completion_tokens_details": {
-                "reasoning_tokens": 0,
-                "accepted_prediction_tokens": 0,
-                "rejected_prediction_tokens": 0
-            }
+            "completion_tokens_details": {"reasoning_tokens": 0, "accepted_prediction_tokens": 0, "rejected_prediction_tokens": 0},
        },
-        "choices": [
-            {
-                "message": {
-                    "role": "assistant",
-                    "content": content
-                },
-                "logprobs": None,
-                "finish_reason": finish_reason,
-                "index": 0
-            }
-        ]
-    } 
+        "choices": [{"message": {"role": "assistant", "content": content}, "logprobs": None, "finish_reason": finish_reason, "index": 0}],
+    }
+
+
 def valid_parser_config(parser_config):
    if not parser_config:
        return