Change knowledge base to dataset (#11976)

### What problem does this PR solve? As title ### Type of change - [x] Refactoring --------- Signed-off-by: Jin Hai <haijin.chn@gmail.com>
2026-02-04 01:25:07 +08:00 · 2025-12-17 10:03:33 +08:00
parent 4d46726eb7
commit 30019dab9f
35 changed files with 92 additions and 92 deletions
--- a/rag/benchmark.py
+++ b/rag/benchmark.py
@ -283,7 +283,7 @@ if __name__ == '__main__':
    print('*****************RAGFlow Benchmark*****************')
    parser = argparse.ArgumentParser(usage="benchmark.py <max_docs> <kb_id> <dataset> <dataset_path> [<miracl_corpus_path>])", description='RAGFlow Benchmark')
    parser.add_argument('max_docs', metavar='max_docs', type=int, help='max docs to evaluate')
-    parser.add_argument('kb_id', metavar='kb_id', help='knowledgebase id')
+    parser.add_argument('kb_id', metavar='kb_id', help='dataset id')
    parser.add_argument('dataset', metavar='dataset', help='dataset name, shall be one of ms_marco_v1.1(https://huggingface.co/datasets/microsoft/ms_marco), trivia_qa(https://huggingface.co/datasets/mandarjoshi/trivia_qa>), miracl(https://huggingface.co/datasets/miracl/miracl')
    parser.add_argument('dataset_path', metavar='dataset_path', help='dataset path')
    parser.add_argument('miracl_corpus_path', metavar='miracl_corpus_path', nargs='?', default="", help='miracl corpus path. Only needed when dataset is miracl')