fix bug about fetching knowledge graph (#3394)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
This commit is contained in:
Kevin Hu
2024-11-14 12:29:15 +08:00
committed by GitHub
parent 400fc3f5e9
commit 4caf932808
6 changed files with 120 additions and 62 deletions

View File

@ -301,16 +301,13 @@ def retrieval_test():
@login_required
def knowledge_graph():
doc_id = request.args["doc_id"]
e, doc = DocumentService.get_by_id(doc_id)
if not e:
return get_data_error_result(message="Document not found!")
tenant_id = DocumentService.get_tenant_id(doc_id)
kb_ids = KnowledgebaseService.get_kb_ids(tenant_id)
req = {
"doc_ids":[doc_id],
"knowledge_graph_kwd": ["graph", "mind_map"]
}
sres = retrievaler.search(req, search.index_name(tenant_id), kb_ids, doc.kb_id)
sres = retrievaler.search(req, search.index_name(tenant_id), kb_ids)
obj = {"graph": {}, "mind_map": {}}
for id in sres.ids[:2]:
ty = sres.field[id]["knowledge_graph_kwd"]

View File

@ -524,7 +524,7 @@ def upload_and_parse():
@manager.route('/parse', methods=['POST'])
@login_required
def parse():
url = request.json.get("url")
url = request.json.get("url") if request.json else ""
if url:
if not is_valid_url(url):
return get_json_result(
@ -537,7 +537,7 @@ def parse():
options.add_argument('--disable-dev-shm-usage')
driver = Chrome(options=options)
driver.get(url)
sections = RAGFlowHtmlParser()("", binary=driver.page_source)
sections = RAGFlowHtmlParser().parser_txt(driver.page_source)
return get_json_result(data="\n".join(sections))
if 'file' not in request.files: