diff --git a/deepdoc/parser/figure_parser.py b/deepdoc/parser/figure_parser.py index 3f6b40b4f..98c1d3349 100644 --- a/deepdoc/parser/figure_parser.py +++ b/deepdoc/parser/figure_parser.py @@ -41,13 +41,13 @@ def vision_figure_parser_docx_wrapper(sections,tbls,callback=None,**kwargs): except Exception: vision_model = None if vision_model: - figures_data = vision_figure_parser_figure_data_wrapper(sections) - try: - docx_vision_parser = VisionFigureParser(vision_model=vision_model, figures_data=figures_data, **kwargs) - boosted_figures = docx_vision_parser(callback=callback) - tbls.extend(boosted_figures) - except Exception as e: - callback(0.8, f"Visual model error: {e}. Skipping figure parsing enhancement.") + figures_data = vision_figure_parser_figure_data_wrapper(sections) + try: + docx_vision_parser = VisionFigureParser(vision_model=vision_model, figures_data=figures_data, **kwargs) + boosted_figures = docx_vision_parser(callback=callback) + tbls.extend(boosted_figures) + except Exception as e: + callback(0.8, f"Visual model error: {e}. Skipping figure parsing enhancement.") return tbls def vision_figure_parser_pdf_wrapper(tbls,callback=None,**kwargs): diff --git a/rag/app/manual.py b/rag/app/manual.py index a970cac06..32a38ed39 100644 --- a/rag/app/manual.py +++ b/rag/app/manual.py @@ -262,7 +262,7 @@ def chunk(filename, binary=None, from_page=0, to_page=100000, docx_parser = Docx() ti_list, tbls = docx_parser(filename, binary, from_page=0, to_page=10000, callback=callback) - tbls=vision_figure_parser_docx_wrapper(sections=sections,tbls=tbls,callback=callback,**kwargs) + tbls=vision_figure_parser_docx_wrapper(sections=ti_list,tbls=tbls,callback=callback,**kwargs) res = tokenize_table(tbls, doc, eng) for text, image in ti_list: d = copy.deepcopy(doc)