Move some constants to common (#11004)

### What problem does this PR solve?

As title.

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
This commit is contained in:
Jin Hai
2025-11-05 08:01:39 +08:00
committed by GitHub
parent 4bbbf92331
commit bab3fce136
59 changed files with 83 additions and 173 deletions

View File

@ -18,7 +18,7 @@ import os
import re
import tempfile
from api.db import LLMType
from common.constants import LLMType
from api.db.services.llm_service import LLMBundle
from rag.nlp import rag_tokenizer, tokenize

View File

@ -20,7 +20,7 @@ import re
from io import BytesIO
from docx import Document
from api.db import ParserType
from common.constants import ParserType
from deepdoc.parser.utils import get_text
from rag.nlp import bullets_category, remove_contents_table, \
make_colon_as_title, tokenize_chunks, docx_question_level, tree_merge

View File

@ -18,7 +18,7 @@ import logging
import copy
import re
from api.db import ParserType
from common.constants import ParserType
from io import BytesIO
from rag.nlp import rag_tokenizer, tokenize, tokenize_table, bullets_category, title_frequency, tokenize_chunks, docx_question_level
from common.token_utils import num_tokens_from_string

View File

@ -28,7 +28,7 @@ from markdown import markdown
from PIL import Image
from tika import parser
from api.db import LLMType
from common.constants import LLMType
from api.db.services.llm_service import LLMBundle
from rag.utils.file_utils import extract_embed_file, extract_links_from_pdf, extract_links_from_docx, extract_html
from deepdoc.parser import DocxParser, ExcelParser, HtmlParser, JsonParser, MarkdownElementExtractor, MarkdownParser, PdfParser, TxtParser

View File

@ -19,7 +19,7 @@ import copy
import re
from deepdoc.parser.figure_parser import vision_figure_parser_pdf_wrapper
from api.db import ParserType
from common.constants import ParserType
from rag.nlp import rag_tokenizer, tokenize, tokenize_table, add_positions, bullets_category, title_frequency, tokenize_chunks
from deepdoc.parser import PdfParser, PlainParser
import numpy as np

View File

@ -20,7 +20,7 @@ import re
import numpy as np
from PIL import Image
from api.db import LLMType
from common.constants import LLMType
from api.db.services.llm_service import LLMBundle
from deepdoc.vision import OCR
from rag.nlp import rag_tokenizer, tokenize

View File

@ -20,7 +20,7 @@ from io import BytesIO
from PIL import Image
from api.db import LLMType
from common.constants import LLMType
from api.db.services.llm_service import LLMBundle
from deepdoc.parser.pdf_parser import VisionParser
from rag.nlp import tokenize, is_english