30 lines
610 B
Plaintext
30 lines
610 B
Plaintext
|
|
fastapi==0.104.1
|
|||
|
|
uvicorn==0.24.0
|
|||
|
|
python-multipart==0.0.6
|
|||
|
|
pydantic==2.5.0
|
|||
|
|
requests==2.31.0
|
|||
|
|
python-dotenv==1.0.0
|
|||
|
|
|
|||
|
|
# OCR相关(可选)
|
|||
|
|
baidu-aip==4.16.13
|
|||
|
|
paddleocr==2.7.0
|
|||
|
|
paddlepaddle==2.5.2
|
|||
|
|
pdfplumber==0.10.3
|
|||
|
|
Pillow>=10.0.0
|
|||
|
|
|
|||
|
|
# MinerU核心依赖(高精度文档解析)
|
|||
|
|
loguru>=0.7.2
|
|||
|
|
numpy>=1.21.6
|
|||
|
|
tqdm>=4.67.1
|
|||
|
|
|
|||
|
|
# LLM相关(根据需要选择安装)
|
|||
|
|
openai==1.3.0
|
|||
|
|
cozepy # Coze官方Python SDK
|
|||
|
|
|
|||
|
|
# Word和PDF处理
|
|||
|
|
PyMuPDF # PDF处理
|
|||
|
|
python-docx # Word文档处理
|
|||
|
|
weasyprint==60.1 # 推荐,质量更好(需要GTK3)
|
|||
|
|
xhtml2pdf==0.2.13 # 备用方案,更简单(纯Python)
|
|||
|
|
jinja2==3.1.2
|