24 lines
553 B
Plaintext
24 lines
553 B
Plaintext
# 零差云控官网爬虫依赖
|
||
requests>=2.28.0
|
||
beautifulsoup4>=4.11.0
|
||
markdownify>=0.11.0
|
||
python-docx>=0.8.11
|
||
lxml>=4.9.0
|
||
|
||
# doc2md.py 依赖
|
||
Pillow>=9.0.0
|
||
matplotlib>=3.5.0 # 可选:用于渲染 LaTeX 公式
|
||
# wand>=0.6.0 # 可选:用于 WMF/EMF 转换(需要系统安装 ImageMagick)
|
||
# html2image>=2.0.0 # 可选:用于表格渲染为图片
|
||
|
||
# test_llm.py 依赖 - RAG 方案
|
||
openai>=1.0.0
|
||
langchain>=0.1.0
|
||
langchain-openai>=0.1.0
|
||
langchain-community>=0.0.20
|
||
faiss-cpu>=1.7.4
|
||
tiktoken>=0.5.0
|
||
sentence-transformers>=2.2.0
|
||
torch>=2.0.0
|
||
|