30 lines
427 B
Plaintext
30 lines
427 B
Plaintext
# OCR字幕提取工具依赖包
|
|
|
|
# 基础依赖
|
|
opencv-python>=4.8.0
|
|
numpy>=1.21.0
|
|
Pillow>=9.0.0
|
|
|
|
# OCR引擎
|
|
paddlepaddle>=2.5.0
|
|
paddleocr>=2.7.0
|
|
easyocr>=1.7.0
|
|
torch>=1.13.0
|
|
torchvision>=0.14.0
|
|
|
|
# 模型和图像处理
|
|
shapely>=1.8.0
|
|
scipy>=1.9.0
|
|
scikit-image>=0.19.0
|
|
|
|
# FunASR (用于SenseVoice)
|
|
funasr>=1.0.0
|
|
modelscope>=1.9.0
|
|
|
|
# 文本处理
|
|
regex>=2022.0.0
|
|
Levenshtein>=0.20.0
|
|
|
|
# 工具库
|
|
tqdm>=4.64.0
|
|
requests>=2.28.0 |