File size: 1,341 Bytes
11196b1
 
 
 
ecb9581
11196b1
 
5be262b
 
 
2aa5eb6
5be262b
 
 
 
 
 
317f8de
 
 
 
7814a5f
2aa5eb6
9bd939c
11196b1
5be262b
11196b1
5be262b
11196b1
 
5be262b
 
11196b1
5be262b
 
 
 
11196b1
 
5be262b
11196b1
 
5be262b
 
 
 
 
 
 
 
 
11196b1
 
9d9ab2d
11196b1
 
9d9ab2d
11196b1
 
9d9ab2d
11196b1
 
5be262b
11196b1
 
9d9ab2d
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
Flask==3.1.0
flask-cors==5.0.1
Werkzeug==3.1.3
python-dotenv==1.0.1


# Core ML/AI
torch==2.1.0
torchaudio==2.1.0
torchvision==0.16.0
transformers==4.36.2
sentence-transformers==2.2.2
scikit-learn==1.3.2
numpy==1.24.3
pandas==2.1.4
scipy==1.11.4
accelerate==0.25.0
bitsandbytes==0.41.1  # For 4-bit quantization
einops==0.7.0  # Required for some transformer models
tiktoken==0.5.2  # For tokenization
protobuf==4.25.1  # Required for some model loading



# NLP
spacy==3.7.2
en-core-web-sm @ https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.1/en_core_web_sm-3.7.1-py3-none-any.whl
nltk==3.8.1

# OCR & PDF/Image
pytesseract==0.3.10
pdf2image==1.16.3
PyPDF2==3.0.1
pdfminer.six==20221105
pdfplumber==0.10.3
opencv-python==4.8.1.78
pillow==10.1.0

# Whisper (speech-to-text)
openai-whisper==20231117

# Utilities
requests==2.31.0
tqdm==4.66.1
python-docx==1.0.1
gunicorn==21.2.0

# Required for Hugging Face Spaces
gradio==4.13.0
huggingface-hub==0.20.3
sentencepiece==0.1.99

# Optional: If you use celery for background tasks
# celery==5.4.0

# Optional: If you use haystack for search
# haystack==0.42

# Optional: If you use langchain for LLM orchestration
# langchain==0.3.20

# Optional: If you use sentencepiece for tokenization
# sentencepiece==0.2.0

# Optional: If you use systemd
# systemd-python==234