damoojeje commited on
Commit
53c6d79
Β·
verified Β·
1 Parent(s): 3fbb6a1

Update requirements.txt

Browse files
Files changed (1) hide show
  1. requirements.txt +20 -20
requirements.txt CHANGED
@@ -1,45 +1,45 @@
1
  # ===============================
2
  # πŸ“¦ Embedding + Vector Search
3
  # ===============================
4
- chromadb
5
- sentence-transformers # Compatible with huggingface-hub 0.30.1
6
- torch # Stable with sentence-transformers
7
 
8
  # ===============================
9
  # πŸ€– LLM-Based QA
10
  # ===============================
11
- transformers # Works well with huggingface-hub 0.30.1
12
- accelerate
13
- huggingface-hub # Compatible with transformers 4.37.2
14
 
15
  # ===============================
16
  # πŸ“„ PDF Parsing
17
  # ===============================
18
- pymupdf # PyMuPDF for full-page text extraction
19
- pdfminer.six # Optional: structured layout extraction
20
 
21
  # ===============================
22
  # πŸ–ΌοΈ OCR + Image Handling
23
  # ===============================
24
- pytesseract # Requires separate install of Tesseract binary
25
- Pillow
26
 
27
  # ===============================
28
  # 🌐 UI Interface
29
  # ===============================
30
- gradio # Gradio 4+ for modern UI
31
- requests
32
 
33
  # ===============================
34
  # πŸ›  Utilities and Fixes
35
  # ===============================
36
- beautifulsoup4 # Parsing for HTML-in-PDFs (e.g., diagrams/tables)
37
- pydantic # Chromadb is not yet compatible with pydantic 2.x
38
- numpy # Ensures compatibility with chromadb and transformers
39
- tqdm # Progress bar (used in embedding scripts)
40
 
41
- # Natural Language Toolkit=========
42
- nltk
 
 
43
  docx2txt
44
- python-docx
45
- spacy
 
1
  # ===============================
2
  # πŸ“¦ Embedding + Vector Search
3
  # ===============================
4
+ chromadb==0.4.24
5
+ sentence-transformers==2.4.0
6
+ torch>=2.0.1
7
 
8
  # ===============================
9
  # πŸ€– LLM-Based QA
10
  # ===============================
11
+ transformers==4.38.2
12
+ accelerate>=0.26.1
13
+ huggingface-hub==0.30.1
14
 
15
  # ===============================
16
  # πŸ“„ PDF Parsing
17
  # ===============================
18
+ pymupdf>=1.23.0
19
+ pdfminer.six>=20221105
20
 
21
  # ===============================
22
  # πŸ–ΌοΈ OCR + Image Handling
23
  # ===============================
24
+ pytesseract>=0.3.10
25
+ Pillow>=9.4.0
26
 
27
  # ===============================
28
  # 🌐 UI Interface
29
  # ===============================
30
+ gradio>=4.29.0
31
+ requests>=2.31.0
32
 
33
  # ===============================
34
  # πŸ›  Utilities and Fixes
35
  # ===============================
36
+ beautifulsoup4>=4.12.2
37
+ pydantic==1.10.13 # Important: lock to v1.x (chroma not yet compatible with pydantic 2)
38
+ numpy==1.26.4
39
+ tqdm
40
 
41
+ # πŸ”€ NLP & DOCX Parsing
42
+ nltk>=3.8.1
43
+ spacy>=3.7.2
44
+ python-docx>=1.1.0
45
  docx2txt