seanpedrickcase commited on
Commit
ef8c72e
·
1 Parent(s): 40bd54b

Similar cleanup to requirements_lightweight.txt

Browse files
Files changed (1) hide show
  1. requirements_lightweight.txt +31 -23
requirements_lightweight.txt CHANGED
@@ -1,35 +1,43 @@
1
- pdfminer.six==20250506
2
- pdf2image==1.17.0
3
- pymupdf==1.26.4
4
- opencv-python==4.12.0.88
5
- presidio_analyzer==2.2.360
6
- presidio_anonymizer==2.2.360
7
- presidio-image-redactor==0.0.57
8
- pikepdf==9.11.0
9
  pandas==2.3.3
10
- scikit-learn==1.7.2
11
- spacy==3.8.7
12
- en_core_web_lg @ https://github.com/explosion/spacy-models/releases/download/en_core_web_lg-3.8.0/en_core_web_lg-3.8.0.tar.gz
13
- gradio==5.49.1
14
  polars==1.33.1
15
- boto3==1.40.57
16
  pyarrow==21.0.0
17
  openpyxl==3.1.5
 
 
 
18
  Faker==37.8.0
19
  python-levenshtein==0.27.1
20
- spaczz==0.6.1
21
- https://github.com/seanpedrick-case/gradio_image_annotator/releases/download/v0.3.3/gradio_image_annotation-0.3.3-py3-none-any.whl # This version includes rotation, image zoom, and default labels, as well as the option to include id for annotation boxes
22
  rapidfuzz==3.14.1
23
- python-dotenv==1.0.1
24
- awslambdaric==3.1.1
25
- python-docx==1.2.0
26
- defusedxml==0.7.1
27
- # Test dependencies
28
- pytest>=7.0.0
29
- pytest-cov>=4.0.0
30
- spaces==0.42.1
31
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32
 
 
 
 
 
33
 
 
 
34
 
 
 
35
 
 
 
 
 
1
+ # --- Core and data packages ---
2
+ numpy==2.2.6
 
 
 
 
 
 
3
  pandas==2.3.3
 
 
 
 
4
  polars==1.33.1
 
5
  pyarrow==21.0.0
6
  openpyxl==3.1.5
7
+ boto3==1.40.57
8
+ python-dotenv==1.0.1
9
+ defusedxml==0.7.1
10
  Faker==37.8.0
11
  python-levenshtein==0.27.1
 
 
12
  rapidfuzz==3.14.1
 
 
 
 
 
 
 
 
13
 
14
+ # --- Machine learning / NLP ---
15
+ scikit-learn==1.7.2
16
+ spacy==3.8.7
17
+ spaczz==0.6.1
18
+ en_core_web_lg @ https://github.com/explosion/spacy-models/releases/download/en_core_web_lg-3.8.0/en_core_web_lg-3.8.0.tar.gz
19
+
20
+ # --- PDF / OCR / Redaction tools ---
21
+ pdfminer.six==20250506
22
+ pdf2image==1.17.0
23
+ pymupdf==1.26.4
24
+ pikepdf==9.11.0
25
+ opencv-python==4.12.0.88
26
+ presidio_analyzer==2.2.360
27
+ presidio_anonymizer==2.2.360
28
+ presidio-image-redactor==0.0.57
29
 
30
+ # --- Gradio and apps ---
31
+ gradio==5.49.1
32
+ https://github.com/seanpedrick-case/gradio_image_annotator/releases/download/v0.3.3/gradio_image_annotation-0.3.3-py3-none-any.whl # Custom annotator version with rotation, zoom, labels, and box IDs
33
+ spaces==0.42.1
34
 
35
+ # --- AWS Lambda runtime ---
36
+ awslambdaric==3.1.1
37
 
38
+ # --- Document generation ---
39
+ python-docx==1.2.0
40
 
41
+ # --- Testing ---
42
+ pytest>=7.0.0
43
+ pytest-cov>=4.0.0