Spaces:

seanpedrickcase
/

document_redaction

Running

document_redaction / requirements.txt

Updated review functions to update with manual reviews. Minor package update

80268bb 5 days ago

1.26 kB

	pdfminer.six==20250506
	pdf2image==1.17.0
	pymupdf==1.26.3
	opencv-python==4.12.0.88
	presidio_analyzer==2.2.359
	presidio_anonymizer==2.2.359
	presidio-image-redactor==0.0.57
	pikepdf==9.10.2
	pandas==2.3.1
	scikit-learn==1.7.1
	spacy==3.8.7
	en_core_web_lg @ https://github.com/explosion/spacy-models/releases/download/en_core_web_lg-3.8.0/en_core_web_lg-3.8.0.tar.gz
	gradio==5.44.0
	boto3==1.40.10
	pyarrow==21.0.0
	openpyxl==3.1.5
	Faker==37.5.3
	python-levenshtein==0.27.1
	spaczz==0.6.1
	# The following version
	https://github.com/seanpedrick-case/gradio_image_annotator/releases/download/v0.3.3/gradio_image_annotation-0.3.3-py3-none-any.whl # This version includes rotation, image zoom, and default labels, as well as the option to include id for annotation boxes
	rapidfuzz==3.13.0
	python-dotenv==1.0.1
	awslambdaric==3.1.1
	python-docx==1.2.0
	paddlepaddle==3.1.0 # Consider installing the GPU version for faster local OCR inference with PaddleOCR: paddlepaddle-gpu==3.1.0 -i https://www.paddlepaddle.org.cn/packages/stable/cu126/ , compatible with CUDA 12.6. See this for more details: https://www.paddlepaddle.org.cn/documentation/docs/en/install/pip/linux-pip_en.html#span-id-gpu-gpu-version-of-paddlepaddle-span
	paddleocr==3.1.1