Spaces:

Dzunisani007
/

cv-analyser

Running

cv-analyser / Dockerfile.hf-ocr

Optimize Docker build process and dependencies

78bd45b 23 days ago

1.05 kB

	FROM python:3.11-slim

	# Install system-level dependencies for OCR and PDF processing
	RUN apt-get update && apt-get install -y \
	build-essential \
	curl \
	git \
	python3-dev \
	libmagic-dev \
	tesseract-ocr \
	tesseract-ocr-eng \
	libtesseract-dev \
	poppler-utils \
	libgl1-mesa-glx \
	libglib2.0-0 \
	&& apt-get install -y libmagic1 \
	&& rm -rf /var/lib/apt/lists/*

	WORKDIR /app

	# Upgrade pip
	RUN pip install --no-cache-dir --upgrade pip

	# Copy requirements and install Python dependencies
	COPY requirements.hf.txt requirements.txt

	# Pre-install heavy engines to avoid build conflicts
	RUN pip install --no-cache-dir torch==2.1.1 numpy==1.24.4
	RUN FORCE_CUDA=0 pip install --no-cache-dir -r requirements.txt

	# Re-add OCR dependencies to requirements
	RUN pip install --no-cache-dir pytesseract pdf2image pdfplumber

	# Copy application code
	COPY . .

	# Expose port for Hugging Face Spaces
	EXPOSE 7860

	# Command to run the application
	CMD ["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "7860"]