Spaces:

satyaki-mitra
/

ContractIntel_AI

Sleeping

satyaki-mitra commited on 5 days ago

Commit

31b2e82

1 Parent(s): 02d909f

README updated

Files changed (3) hide show

Dockerfile CHANGED Viewed

@@ -1,26 +1,17 @@
-FROM python:3.11-slim
 WORKDIR /app
-# Install system dependencies for llama-cpp-python and PDF processing
 RUN apt-get update && apt-get install -y \
     curl \
     wget \
     git \
-    build-essential \
-    cmake \
-    pkg-config \
-    libopenblas-dev \
-    liblapack-dev \
-    libxml2-dev \
-    libxslt1-dev \
-    zlib1g-dev \
-    libjpeg-dev \
-    libpng-dev \
-    libfreetype6-dev \
     && rm -rf /var/lib/apt/lists/*
-# Copy requirements and install with optimizations
 COPY requirements.txt .
 RUN pip install --no-cache-dir --upgrade pip && \
     pip install --no-cache-dir -r requirements.txt
@@ -28,24 +19,24 @@ RUN pip install --no-cache-dir --upgrade pip && \
 # Download spaCy model
 RUN python -m spacy download en_core_web_sm
-# Copy application
 COPY . .
-# Create directories (HF Spaces uses /data for persistent storage)
 RUN mkdir -p uploads cache logs /data/models
-# Expose port (HF Spaces uses 7860 by default)
-EXPOSE 7860
-# Environment variables for CPU-only operation
 ENV LLAMA_CPP_N_GPU_LAYERS=0
-ENV CUDA_VISIBLE_DEVICES=""
-ENV OMP_NUM_THREADS=4
-ENV NUMEXPR_MAX_THREADS=4
-# HEALTH CHECK for HF Spaces
 HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
     CMD curl -f http://localhost:7860/api/v1/health || exit 1
-# CMD for HuggingFace Spaces (NO Ollama!)
-CMD uvicorn app:app --host 0.0.0.0 --port 7860 --workers 1 --timeout-keep-alive 30

+FROM python:3.11-slim-bookworm
 WORKDIR /app
+# Install ONLY minimal runtime dependencies (no build tools!)
+# libgomp1 is needed by OpenMP in NumPy/SciPy; git/wget/curl for huggingface-hub
 RUN apt-get update && apt-get install -y \
     curl \
     wget \
     git \
+    libgomp1 \
     && rm -rf /var/lib/apt/lists/*
+# Install Python dependencies (wheels only — no compilation!)
 COPY requirements.txt .
 RUN pip install --no-cache-dir --upgrade pip && \
     pip install --no-cache-dir -r requirements.txt
 # Download spaCy model
 RUN python -m spacy download en_core_web_sm
+# Copy app code
 COPY . .
+# Create directories
 RUN mkdir -p uploads cache logs /data/models
+# Environment: enforce CPU mode
+ENV CUDA_VISIBLE_DEVICES=""
 ENV LLAMA_CPP_N_GPU_LAYERS=0
+ENV OMP_NUM_THREADS=2
+ENV NUMEXPR_MAX_THREADS=2
+# Expose port
+EXPOSE 7860
+# Health check
 HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
     CMD curl -f http://localhost:7860/api/v1/health || exit 1
+# Run app
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1", "--timeout-keep-alive", "30"]

README.md CHANGED Viewed

@@ -4,7 +4,6 @@ emoji: 📝
 colorFrom: blue
 colorTo: purple
 sdk: docker
-accelerator: gpu
 license: mit
 ---

 colorFrom: blue
 colorTo: purple
 sdk: docker
 license: mit
 ---

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
---extra-index-url https://pypi.org/simple/ https://huggingface.github.io/llama-cpp-python-wheels/
 # Core Dependencies
 fastapi>=0.104.1
@@ -7,8 +7,8 @@ pydantic>=2.5.0
 pydantic-settings>=2.1.0
 python-multipart>=0.0.6
-# AI & NLP Libraries
-torch>=2.1.0
 transformers>=4.35.0
 sentence-transformers>=2.2.2
 tokenizers>=0.14.0
@@ -40,7 +40,7 @@ openai>=1.0.0
 anthropic>=0.5.0
 # For Hugging Face Spaces
-llama-cpp-python==0.3.16        # pinned to version with pre-built wheel
 huggingface-hub>=0.19.0
 # Text Processing Utilities

+--extra-index-url https://pypi.org/simple/ https://huggingface.github.io/llama-cpp-python-wheels/ https://download.pytorch.org/whl/cpu
 # Core Dependencies
 fastapi>=0.104.1
 pydantic-settings>=2.1.0
 python-multipart>=0.0.6
+# AI & NLP Libraries (CPU-only PyTorch!)
+torch>=2.1.0+cpu
 transformers>=4.35.0
 sentence-transformers>=2.2.2
 tokenizers>=0.14.0
 anthropic>=0.5.0
 # For Hugging Face Spaces
+llama-cpp-python==0.3.16  # Pinned to pre-built wheel
 huggingface-hub>=0.19.0
 # Text Processing Utilities