qa_python_k2_think_api_UI

Runtime error

rabiyulfahim commited on Oct 6

Commit

247f998

verified ·

1 Parent(s): 484d307

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -4,7 +4,7 @@ FROM python:3.10-slim
 # Set working directory
 WORKDIR /app
-# Install system dependencies (for PyTorch and git)
 RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
 # Copy requirements and install
@@ -14,18 +14,18 @@ RUN pip install --no-cache-dir -r requirements.txt
 # Copy application code
 COPY . .
-# ✅ Hugging Face cache directory (use /tmp, writable in Spaces)
 ENV HF_HOME=/tmp
-# Pre-download model into /tmp to avoid cold start
 RUN python -c "from transformers import AutoTokenizer, AutoModelForCausalLM; \
-    model_id='rabiyulfahim/qa_python_gpt2'; \
     AutoTokenizer.from_pretrained(model_id, cache_dir='/tmp'); \
     AutoModelForCausalLM.from_pretrained(model_id, cache_dir='/tmp')"
-# Expose the correct port (Hugging Face default is 7860)
 EXPOSE 7860
-# Command to run the app
-CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

 # Set working directory
 WORKDIR /app
+# Install system dependencies
 RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
 # Copy requirements and install
 # Copy application code
 COPY . .
+# ✅ Hugging Face cache directory
 ENV HF_HOME=/tmp
+ENV TRANSFORMERS_CACHE=/tmp
+# Pre-download K2-Think model to avoid cold start
 RUN python -c "from transformers import AutoTokenizer, AutoModelForCausalLM; \
+    model_id='LLM360/K2-Think'; \
     AutoTokenizer.from_pretrained(model_id, cache_dir='/tmp'); \
     AutoModelForCausalLM.from_pretrained(model_id, cache_dir='/tmp')"
+# Expose port
 EXPOSE 7860
+# Command to run the FastAPI app
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]