Spaces:

CiegCieg
/

InstructJet-AI

Sleeping

App Files Files Community

InstructJet-AI / Dockerfile

Fatmagician

New updates faster

b7e622a about 1 month ago

raw

history blame contribute delete

2.07 kB

	# Read the doc: https://huggingface.co/docs/hub/spaces-sdks-docker
	# you will also find guides on how best to write your Dockerfile

	# FROM python:3.12.3

	# RUN useradd -m -u 1000 user
	# USER user
	# ENV PATH="/home/user/.local/bin:$PATH"

	# WORKDIR /app

	# COPY --chown=user ./requirements.txt requirements.txt
	# RUN pip install --no-cache-dir --upgrade -r requirements.txt
	# RUN mkdir -p /app/models && \
	# wget https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGUF/resolve/main/llama-2-7b-chat.Q4_K_M.gguf \
	# -O /app/models/llama-2-7b-chat.Q4_K_M.gguf

	# COPY --chown=user . /app
	# CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

	FROM python:3.12

	# --- System dependencies ---
	RUN apt-get update && apt-get install -y --no-install-recommends \
	wget \
	libgomp1 \
	&& rm -rf /var/lib/apt/lists/*

	RUN apt-get update && apt-get install -y build-essential cmake

	# --- Non-root user ---
	RUN useradd -m -u 1000 user
	USER user
	WORKDIR /app
	ENV PATH="/home/user/.local/bin:$PATH"

	# --- Copy wheel and requirements first ---
	COPY --chown=user llama_cpp_python-0.3.20-py3-none-linux_x86_64.whl .
	COPY --chown=user requirements.txt .

	ENV CMAKE_ARGS="-DLLAMA_AVX2=on -DLLAMA_FMA=on -DLLAMA_OPENMP=on"


	# --- Install dependencies ---
	RUN pip install --no-cache-dir --upgrade pip && \
	pip install --no-cache-dir -r requirements.txt && \
	pip install --no-cache-dir llama_cpp_python-0.3.20-py3-none-linux_x86_64.whl

	# --- Download model ---
	RUN mkdir -p /app/models && \
	wget --progress=bar:force \
	--retry-connrefused \
	--tries=5 \
	--timeout=30 \
	-O /app/models/Ministral-3-3B-Instruct-2512-Q4_K_M.gguf \
	https://huggingface.co/mistralai/Ministral-3-3B-Instruct-2512-GGUF/resolve/main/Ministral-3-3B-Instruct-2512-Q4_K_M.gguf

	RUN ls -lh /app/models && \
	du -h /app/models/Ministral-3-3B-Instruct-2512-Q4_K_M.gguf

	# --- Copy source code ---
	COPY --chown=user . /app

	# --- Expose & run ---
	EXPOSE 7860
	CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]