| FROM ghcr.io/ggml-org/llama.cpp:full |
|
|
| |
| WORKDIR /app |
|
|
| |
| RUN apt update && apt install -y python3-pip |
|
|
| |
| RUN pip install -U huggingface_hub |
|
|
| |
| RUN python3 -c 'from huggingface_hub import hf_hub_download; \ |
| hf_hub_download(repo_id="unsloth/Llama-3.2-3B-Instruct-GGUF", \ |
| filename="Llama-3.2-3B-Instruct-IQ4_NL.gguf", \ |
| local_dir=".", \ |
| local_dir_use_symlinks=False)' |
|
|
| |
| RUN ls -lh /app/Llama-3.2-3B-Instruct-IQ4_NL.gguf |
|
|
| |
| CMD ["--server", "-m", "/app/Llama-3.2-3B-Instruct-IQ4_NL.gguf", "--port", "7860", "--host", "0.0.0.0", "-n", "4096", "--ctx-size", "32768"] |