Spaces:
Running on Zero
Running on Zero
File size: 957 Bytes
9a7964b a31982f 9a7964b a31982f 9a7964b a31982f f173e0f a31982f f173e0f 9a7964b a31982f 9a7964b | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 | # --- Preset selection (models.yaml is the source of truth) ---
ACTIVE_MODEL=minicpm5-1b
# Dev: enable dropdown in Gradio. Space: leave false to pin one model for visitors.
ALLOW_MODEL_SWITCH=false
# MODEL_PRESETS_PATH=./models.yaml
# --- Agent outputs ---
# AGENT_OUTPUTS_DIR=/tmp/agent_outputs
# AGENT_TRACES_DIR=outputs/traces
# SKILLS_DIR=./skills
# --- Legacy single-model overrides (optional; applied to ACTIVE_MODEL only) ---
# INFERENCE_BACKEND=transformers
# MODEL_ID=openbmb/MiniCPM5-1B
# TRUST_REMOTE_CODE=true
# --- llama.cpp presets (optional) ---
# ACTIVE_MODEL=qwen3b-gguf
# INFERENCE_BACKEND=llama_cpp
# MODEL_REPO=Qwen/Qwen2.5-3B-Instruct-GGUF
# MODEL_FILE=qwen2.5-3b-instruct-q4_k_m.gguf
# N_CTX=4096
# N_GPU_LAYERS=0
# Optional: local GGUF path instead of Hub download
# MODEL_PATH=./models/qwen2.5-3b-instruct-q4_k_m.gguf
# Optional: local fine-tuned merged weights
# ACTIVE_MODEL=gemma-merged-local
# MODEL_ID=./gemma_merged_model
|