Deployment Bot commited on
Commit ·
eb576ef
1
Parent(s): 4ba6f31
Fix AI provider: Switch from Gemma 3 4b to Llama-3.1-8B-Instruct (chat-compatible)
Browse files- backend/config.py +4 -3
backend/config.py
CHANGED
|
@@ -38,10 +38,11 @@ PROVIDER_REGISTRY = {
|
|
| 38 |
},
|
| 39 |
"huggingface": {
|
| 40 |
# HF Inference Providers router — OpenAI-compatible chat completions.
|
| 41 |
-
#
|
| 42 |
-
#
|
|
|
|
| 43 |
"base_url": "https://router.huggingface.co/v1",
|
| 44 |
-
"default_model": "
|
| 45 |
"tool_format": "openai",
|
| 46 |
"api_key_env": "HF_TOKEN",
|
| 47 |
},
|
|
|
|
| 38 |
},
|
| 39 |
"huggingface": {
|
| 40 |
# HF Inference Providers router — OpenAI-compatible chat completions.
|
| 41 |
+
# meta-llama/Llama-3.1-8B-Instruct is confirmed to work on the HF router
|
| 42 |
+
# with the free token (no monthly credit consumption).
|
| 43 |
+
# Gemma models are text-gen only — NOT chat-compatible on HF router.
|
| 44 |
"base_url": "https://router.huggingface.co/v1",
|
| 45 |
+
"default_model": "meta-llama/Llama-3.1-8B-Instruct",
|
| 46 |
"tool_format": "openai",
|
| 47 |
"api_key_env": "HF_TOKEN",
|
| 48 |
},
|