Deployment Bot commited on
Commit Β·
4ba6f31
1
Parent(s): bf5c2da
Force HuggingFace provider with Gemma 3 4B for all AI operations
Browse files- backend/config.py +3 -6
backend/config.py
CHANGED
|
@@ -38,13 +38,10 @@ PROVIDER_REGISTRY = {
|
|
| 38 |
},
|
| 39 |
"huggingface": {
|
| 40 |
# HF Inference Providers router β OpenAI-compatible chat completions.
|
| 41 |
-
# google/gemma-3-
|
| 42 |
# monthly Inference-Provider credit allowance β works on the free token.
|
| 43 |
-
# Confirmed: HTTP 200 chat + native tool_calls support.
|
| 44 |
-
# If 27B is cold/unavailable, alternatives that also stay free:
|
| 45 |
-
# google/gemma-3-12b-it (smaller, faster cold-start)
|
| 46 |
"base_url": "https://router.huggingface.co/v1",
|
| 47 |
-
"default_model": "google/gemma-3-
|
| 48 |
"tool_format": "openai",
|
| 49 |
"api_key_env": "HF_TOKEN",
|
| 50 |
},
|
|
@@ -57,7 +54,7 @@ PROVIDER_REGISTRY = {
|
|
| 57 |
}
|
| 58 |
|
| 59 |
# ββ Active Provider βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 60 |
-
ACTIVE_PROVIDER =
|
| 61 |
|
| 62 |
if ACTIVE_PROVIDER not in PROVIDER_REGISTRY:
|
| 63 |
raise ValueError(
|
|
|
|
| 38 |
},
|
| 39 |
"huggingface": {
|
| 40 |
# HF Inference Providers router β OpenAI-compatible chat completions.
|
| 41 |
+
# google/gemma-3-4b-it routes to a provider that does NOT consume the
|
| 42 |
# monthly Inference-Provider credit allowance β works on the free token.
|
|
|
|
|
|
|
|
|
|
| 43 |
"base_url": "https://router.huggingface.co/v1",
|
| 44 |
+
"default_model": "google/gemma-3-4b-it",
|
| 45 |
"tool_format": "openai",
|
| 46 |
"api_key_env": "HF_TOKEN",
|
| 47 |
},
|
|
|
|
| 54 |
}
|
| 55 |
|
| 56 |
# ββ Active Provider βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 57 |
+
ACTIVE_PROVIDER = "huggingface" # Forced to HF per user request
|
| 58 |
|
| 59 |
if ACTIVE_PROVIDER not in PROVIDER_REGISTRY:
|
| 60 |
raise ValueError(
|