Deployment Bot commited on
Commit
eb576ef
·
1 Parent(s): 4ba6f31

Fix AI provider: Switch from Gemma 3 4b to Llama-3.1-8B-Instruct (chat-compatible)

Browse files
Files changed (1) hide show
  1. backend/config.py +4 -3
backend/config.py CHANGED
@@ -38,10 +38,11 @@ PROVIDER_REGISTRY = {
38
  },
39
  "huggingface": {
40
  # HF Inference Providers router — OpenAI-compatible chat completions.
41
- # google/gemma-3-4b-it routes to a provider that does NOT consume the
42
- # monthly Inference-Provider credit allowance works on the free token.
 
43
  "base_url": "https://router.huggingface.co/v1",
44
- "default_model": "google/gemma-3-4b-it",
45
  "tool_format": "openai",
46
  "api_key_env": "HF_TOKEN",
47
  },
 
38
  },
39
  "huggingface": {
40
  # HF Inference Providers router — OpenAI-compatible chat completions.
41
+ # meta-llama/Llama-3.1-8B-Instruct is confirmed to work on the HF router
42
+ # with the free token (no monthly credit consumption).
43
+ # Gemma models are text-gen only — NOT chat-compatible on HF router.
44
  "base_url": "https://router.huggingface.co/v1",
45
+ "default_model": "meta-llama/Llama-3.1-8B-Instruct",
46
  "tool_format": "openai",
47
  "api_key_env": "HF_TOKEN",
48
  },