Deployment Bot commited on
Commit
4ba6f31
Β·
1 Parent(s): bf5c2da

Force HuggingFace provider with Gemma 3 4B for all AI operations

Browse files
Files changed (1) hide show
  1. backend/config.py +3 -6
backend/config.py CHANGED
@@ -38,13 +38,10 @@ PROVIDER_REGISTRY = {
38
  },
39
  "huggingface": {
40
  # HF Inference Providers router β€” OpenAI-compatible chat completions.
41
- # google/gemma-3-27b-it routes to a provider that does NOT consume the
42
  # monthly Inference-Provider credit allowance β€” works on the free token.
43
- # Confirmed: HTTP 200 chat + native tool_calls support.
44
- # If 27B is cold/unavailable, alternatives that also stay free:
45
- # google/gemma-3-12b-it (smaller, faster cold-start)
46
  "base_url": "https://router.huggingface.co/v1",
47
- "default_model": "google/gemma-3-27b-it",
48
  "tool_format": "openai",
49
  "api_key_env": "HF_TOKEN",
50
  },
@@ -57,7 +54,7 @@ PROVIDER_REGISTRY = {
57
  }
58
 
59
  # ── Active Provider ───────────────────────────────────────────────────────────
60
- ACTIVE_PROVIDER = os.getenv("PROVIDER", "anthropic").lower()
61
 
62
  if ACTIVE_PROVIDER not in PROVIDER_REGISTRY:
63
  raise ValueError(
 
38
  },
39
  "huggingface": {
40
  # HF Inference Providers router β€” OpenAI-compatible chat completions.
41
+ # google/gemma-3-4b-it routes to a provider that does NOT consume the
42
  # monthly Inference-Provider credit allowance β€” works on the free token.
 
 
 
43
  "base_url": "https://router.huggingface.co/v1",
44
+ "default_model": "google/gemma-3-4b-it",
45
  "tool_format": "openai",
46
  "api_key_env": "HF_TOKEN",
47
  },
 
54
  }
55
 
56
  # ── Active Provider ───────────────────────────────────────────────────────────
57
+ ACTIVE_PROVIDER = "huggingface" # Forced to HF per user request
58
 
59
  if ACTIVE_PROVIDER not in PROVIDER_REGISTRY:
60
  raise ValueError(