Spaces:

FoodDesert
/

Prompt_Squirrel_RAG

Running

Prompt_Squirrel_RAG / psq_rag /llm /openrouter_client.py

Food Desert

Add alias-based character tag filtering for Stage 3

c6be992 4 months ago

4.08 kB

	import os, json
	from typing import Any, Dict, List, Optional, Tuple
	import httpx


	OPENROUTER_API_KEY = os.environ.get("OPENROUTER_API_KEY", "")
	OPENROUTER_MODEL = os.environ.get("OPENROUTER_MODEL", "meta-llama/llama-3.1-8b-instruct")

	def _extract_json_object(text: str) -> Optional[dict]:
	"""
	Best-effort: find the first top-level JSON object in a response.
	Works even if the model wraps JSON with prose or code fences.
	"""
	if not text:
	return None

	# Strip common fences
	t = text.strip()
	t = t.removeprefix("```json").removeprefix("```").removesuffix("```").strip()

	# Find first {...} span
	start = t.find("{")
	if start == -1:
	return None

	depth = 0
	for i in range(start, len(t)):
	if t[i] == "{":
	depth += 1
	elif t[i] == "}":
	depth -= 1
	if depth == 0:
	chunk = t[start:i+1]
	try:
	return json.loads(chunk)
	except Exception:
	return None
	return None



	def openrouter_chat(
	messages: List[Dict[str, str]],
	response_format: Optional[Dict[str, Any]] = None,
	temperature: float = 0.2,
	max_tokens: int = 512,
	timeout_s: float = 30.0,
	) -> Tuple[Optional[str], Optional[dict], Optional[str]]:
	"""
	Returns (raw_text, parsed_json, error_str).
	Never raises.

	Instrumented to help diagnose moderation/routing variance:
	- includes HTTP status
	- includes OpenRouter error message/code if provided
	"""
	if not OPENROUTER_API_KEY:
	return None, None, "OPENROUTER_API_KEY missing"

	payload: Dict[str, Any] = {
	"model": OPENROUTER_MODEL,
	"messages": messages,
	"temperature": temperature,
	"max_tokens": max_tokens,
	}
	if response_format is not None:
	payload["response_format"] = response_format

	headers = {
	"Authorization": f"Bearer {OPENROUTER_API_KEY}",
	"Content-Type": "application/json",
	"HTTP-Referer": "https://huggingface.co/spaces",
	"X-Title": "Prompt_Squirrel_RAG",
	}

	try:
	with httpx.Client(timeout=timeout_s) as client:
	r = client.post(
	"https://openrouter.ai/api/v1/chat/completions",
	headers=headers,
	json=payload,
	)

	data = r.json()
	choice0 = data["choices"][0]
	content = (choice0["message"].get("content", "") or "").strip()

	finish_reason = choice0.get("finish_reason")
	native_finish_reason = choice0.get("native_finish_reason")

	# (optional) expose these as part of error_str for logging
	meta = []
	if data.get("model"):
	meta.append(f"model={data['model']}")
	if finish_reason:
	meta.append(f"finish={finish_reason}")
	if native_finish_reason:
	meta.append(f"native_finish={native_finish_reason}")
	if isinstance(data.get("usage"), dict):
	u = data["usage"]
	if "prompt_tokens" in u and "completion_tokens" in u:
	meta.append(f"tokens={u['prompt_tokens']}+{u['completion_tokens']}")

	parsed = _extract_json_object(content)

	# If it looks filtered, flag it
	if finish_reason == "content_filter":
	return content, parsed, f"Filtered (content_filter; {'; '.join(meta)})"

	# If it looks refusal-like but not content_filter, still flag it
	if content.lower().startswith(("i can't", "i can’t", "i cannot", "can't", "cannot")):
	return content, parsed, f"Refusal-like ({'; '.join(meta)})"

	return content, parsed, None

	except Exception as e:
	return None, None, f"{type(e).__name__}: {e}"


	if __name__ == "__main__":
	print("openrouter_client.py imports ok")