MDIIII's picture
perf: raise rate limit to 200/min for paid-tier models
2f5bdbc
Raw
History Blame Contribute Delete
1.2 kB
import os
# OpenRouter
OPENROUTER_API_KEY = os.getenv("OPENROUTER_API_KEY", "")
OPENROUTER_BASE_URL = "https://openrouter.ai/api/v1"
# Free models on OpenRouter (verified working 2026-06)
FREE_MODELS = [
"google/gemma-4-31b-it:free",
"google/gemma-4-26b-a4b-it:free",
"nvidia/nemotron-3-super-120b-a12b:free",
"meta-llama/llama-3.3-70b-instruct:free",
]
DEFAULT_MODEL = FREE_MODELS[0]
# Paid (affordable) open-source models via OpenRouter
PAID_MODELS = [
"meta-llama/llama-3.1-8b-instruct",
"google/gemma-4-26b-a4b-it",
"qwen/qwen3.5-9b",
"meta-llama/llama-3.3-70b-instruct",
]
# All available models (union)
AVAILABLE_MODELS = FREE_MODELS + PAID_MODELS
# Supported assets
ASSETS = ["BTC/USDT", "ETH/USDT"]
ASSET_YFINANCE_MAP = {
"BTC/USDT": "BTC-USD",
"ETH/USDT": "ETH-USD",
}
# Benchmarks
BENCHMARKS = ["A", "B", "C"]
# Portfolio
INITIAL_CAPITAL = 10_000.0
TRADE_FEE = 0.001 # 0.1%
# Rate limiting — paid OpenRouter tier supports 200+ req/min
# 60/min shared across parallel runs → ~15/run when 4 run simultaneously
MAX_REQUESTS_PER_MINUTE = 200
LLM_TIMEOUT = 120
LLM_MAX_RETRIES = 3
# DB
DB_PATH = os.getenv("DB_PATH", "/app/data/benchmark.db")