mekosotto commited on
Commit
c6ef481
·
1 Parent(s): e175fb0

feat(llm): refresh free-tier chain with verified-live OpenRouter IDs

Browse files
Files changed (1) hide show
  1. src/llm/explainer.py +11 -11
src/llm/explainer.py CHANGED
@@ -58,18 +58,18 @@ _LLM_TEMPERATURE = 0.3
58
  # 5xx (upstream), we advance to the next model. Network/timeout errors fall
59
  # straight to the deterministic template — switching models won't help.
60
  # Override at runtime via OPENROUTER_FREE_MODELS (comma-separated). Model
61
- # availability on OpenRouter churns; an ID that 404s is skipped silently.
62
  _DEFAULT_FREE_MODEL_CHAIN: tuple[str, ...] = (
63
- "inclusionai/ling-2.6-1t:free", # ~1T flagship
64
- "nvidia/nemotron-3-super-120b-a12b:free", # 120B reasoning MoE
65
- "minimax/minimax-m2.5:free",
66
- "tencent/hy3-preview:free", # MoE + reasoning
67
- "google/gemma-4-31b-it:free",
68
- "google/gemma-4-26b-a4b-it:free",
69
- "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free",
70
- "poolside/laguna-m.1:free",
71
- "poolside/laguna-xs.2:free",
72
- "meta-llama/llama-3.2-3b-instruct:free", # 3B last-resort
73
  )
74
 
75
 
 
58
  # 5xx (upstream), we advance to the next model. Network/timeout errors fall
59
  # straight to the deterministic template — switching models won't help.
60
  # Override at runtime via OPENROUTER_FREE_MODELS (comma-separated). Model
61
+ # availability on OpenRouter churns; verify with scripts/diagnose_openrouter.py.
62
  _DEFAULT_FREE_MODEL_CHAIN: tuple[str, ...] = (
63
+ "inclusionai/ling-2.6-1t:free", # ~1T flagship — verified OK, returns content
64
+ "nvidia/nemotron-3-super-120b-a12b:free", # 120B verified OK, returns content
65
+ "minimax/minimax-m2.5:free", # MoE — verified OK, returns content
66
+ "google/gemma-4-31b-it:free", # 31B currently 429 but valid id
67
+ "google/gemma-4-26b-a4b-it:free", # 26B MoE — currently 429 but valid id
68
+ "qwen/qwen3-next-80b-a3b-instruct:free", # 80B — currently 429 but valid id
69
+ "tencent/hy3-preview:free", # MoE preview — verified OK
70
+ "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", # 30B reasoning — verified OK
71
+ "nvidia/nemotron-3-nano-30b-a3b:free", # 30B — verified OK
72
+ "poolside/laguna-xs.2:free", # smallest — verified OK
73
  )
74
 
75