docs(llm): add probe-date + 429-policy notes; fix chain capability order
Browse files- src/llm/explainer.py +4 -1
src/llm/explainer.py
CHANGED
|
@@ -59,13 +59,16 @@ _LLM_TEMPERATURE = 0.3
|
|
| 59 |
# straight to the deterministic template — switching models won't help.
|
| 60 |
# Override at runtime via OPENROUTER_FREE_MODELS (comma-separated). Model
|
| 61 |
# availability on OpenRouter churns; verify with scripts/diagnose_openrouter.py.
|
|
|
|
|
|
|
|
|
|
| 62 |
_DEFAULT_FREE_MODEL_CHAIN: tuple[str, ...] = (
|
| 63 |
"inclusionai/ling-2.6-1t:free", # ~1T flagship — verified OK, returns content
|
| 64 |
"nvidia/nemotron-3-super-120b-a12b:free", # 120B — verified OK, returns content
|
| 65 |
"minimax/minimax-m2.5:free", # MoE — verified OK, returns content
|
|
|
|
| 66 |
"google/gemma-4-31b-it:free", # 31B — currently 429 but valid id
|
| 67 |
"google/gemma-4-26b-a4b-it:free", # 26B MoE — currently 429 but valid id
|
| 68 |
-
"qwen/qwen3-next-80b-a3b-instruct:free", # 80B — currently 429 but valid id
|
| 69 |
"tencent/hy3-preview:free", # MoE preview — verified OK
|
| 70 |
"nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", # 30B reasoning — verified OK
|
| 71 |
"nvidia/nemotron-3-nano-30b-a3b:free", # 30B — verified OK
|
|
|
|
| 59 |
# straight to the deterministic template — switching models won't help.
|
| 60 |
# Override at runtime via OPENROUTER_FREE_MODELS (comma-separated). Model
|
| 61 |
# availability on OpenRouter churns; verify with scripts/diagnose_openrouter.py.
|
| 62 |
+
# Last verified: 2026-05-02 via scripts/diagnose_openrouter.py.
|
| 63 |
+
# Entries marked "currently 429" have valid IDs but were quota-exhausted at
|
| 64 |
+
# probe time; kept because OpenRouter rate-limits are per-window and recover.
|
| 65 |
_DEFAULT_FREE_MODEL_CHAIN: tuple[str, ...] = (
|
| 66 |
"inclusionai/ling-2.6-1t:free", # ~1T flagship — verified OK, returns content
|
| 67 |
"nvidia/nemotron-3-super-120b-a12b:free", # 120B — verified OK, returns content
|
| 68 |
"minimax/minimax-m2.5:free", # MoE — verified OK, returns content
|
| 69 |
+
"qwen/qwen3-next-80b-a3b-instruct:free", # 80B — currently 429 but valid id
|
| 70 |
"google/gemma-4-31b-it:free", # 31B — currently 429 but valid id
|
| 71 |
"google/gemma-4-26b-a4b-it:free", # 26B MoE — currently 429 but valid id
|
|
|
|
| 72 |
"tencent/hy3-preview:free", # MoE preview — verified OK
|
| 73 |
"nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", # 30B reasoning — verified OK
|
| 74 |
"nvidia/nemotron-3-nano-30b-a3b:free", # 30B — verified OK
|