chore(routing): flip LITELLM_BASE_URL default to https://llm-api.d-ma.be
Follow-up to infra#70. LiteLLM moved off piguard into k3s and the public llm-api.d-ma.be hostname now upstreams to koala:30401. The piguard:4000 default in the source bit-rots — works today because piguard:4000 is still alive during the 7-day soak, breaks the moment the compose comes down. Pointing the default at the public hostname survives the cutover without needing a follow-up. Production deploys via k3s already override via env (in-cluster Service DNS) so this only affects local dev shells without LITELLM_BASE_URL set. - internal/config/routing.go: comment + envOr fallback - internal/config/routing_test.go: expected value in defaults test - scripts/smoke-routing.sh: shell default task check: clean (tests + vet + govulncheck).
This commit is contained in:
@@ -11,7 +11,7 @@ import (
|
|||||||
type RoutingConfig struct {
|
type RoutingConfig struct {
|
||||||
Port string // ROUTING_PORT, default 3210
|
Port string // ROUTING_PORT, default 3210
|
||||||
MCPAuthToken string // ROUTING_MCP_TOKEN, optional bearer token
|
MCPAuthToken string // ROUTING_MCP_TOKEN, optional bearer token
|
||||||
LiteLLMBaseURL string // LITELLM_BASE_URL, default http://piguard:4000
|
LiteLLMBaseURL string // LITELLM_BASE_URL, default https://llm-api.d-ma.be
|
||||||
LiteLLMAPIKey string // LITELLM_API_KEY
|
LiteLLMAPIKey string // LITELLM_API_KEY
|
||||||
BrainURL string // BRAIN_URL, default http://ingestion.supervisor:3300
|
BrainURL string // BRAIN_URL, default http://ingestion.supervisor:3300
|
||||||
FastModel string // HYPERGUILD_FAST_MODEL, default koala/qwen35-9b-fast
|
FastModel string // HYPERGUILD_FAST_MODEL, default koala/qwen35-9b-fast
|
||||||
@@ -41,7 +41,7 @@ func LoadRouting() (RoutingConfig, error) {
|
|||||||
cfg := RoutingConfig{
|
cfg := RoutingConfig{
|
||||||
Port: envOr("ROUTING_PORT", "3210"),
|
Port: envOr("ROUTING_PORT", "3210"),
|
||||||
MCPAuthToken: os.Getenv("ROUTING_MCP_TOKEN"),
|
MCPAuthToken: os.Getenv("ROUTING_MCP_TOKEN"),
|
||||||
LiteLLMBaseURL: envOr("LITELLM_BASE_URL", "http://piguard:4000"),
|
LiteLLMBaseURL: envOr("LITELLM_BASE_URL", "https://llm-api.d-ma.be"),
|
||||||
LiteLLMAPIKey: os.Getenv("LITELLM_API_KEY"),
|
LiteLLMAPIKey: os.Getenv("LITELLM_API_KEY"),
|
||||||
BrainURL: envOr("BRAIN_URL", "http://ingestion.supervisor:3300"),
|
BrainURL: envOr("BRAIN_URL", "http://ingestion.supervisor:3300"),
|
||||||
FastModel: envOr("HYPERGUILD_FAST_MODEL", "koala/qwen35-9b-fast"),
|
FastModel: envOr("HYPERGUILD_FAST_MODEL", "koala/qwen35-9b-fast"),
|
||||||
|
|||||||
@@ -22,7 +22,7 @@ func TestLoadRoutingDefaults(t *testing.T) {
|
|||||||
require.NoError(t, err)
|
require.NoError(t, err)
|
||||||
assert.Equal(t, "3210", cfg.Port)
|
assert.Equal(t, "3210", cfg.Port)
|
||||||
assert.Equal(t, "", cfg.MCPAuthToken)
|
assert.Equal(t, "", cfg.MCPAuthToken)
|
||||||
assert.Equal(t, "http://piguard:4000", cfg.LiteLLMBaseURL)
|
assert.Equal(t, "https://llm-api.d-ma.be", cfg.LiteLLMBaseURL)
|
||||||
assert.Equal(t, "http://ingestion.supervisor:3300", cfg.BrainURL)
|
assert.Equal(t, "http://ingestion.supervisor:3300", cfg.BrainURL)
|
||||||
assert.Equal(t, "koala/qwen35-9b-fast", cfg.FastModel)
|
assert.Equal(t, "koala/qwen35-9b-fast", cfg.FastModel)
|
||||||
assert.Equal(t, "iguana/gemma4-26b", cfg.ThinkingModel)
|
assert.Equal(t, "iguana/gemma4-26b", cfg.ThinkingModel)
|
||||||
|
|||||||
@@ -4,7 +4,7 @@ set -euo pipefail
|
|||||||
# Boot the routing binary and exercise its four tools against live deps.
|
# Boot the routing binary and exercise its four tools against live deps.
|
||||||
# Skipped when LITELLM_BASE_URL or BRAIN_URL is unreachable.
|
# Skipped when LITELLM_BASE_URL or BRAIN_URL is unreachable.
|
||||||
|
|
||||||
LITELLM_BASE_URL="${LITELLM_BASE_URL:-http://piguard:4000}"
|
LITELLM_BASE_URL="${LITELLM_BASE_URL:-https://llm-api.d-ma.be}"
|
||||||
BRAIN_URL="${BRAIN_URL:-http://koala:30330}"
|
BRAIN_URL="${BRAIN_URL:-http://koala:30330}"
|
||||||
|
|
||||||
if ! curl -sS --max-time 2 "${LITELLM_BASE_URL}/v1/models" >/dev/null 2>&1; then
|
if ! curl -sS --max-time 2 "${LITELLM_BASE_URL}/v1/models" >/dev/null 2>&1; then
|
||||||
|
|||||||
Reference in New Issue
Block a user