generated from coulomb/repo-seed
Switch the custodian triage default from anthropic/claude-sonnet-4 to google/gemini-2.5-flash, which advertises structured-output support on OpenRouter. Tighten the OpenRouter adapter to send strict JSON schema requests and set provider.require_parameters=true so routing only hits providers that honor the requested response_format. Update Kubernetes deploy docs and config for the verified coulombcore handoff: Containerfile build path, image-pull-policy=Never for smoke pods, credential-routing notes, and live smoke evidence. Mark LLM-WP-0006 finished with closure notes from 2026-06-18.
22 lines
752 B
YAML
22 lines
752 B
YAML
apiVersion: v1
|
|
kind: ConfigMap
|
|
metadata:
|
|
name: llm-connect-config
|
|
namespace: activity-core
|
|
labels:
|
|
app.kubernetes.io/name: llm-connect
|
|
app.kubernetes.io/part-of: activity-core
|
|
data:
|
|
LLM_CONNECT_HOST: "0.0.0.0"
|
|
LLM_CONNECT_PORT: "8080"
|
|
LLM_CONNECT_PROVIDER: "openrouter"
|
|
LLM_CONNECT_MODEL: "google/gemini-2.5-flash"
|
|
LLM_CONNECT_CUSTODIAN_TRIAGE_PROVIDER: "openrouter"
|
|
LLM_CONNECT_CUSTODIAN_TRIAGE_MODEL: "google/gemini-2.5-flash"
|
|
LLM_CONNECT_CUSTODIAN_TRIAGE_TEMPERATURE: "0.2"
|
|
LLM_CONNECT_CUSTODIAN_TRIAGE_MAX_TOKENS: "1800"
|
|
LLM_CONNECT_CUSTODIAN_TRIAGE_MAX_DEPTH: "2"
|
|
LLM_CONNECT_CUSTODIAN_TRIAGE_TIMEOUT_SECONDS: "300"
|
|
LLM_CONNECT_CUSTODIAN_TRIAGE_REASONING_EFFORT: "medium"
|
|
LLM_CONNECT_STRICT_PROFILES: "false"
|