Configure all agents for local inference via festinger

- All agents now use lm_studio provider → http://festinger:11434
- ctx_length set to 32768 for Omega13 (128GB RAM); reduce for smaller machines
- Model: qwen2.5-7b-instruct (update to larger model on Omega13)
- Each agent has a unique A0_PERSISTENT_RUNTIME_ID for stable mcp_server_token
- agent_profile=agent0 and mcp_server_enabled=true set in all settings.json
- agents/agent0/prompts/ placeholder created for pull-on-start persona override
- pull-agent-identity.py now writes to usr/agents/agent0/prompts/ (correct override path)
- festinger: agent_frameworks table auto-seeded on startup with all 5 agents
- festinger: num_ctx injection, agent_frameworks CRUD + admin UI, /chat endpoint
- festinger: removed debug system_prompt logging

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
2026-05-03 13:00:07 +02:00
parent 4a2b682f6d
commit 8e97cbc97a
24 changed files with 609 additions and 101 deletions
+16 -10
View File
@@ -1,27 +1,33 @@
{
"allow_chat_override": false,
"chat_model": {
"provider": "anthropic",
"name": "claude-opus-4-6",
"api_base": "http://festinger:11434/v1/messages",
"ctx_length": 100000,
"provider": "lm_studio",
"name": "qwen2.5-7b-instruct",
"api_base": "http://festinger:11434",
"ctx_length": 32768,
"ctx_history": 0.7,
"vision": true,
"rl_requests": 0,
"rl_input": 0,
"rl_output": 0,
"kwargs": {"max_tokens": 4096}
"kwargs": {
"max_tokens": 4096,
"agent_id": 5
},
"max_embeds": 10
},
"utility_model": {
"provider": "ollama",
"name": "deepseek-r1:8b",
"provider": "lm_studio",
"name": "qwen2.5-7b-instruct",
"api_base": "http://festinger:11434",
"ctx_length": 100000,
"ctx_length": 32768,
"ctx_input": 0.7,
"rl_requests": 0,
"rl_input": 0,
"rl_output": 0,
"kwargs": {}
"kwargs": {
"X-Agent-Id": 5
}
},
"embedding_model": {
"provider": "huggingface",
@@ -31,4 +37,4 @@
"rl_input": 0,
"kwargs": {}
}
}
}