Includes updates across gateway, router, node-worker, memory-service, aurora-service, swapper, sofiia-console UI and node2 infrastructure: - gateway-bot: Dockerfile, http_api.py, druid/aistalk prompts, doc_service - services/router: main.py, router-config.yml, fabric_metrics, memory_retrieval, offload_client, prompt_builder - services/node-worker: worker.py, main.py, config.py, fabric_metrics - services/memory-service: Dockerfile, database.py, main.py, requirements - services/aurora-service: main.py (+399), kling.py, quality_report.py - services/swapper-service: main.py, swapper_config_node2.yaml - services/sofiia-console: static/index.html (console UI update) - config: agent_registry, crewai_agents/teams, router_agents - ops/fabric_preflight.sh: updated preflight checks - router-config.yml, docker-compose.node2.yml: infra updates - docs: NODA1-AGENT-ARCHITECTURE, fabric_contract updated Made-with: Cursor
50 lines
1.0 KiB
YAML
50 lines
1.0 KiB
YAML
# Swapper Configuration for Node #2 (Development Node)
|
|
# MacBook Pro M4 Max - Apple Silicon (40-core GPU, 64GB RAM)
|
|
#
|
|
# NOTE: Swapper is now a runtime gateway / executor only.
|
|
# Source of truth for models is NCS (Node Capabilities Service).
|
|
# No hardcoded model lists — Swapper queries NCS or Ollama /api/tags at startup.
|
|
|
|
node_id: noda2
|
|
|
|
runtimes:
|
|
ollama:
|
|
url: http://host.docker.internal:11434
|
|
timeout: 300
|
|
# mlx:
|
|
# stt_model: whisper-large-v3-turbo
|
|
# tts_model: kokoro-82m
|
|
# comfyui:
|
|
# url: http://127.0.0.1:8188
|
|
|
|
limits:
|
|
llm_concurrency: 1
|
|
vision_concurrency: 1
|
|
max_concurrent_models: 1
|
|
model_swap_timeout: 300
|
|
|
|
timeouts:
|
|
llm_ms: 120000
|
|
vision_ms: 180000
|
|
stt_ms: 60000
|
|
tts_ms: 60000
|
|
image_gen_ms: 300000
|
|
|
|
gpu:
|
|
enabled: true
|
|
metal_acceleration: true
|
|
|
|
storage:
|
|
models_dir: /app/models
|
|
cache_dir: /app/cache
|
|
swap_dir: /app/swap
|
|
|
|
models:
|
|
flux-klein-4b:
|
|
path: huggingface:segmind/tiny-sd
|
|
type: image_generation
|
|
size_gb: 0.7
|
|
priority: medium
|
|
capabilities:
|
|
- image_generation
|