mirror of
https://github.com/ruvnet/RuVector.git
synced 2026-05-23 04:27:11 +00:00
SSE Proxy Decoupling (ADR-130): - Fix ruvbrain-sse proxy: proper MCP handshake, session creation, drain polling - Fix internal queue endpoints: session_create keeps receiver, drain returns buffered messages - Add response_queues to AppState for SSE proxy communication - Skip sparsifier for >5M edge graphs (was crashing on 16M edges) - Add SSE_DISABLED/MAX_SSE env vars for configurable connection limits - Route SSE to dedicated mcp.pi.ruv.io subdomain (Cloudflare CNAME) - Serve SSE at root / path on proxy (no /sse needed) - Update all references from pi.ruv.io/sse to mcp.pi.ruv.io - Fix Dockerfile consciousness crate build (feature/version mismatches) Claude Code CLI Source Research (ADR-133): - 19 research documents analyzing Claude Code internals (3000+ lines) - Decompiler script + RVF corpus builder for all major versions - Binary RVF containers for v0.2, v1.0, v2.0, v2.1 (300-2068 vectors each) - Call graphs, class hierarchies, state machines from minified source Integration Strategy (ADR-134): - 6-tier integration plan: WASM MCP, agents, hooks, cache, SDK, plugin - Integration guide with architecture diagrams and performance targets Co-Authored-By: claude-flow <ruv@ruv.net>
61 lines
1.8 KiB
YAML
61 lines
1.8 KiB
YAML
apiVersion: serving.knative.dev/v1
|
|
kind: Service
|
|
metadata:
|
|
name: dragnes
|
|
labels:
|
|
app: dragnes
|
|
component: dermatology-intelligence
|
|
annotations:
|
|
run.googleapis.com/launch-stage: GA
|
|
run.googleapis.com/ingress: all
|
|
spec:
|
|
template:
|
|
metadata:
|
|
annotations:
|
|
autoscaling.knative.dev/minScale: "1"
|
|
autoscaling.knative.dev/maxScale: "10"
|
|
run.googleapis.com/cpu-throttling: "false"
|
|
run.googleapis.com/startup-cpu-boost: "true"
|
|
spec:
|
|
containerConcurrency: 80
|
|
timeoutSeconds: 300
|
|
serviceAccountName: dragnes-sa@ruv-dev.iam.gserviceaccount.com
|
|
containers:
|
|
- image: gcr.io/ruv-dev/dragnes:latest
|
|
ports:
|
|
- containerPort: 3000
|
|
resources:
|
|
limits:
|
|
cpu: "2"
|
|
memory: 2Gi
|
|
env:
|
|
- name: NODE_ENV
|
|
value: production
|
|
- name: OPENAI_BASE_URL
|
|
value: https://openrouter.ai/api/v1
|
|
- name: OPENAI_API_KEY
|
|
valueFrom:
|
|
secretKeyRef:
|
|
name: OPENROUTER_API_KEY
|
|
key: latest
|
|
- name: MCP_SERVERS
|
|
value: '[{"name":"pi-brain","url":"https://mcp.pi.ruv.io"}]'
|
|
- name: DRAGNES_ENABLED
|
|
value: "true"
|
|
- name: DRAGNES_BRAIN_URL
|
|
value: https://pi.ruv.io
|
|
- name: DRAGNES_MODEL_VERSION
|
|
value: 0.1.0
|
|
startupProbe:
|
|
httpGet:
|
|
path: /api/health
|
|
port: 3000
|
|
initialDelaySeconds: 5
|
|
periodSeconds: 5
|
|
failureThreshold: 10
|
|
livenessProbe:
|
|
httpGet:
|
|
path: /api/health
|
|
port: 3000
|
|
periodSeconds: 30
|
|
failureThreshold: 3
|