Compare commits

..

1 Commits

Author SHA1 Message Date
Alexander Whitestone
c7dfb8a5e6 fix: [MONITORING] Integrate Kimi Heartbeat status into Nexus Watchdog (closes #800)
Some checks failed
CI / test (pull_request) Failing after 8s
CI / validate (pull_request) Failing after 12s
2026-04-10 20:16:43 -04:00
6 changed files with 117 additions and 482 deletions

14
app.js
View File

@@ -5,7 +5,6 @@ import { UnrealBloomPass } from 'three/addons/postprocessing/UnrealBloomPass.js'
import { SMAAPass } from 'three/addons/postprocessing/SMAAPass.js';
import { SpatialMemory } from './nexus/components/spatial-memory.js';
import { SessionRooms } from './nexus/components/session-rooms.js';
import { EvenniaRoomPanel } from './nexus/components/evennia-room-panel.js';
// ═══════════════════════════════════════════
// NEXUS v1.1 — Portal System Update
@@ -708,7 +707,6 @@ async function init() {
createAshStorm();
SpatialMemory.init(scene);
SessionRooms.init(scene, camera, null);
EvenniaRoomPanel.init();
updateLoad(90);
loadSession();
@@ -2076,7 +2074,6 @@ function connectHermes() {
addChatMessage('system', 'Hermes link established.');
updateWsHudStatus(true);
refreshWorkshopPanel();
EvenniaRoomPanel.setConnected(true);
};
// Initialize MemPalace
@@ -2105,7 +2102,6 @@ function connectHermes() {
hermesWs = null;
updateWsHudStatus(false);
refreshWorkshopPanel();
EvenniaRoomPanel.setConnected(false);
if (wsReconnectTimer) clearTimeout(wsReconnectTimer);
wsReconnectTimer = setTimeout(connectHermes, 5000);
};
@@ -2116,16 +2112,6 @@ function connectHermes() {
}
function handleHermesMessage(data) {
// ── Evennia room snapshot events (#728) ──
if (data.type === 'evennia.room_snapshot') {
EvenniaRoomPanel.onRoomSnapshot(data);
return;
}
if (data.type === 'evennia.actor_located') {
EvenniaRoomPanel.onActorLocated(data);
return;
}
if (data.type === 'chat') {
addChatMessage(data.agent || 'timmy', data.text);
} else if (data.type === 'tool_call') {

View File

@@ -60,6 +60,23 @@ If the heartbeat is older than --stale-threshold seconds, the
mind is considered dead even if the process is still running
(e.g., hung on a blocking call).
KIMI HEARTBEAT
==============
The Kimi triage pipeline writes a cron heartbeat file after each run:
/var/run/bezalel/heartbeats/kimi-heartbeat.last
(fallback: ~/.bezalel/heartbeats/kimi-heartbeat.last)
{
"job": "kimi-heartbeat",
"timestamp": 1711843200.0,
"interval_seconds": 900,
"pid": 12345,
"status": "ok"
}
If the heartbeat is stale (>2x declared interval), the watchdog reports
a Kimi Heartbeat failure alongside the other checks.
ZERO DEPENDENCIES
=================
Pure stdlib. No pip installs. Same machine as the nexus.
@@ -104,6 +121,10 @@ DEFAULT_HEARTBEAT_PATH = Path.home() / ".nexus" / "heartbeat.json"
DEFAULT_STALE_THRESHOLD = 300 # 5 minutes without a heartbeat = dead
DEFAULT_INTERVAL = 60 # seconds between checks in watch mode
# Kimi Heartbeat — cron job heartbeat file written by the triage pipeline
KIMI_HEARTBEAT_JOB = "kimi-heartbeat"
KIMI_HEARTBEAT_STALE_MULTIPLIER = 2.0 # stale at 2x declared interval
GITEA_URL = os.environ.get("GITEA_URL", "https://forge.alexanderwhitestone.com")
GITEA_TOKEN = os.environ.get("GITEA_TOKEN", "")
GITEA_REPO = os.environ.get("NEXUS_REPO", "Timmy_Foundation/the-nexus")
@@ -345,6 +366,93 @@ def check_syntax_health() -> CheckResult:
)
def check_kimi_heartbeat(
job: str = KIMI_HEARTBEAT_JOB,
stale_multiplier: float = KIMI_HEARTBEAT_STALE_MULTIPLIER,
) -> CheckResult:
"""Check if the Kimi Heartbeat cron job is alive.
Reads the ``<job>.last`` file from the standard Bezalel heartbeat
directory (``/var/run/bezalel/heartbeats/`` or fallback
``~/.bezalel/heartbeats/``). The file is written atomically by the
cron_heartbeat module after each successful triage pipeline run.
A job is stale when:
``time.time() - timestamp > stale_multiplier * interval_seconds``
(same rule used by ``check_cron_heartbeats.py``).
"""
# Resolve heartbeat directory — same logic as cron_heartbeat._resolve
primary = Path("/var/run/bezalel/heartbeats")
fallback = Path.home() / ".bezalel" / "heartbeats"
env_dir = os.environ.get("BEZALEL_HEARTBEAT_DIR")
if env_dir:
hb_dir = Path(env_dir)
elif primary.exists():
hb_dir = primary
elif fallback.exists():
hb_dir = fallback
else:
return CheckResult(
name="Kimi Heartbeat",
healthy=False,
message="Heartbeat directory not found — no triage pipeline deployed yet",
details={"searched": [str(primary), str(fallback)]},
)
hb_file = hb_dir / f"{job}.last"
if not hb_file.exists():
return CheckResult(
name="Kimi Heartbeat",
healthy=False,
message=f"No heartbeat file at {hb_file} — Kimi triage pipeline has never reported",
details={"path": str(hb_file)},
)
try:
data = json.loads(hb_file.read_text())
except (json.JSONDecodeError, OSError) as e:
return CheckResult(
name="Kimi Heartbeat",
healthy=False,
message=f"Heartbeat file corrupt: {e}",
details={"path": str(hb_file), "error": str(e)},
)
timestamp = float(data.get("timestamp", 0))
interval = int(data.get("interval_seconds", 0))
raw_status = data.get("status", "unknown")
age = time.time() - timestamp
if interval <= 0:
# No declared interval — use raw timestamp age (30 min default)
interval = 1800
threshold = stale_multiplier * interval
is_stale = age > threshold
age_str = f"{int(age)}s" if age < 3600 else f"{int(age // 3600)}h {int((age % 3600) // 60)}m"
interval_str = f"{int(interval)}s" if interval < 3600 else f"{int(interval // 3600)}h {int((interval % 3600) // 60)}m"
if is_stale:
return CheckResult(
name="Kimi Heartbeat",
healthy=False,
message=(
f"Silent for {age_str} "
f"(threshold: {stale_multiplier}x {interval_str} = {int(threshold)}s). "
f"Status: {raw_status}"
),
details=data,
)
return CheckResult(
name="Kimi Heartbeat",
healthy=True,
message=f"Alive — last beat {age_str} ago (interval {interval_str}, status={raw_status})",
details=data,
)
# ── Gitea alerting ───────────────────────────────────────────────────
def _gitea_request(method: str, path: str, data: Optional[dict] = None) -> Any:
@@ -446,6 +554,7 @@ def run_health_checks(
check_mind_process(),
check_heartbeat(heartbeat_path, stale_threshold),
check_syntax_health(),
check_kimi_heartbeat(),
]
return HealthReport(timestamp=time.time(), checks=checks)
@@ -545,6 +654,14 @@ def main():
"--json", action="store_true", dest="output_json",
help="Output results as JSON (for integration with other tools)",
)
parser.add_argument(
"--kimi-job", default=KIMI_HEARTBEAT_JOB,
help=f"Kimi heartbeat job name (default: {KIMI_HEARTBEAT_JOB})",
)
parser.add_argument(
"--kimi-stale-multiplier", type=float, default=KIMI_HEARTBEAT_STALE_MULTIPLIER,
help=f"Kimi heartbeat staleness multiplier (default: {KIMI_HEARTBEAT_STALE_MULTIPLIER})",
)
args = parser.parse_args()

View File

@@ -125,19 +125,6 @@
<div class="agent-log-header">AGENT THOUGHT STREAM</div>
<div id="agent-log-content" class="agent-log-content"></div>
</div>
<!-- Evennia Room Snapshot Operator Panel (#728) -->
<div id="evennia-room-panel" class="evennia-room-panel" aria-live="polite">
<div class="erp-header">
<span class="erp-icon"></span>
<span class="erp-title">EVENNIA ROOM</span>
<span class="erp-status-dot erp-offline"></span>
</div>
<div class="erp-body erp-empty-state">
<div class="erp-empty-icon"></div>
<div class="erp-empty-label">DISCONNECTED</div>
<div class="erp-empty-hint">No link to Evennia world.</div>
</div>
</div>
</div>
<!-- Bottom: Chat Interface -->

View File

@@ -1,229 +0,0 @@
// ═══════════════════════════════════════════════════════
// EVENNIA ROOM SNAPSHOT OPERATOR PANEL (Issue #728)
// ═══════════════════════════════════════════════════════
//
// Renders the current Evennia room state in the Nexus HUD.
// Consumes evennia.room_snapshot and evennia.actor_located
// events from the Hermes WebSocket bridge.
//
// States:
// offline — no WS connection
// awaiting — connected but no room data yet
// in-room — room snapshot loaded, render full panel
//
// Usage from app.js:
// EvenniaRoomPanel.init();
// EvenniaRoomPanel.onRoomSnapshot(data);
// EvenniaRoomPanel.onActorLocated(data);
// EvenniaRoomPanel.setConnected(bool);
// ═══════════════════════════════════════════════════════
export const EvenniaRoomPanel = (() => {
// ─── STATE ────────────────────────────────────────────
let _connected = false;
let _roomData = null; // latest evennia.room_snapshot payload
let _actorRoomId = null; // from evennia.actor_located
let _lastUpdate = null; // timestamp of last snapshot
let _panelEl = null; // DOM root
let _init = false;
// ─── DOM REFS ─────────────────────────────────────────
function _el(id) { return document.getElementById(id); }
// ─── INIT ─────────────────────────────────────────────
function init() {
_panelEl = _el('evennia-room-panel');
if (!_panelEl) {
console.warn('[EvenniaRoomPanel] Panel element not found in DOM.');
return;
}
_init = true;
_render();
console.log('[EvenniaRoomPanel] Initialized.');
}
// ─── EVENT HANDLERS ───────────────────────────────────
function onRoomSnapshot(data) {
_roomData = data;
_lastUpdate = data.timestamp || new Date().toISOString();
_actorRoomId = data.room_id || data.room_key || null;
_render();
}
function onActorLocated(data) {
_actorRoomId = data.room_id || data.room_key || null;
// If we get a location but no snapshot yet, show awaiting
if (!_roomData || (_roomData.room_id !== _actorRoomId && _roomData.room_key !== _actorRoomId)) {
_render();
}
}
function setConnected(connected) {
_connected = connected;
if (!connected) {
// Clear room data on disconnect — stale data is lying
_roomData = null;
_actorRoomId = null;
_lastUpdate = null;
}
_render();
}
// ─── RENDER ───────────────────────────────────────────
function _render() {
if (!_panelEl) return;
if (!_connected) {
_renderOffline();
} else if (!_roomData) {
_renderAwaiting();
} else {
_renderRoom();
}
}
function _renderOffline() {
_panelEl.innerHTML = `
<div class="erp-header">
<span class="erp-icon">◈</span>
<span class="erp-title">EVENNIA ROOM</span>
<span class="erp-status-dot erp-offline"></span>
</div>
<div class="erp-body erp-empty-state">
<div class="erp-empty-icon">⊘</div>
<div class="erp-empty-label">DISCONNECTED</div>
<div class="erp-empty-hint">No link to Evennia world.</div>
</div>
`;
_panelEl.classList.add('erp-state-offline');
_panelEl.classList.remove('erp-state-awaiting', 'erp-state-inroom');
}
function _renderAwaiting() {
_panelEl.innerHTML = `
<div class="erp-header">
<span class="erp-icon">◈</span>
<span class="erp-title">EVENNIA ROOM</span>
<span class="erp-status-dot erp-online"></span>
</div>
<div class="erp-body erp-empty-state">
<div class="erp-empty-icon erp-pulse">◎</div>
<div class="erp-empty-label">AWAITING SNAPSHOT</div>
<div class="erp-empty-hint">Connected. Waiting for room data&hellip;</div>
</div>
`;
_panelEl.classList.add('erp-state-awaiting');
_panelEl.classList.remove('erp-state-offline', 'erp-state-inroom');
}
function _renderRoom() {
const room = _roomData;
const title = _esc(room.title || room.room_name || room.room_key || 'Unknown Room');
const desc = _esc(room.desc || 'No description available.');
const exits = Array.isArray(room.exits) ? room.exits : [];
const objects = Array.isArray(room.objects) ? room.objects : [];
const occupants = Array.isArray(room.occupants) ? room.occupants : [];
const roomId = _esc(room.room_id || room.room_key || '—');
const timeStr = _formatTime(_lastUpdate);
// Build exits list
let exitsHtml = '';
if (exits.length > 0) {
exitsHtml = exits.map(e => {
const name = _esc(e.key || e.name || '?');
const dest = _esc(e.destination_name || e.destination_id || e.destination_key || '');
return `<div class="erp-exit-row">
<span class="erp-exit-arrow">→</span>
<span class="erp-exit-name">${name}</span>
${dest ? `<span class="erp-exit-dest">${dest}</span>` : ''}
</div>`;
}).join('');
} else {
exitsHtml = '<div class="erp-none">No visible exits.</div>';
}
// Build objects list
let objectsHtml = '';
if (objects.length > 0) {
objectsHtml = objects.map(o => {
const name = _esc(o.key || o.id || '?');
const desc = _esc(o.short_desc || '');
return `<div class="erp-object-row">
<span class="erp-object-icon">▪</span>
<span class="erp-object-name">${name}</span>
${desc ? `<span class="erp-object-desc">${desc}</span>` : ''}
</div>`;
}).join('');
} else {
objectsHtml = '<div class="erp-none">No visible objects.</div>';
}
// Build occupants list
let occupantsHtml = '';
if (occupants.length > 0) {
occupantsHtml = occupants.map(o => {
const name = _esc(typeof o === 'string' ? o : (o.name || o.key || '?'));
return `<span class="erp-occupant">${name}</span>`;
}).join('');
}
_panelEl.innerHTML = `
<div class="erp-header">
<span class="erp-icon">◈</span>
<span class="erp-title">${title}</span>
<span class="erp-status-dot erp-online"></span>
</div>
<div class="erp-body">
<div class="erp-room-id">${roomId}</div>
<div class="erp-desc">${desc}</div>
<div class="erp-section">
<div class="erp-section-label">EXITS</div>
<div class="erp-exits">${exitsHtml}</div>
</div>
<div class="erp-section">
<div class="erp-section-label">OBJECTS</div>
<div class="erp-objects">${objectsHtml}</div>
</div>
${occupantsHtml ? `
<div class="erp-section">
<div class="erp-section-label">OCCUPANTS</div>
<div class="erp-occupants">${occupantsHtml}</div>
</div>` : ''}
<div class="erp-footer">
<span class="erp-time">${timeStr}</span>
</div>
</div>
`;
_panelEl.classList.add('erp-state-inroom');
_panelEl.classList.remove('erp-state-offline', 'erp-state-awaiting');
}
// ─── UTILS ────────────────────────────────────────────
function _esc(str) {
const d = document.createElement('div');
d.textContent = str;
return d.innerHTML;
}
function _formatTime(isoStr) {
if (!isoStr) return '—';
try {
const d = new Date(isoStr);
return d.toLocaleTimeString('en-US', { hour: '2-digit', minute: '2-digit', second: '2-digit', hour12: false });
} catch {
return '—';
}
}
// ─── PUBLIC API ───────────────────────────────────────
return { init, onRoomSnapshot, onActorLocated, setConnected };
})();

226
style.css
View File

@@ -1580,229 +1580,3 @@ canvas#nexus-canvas {
text-transform: uppercase;
}
/* ═══════════════════════════════════════════════════════
EVENNIA ROOM SNAPSHOT OPERATOR PANEL (#728)
═══════════════════════════════════════════════════════ */
.evennia-room-panel {
width: 280px;
background: rgba(5, 5, 16, 0.85);
backdrop-filter: blur(12px);
border: 1px solid rgba(74, 240, 192, 0.18);
border-left: 3px solid var(--color-primary, #4af0c0);
border-radius: 6px;
font-family: var(--font-body, 'JetBrains Mono', monospace);
font-size: 11px;
color: var(--color-text, #e0f0ff);
pointer-events: auto;
overflow: hidden;
transition: border-color 0.3s ease;
}
.evennia-room-panel.erp-state-offline {
border-left-color: var(--color-danger, #ff4466);
}
.evennia-room-panel.erp-state-awaiting {
border-left-color: var(--color-warning, #ffaa22);
}
.evennia-room-panel.erp-state-inroom {
border-left-color: var(--color-primary, #4af0c0);
}
.erp-header {
display: flex;
align-items: center;
gap: 6px;
padding: 6px 10px;
border-bottom: 1px solid rgba(74, 240, 192, 0.1);
background: rgba(74, 240, 192, 0.04);
}
.erp-icon {
font-size: 12px;
color: var(--color-primary, #4af0c0);
}
.erp-title {
font-size: 10px;
font-weight: 700;
letter-spacing: 1.2px;
color: var(--color-primary, #4af0c0);
flex: 1;
}
.erp-status-dot {
width: 7px;
height: 7px;
border-radius: 50%;
flex-shrink: 0;
}
.erp-status-dot.erp-offline {
background: var(--color-danger, #ff4466);
box-shadow: 0 0 6px var(--color-danger, #ff4466);
}
.erp-status-dot.erp-online {
background: var(--color-primary, #4af0c0);
box-shadow: 0 0 6px var(--color-primary, #4af0c0);
}
.erp-body {
padding: 8px 10px;
max-height: 320px;
overflow-y: auto;
}
/* Empty / offline states */
.erp-empty-state {
text-align: center;
padding: 18px 10px;
}
.erp-empty-icon {
font-size: 22px;
color: rgba(74, 240, 192, 0.25);
margin-bottom: 6px;
}
.erp-empty-icon.erp-pulse {
animation: erpPulse 2s ease-in-out infinite;
}
@keyframes erpPulse {
0%, 100% { opacity: 0.35; }
50% { opacity: 0.9; }
}
.erp-empty-label {
font-size: 10px;
font-weight: 700;
letter-spacing: 1.5px;
color: var(--color-text-muted, #8a9ab8);
margin-bottom: 4px;
}
.erp-empty-hint {
font-size: 10px;
color: rgba(138, 154, 184, 0.55);
}
/* Room content */
.erp-room-id {
font-size: 9px;
color: rgba(138, 154, 184, 0.4);
letter-spacing: 0.8px;
text-transform: uppercase;
margin-bottom: 6px;
}
.erp-desc {
font-size: 11px;
color: rgba(224, 240, 255, 0.8);
line-height: 1.45;
margin-bottom: 10px;
border-left: 2px solid rgba(74, 240, 192, 0.15);
padding-left: 8px;
}
.erp-section {
margin-bottom: 8px;
}
.erp-section-label {
font-size: 9px;
font-weight: 700;
letter-spacing: 1.5px;
color: var(--color-primary, #4af0c0);
margin-bottom: 4px;
opacity: 0.7;
}
.erp-none {
font-size: 10px;
color: rgba(138, 154, 184, 0.35);
font-style: italic;
padding: 2px 0;
}
/* Exits */
.erp-exit-row {
display: flex;
align-items: center;
gap: 6px;
padding: 2px 0;
font-size: 11px;
}
.erp-exit-arrow {
color: var(--color-secondary, #7b5cff);
font-weight: 700;
}
.erp-exit-name {
color: var(--color-secondary, #7b5cff);
font-weight: 600;
}
.erp-exit-dest {
color: rgba(138, 154, 184, 0.45);
font-size: 10px;
}
/* Objects */
.erp-object-row {
display: flex;
align-items: baseline;
gap: 5px;
padding: 2px 0;
font-size: 11px;
}
.erp-object-icon {
color: var(--color-gold, #ffd700);
font-size: 8px;
}
.erp-object-name {
color: rgba(224, 240, 255, 0.75);
font-weight: 500;
}
.erp-object-desc {
color: rgba(138, 154, 184, 0.45);
font-size: 10px;
}
/* Occupants */
.erp-occupants {
display: flex;
flex-wrap: wrap;
gap: 4px;
}
.erp-occupant {
font-size: 10px;
padding: 2px 6px;
background: rgba(74, 240, 192, 0.08);
border: 1px solid rgba(74, 240, 192, 0.15);
border-radius: 3px;
color: var(--color-primary, #4af0c0);
}
/* Footer */
.erp-footer {
margin-top: 6px;
padding-top: 4px;
border-top: 1px solid rgba(74, 240, 192, 0.06);
text-align: right;
}
.erp-time {
font-size: 9px;
color: rgba(138, 154, 184, 0.3);
letter-spacing: 0.5px;
}