Update 2026-04-22 11:47:53

2026-04-22 11:47:54 +04:00 · 2026-04-22 11:47:54 +04:00 · 5b8e94f42e
commit 5b8e94f42e
parent 3122a52966
2 changed files with 91 additions and 25 deletions
--- a/Brain/marcus_brain.py
+++ b/Brain/marcus_brain.py
@ -146,7 +146,12 @@ def init_brain():
        print("  [Voice] disabled by config")
    _log("Brain initialized", "info", "brain")
-    _warmup_llava()
+
    # Warmup runs in a daemon thread so the dashboard + Command: prompt
    # appear immediately. The first real user command will either hit a
    # warm model (fast) or pay the cold-load itself (same as before).
    import threading as _t
    _t.Thread(target=_warmup_llava, daemon=True, name="llava-warmup").start()
 # Global voice references
@ -400,20 +405,51 @@ def _handle_llava(cmd):
 # HELPERS
 # ══════════════════════════════════════════════════════════════════════════════
 def _strip_ansi(s: str) -> str:
    """Strip ANSI colour escapes for correct visual width calculations."""
    import re as _re
    return _re.sub(r"\x1b\[[0-9;]*m", "", s)
 def _warmup_llava():
    """
    Runs in a daemon thread — primes the Ollama model into VRAM so the first
    user command doesn't pay the ~15-20 s cold-load. Tolerates client-timeout
    on the first attempt (common on the 16 GB Jetson when the compute graph
    needs a second pass to fit) by doing one silent retry.
    """
    import ollama
-    print("  Warming up LLaVA... (loading into GPU)")
+    # Quiet heartbeat in the terminal so the operator knows something is happening
-    try:
+    # without flooding stdout once the banner prints.
-        img = get_frame()
+    print("  [Warmup] Loading Qwen2.5-VL into GPU...")
-        ollama.chat(
+    base_options = {
-            model=OLLAMA_MODEL,
+        "temperature": 0.0,
-            messages=[{"role": "user", "content": "hi",
+        "num_predict": _cfg["warmup_num_predict"],
-                       "images": [img] if img else []}],
+        # Honor the same compute-graph caps everything else uses, otherwise
-            options={"temperature": 0.0, "num_predict": _cfg["warmup_num_predict"]}
+        # Ollama reverts to batch=512/ctx=4096 for this call and OOMs.
-        )
+        "num_batch":   _cfg.get("num_batch", 128),
-        print("  LLaVA warm - first command will be fast\n")
+        "num_ctx":     _cfg.get("num_ctx",   2048),
-    except Exception as e:
+    }
-        print(f"  Warmup failed ({e}) - first command may be slow\n")
+    for attempt in (1, 2):
        try:
            img = get_frame()
            ollama.chat(
                model=OLLAMA_MODEL,
                messages=[{"role": "user", "content": "hi",
                           "images": [img] if img else []}],
                options=base_options,
            )
            print("  [Warmup] Ready — first command will be fast")
            return
        except Exception as e:
            if attempt == 1:
                # Cold-load frequently times out on attempt #1 while Ollama
                # is still allocating the compute graph. The model stays
                # loaded though, so attempt #2 almost always succeeds.
                print(f"  [Warmup] first attempt timed out, retrying...")
                continue
            print(f"  [Warmup] failed after retry ({e}) — first real command "
                  f"will pay the cold-load (~15-20 s)")
 def get_brain_status() -> dict:
@ -480,18 +516,39 @@ def run_terminal():
    """Run brain with terminal input loop."""
    init_brain()
    # ─── DASHBOARD ───────────────────────────────────────────────────────
    # Separate the boot log from the interactive dashboard with a clear
    # visual break. Print at the end of init so it's always the last thing
    # on screen before the first `Command:` prompt — even if the operator
    # scrolled through a wall of subsystem init messages.
    status = get_brain_status()
-    print()
+
-    print("=" * 54)
+    def _fmt(v):
-    print("           SANAD AI BRAIN — READY")
+        if v is True:  return "\033[92mON \033[0m"    # green
-    print("=" * 54)
+        if v is False: return "\033[91mOFF\033[0m"    # red
-    for k, v in status.items():
+        return str(v)
-        print(f"  {k:<12}: {v}")
+
-    print("-" * 54)
+    W = 58
-    print("  Type a command, or say \"Sanad, <command>\".")
+    print("\n\n" + "╔" + "═" * (W-2) + "╗")
-    print("  Shortcuts: help | example | yolo | patrol | auto on/off | q")
+    print("║" + "   SANAD — AI BRAIN READY".ljust(W-2) + "║")
-    print("=" * 54)
+    print("╠" + "═" * (W-2) + "╣")
-    print()
+    left  = [("model",    status["model"]),
             ("voice",    _fmt(status["voice"])),
             ("camera",   status["camera"])]
    right = [("yolo",     _fmt(status["yolo"])),
             ("lidar",    _fmt(status["lidar"])),
             ("memory",   _fmt(status["memory"])),
             ("odometry", _fmt(status["odometry"]))]
    for i in range(max(len(left), len(right))):
        l = f"  {left[i][0]:<8}: {left[i][1]}"        if i < len(left)  else ""
        r = f"  {right[i][0]:<8}: {right[i][1]}"      if i < len(right) else ""
        # account for ANSI escapes when padding the left column
        pad = 28 + (len(l) - len(_strip_ansi(l)))
        print("║" + l.ljust(pad) + r.ljust(W - 2 - pad) + "║")
    print("╠" + "═" * (W-2) + "╣")
    print("║" + "  Type a command, or say \"Sanad, <command>\".".ljust(W-2) + "║")
    print("║" + "  help · example · yolo · patrol · auto on/off · q".ljust(W-2) + "║")
    print("╚" + "═" * (W-2) + "╝\n")
    try:
        while True:
--- a/Lidar/SLAM_worker.py
+++ b/Lidar/SLAM_worker.py
@ -595,7 +595,16 @@ def slam_worker(
    def init_slam_stack():
        nonlocal slam, filt, stable
-        cfg = load_config(config_file=None, max_range=float(eng_cfg.max_range))
+        # kiss_icp >= 1.2.x requires a `deskew` positional arg; pre-1.2 doesn't.
        # Try the new signature first, fall back to the old one.
        try:
            cfg = load_config(
                config_file=None,
                deskew=bool(getattr(eng_cfg, "deskew", True)),
                max_range=float(eng_cfg.max_range),
            )
        except TypeError:
            cfg = load_config(config_file=None, max_range=float(eng_cfg.max_range))
        cfg.mapping.voxel_size = float(eng_cfg.slam_voxel_size)
        slam = KissICP(cfg)