From f81e586500aa4e31d35513fae2e65fb4ce522d35 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Wed, 11 Mar 2026 15:03:18 -0700
Subject: [PATCH 01/25] Add rebrand for welcome UI, include launch.sh script

---
 brev/launch.sh            | 51 ++++++++++++++++++++++++++-
 brev/welcome-ui/server.js | 73 ++++++++++++++++++++++++++++++++++-----
 2 files changed, 115 insertions(+), 9 deletions(-)
diff --git a/brev/launch.sh b/brev/launch.sh
index dfee5f8..881a1af 100755
--- a/brev/launch.sh
+++ b/brev/launch.sh
@@ -32,6 +32,7 @@ CLI_RETRY_COUNT="${CLI_RETRY_COUNT:-5}"
 CLI_RETRY_DELAY_SECS="${CLI_RETRY_DELAY_SECS:-3}"
 GHCR_LOGIN="${GHCR_LOGIN:-auto}"
 GHCR_USER="${GHCR_USER:-}"
+NEMOCLAW_IMAGE="${NEMOCLAW_IMAGE:-ghcr.io/nvidia/openshell-community/sandboxes/nemoclaw:latest}"
 
 mkdir -p "$(dirname "$LAUNCH_LOG")"
 touch "$LAUNCH_LOG"
@@ -252,6 +253,47 @@ docker_login_ghcr_if_needed() {
   fi
 }
 
+should_build_nemoclaw_image() {
+  [[ -n "$COMMUNITY_REF" && "$COMMUNITY_REF" != "main" ]]
+}
+
+build_nemoclaw_image_if_needed() {
+  local docker_cmd=()
+  local image_context="$REPO_ROOT/sandboxes/nemoclaw"
+  local dockerfile_path="$image_context/Dockerfile"
+
+  if ! should_build_nemoclaw_image; then
+    log "Skipping local NeMoClaw image build (COMMUNITY_REF=${COMMUNITY_REF:-<unset>})."
+    return
+  fi
+
+  if [[ ! -f "$dockerfile_path" ]]; then
+    log "NeMoClaw Dockerfile not found: $dockerfile_path"
+    exit 1
+  fi
+
+  if command -v docker >/dev/null 2>&1; then
+    docker_cmd=(docker)
+  elif command -v sudo >/dev/null 2>&1; then
+    docker_cmd=(sudo docker)
+  else
+    log "Docker is required to build the NeMoClaw sandbox image."
+    exit 1
+  fi
+
+  log "Building local NeMoClaw image for non-main ref '$COMMUNITY_REF': $NEMOCLAW_IMAGE"
+  if ! "${docker_cmd[@]}" build \
+    --pull \
+    --tag "$NEMOCLAW_IMAGE" \
+    --file "$dockerfile_path" \
+    "$image_context"; then
+    log "Local NeMoClaw image build failed."
+    exit 1
+  fi
+
+  log "Local NeMoClaw image ready: $NEMOCLAW_IMAGE"
+}
+
 checkout_repo_ref() {
   if [[ -z "$COMMUNITY_REF" ]]; then
     return
@@ -518,7 +560,12 @@ start_welcome_ui() {
   log "Starting welcome UI in background..."
   log "Welcome UI log: $WELCOME_UI_LOG"
 
-  nohup env PORT="$PORT" REPO_ROOT="$REPO_ROOT" CLI_BIN="$CLI_BIN" node server.js >> "$WELCOME_UI_LOG" 2>&1 &
+  nohup env \
+    PORT="$PORT" \
+    REPO_ROOT="$REPO_ROOT" \
+    CLI_BIN="$CLI_BIN" \
+    NEMOCLAW_IMAGE="$NEMOCLAW_IMAGE" \
+    node server.js >> "$WELCOME_UI_LOG" 2>&1 &
   WELCOME_UI_PID=$!
   export WELCOME_UI_PID
   log "Welcome UI PID: $WELCOME_UI_PID"
@@ -544,6 +591,8 @@ main() {
   ensure_cli_compat_aliases
   step "Authenticating registries"
   docker_login_ghcr_if_needed
+  step "Preparing NeMoClaw image"
+  build_nemoclaw_image_if_needed
   step "Ensuring Node.js"
   ensure_node
 
diff --git a/brev/welcome-ui/server.js b/brev/welcome-ui/server.js
index abc63b8..240947b 100644
--- a/brev/welcome-ui/server.js
+++ b/brev/welcome-ui/server.js
@@ -38,6 +38,7 @@ const SANDBOX_START_CMD = process.env.SANDBOX_START_CMD || "nemoclaw-start";
 const SANDBOX_BASE_IMAGE =
   process.env.SANDBOX_BASE_IMAGE ||
   "ghcr.io/nvidia/openshell-community/sandboxes/openclaw:latest";
+const NEMOCLAW_IMAGE = (process.env.NEMOCLAW_IMAGE || "").trim();
 const POLICY_FILE = path.join(SANDBOX_DIR, "policy.yaml");
 
 const LOG_FILE = "/tmp/nemoclaw-sandbox-create.log";
@@ -264,6 +265,13 @@ const injectKeyState = {
   keyHash: null,
 };
 
+// Raw API key stored in memory so it can be passed to the sandbox at
+// creation time and forwarded to LiteLLM for inference.  Not persisted
+// to disk.
+let _nvidiaApiKey = process.env.NVIDIA_INFERENCE_API_KEY
+  || process.env.NVIDIA_INTEGRATE_API_KEY
+  || "";
+
 // ── Brev ID detection & URL building ───────────────────────────────────────
 
 function extractBrevId(host) {
@@ -286,7 +294,7 @@ function buildOpenclawUrl(token) {
   } else {
     url = `http://127.0.0.1:${PORT}/`;
   }
-  if (token) url += `?token=${token}`;
+  if (token) url += `#token=${token}`;
   return url;
 }
 
@@ -627,18 +635,26 @@ function runSandboxCreate() {
       const cmd = [
         CLI_BIN, "sandbox", "create",
         "--name", SANDBOX_NAME,
-        "--from", SANDBOX_DIR,
+        "--from", NEMOCLAW_IMAGE || SANDBOX_DIR,
         "--forward", "18789",
       ];
       if (policyPath) cmd.push("--policy", policyPath);
-      cmd.push(
-        "--",
-        "env",
-        `CHAT_UI_URL=${chatUiUrl}`,
-        SANDBOX_START_CMD
-      );
+      const envArgs = [`CHAT_UI_URL=${chatUiUrl}`];
+      const nvapiKey = _nvidiaApiKey
+        || process.env.NVIDIA_INFERENCE_API_KEY
+        || process.env.NVIDIA_INTEGRATE_API_KEY
+        || "";
+      if (nvapiKey) {
+        envArgs.push(`NVIDIA_INFERENCE_API_KEY=${nvapiKey}`);
+        envArgs.push(`NVIDIA_INTEGRATE_API_KEY=${nvapiKey}`);
+      }
+
+      cmd.push("--", "env", ...envArgs, SANDBOX_START_CMD);
 
       const cmdDisplay = cmd.slice(0, 8).join(" ") + " -- ...";
+      if (NEMOCLAW_IMAGE) {
+        logWelcome(`Using NeMoClaw image override: ${NEMOCLAW_IMAGE}`);
+      }
       logWelcome(`Running: ${cmdDisplay}`);
 
       const logFd = fs.openSync(LOG_FILE, "w");
@@ -788,6 +804,38 @@ function runInjectKey(key, keyHash) {
     });
 }
 
+/**
+ * Forward the API key to the sandbox's LiteLLM instance via the
+ * policy-proxy's /api/litellm-key endpoint.  This triggers a config
+ * regeneration and LiteLLM restart with the new key.
+ */
+function forwardKeyToSandbox(key) {
+  const body = JSON.stringify({ apiKey: key });
+  const opts = {
+    hostname: "127.0.0.1",
+    port: SANDBOX_PORT,
+    path: "/api/litellm-key",
+    method: "POST",
+    headers: {
+      "Content-Type": "application/json",
+      "Content-Length": Buffer.byteLength(body),
+    },
+    timeout: 10000,
+  };
+  const req = http.request(opts, (res) => {
+    res.resume();
+    if (res.statusCode === 200) {
+      log("inject-key", "Forwarded API key to sandbox LiteLLM");
+    } else {
+      log("inject-key", `Sandbox LiteLLM key forward returned ${res.statusCode}`);
+    }
+  });
+  req.on("error", (err) => {
+    log("inject-key", `Failed to forward key to sandbox: ${err.message}`);
+  });
+  req.end(body);
+}
+
 // ── Provider CRUD ──────────────────────────────────────────────────────────
 
 function parseProviderDetail(stdout) {
@@ -1271,8 +1319,16 @@ async function handleInjectKey(req, res) {
   injectKeyState.status = "injecting";
   injectKeyState.error = null;
   injectKeyState.keyHash = keyH;
+  _nvidiaApiKey = key;
 
   runInjectKey(key, keyH);
+
+  // If the sandbox is already running, forward the key to LiteLLM inside
+  // the sandbox so it can authenticate with upstream NVIDIA APIs.
+  if (sandboxState.status === "running") {
+    forwardKeyToSandbox(key);
+  }
+
   return jsonResponse(res, 202, { ok: true, started: true });
 }
 
@@ -1561,6 +1617,7 @@ function _resetForTesting() {
   detectedBrevId = "";
   _brevEnvId = "";
   renderedIndex = null;
+  _nvidiaApiKey = "";
 }
 
 function _setMocksForTesting(mocks) {

From 53258bc6076094830eed0099414297f53dc5ff64 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Wed, 11 Mar 2026 16:40:54 -0700
Subject: [PATCH 02/25] Remove BASH_SOURCE dependency

---
 brev/launch.sh | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/brev/launch.sh b/brev/launch.sh
index 881a1af..1fdd5d5 100755
--- a/brev/launch.sh
+++ b/brev/launch.sh
@@ -38,6 +38,10 @@ mkdir -p "$(dirname "$LAUNCH_LOG")"
 touch "$LAUNCH_LOG"
 exec > >(tee -a "$LAUNCH_LOG") 2>&1
 
+mkdir -p "$(dirname "$LAUNCH_LOG")"
+touch "$LAUNCH_LOG"
+exec > >(tee -a "$LAUNCH_LOG") 2>&1
+
 log() {
   printf '[launch.sh] %s\n' "$*"
 }

From 9842d40d712120aa28ef290d65d48bb8ba30b0f3 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Wed, 11 Mar 2026 17:03:29 -0700
Subject: [PATCH 03/25] Address silent fail on launch.sh

---
 brev/launch.sh | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/brev/launch.sh b/brev/launch.sh
index 1fdd5d5..881a1af 100755
--- a/brev/launch.sh
+++ b/brev/launch.sh
@@ -38,10 +38,6 @@ mkdir -p "$(dirname "$LAUNCH_LOG")"
 touch "$LAUNCH_LOG"
 exec > >(tee -a "$LAUNCH_LOG") 2>&1
 
-mkdir -p "$(dirname "$LAUNCH_LOG")"
-touch "$LAUNCH_LOG"
-exec > >(tee -a "$LAUNCH_LOG") 2>&1
-
 log() {
   printf '[launch.sh] %s\n' "$*"
 }

From eb74ff4c9f5771f8835dce89ec4b4d2b6687df20 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Wed, 11 Mar 2026 17:22:00 -0700
Subject: [PATCH 04/25] Add favicon, handle ghcr.io login if params present,
 fix logo

---
 brev/welcome-ui/favicon.ico | Bin 32038 -> 32038 bytes
 brev/welcome-ui/index.html  |   4 ++--
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/brev/welcome-ui/favicon.ico b/brev/welcome-ui/favicon.ico
index dce06225d9aa9a234d2faa96a7807ab14f790700..76d821c156c32261e5063776228679bc49c1915d 100644
GIT binary patch
literal 32038
zcmdU&37A|(wSYSeWC%+-fC&&FlK??fWDyKJ5hj3&M%h6Y7Xm)^9U<&w@`40W2!fz2
z0)h_(1=$3HERzHbAc%q>vQCI7pu$8HMi|rY|NHcvdwZSk1jRQWKUKHtoKvT^Q`J2^
zom_56Zt2{J5joPaxr3L^<vx+i<;ISU=O0jh17#a;TzVd#%YAlaE;n&vJg>iPF1P3-
zx!n5bAc}=3C&^*9{?Du_xm?N^@&~|KFar*U@sP??TADRw2=(fH5l(<lz>1KEo!}HW
z5Z((*m8pl_bt#_)ov<9(mbyp7mthKQ0aIZDq$WakPs%=CERW}*<oAY~;kXjo+!zjl
zAp-_xO<9I#?XLmK*uK7=4&Q=(VP&w+KAjB1Gx{Ao+s4wMjDDU0yTHL<S(bx%-Xv4@
zDe}9Po*l<e!>w>T>;?l(74x&EY(@I{Qhq7YqhP(#^M8>Z4;z7fJrUjqSsSBxc8-R@
zYM{)r&<5(R1N!Upmteo*b7H~yi#Fd+`Y~|MmAC)e8VSR}F}W6wg|<YUyt0$vbKu;5
z2rRSj_QiGNTz(s7LKh6J&>u_L|9~>9gZkn+*bW?1?Vk%@1^bf7m^zOafpg(lY!7)@
z4NihRz`AW<FGzG<8?I6Nc4Vo1G^sKt!jAA!aP5d=rLN;)8@A<mxn>fZN%|hjb^_->
znfHQa+SImvv#msaU`Wc!W=&a%XV>1D@HKE8R)s3PzK&e3o0*vd53Q8Toh8TQa_5~y
z{MaIwTMEXm8Ej0NBkpu<lgstA=W^;AXU4)rFkTgZ3_Oebll3uTj(vC*eh*iH>pPvx
z#ce06SKg*$<hXai18@`U4in)Lco;5*Ey1`^HKtk9gXU9x*U3ikb+C==z&NlxByHI5
z&EOlL%=f^3G7J)#L7N;92p#wA=HOoVC0q%v`F2Qcrg`_M{r(_)1s;MMU}snn2Fwqd
znKfk<<db$yw*dV~+to-syT{Lk>q}fgx*@C!r-E~J8yNEjZMrBkYswC!kAeM9_G!6p
zw5^}lz>V+)aBuz`PJ_h1waDKB?zeIqwVoo@8QWY_VWUzm%7;>aKKvcdfl*+rz7?hx
zRTBL;6XsB!uQXNlJZs7b<nD#Np{lxA7Gq+2_ESHd>#O01U^|-)D25N?Df=}zj{{Xz
znUHn={0i2tQ$L)#888>R;m6?EK37WDBrR9<jEFfpp{gz`8SS5f%#UE1Y*jHI`^mLt
z+n!U~!6R@WxZc{Jdd{Nk80wsxWvlEa1!4boWR57>Ny?Kn&K}$QK(Ri~w_lPs_Eoo=
z>RD%ea1IR3)jy%XK}n|eUWs${K4f+Q?<MXp=YF+ngB2wa1MWt4f2gSBG1@<f^k=Yq
znLyIF*pGKmuMaXCCPR8>D^tuogpD(iy&BRxM<NpO<@?l4gQPUl&>c&;vB>_qKE<&&
z=8uMQoyw=M@p0rHhBYdyDH{XM?L<hcL(e;b{nkHic#ja*-%sG%&<?3ytz5(i<Ka$a
zveCxwl>Ho5DN_x*ms0NDUI~)9N>bO1WAS-tJP#2!9Ix}rWFzKXNZB{b%5@~x?W3d{
zL$sMVm^{y#awv8BP(7}RY}itNFEGAwqbdEwc{7hP*K|@EY20&NXUh##r0sg<IS)Su
z_wA?wnR=O7Q^p~uuj(aZxD9#N(wHi>=-WNirEw$lR;FwkxSm{>lVSBL{mOzkqkn{~
zaV}|JJJ&$<E5TV)_M!YPi2jGpswMeuQgv^GKf{+Ro2z;b{liN--kDbf_xu4+B~F>^
zJzbZfe==qIbPhO{KD!TU7^pBA`mQDQJ_Mdg=08v&8IN)IGH$-NSP(JZJJ?ZhIvCU3
z7uUnVHEmQD#_Pyg$R7`$q23QXyDKG~AMY5h&7F(&(f+mMkAyYgK{x{RV{)~D8YM9X
ziSO!v1D1wlJ)}ypXD^`c@{Ek~t~uq6=a0j4uuG~~BbT)w>*_UhwDSmD3GRc4W971&
zQvMk11h#3cnGLQTxfyzaS0xoc<#v`rW+U*v@DSVx_B&hV+<pd@hh#j|I}9F$Pl9K?
z`*llDW*wLWwPJ+z%Yf_5zCH}zQ9B{#JZ)z^%BF%b`WDy|Mu0Z-(>Zr7o&&!C*G}SN
zq;@|o)Bd*bUC>|S>jX&WIvK81NBuEyEZht3%`d?yu+F=N{_Eqei8}dgyN;b>=vX?=
zXTyfzIHqy~%9%{IK3;Plh>m-G4jcueK|A?Un%ax8a?Bh%{d0{wrm0M(sfO9CPQ1rs
z95lwb7f%7_JhAK8><^BWW9Ha7hDm+HrW#geZNysN5xYMG`*$XM8Qcqwkz=(QEP1<?
zPGxOI{MvzbehRMVgJC4J+-{*SUnq396$(ST3jOWfoxFF@(RX@Veqn#x%!Pf>+dgw)
zPk!El7dq!H=qWOHZg=N`d0ia~=H>JAXLQV5ICD&X;mkGj3-hbx`#MGp(BCm6-`9Rt
zzGq0+%&zW<i`x1|^yL@jdO8c!rWFc3?S(>LN5RW5Z(Zaj!@&C#>+<lg`bo!V2;*hk
zaZmmg3UCkX3M)X2<-f|0R_!MK#QC!c{+$c+;SF%zUkNY5>)`&gAMVkX*F>wXHIz@=
zHwJ$Mynnt7e}}}+;pE%E`S?26uQ$Q@_yW8K{=NN3+Z#sP+rjtXHSnCf7Pg1wAoVNq
zuB-K-3!a95fU)8bFm|T$4F_&9Dzmm@4I3kF0N2Eyz;k13C_m$~O_kdihwSn27`z3K
z!f`Mb-r0Vn_Ey67XTjL!8gWfu03U|*+*CgMlj^5_rDewCL*YTNA5XzFaGsp6tfj@v
z$9o5^RnJM+?(;AMJ_w$dsb7^Xq;+c}Hx-OYV!vm?B+$>1upi6@*VPN)eo?Q|YV*(0
z{se5i3eSP(>v*W|bJlvut&4m&^g&OF1*Ct2KfuP2*z->19Nz)|1Y=p_*RI+2D)V92
zb?Myh4M{tdlGV>4I~twaVIdp=-W@t%9GnIHuzgWEYdg+*&);7{`Rn%Tmg<+pJ=FFc
zH`}c*TUitL!v96505`*yklo)W@SOUe=%@W~eK|*4K~md%8g|}??n_`?tbPq!%UasL
zarCdCkDg`5*dxI{>;k`mKf{Nr%!CbNoO|Iks1g~pAZ)m&-Ujb)gQ^r|Vm})H*MR>9
z<NHD2{xMEo0ru;6Fd3@f&$OjkQ`UrM;7&+izYOk0NJLD$8eQYNv8J(R^mi5HroqqQ
zfl}&T+zYM**OIaKa(F-JXKlOD{#Dff1vaWHS6f@VYk~d$88q&H_+jk044m`(;TE_R
zTz`+l7vWOa6PAVgzUx!ePbTdL=dYfp)#ahPBRa;NlN;)W>@Z}Eb^3lW7|(~oieMj}
z2G`S4(Ae*+H}QL9`+pszzmLtz)XK*iJ`WxD|3{&gRFs83dn4l>y#_p|lkxL>eG2Y^
z!N<I^mC*SKy7OUdWp&->cyGqo`w*;LSI&xf55V~7K6xJ`zMFmsdf^;s{TvEg$D`{y
z*c}?WQmhOeW3FTGnrPf^tdrZ2Gd>#Yj>_Qvcl{d225-AkB7E5#UE|fap!{<nmGVA^
z&Z(rX<sFL8wd9hrkauso#$Bsfe$TUK*x<j%NbFUn@mlA8Y&;4hE32!X<NYPqtN!>K
z^!h*HyL)mII0M|fSzI?;LmSk$)2Jr);#ugszqV^=C;ZtE8P7#yZ~ZejWS2+A_32&O
z`SOmI#dZ5f@UE~7H1f1|U9|H_bhYc*Qd`c_kUg06ZP>T2Y{+@WehuCP=WB16RKXrR
z-wod1c7|x9z6Z5y;`e#KMSnJ|P+O?zzhh*qeF<v+K2PO{<6kCqOnv~PA?bf*x-oUn
z!>?dmQLe57bt<C0@1SdpFs9WO4Eyt`H|Fw*ks3eY=LG8Q;~ZEMY6zB!Lf-q6>&v~7
z{=THXR(Va>_#C>f$HSq#-lvdpzLjxot7SsY{rXKXzJ98%T%sLzU29ju-(jDms--mE
zn|7bw2-RnC%#ktHwd(lRHXnBbW7%Breo$M^((v8Xb?LY*f=lWvG^mMt_f6<8fOV=Q
z<Mqa4)OmNT|9OTuV_!w)hfx1)OMUn5cp3D9d$4f~ta7YW5cZBl-`HZTNF}3AyT+0k
zWp$}k<YrCTfO^lv+Wx104@btcxCiw864(+N&sk-A$#dA<6n*#brI7xvJkE&el<EKW
zkZ4t>@%r7p`y;3x|7gcJb1fL3jGykS{lWcyJB+P1+(b!yrfx3!Pe6L6$Cy~|{HEo#
zOh&By9dfS4^7AcxUz>7$c7J<5><0GLu@U3Yq*|s2EerdOv*Yp!NcPxf<elU4d8uVE
z#^8QryP@*)6z<b+fqtF@)4=oh74Uvx+;Z)0Rm=3CW#R9~(AWM~U<lX;_l5Vw@_kXu
zVB9zFK=v6Z|Gj>kla^cmes}>qPqu-jz_D}hZ&b^4Q)OwKxeq%l!LndXT>yjsh9LTU
zA+qkH4a?e$_x)a`{5)s}_w4Ji3ph>}fpf85nO-XoF%I9xhV5?!j+6J?8=(4JsI(n^
z9E_}SY#&G^;&YI$m-CC|@w(qRaJ`KNW0w6JmnyZGi}pW@4fm1j^Pp1xP}1g%#rd`n
z`HLYN$Mn&=&Mhz$T%RX`eLV&41pCwYUf#%y@P8~eo`YY&ZSV%{3a(M-xse6ySAaXf
zdGkC7`FQPc56@4)sA741j&~mU7eV=lq4oC!6Tc!|3mcxZ{{+{KYxECr0Zf3UA^MT{
zmhDm0?S_o~z8r>S<bBQJJ?EpDGULB7qX2h7dECm{uFPlsi1$yALH`l3?I&Rbd<N`?
zvF*=r1$2UYySg7yrqB9rEItmBKJP^SEjSqx-Q~zTHcx?Zwb|FPiT--%oC^Bux_=N{
z?_(g5(VuPMDlo=*9=P8=1+JGwE?Fx+cYx#Rc<ZlntHJMJ4#eLqr2Vx$<5J})XKg0!
zxRy7Bv!Dl@zuB-ajD(O=Gs#El8T4Op5xfNYb{p&t&Q+znV{<z=57)s~;5q1;OwXyT
zUZwZhy11)OK-aU*SoSy2es%kmcFOx=|2KlO!T#%CH%x}K|IxN%?p@&(_zOG_?yX&F
zH8D_D?zd~zHG3tvhK+B||0JlM{{bU)GO2B2pksVGJPEEp<JRG@Cge)Ak!}IsfM3ET
zuxd@~sgAnKgFfo3KHGo$unpASe>IKPDJ*Zx^`7j1`|%q%0oH+}ANJRE<~l4ln#w4v
z%pTy{bd9=JE`-e?bSw4Ct+n=4-nQ%I0JsnO;8{2WJ^=ck^d;KJKF8Xdj7&GE+XJpq
z_o{0)bX)VTdFjM{q^r>0-f#!J0iI9i!KRSJ)9@$We?E-z2f?{}5?qt6&9u+Wd$MGb
z<^5O@A9jQvgK_5-_zrl6>E9G^t?Bo#;aG4jCVg8nUzSum^}{n{JGcsrA+N#<@Fx5m
z4usX=Kf~|Jey4s7#m9;8BQO>n45Q#3_q$N&<%3GOTzpu`v_yYfcc=N@JfCDD?e1JO
z#57mv;(xh9dm%S@Drv`}+=--%I{H^ArMXi(dG72jrv05gL;88{@9b_{WIDAgzo>)1
zrJ6dlBhuj=h2nFrv%tF^eT7JSlXOw8qcAg<Ti8!JBbS@s*O`xWYI|W`F1Mh!FrzRx
zmz$fW?S%zC_qP}3=W;W8``RMyEu}qeh2C6lW^bhV-kx=Q&iB30R_M#|A+5>9G~c&h
zF>UJ~H@(oqMD?#Uy+G2vb#7iiH}2lNLql;}7enK?bTc%hJ)88mnfA3au%wHI#5fkZ
zhQ!$V0WHe?kQS+La!!OU82Fr)1@FdBc74Se;9cZ<;QlGV6L2JqhIf1|z8hUGwwdiq
z+z+>=f0u!0qW$)qdAXGLwbcD^1Z3|I@0$CI-Eeuom!m)1!}r0sX}_I!&o<Av&EQOU
z2CS3E;3QZV{{O6ptgrF=tzGc{M)38M{qhXF2`tY;+P63lPo>QBFd2uZ$$telfPeiR
zWU(h4#k4Q0kpCPccNhEe8e9Xe1MjsVpR|`eM>>}JW8fk1uCKmlt@ob~!#jV6O#Emy
zE%$pheDm%(7v2K>ehGZdWxQ*L@_tvgm()jUEc9M+FJ$c*Ka3-(J>~zMKjnUo!Iz`K
z`C0_o`EqZk_tj>7EVut2Y<wQ>gyg(1j#RIwfAu(|etEAR52rwOzdprtvR~7?_h5dd
zcC-7aGH<-t4Q_$If#X~|o-{kot;)sk%Z)|$(b%L9@)(>9j!C)SgSC;$t9uZ*_bb_%
zvLtS-Kz<Tj3&s`OPtFt9$;vQTtF70EpZfSX*k(WYn(HWV52XEW)_SV5Ir{FOWIQWV
zUq?@ep^&uWdjJ#Ra`1JPI^HMFhV;GLW_=k<F52A}+i$}k!PsQXOZ*wkLV10vw+S|U
zEu#P411|$#BYqdWBi;wbm1iLR9aO5n4CNExe?d9tXYjx4EB9vbr-)<vrJwrM2GRGy
zwW}pUcU^4U3)=h@c)n>jVQKQag7fMbIJ(ME;zN91*Yn2M@NuXTU7~`xlRk-E&*U#H
zk^S&_O>Eo*&e<PecNh-odW!sKD68LpI~8)i*U$})<#ee29qQr^K<dXE*nJUd|LtS5
z_G2Gkf*pMo?Rs|1gHJ=!Cu7-H!C3Pwr0c)3t$45JRAjU_7e-WyEcSEQHm+#<c4+*$
z&w34|{c?RfM}LMtmD1#ntnc=FE4USmH?FyvQ2+OEVS5{77J_y+gL<B{Rvw>QG}hby
zDJ|Pg`|Z5Cr;S;z|E<A(ZUJ8e_iis3%Z#zM=icz1u?jTyJKn=Ij<~0e9#p=uwWtl>
zx5Sobt@keT&1j}FVPhnEj@>M{3+{wF!1biB;~_Z*?6+(FMzFoOOQjZT=OS*NhrIgg
z4y!HLLTUJZBDNe;U!Skkf_AcxS3~a_a2+Rovw!0A+u)t&d~p353w$471cZ%d8Vy<F
zsPS?E@U3P`_!IZ8pJGct&w{~!N0&4i{<xQ~0LSky&;_4`y-K*pwfzGa2iwB>(0sp>
z_Dtjb<L5}<f-e^BWb0eWhYugXhI`OEm}gOQ7DCteja`q<v-5f|q_5*+U0+6-{XYj{
zoiA?R^(@Yot4lVuUH(~|=DZK7@Z$h%=>L;Y{<)GywnFy{=s0e2G#L9*t%z5TP-g!R
zDXUARTFXVdj<Y`h78d_57-MNH*1t=j`LT@8z;u^%od?%Kd0*l)cP~@!+SsnDzFfMw
zr|AC%*zz@j;~w{k=CsSD;&si_*l;iH3+45Vp5py1&vs+p&PCnuE%tTfcca``^(?H_
z$XrWx@q69du<5+bfaYUX(ong7zsE*vpDl{NlQE9#!!2-b4ZQDJe+M-G*^R`<dTIE6
z3O0?o4*<VWXz?e`(r=)vf7e56XKC!63()gy(?&gfU9$tU=wJi!=>L}3^iJuS^O2VA
z$KNn}A94L2+me2??>Zj|2f<h1%o?0P*#w9^(V$B$S4G?RW7~0G9REFs9Y61U&EKVy
zzQq1N9o?V7FY0g)<!8W#@Xn4woTa{Iu>amUoBw=!=$=;6y_>YT*HY03&v)+$$+=c<
z-Dk_6Mt&l+Jk50#!WaGc2e`+Yf6W?qzHW4kAFkWF%?wneecuQ9<h9GM$h-Ew0H3eG
zvLhf_qxX_u3kFOsaVGA9-dpU)zD?PVer$@Y=kgoS+_@Zj+avG2+qpI7uMe@V>!+I|
z(*x?914ChnyIwR9G5o5M?Q2K}e_t^CJfx&!{2ToK6gul7o2+^F{1}M7*XvExd*?k2
zya#v>+7;?)v{oMWo%esj6HxtqVU-r+wfT+6Iv*Fq;CF|(*BWbFXOBbk@hp5Cj?VYN
zHXTF9veL8GpTo9y!585zXnf9w{CMP^1@F(kmTcT^=-6M^y|Ko-cVnH(+OVOY&XHqq
zDJ<T5Ox3oR#g=<fyXQmw_XWd`J&|#}I0nspZrwGW>=);5G*o)g_&M6u&Y|!&^umW5
zD>YdgwvWS}{htT*KjR#)O)oFWUPoH{Z{V{{M~q2ye4R7+eo6Gxez&2wCEN`9`4ViD
zh%HeXZFv7Pw!98oL2Z*Ucb-}9<AdtTWwj$--;Jz(U(l3}`f1<Y>t6@Y8*Tgn4u`?V
zKI=!Le7uh|w`Bh`(rW4O=M&Vu3Hq{0wNQ<c_&xL-<fH#JM5>CStzqa)hF_O-ZP&QF
zHKgNHrMwsgai9BYshyvaR=?JYHqS1}cz!h(e`5Y`FX>&-(7Uu>Ya{QT@%6dm<~i%V
z$+h5F=vm@AtskozHdIj=?M}j;@!7eJ^C>G9Yh*Tc`g00oYwPFZ>`UGwxv;KY+V@S7
zN!H?P<X!vTlXio9!M&#s_ra+84Yybmd;3vr{u9dgcKGJ&F#Rz`OoZkdh_!Vt^7?H2
zt37AY#>Uh;*UJ7D_5fqk)nL1p8>dX4fx*w8=Dc)28DqZ#+V-xI#+UGI3T2M{gHZpB
zsBACQ)$X-W@9&dWpza1x&U4aOa}q27%U*?VLgL56<OjcdR{B%#IsE(_Hl2URcHDqy
zyf=3fW%}XXt38JU3Kg078%%XwzqQ9M&Nt`wZ{S|s1&n$9a2tFQmVrG%Tkgf?UUycw
zQ};3c4()mD8VAyQcI>|wDSHd_tFDQf6|r~ihc?!!BjecHuLocyu$?#Hudp*DG5-+q
z${D9yd(Ww6!<oW3t8OaUcdac2w!0s^4erU---nFfy?bukm(4RRrr9{t?bj{P4#OeY
z53|Ux4Ekd1RZc&ff4@0xseUf(`<h$(z9+LfxaO_^%Zx*<w;8^BZ*mPB3e`TOcjTW?
zKddMdf0y$o@~%72J^Oz?=*#uc+CHpqwY((kPr&Xgun^pH<KPJ}F6<BGI?X)A7+!_0
zemj=cV;H~hvi^P;RWuuV#v9}A<FF1~1Iigon`yl@nfROTIoP&M$9gaLJIn{q;nwUa
z9pmcQIsebV_+nYsQhfH)d3NkKC{~4@vi4nnz6Qzuyoh|(!jk8sJ^ei$9OFkJnYZ7N
z-vE;SG~Zt6j78UeI0mP|Qjpq+F>!2+y`LJW3tjh&WAid3=i%w8@)G8<eTukq67A@R
zV{j+9_RZ_xncz5t|Jgn?awFtVM9=>Bfcq@fh&_K7Wwv7*Q5U|g!gEq*y=&pHRCzIT
zVLO>m+t>$Yf$QCN{tDi?kAa6E83*UUy<s1Wk71*c8zD0qS?>Vaz7<x3q@P2`PXp_I
z2HAi2O8cLNUa;P^utTHf8rCKLM!Gt-4uCl&yW0OFTnyVmGCo<ke^9QR>+y1!2+Km_
zaftfuk$VZ8!|%Z;NZR-~dG9~o^)@S(Cmo4#-jA{?;CN{L?vu7-dmV5z`~s4B?ICZx
zwe6T!+b`F1o$L+XKazFw8hPXKB=8=a>LmWBcHB2#0{iF~dX9|;bykK4L4Qt#R6Dg9
zer4-Ysp?#+m-w_EcD+M92DUFx!5PqaUzgkRezGIzzh|X(oV#0LcNhUlo2g$>W*-g$
z*N=J+gL^LzQ^B?2J}JK|*Rq#duFj?Mj`;^+1{lL^Q;hG%q;;X%*J_JVl9ly+fcUrB
zt|I*tXtxjUhJ7KszO(vm)H#01Jb2f4O}X#X{|m%9SkI4o<*9#;voY!dFlOnS@%I5Z
z0@i}&`(4>yRyXdfAHm*5@FLijcjkF;7_13tTWQ|)_;vU_sFUE_4E}z6)~D2_v1lR~
zn_dBJI;Qu){;(>fzGQ7IZa%fQG`2T^v*9_gZP&B+-xFXRNZXFQYeAhZxDRfJPr~5$
z+j3jRo=I>WBxi+t@+Yt-7+=!17q_pC^iuntXY0f1@B}3D`aAN|;r*aY>QChD!?1z!
zdTo{K8Ef_cV~_o{E&KmN_zbKFX*>07zLVwI_Tu}skHv?F!L^`&^Wj|B6kIc@e@VWU
zKS^DrBhlLz?uO({HU@ncwuN*Ym47#W%Kcp(pALk%;2p+s@GfvEYz6HQ<51~qQXc6V
z$Q=sC7UP+Aj5)?0W6)4Y$FtJbyYZa$$8#;tJLCNup#QJJHQ>Hq9#a3){MwXHfkz-&
zN6(S}8W=y)b@XoZv6(j0zSzIvuoGMl$sOW#@;Ae7;J!9S7%Qg1li*m%Z=nm`2TMVW
zS2I5RC&(oJM!FpSe+;ey_pkl)yt)It4?GV^zn%NzU>u}t<UgTLi{nGK53z6EzZb#+
zNcwE7@LW6?M#KOAepilFwokE-x1gVw!~Jj=tP213ei!148c2%&s*GtaH`SznNLPnx
zZ+kD_EI@TfKi@P!^;G{W^zqQ$QT%sdx<??;(^=?Rfq$2#2Z=oC?82g4er};Kx6q%@
z&o=EFYC4^7L&(oJ?ag(N&M0)}I#Fu(`yYBub9|9Pp^#rRG+*eQTFCeFMGk#a7v=lM
z6w{9Wtw}riUWlA&e=+Uv?C)HJS3GrE-rv#3_e69Q7LoSk@}^UJFuf?>H+42?A>TW7
zIxdj%f4pk<YaaAQscEG13;Dv3NcqBt!t~jNd>>z~FqgE~bZ()&hjjMb!i;Xx`O{13
z4APAm1=A6v?S&b0sOLKyrkB#WbFs_w>|#2El=ixFQ+sC5X6U**diR^n*fZ*5-$cEC
zh|P9&6mqBXoeyNYJNOO=#<#b<tI)$&Z1m?|FLZS>FI|iP358Y{5VE>}65o8`k6#qw
Nk6#qwPhSWB`#<x?*5UvF

literal 32038
zcmeI53$R^PdB^uYuLuZv5FjCt8$x0dKnxH_NYZeFCblC`6$DZY55r3eLJ>j$;a+@=
zt#*c1D5Z&570?kMAX*F&BM3e^(`lXIVSvF)J8j1&AhaORtp0y%optuP`|jsG=Ugs&
z@60djJoaAe`@Z$~zV+BAK@bMDV9Jz0>73yFS`e%af?&=Z_x?-z{A>Db@#5zD`9W~<
zUO~{`@7^ywHVAeu4}yidN0%xG_qmcl*{1((-53OpU6t-9`V!bvpH;;0eB6CCeSW;S
zUF;D59^+}f|Gv0J>@R$Iq@ma#el3h;+Z87G&ZgnqtIyo`_b8n$d>-@knlepruekeC
zQ~AWnrh3jXrh4`&Q{5oWTW!M6o}=$ud0g9e{~3DyJA41PFE`bT-e&4^_cZl6(<0{Y
zWhx&z(FDllWOz{Nbb$=y<?{Z@MW%k}EK@sai3#tx$b?_M&=Tl%aL?sVK6gL%=xg3T
z;O<u*-}nntTYIpnA2Hj>j}CBNztsudtd7pU!|!j(5dQs{E|0hldXH{_bX0lN&&d19
z1G|6gvX<;t2g#34=oUyv*)jS4Z+*~IuK81Eb1!={tsl{6<w8g4(0>2Mmi~8MVrp+c
z*feHOjciXn95Bt)-nPh~TeA*-s(Was*#E8KS%F?A_}axLy!`?besMU#U6k9Zzgu<f
z8wB_7F76QSey&NR`Tf?7ztXkG3E%!m4;18q96N=}Yk2yyK7T@-Eovg_N0A(>_4(yu
zAO>yhEHO`1M09Tlub!P01mCL$!C=@#c@1Wv>%J$3bdND^oSCER`vv2b{bS&n_$zJ!
zSNBU)r`L-ik<@n5K4aYbq&QrtW=j5T-MCQqJt@-iFY`IF$Ric}+q$v8OXbF8?9Y_|
zIlH5Cylnp-7o7a({GIbxy_11DO)H<a;^j<CD}TMt)c*Jo)0p~(OezEKOuWCD|B^%j
zTzgHuuexq&W|?uBGIY5<rTkReqjx<2toJ$k52ci!s(ZW5t*^_erwrX)8A$?U<k_xk
zZr&OBwC*ig{%fs&+4@Ib?rG^8w@FF;$){}lr_Q)1QHD{JPd-Kae|vjLw8JRNPt+xD
zTfL``cp0dR5%=}De9H6Xla6)y-PWJ+tX-cnue(wIWy)*6wq*NHjj_t=Uq7-htN-sv
zYJO@X#CapzO7}neWJ>wOnqyJ^;VI=aU+PxOnWhImK0O|Gac|na-S|8|4t_1;UtcjU
z4o;1SO12Z~G(GP1WyVt%4-=Czk0~n)eVP75n~vu^@qV0Gz%>7M2Ej3}20`CTK`{B*
zAeb~11l4Xqe&kF3l;g`JrBN;xXNuN3#XP;4_<Ma?z^$3EZrl))#lC_yxJBaN4me2n
zvNkYVu)e#Cs0w^m_iW|zL-x7io#G?nPVvv;;ZgF4?)z79ueed1D~=S?MCbCmJg_-?
z1S<vWlsAZP3S@p({GaH=e{%o-3dZ#Z#OKAw#A#xdaBH7s>cZ>p?wzhY`o+!S=i*h-
ziM&Pb{U4R_Bf+{aZEKRij>XzjBtNp#R<?`h#8}9VeynFxCr^t{2>OUyJI~X=$&Rk{
zqm#rp1hN;gTQ9D8RAv9Ac$3I)OHO{;`%-bMC@vFwQHlEqY5NQQ^V~A12l{rjj~1_o
zsLjyt`^0APAENj2=a)fSVw_tq+_*&A{uh1D*t<gfi^!LKoA$1Bo!xu8@pQKrb-}T2
zA27BbW%t$EKVzTp;x#7xyE9Di^^5b$dQs(kTrjq}c9bkXe(5a1c$Sx^-Mb7wcb=(S
z_byXCZJDVbHODmed829U(J+lEld{>pZW?`4P4&G;I~^#GHke-S7xdjxg7)1meN-n~
zH!jzApBBFm>3P|<F1z1wx~Z;TZt9EoH;w(Ln8pmr&KmOM9NE#0Yo_U1?fq3huqNs|
z>E%8snJy4}i8T37(RUAs7euoB$bOI8@2p;^z2AdpN{(GjW7nE#>{fzZs-`i0S5sd$
z*Hi|zF7Eq(TDh)2(l7f&n*0~*yZ;uih-CTMlfLT`Q~A`XZtv8$ll>-}`l5YI{g8c4
z{mrukX$A+)FtwHQOy#QMO?cb;lgk<|!^@IsyI?F$lmA2dF56Gtx5<QG`g6O_&Hl1)
zD|T)5<L@!y&1aeLma|RxnH;ukFyTL*Yl5$S!0unG+#)*so31-3L;k_se7<|72|stP
zsr4^#eYI)->KQBSetvM@l_uDJRWX#8-G7hvsq=JrSn?6?rrAGVe#sWza*nAl=^Hk_
zR5$#Q3I6FacjlqAA1h>gbn9Gx*_ZZOJMjopKX7_WhuSGenef*0ZQr)%HcII*hVpaX
zLT$FP={QqgexMucH5S$n-`}7E^-w*xc@CuAU&UW@)<wRK^B19fA3o5w-KI~puSfQY
z&h3v~zxhEEs{d6_J<2p@?ooWq_hS_)K2E+4pNH?m2jUCunU|4r`+m{6{625#K$*4G
z3!M%{d~Un^_%D1NK2N?6ABZo+Cpuq{*rvK8KfXqOfPP?O2h{^@sns9K`ZBJU55yPZ
z6FCEfk4%Usx+A}@1AJMtEzuurpVqikKV)XM@3MYPJ`P_epVyG@^YIeriSUj1$hPxa
z-ETkWKs}I32l_Pi!PrXQ$n{_NIQhDYe4gD0rEM_|$R`r3;v)n3%2+?{uKj&I(5D%f
z%J?pP9M|i77rxKipFWLm#774BH(!QJyDNXGF<v^xuc!UV=P~BC<X1i58>vU@$9pP2
zZ74ymBA+2UajbkEe#6Vp7(hR=F&*{OZTXRn^MZ^$AAa}nbBl2wmGvGUC%Yp%zR$*i
z8iN_f7z=D%N1N=n{NDdwsqtpTJXbDbdHdKtn%DRO`9gdm{ojrW*s9y|6Mri1C3a{2
z(Xrg<itm%`_(J@Nm3_F}UXQ%~d!_VczVELenG(O<uK105Cw?n4=Zas8+_Uzu{S~|0
z7((sR#ea!1{7|xS1}-grK40HGDSjtL%Fbu>JB@ka->x^+KhvBYUu5T88FQ_qc^LN)
z^XdF=^^&zwn<4+?vN<pPWieNz$<H~}uM5^@)ADg=g3*C<v!B6N74TOh=3}}CANKk4
zT<nPtq)hJ<N0$E+eb2epnIcVo<~GbB|5K#P&v)3VtiMW{mldCbv6gwf*h8er&vz#X
z&MRljKepd9Cud#f08tld^0OB7X0ctQ_kppOoi&lmgp)lkzt@J(-TKglN*@yAp$>j2
zIc^lJYa*YQc4X?lujv}r5t+;Xmq=d=>b-u9<+O!W!tDX%%a4xeaHuHOmwTtj-I9Sl
z6rN>qw$GBE8i}rB4}-oiAn+U5g1wPmw<*e?-ftK05z__h;v?Hj)+bI6>S2a>zxa-L
zOpy08;w91P{vEbpY+=ufc0MH7le|S7Ep`*mrdhHkedq3DF9{u}ze5E6?J9AHcvSpW
zbW$JmE##(tZxS2CO3^2F6_h_Z`P+4Jc~FOw#Uk-1;%sq+80>&+bnm6&G=bc+M1DVQ
zmu=$pga!UUE#S@!@oW=+N{4hnsXfIm1A4}iv@c3^?noz(f*_viOp-DPg5Q_a>ZfPM
z;(FTmZT67KteslvP}7dyt|=+!wED%MXr0sIgNeTh3rtv`GYj~*#hq7}q_}|CgZN;9
zI7}=P#0<pt-DHLGTPofn<_qRB%!?Z${|ruNT1R(B`lCBB@Dg#VxLRx$cZvH1=LO*Y
z4)OVHQ$Al2%=w7#h~W<x$bc-J$CHtk(JP;?i&=@8rwU@t)nc94B({j{;wkaGcvW-~
zKPTPGIf37Z9pYYbv)CxGeZOG+ZHgcs?oND-6(ar7o&0Hs9~I02e<&UiPm5m(=5px1
zQzYro$!FyGig-c%LJWzA#Sa8+?mEHTh(3X=owWylzw2AX{<FneF(`g4m?QO~p3B+@
zo3Jj49j+B?1hOLY=*NXff3N$A%I`Mugm_N$s-Da0PrE=CZ1A|aRUoUkLAiDi>CJuE
zk9^3Fapx&fR=%;m9vP9<+rX`Hc)g;LE%}wd&W$7VCE61<rH{WT##*1U<sl=o(pKrO
zj9JCUgGhhIdBzjg0$39%D~G$@?>Vxr&KZ)ju&)N(Z}TcF$77OtK&%wgM6rJ0uX8@`
z!@BPwf!`^wKYJF)jO^&ZzB_vhqoLgf#bkL#GXF??RN$|(_4nVqls?lh@GE|-E3Q8}
ze_OiqJ2U#7m+%Ycn{e~{OnAe36JCGX=(y=jyT2Fcw_WUcvV0q`2Kl_WTdWq@<3OZ;
zL)Y#th%4|Z#r5V|Ti>c@&Yx%xo#$Drm%iOTTU~qWB2zzlu7h(mMbJ6W`mzH|?S#ed
zOeK53*r0e{AVygy_7Uio+z$NbE}kc@B(@^HD6T&;>9>3AZ~f@}bLB%PnCh7;O>NCV
zb}!SOL4Kpo7X#;vi@>$opXGOyYVSDIRJ6Zt&mj2mAYVRoxI!!u%vJLAXI?>UO?>$?
zQB414y`y{OV<$PiSIu{4XC-@M=I-uXGJDG~xgh@fJ$05?=dx?Z9qP_y`|%)Oz9H$b
zMbMsSi9G%1>l*Auj7^+bOn>@2ZC>?Go!5`lne%;hhR@fr*Q2Q3{yKl(==CQq-!85e
z3q+p&%rA)_c8C{5zW$8!8tZI-SDUY?-mUJOLr4DIp<sKDU)Op2XHG&)v{@V`^7LP-
zYnW#ePZC#V>u<*)^?Qx;cC4fBIXj0Q=&p8OUo^v>rQl3^p)s$0T<m=O!w*o8__Adp
zPyZFVW}C>?+kbESz0OR^$1%>^v5x+3>rv;9q<i)B<%Zt`;QV0tH}7?n^@HX8UtE6H
zB#4Fb^k1cG?k}u=Gqwr;;eGau5@#$MGc?xOc3-#kZl7b|JUuq!T*TPKKXLuh3EjG^
zzl-a_Pp>z%V|C_t@7>(_U9Z2|Z{<_#oGgslo}zJZ>w5Ju+t&)VOW!`D^!2I#Fgtl0
zD2?<g`npH@OBU5p&)Yw92ik&<d(zKCrP-r5`j6H4$J~KAgvMF>+mXyIh&d>~SX=0w
z{>acP|JR%^Fn8ehY49=lS^G>1XXEG}#ca?U{jq(o;~!!mp6SrpM*J)BC36d6P5VrN
z<{SlV&^!IHL9gRqVo72t#TLX@#F*9&nrm1a<hO&~>TkyZjf35u|HS73K0emmf;k2@
zu+Q4k7pQ~uv7op5+kT*Npxg6buWu_=OigS-dyoxi2evQpj9T=&zDaiIz5d<?w8d_%
zfB3lo^8h_RK|F2e(muXYU$Fgv-_LWuDV#PIjE(-@2DHU)tbaA<3(OsuLok=HHfYW%
z?YanKqWpsOjXpjY*$>7}e_wXD)<6C8K0M#3XQJ&hrt}BefaV&^IqdThnuD}rBrijh
zj=lbr&A4dCMy11ISz@^Y`1qex`7xJZ9^IN>^L&Wr9LznKgV;4@@{RQNuY0e5yuNL`
zT0qAvJG`#+r;Y_Ok7kaWcF*gf{qu~s)}?s{CuFUn?D|I9_2Yf~^KBm8wKmW19<Wx=
zn*FHOyS%@Pr{mTCHODsl+#b)qX^kGAWS_q(v(Dd&Z?e`&o3YP$ihr8@ofwq0dDiF~
ztW_f;`1rNc)aU2dl6x2bvPQ^Sq4yivX|MJ7dQXv`+e>R}{2s}IQO$o?(`9WpZ~c!o
zV%CaTGiL2LTmP|W|MVlZDgOTo*3bDp02}k)RA~Oo8a`|Jtm(71pQk^21e*nW2J9W=
z=--TSdNuy}^^arTWNOF1MZaO8|HI_3PARkgK|QjU!=4U%J9+xEM|8E=F4#ND*57~M
zEC1*HqMi%2epUbfjQvfH;_F}R;jx#;o*sL9dHT=NHS85`5ksPw{#@td+-}D|HZD?3
z<zqoR$0;n=&!hu;x$Nn(x0|Owd&Elw_Ig;9&_8Aa<jsn0OMlmlFR^oRxzK^VeD?H<
z?0<7cU>~tgaCV?fS>y3q&T!D4_ZCIYKhQonE3#T}c7!t|`F>#h*@<!gIe{<h7un}u
z{AoDfKirui&JJ;g=ov8{>o!X!&TMgZi!)sL=buLE&zUh|p#kxj$SP|*e)p(kzD67^
zri$co&+F||f1Nus$l1ZQ;x_TLcu|Z;UE5_sMr7s8<{H5n&ZzBsJ=4-ie?Jb)*8L|6
z;s;`)_Oiy~Yh*-LWJdPr3^ckG{fq3-e*PJoJ}&&(kezz{TH62_{8;ydUei{+?#N!O
z-N)_X?;C#po%VFCz^7n?SHx?rKf3=`a3+6H&|j%{bdTyju3ypjksWHvkG{lsa-G1h
zU<cxhAwit^g1{!dXcxYonUfHg)5jkX#3*+QeANoUn1!sPtM|BFd_L}(62=koUnu$o
zaRspz@g*_#4uRi!S#-NyP|wecr^I%#MQjr5#A<<$W1L6#P;^KCbbCxv88ZZNC9(At
zf^mm=<~H#_llzr+g3pIF3EJFdakaqqO9V0?OK<c|*Pp)C5cCP=74rr2%cX*LxT?#n
zRDR3EVPb)pC5Y$Iz4Lw^*K^|igasxnFkyk;V++`y4@mmQ{V;<uJ{`gcp)o!k<b5z;
zd}`m?|1XAD{J$~7QvF{t{7tsMZ{Yra8Q$~%%=|&8-Y#)_#oiy&vh$#|*FdWthIp@f
O@%7}>q&iLb?Ee8Uw1u_+

diff --git a/brev/welcome-ui/index.html b/brev/welcome-ui/index.html
index 19dcc37..4d95a34 100644
--- a/brev/welcome-ui/index.html
+++ b/brev/welcome-ui/index.html
@@ -4,7 +4,7 @@
   <meta charset="UTF-8">
   <meta name="viewport" content="width=device-width, initial-scale=1.0">
   <title>OpenShell — Agent Sandbox</title>
-  <link rel="icon" type="image/svg+xml" href="/openshell-mark.svg">
+  <link rel="icon" type="image/svg+xml" href="/OpenShell-Icon.svg">
   <link rel="alternate icon" href="/favicon.ico" sizes="any">
   <link rel="stylesheet" href="styles.css?v=7">
   <link rel="preconnect" href="https://fonts.googleapis.com">
@@ -16,7 +16,7 @@
   <!-- Top bar -->
   <header class="topbar">
     <div class="topbar__brand">
-      <img class="topbar__logo" src="openshell-mark.svg" alt="OpenShell">
+      <img class="topbar__logo" src="OpenShell-Icon-Logo.svg" alt="OpenShell">
       <span class="topbar__divider"></span>
       <span class="topbar__title">OpenShell</span>
       <span class="topbar__badge">Sandbox</span>

From 485a94ea58c4b67dc53f31f9cb4c4b5e0a98fe2c Mon Sep 17 00:00:00 2001
From: nv-kasikritc <kchantharuan@nvidia.com>
Date: Thu, 12 Mar 2026 10:12:45 +0000
Subject: [PATCH 05/25] Init LiteLLM implementation

---
 sandboxes/nemoclaw/Dockerfile                 |  12 +
 sandboxes/nemoclaw/nemoclaw-start.sh          |  70 +++++-
 .../nemoclaw-ui-extension/extension/index.ts  |  43 +---
 .../extension/model-registry.ts               |  16 +-
 .../extension/model-selector.ts               |  23 +-
 sandboxes/nemoclaw/policy-proxy.js            | 226 +++++++++++++++++-
 6 files changed, 323 insertions(+), 67 deletions(-)

diff --git a/sandboxes/nemoclaw/Dockerfile b/sandboxes/nemoclaw/Dockerfile
index bb10e19..9a5d96e 100644
--- a/sandboxes/nemoclaw/Dockerfile
+++ b/sandboxes/nemoclaw/Dockerfile
@@ -16,6 +16,13 @@ FROM ${BASE_IMAGE}
 
 USER root
 
+ENV NO_PROXY=127.0.0.1,localhost,::1
+ENV no_proxy=127.0.0.1,localhost,::1
+
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends jq && \
+    rm -rf /var/lib/apt/lists/*
+
 # Override the startup script with our version (adds runtime API key injection)
 COPY nemoclaw-start.sh /usr/local/bin/nemoclaw-start
 RUN chmod +x /usr/local/bin/nemoclaw-start
@@ -27,6 +34,11 @@ COPY policy-proxy.js /usr/local/lib/policy-proxy.js
 COPY proto/ /usr/local/lib/nemoclaw-proto/
 RUN npm install -g @grpc/grpc-js @grpc/proto-loader js-yaml
 
+# Install LiteLLM proxy for streaming-capable local LLM inference routing.
+# LiteLLM handles SSE streaming natively, bypassing the sandbox proxy's
+# inference interception path which buffers responses and times out.
+RUN python3 -m pip install --no-cache-dir --break-system-packages 'litellm[proxy]'
+
 # Fix @hono/node-server authorization bypass (GHSA-wc8c-qw6v-h7f6)
 RUN npm install -g @hono/node-server@1.19.11
 
diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index e1756f9..ba22672 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -65,6 +65,70 @@ if [ -f "$BUNDLE" ]; then
   ) || echo "Note: API key injection into UI bundle skipped (read-only /usr). Keys can be set via the API Keys page."
 fi
 
+# --------------------------------------------------------------------------
+# LiteLLM streaming inference proxy
+#
+# LiteLLM runs on localhost:4000 and provides streaming-capable inference
+# routing.  This bypasses the sandbox proxy's inference.local interception
+# path which buffers entire responses and has a 60s hard timeout.
+# --------------------------------------------------------------------------
+LITELLM_PORT=4000
+LITELLM_CONFIG="/tmp/litellm_config.yaml"
+LITELLM_LOG="/tmp/litellm.log"
+
+export NVIDIA_NIM_API_KEY="${NVIDIA_INFERENCE_API_KEY:-${NVIDIA_INTEGRATE_API_KEY:-not-set}}"
+
+_DEFAULT_MODEL="moonshotai/kimi-k2.5"
+_DEFAULT_PROVIDER="nvidia-endpoints"
+
+generate_litellm_config() {
+  local model_id="${1:-$_DEFAULT_MODEL}"
+  local provider="${2:-$_DEFAULT_PROVIDER}"
+  local api_base=""
+  local litellm_prefix="nvidia_nim"
+
+  case "$provider" in
+    nvidia-endpoints)
+      api_base="https://integrate.api.nvidia.com/v1" ;;
+    nvidia-inference)
+      api_base="https://inference-api.nvidia.com/v1" ;;
+    *)
+      api_base="https://integrate.api.nvidia.com/v1" ;;
+  esac
+
+  cat > "$LITELLM_CONFIG" <<LITELLM_EOF
+model_list:
+  - model_name: "*"
+    litellm_params:
+      model: "${litellm_prefix}/${model_id}"
+      api_key: os.environ/NVIDIA_NIM_API_KEY
+      api_base: "${api_base}"
+general_settings:
+  master_key: sk-nemoclaw-local
+litellm_settings:
+  request_timeout: 600
+  drop_params: true
+  num_retries: 0
+LITELLM_EOF
+  echo "[litellm] Config written: model=${litellm_prefix}/${model_id} api_base=${api_base}"
+}
+
+generate_litellm_config "$_DEFAULT_MODEL" "$_DEFAULT_PROVIDER"
+
+nohup litellm --config "$LITELLM_CONFIG" --port "$LITELLM_PORT" --host 127.0.0.1 \
+  >> "$LITELLM_LOG" 2>&1 &
+echo "[litellm] Starting on 127.0.0.1:${LITELLM_PORT} (pid $!)"
+
+# Wait for LiteLLM to accept connections before proceeding.
+_litellm_deadline=$(($(date +%s) + 30))
+while ! curl -sf "http://127.0.0.1:${LITELLM_PORT}/health" >/dev/null 2>&1; do
+  if [ "$(date +%s)" -ge "$_litellm_deadline" ]; then
+    echo "[litellm] WARNING: LiteLLM did not become ready within 30s. Continuing anyway."
+    break
+  fi
+  sleep 0.5
+done
+
 # --------------------------------------------------------------------------
 # Onboard and start the gateway
 # --------------------------------------------------------------------------
@@ -78,9 +142,9 @@ openclaw onboard \
   --skip-skills \
   --skip-health \
   --auth-choice custom-api-key \
-  --custom-base-url "https://inference.local/v1" \
-  --custom-model-id "-" \
-  --custom-api-key "$_ONBOARD_KEY" \
+  --custom-base-url "http://127.0.0.1:${LITELLM_PORT}/v1" \
+  --custom-model-id "$_DEFAULT_MODEL" \
+  --custom-api-key "sk-nemoclaw-local" \
   --secret-input-mode plaintext \
   --custom-compatibility openai \
   --gateway-port 18788 \
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index 5ff25a2..2d4a239 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -15,7 +15,7 @@ import { injectButton } from "./deploy-modal.ts";
 import { injectNavGroup, activateNemoPage, watchOpenClawNavClicks } from "./nav-group.ts";
 import { injectModelSelector, watchChatCompose } from "./model-selector.ts";
 import { ingestKeysFromUrl, DEFAULT_MODEL, resolveApiKey, isKeyConfigured } from "./model-registry.ts";
-import { waitForClient, waitForReconnect, patchConfig } from "./gateway-bridge.ts";
+import { waitForReconnect } from "./gateway-bridge.ts";
 import { syncKeysToProviders } from "./api-keys-page.ts";
 
 function inject(): boolean {
@@ -65,50 +65,11 @@ function revealApp(): void {
   }
 }
 
-/**
- * Read the live OpenClaw config, find the active model.primary ref, and
- * patch streaming: true for it.  For proxy-managed models the model.primary
- * never changes after onboard, so enabling it once covers every proxy model
- * switch.
- */
-async function enableStreamingForActiveModel(): Promise<void> {
-  const client = await waitForClient();
-  const snapshot = await client.request<Record<string, unknown>>("config.get", {});
-
-  const agents = snapshot?.agents as Record<string, unknown> | undefined;
-  const defaults = agents?.defaults as Record<string, unknown> | undefined;
-  const model = defaults?.model as Record<string, unknown> | undefined;
-  const primary = model?.primary as string | undefined;
-
-  if (!primary) {
-    console.warn("[NeMoClaw] Could not determine active model primary from config");
-    return;
-  }
-
-  const models = defaults?.models as Record<string, Record<string, unknown>> | undefined;
-  if (models?.[primary]?.streaming === true) return;
-
-  await patchConfig({
-    agents: {
-      defaults: {
-        models: {
-          [primary]: { streaming: true },
-        },
-      },
-    },
-  });
-}
-
 function bootstrap() {
   showConnectOverlay();
 
   waitForReconnect(30_000)
-    .then(() => {
-      revealApp();
-      enableStreamingForActiveModel().catch((err) =>
-        console.warn("[NeMoClaw] Failed to enable streaming:", err),
-      );
-    })
+    .then(revealApp)
     .catch(revealApp);
 
   const keysIngested = ingestKeysFromUrl();
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts
index 9016971..da97edc 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts
@@ -118,8 +118,8 @@ export interface ModelEntry {
 }
 
 // ---------------------------------------------------------------------------
-// Curated models — hardcoded presets routed through inference.local.
-// The NemoClaw proxy injects credentials based on the providerName.
+// Curated models — hardcoded presets routed through the local LiteLLM proxy.
+// LiteLLM handles upstream credential injection and SSE streaming natively.
 // ---------------------------------------------------------------------------
 
 export interface CuratedModel {
@@ -179,7 +179,7 @@ export function curatedToModelEntry(c: CuratedModel): ModelEntry {
     keyType: "inference",
     isDynamic: true,
     providerConfig: {
-      baseUrl: "https://inference.local/v1",
+      baseUrl: "http://127.0.0.1:4000/v1",
       api: "openai-completions",
       models: [
         {
@@ -215,7 +215,7 @@ export const MODEL_REGISTRY: readonly ModelEntry[] = [
     modelRef: `${DEFAULT_PROVIDER_KEY}/moonshotai/kimi-k2.5`,
     keyType: "inference",
     providerConfig: {
-      baseUrl: "https://inference.local/v1",
+      baseUrl: "http://127.0.0.1:4000/v1",
       api: "openai-completions",
       models: [
         {
@@ -267,8 +267,8 @@ export function getModelByCuratedModelId(modelId: string): ModelEntry | undefine
 
 /**
  * Build a ModelEntry for a provider managed through the inference tab.
- * These route through inference.local where the proxy injects credentials,
- * so no client-side API key is needed.
+ * These route through the local LiteLLM proxy which handles credentials
+ * and streaming, so no client-side API key is needed.
  */
 export function buildDynamicEntry(
   providerName: string,
@@ -288,7 +288,7 @@ export function buildDynamicEntry(
     keyType: "inference",
     isDynamic: true,
     providerConfig: {
-      baseUrl: "https://inference.local/v1",
+      baseUrl: "http://127.0.0.1:4000/v1",
       api: "openai-completions",
       models: [
         {
@@ -328,7 +328,7 @@ export function buildQuickSelectEntry(
     keyType: "inference",
     isDynamic: true,
     providerConfig: {
-      baseUrl: "https://inference.local/v1",
+      baseUrl: "http://127.0.0.1:4000/v1",
       api: "openai-completions",
       models: [
         {
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts
index 3c897ce..7b2fbe6 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts
@@ -2,11 +2,11 @@
  * NeMoClaw DevX — Model Selector
  *
  * Dropdown injected into the chat compose area that lets users pick a
- * model.  For models routed through inference.local (curated + dynamic),
- * switching only updates the NemoClaw cluster-inference route — no
- * OpenClaw config.patch is needed because the NemoClaw proxy rewrites
- * the model field in every request body.  This avoids the gateway
- * disconnect that config.patch causes.
+ * model.  For models routed through the local LiteLLM proxy (curated +
+ * dynamic), switching only updates the NemoClaw cluster-inference route
+ * — no OpenClaw config.patch is needed because the LiteLLM proxy
+ * handles model routing and streaming natively.  This avoids the
+ * gateway disconnect that config.patch causes.
  *
  * Models are fetched dynamically from the NemoClaw runtime (providers
  * and active route configured in the Inference tab).
@@ -264,14 +264,14 @@ function dismissTransitionBanner(): void {
 // ---------------------------------------------------------------------------
 
 /**
- * Returns true if the model routes through inference.local, meaning the
- * NemoClaw proxy manages credential injection and model rewriting.
+ * Returns true if the model routes through the local LiteLLM proxy,
+ * meaning credential injection and streaming are handled server-side.
  * For these models we only need to update the cluster-inference route —
  * no OpenClaw config.patch (and therefore no gateway disconnect).
  */
 function isProxyManaged(entry: ModelEntry): boolean {
   return entry.isDynamic === true ||
-    entry.providerConfig.baseUrl === "https://inference.local/v1";
+    entry.providerConfig.baseUrl === "http://127.0.0.1:4000/v1";
 }
 
 async function applyModelSelection(
@@ -295,10 +295,9 @@ async function applyModelSelection(
 
   try {
     if (isProxyManaged(entry)) {
-      // Proxy-managed models route through inference.local.  We update the
-      // NemoClaw cluster-inference route (no OpenClaw config.patch, no
-      // gateway disconnect).  The sandbox polls every ~30s for route
-      // updates, so we show an honest propagation countdown.
+      // Proxy-managed models route through the local LiteLLM proxy.  We
+      // update the cluster-inference route and LiteLLM is restarted with the
+      // new model config (no OpenClaw config.patch, no gateway disconnect).
       const curated = getCuratedByModelId(entry.providerConfig.models[0]?.id || "");
       const provName = curated?.providerName || entry.providerKey.replace(/^dynamic-/, "");
       const modelId = entry.providerConfig.models[0]?.id || "";
diff --git a/sandboxes/nemoclaw/policy-proxy.js b/sandboxes/nemoclaw/policy-proxy.js
index ea479f6..8b92b14 100644
--- a/sandboxes/nemoclaw/policy-proxy.js
+++ b/sandboxes/nemoclaw/policy-proxy.js
@@ -418,15 +418,218 @@ function syncAndRespond(yamlBody, res, t0) {
   });
 }
 
+// ---------------------------------------------------------------------------
+// LiteLLM config manager
+//
+// When the user switches models via the UI, the extension POSTs to
+// /api/cluster-inference.  After forwarding to the gateway we regenerate
+// the LiteLLM config and restart the proxy so the new model takes effect.
+// ---------------------------------------------------------------------------
+
+const { execFile } = require("child_process");
+
+const LITELLM_PORT = 4000;
+const LITELLM_CONFIG_PATH = "/tmp/litellm_config.yaml";
+const LITELLM_LOG_PATH = "/tmp/litellm.log";
+
+const PROVIDER_MAP = {
+  "nvidia-endpoints": {
+    litellmPrefix: "nvidia_nim",
+    apiBase: "https://integrate.api.nvidia.com/v1",
+    apiKeyEnv: "NVIDIA_NIM_API_KEY",
+  },
+  "nvidia-inference": {
+    litellmPrefix: "nvidia_nim",
+    apiBase: "https://inference-api.nvidia.com/v1",
+    apiKeyEnv: "NVIDIA_NIM_API_KEY",
+  },
+};
+
+let litellmPid = null;
+
+function generateLitellmConfig(providerName, modelId) {
+  const provider = PROVIDER_MAP[providerName] || PROVIDER_MAP["nvidia-endpoints"];
+  const fullModel = `${provider.litellmPrefix}/${modelId}`;
+
+  const config = [
+    "model_list:",
+    '  - model_name: "*"',
+    "    litellm_params:",
+    `      model: "${fullModel}"`,
+    `      api_key: os.environ/${provider.apiKeyEnv}`,
+    `      api_base: "${provider.apiBase}"`,
+    "general_settings:",
+    "  master_key: sk-nemoclaw-local",
+    "litellm_settings:",
+    "  request_timeout: 600",
+    "  drop_params: true",
+    "  num_retries: 0",
+    "",
+  ].join("\n");
+
+  fs.writeFileSync(LITELLM_CONFIG_PATH, config, "utf8");
+  console.log(`[litellm-mgr] Config written: model=${fullModel} api_base=${provider.apiBase}`);
+}
+
+function restartLitellm() {
+  return new Promise((resolve) => {
+    if (litellmPid) {
+      try {
+        process.kill(litellmPid, "SIGTERM");
+        console.log(`[litellm-mgr] Sent SIGTERM to old LiteLLM (pid ${litellmPid})`);
+      } catch (e) {
+        // Process may have already exited.
+      }
+      litellmPid = null;
+    }
+
+    // Brief grace period for the old process to release the port.
+    setTimeout(() => {
+      const logFd = fs.openSync(LITELLM_LOG_PATH, "a");
+      const child = execFile(
+        "litellm",
+        ["--config", LITELLM_CONFIG_PATH, "--port", String(LITELLM_PORT), "--host", "127.0.0.1"],
+        { stdio: ["ignore", logFd, logFd], detached: true }
+      );
+      child.unref();
+      litellmPid = child.pid;
+      console.log(`[litellm-mgr] Started new LiteLLM (pid ${litellmPid})`);
+      fs.closeSync(logFd);
+
+      // Wait for the health endpoint to become available.
+      let attempts = 0;
+      const maxAttempts = 20;
+      const poll = setInterval(() => {
+        attempts++;
+        const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health`, (healthRes) => {
+          if (healthRes.statusCode === 200) {
+            clearInterval(poll);
+            console.log(`[litellm-mgr] LiteLLM ready after ${attempts * 500}ms`);
+            resolve(true);
+          }
+          healthRes.resume();
+        });
+        healthReq.on("error", () => {});
+        healthReq.setTimeout(400, () => healthReq.destroy());
+        if (attempts >= maxAttempts) {
+          clearInterval(poll);
+          console.warn("[litellm-mgr] LiteLLM did not become ready within 10s");
+          resolve(false);
+        }
+      }, 500);
+    }, 500);
+  });
+}
+
+// Discover existing LiteLLM pid at startup so we can manage restarts.
+try {
+  const { execSync } = require("child_process");
+  const pidStr = execSync(`pgrep -f "litellm.*--port ${LITELLM_PORT}" 2>/dev/null || true`, { encoding: "utf8" }).trim();
+  if (pidStr) {
+    litellmPid = parseInt(pidStr.split("\n")[0], 10);
+    console.log(`[litellm-mgr] Discovered existing LiteLLM pid: ${litellmPid}`);
+  }
+} catch (e) {}
+
+// ---------------------------------------------------------------------------
+// /api/cluster-inference intercept
+// ---------------------------------------------------------------------------
+
+function handleClusterInferencePost(clientReq, clientRes) {
+  const chunks = [];
+  clientReq.on("data", (chunk) => chunks.push(chunk));
+  clientReq.on("end", () => {
+    const rawBody = Buffer.concat(chunks);
+    let payload;
+    try {
+      payload = JSON.parse(rawBody.toString("utf8"));
+    } catch (e) {
+      clientRes.writeHead(400, { "Content-Type": "application/json" });
+      clientRes.end(JSON.stringify({ error: "invalid JSON" }));
+      return;
+    }
+
+    // Forward the original request to the upstream gateway first.
+    const opts = {
+      hostname: UPSTREAM_HOST,
+      port: UPSTREAM_PORT,
+      path: clientReq.url,
+      method: clientReq.method,
+      headers: { ...clientReq.headers, "content-length": rawBody.length },
+    };
+
+    const upstream = http.request(opts, (upstreamRes) => {
+      const upChunks = [];
+      upstreamRes.on("data", (c) => upChunks.push(c));
+      upstreamRes.on("end", () => {
+        const upBody = Buffer.concat(upChunks);
+        clientRes.writeHead(upstreamRes.statusCode, upstreamRes.headers);
+        clientRes.end(upBody);
+
+        // On success, regenerate LiteLLM config and restart.
+        if (upstreamRes.statusCode >= 200 && upstreamRes.statusCode < 300) {
+          const providerName = payload.providerName || "nvidia-endpoints";
+          const modelId = payload.modelId || payload.model || "";
+          if (modelId) {
+            console.log(`[litellm-mgr] Model switch detected: provider=${providerName} model=${modelId}`);
+            generateLitellmConfig(providerName, modelId);
+            restartLitellm().then((ready) => {
+              console.log(`[litellm-mgr] Restart complete, ready=${ready}`);
+            });
+          }
+        }
+      });
+    });
+
+    upstream.on("error", (err) => {
+      console.error("[litellm-mgr] upstream error on cluster-inference forward:", err.message);
+      if (!clientRes.headersSent) {
+        clientRes.writeHead(502, { "Content-Type": "application/json" });
+      }
+      clientRes.end(JSON.stringify({ error: "upstream unavailable" }));
+    });
+
+    upstream.end(rawBody);
+  });
+}
+
+// ---------------------------------------------------------------------------
+// /api/litellm-health handler
+// ---------------------------------------------------------------------------
+
+function handleLitellmHealth(req, res) {
+  const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health`, (healthRes) => {
+    const chunks = [];
+    healthRes.on("data", (c) => chunks.push(c));
+    healthRes.on("end", () => {
+      res.writeHead(healthRes.statusCode, { "Content-Type": "application/json" });
+      res.end(Buffer.concat(chunks));
+    });
+  });
+  healthReq.on("error", (err) => {
+    res.writeHead(503, { "Content-Type": "application/json" });
+    res.end(JSON.stringify({ error: "litellm unreachable", detail: err.message, pid: litellmPid }));
+  });
+  healthReq.setTimeout(3000, () => {
+    healthReq.destroy();
+    res.writeHead(504, { "Content-Type": "application/json" });
+    res.end(JSON.stringify({ error: "litellm health check timed out", pid: litellmPid }));
+  });
+}
+
 // ---------------------------------------------------------------------------
 // HTTP server
 // ---------------------------------------------------------------------------
 
+function setCorsHeaders(res) {
+  res.setHeader("Access-Control-Allow-Origin", "*");
+  res.setHeader("Access-Control-Allow-Methods", "GET, POST, OPTIONS");
+  res.setHeader("Access-Control-Allow-Headers", "Content-Type, Authorization");
+}
+
 const server = http.createServer((req, res) => {
   if (req.url === "/api/policy") {
-    res.setHeader("Access-Control-Allow-Origin", "*");
-    res.setHeader("Access-Control-Allow-Methods", "GET, POST, OPTIONS");
-    res.setHeader("Access-Control-Allow-Headers", "Content-Type");
+    setCorsHeaders(res);
 
     if (req.method === "OPTIONS") {
       res.writeHead(204);
@@ -442,6 +645,23 @@ const server = http.createServer((req, res) => {
     return;
   }
 
+  if (req.url === "/api/cluster-inference" && req.method === "POST") {
+    setCorsHeaders(res);
+    handleClusterInferencePost(req, res);
+    return;
+  }
+
+  if (req.url === "/api/litellm-health") {
+    setCorsHeaders(res);
+    if (req.method === "OPTIONS") {
+      res.writeHead(204);
+      res.end();
+    } else {
+      handleLitellmHealth(req, res);
+    }
+    return;
+  }
+
   proxyRequest(req, res);
 });
 

From 754c756b33d8f062fad70acb7edcf1a4e23bcd5e Mon Sep 17 00:00:00 2001
From: nv-kasikritc <kchantharuan@nvidia.com>
Date: Thu, 12 Mar 2026 10:57:49 +0000
Subject: [PATCH 06/25] LiteLLM working

---
 sandboxes/nemoclaw/nemoclaw-start.sh |  51 +++++++++++---
 sandboxes/nemoclaw/policy-proxy.js   | 100 +++++++++++++++++++++++----
 sandboxes/nemoclaw/policy.yaml       |   3 +
 3 files changed, 133 insertions(+), 21 deletions(-)

diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index ba22672..e1c35ce 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -76,7 +76,22 @@ LITELLM_PORT=4000
 LITELLM_CONFIG="/tmp/litellm_config.yaml"
 LITELLM_LOG="/tmp/litellm.log"
 
-export NVIDIA_NIM_API_KEY="${NVIDIA_INFERENCE_API_KEY:-${NVIDIA_INTEGRATE_API_KEY:-not-set}}"
+NVIDIA_NIM_API_KEY="${NVIDIA_INFERENCE_API_KEY:-${NVIDIA_INTEGRATE_API_KEY:-}}"
+export NVIDIA_NIM_API_KEY
+
+# Persist the API key to a well-known file so the policy-proxy can read
+# it later when regenerating the LiteLLM config (e.g. on model switch or
+# late key injection from the welcome UI).
+LITELLM_KEY_FILE="/tmp/litellm_api_key"
+if [ -n "$NVIDIA_NIM_API_KEY" ]; then
+  echo -n "$NVIDIA_NIM_API_KEY" > "$LITELLM_KEY_FILE"
+  chmod 600 "$LITELLM_KEY_FILE"
+fi
+
+# Use the local bundled cost map to avoid a blocked HTTPS fetch to GitHub
+# at startup (the sandbox network policy doesn't allow Python to reach
+# raw.githubusercontent.com, causing a ~5s timeout on every start).
+export LITELLM_LOCAL_MODEL_COST_MAP="True"
 
 _DEFAULT_MODEL="moonshotai/kimi-k2.5"
 _DEFAULT_PROVIDER="nvidia-endpoints"
@@ -86,6 +101,12 @@ generate_litellm_config() {
   local provider="${2:-$_DEFAULT_PROVIDER}"
   local api_base=""
   local litellm_prefix="nvidia_nim"
+  local api_key="${NVIDIA_NIM_API_KEY:-}"
+
+  # Read from persisted key file if env var is empty.
+  if [ -z "$api_key" ] && [ -f "$LITELLM_KEY_FILE" ]; then
+    api_key="$(cat "$LITELLM_KEY_FILE")"
+  fi
 
   case "$provider" in
     nvidia-endpoints)
@@ -96,12 +117,23 @@ generate_litellm_config() {
       api_base="https://integrate.api.nvidia.com/v1" ;;
   esac
 
+  # Write the actual key value into the config. Using os.environ/ references
+  # is fragile inside the sandbox where env vars may not be propagated to all
+  # child processes.  If no key is available yet, use a placeholder — the
+  # policy-proxy will regenerate the config when the key arrives.
+  local key_yaml
+  if [ -n "$api_key" ]; then
+    key_yaml="      api_key: \"${api_key}\""
+  else
+    key_yaml="      api_key: \"key-not-yet-configured\""
+  fi
+
   cat > "$LITELLM_CONFIG" <<LITELLM_EOF
 model_list:
   - model_name: "*"
     litellm_params:
       model: "${litellm_prefix}/${model_id}"
-      api_key: os.environ/NVIDIA_NIM_API_KEY
+${key_yaml}
       api_base: "${api_base}"
 general_settings:
   master_key: sk-nemoclaw-local
@@ -110,23 +142,26 @@ litellm_settings:
   drop_params: true
   num_retries: 0
 LITELLM_EOF
-  echo "[litellm] Config written: model=${litellm_prefix}/${model_id} api_base=${api_base}"
+  echo "[litellm] Config written: model=${litellm_prefix}/${model_id} api_base=${api_base} key=${api_key:+present}"
 }
 
 generate_litellm_config "$_DEFAULT_MODEL" "$_DEFAULT_PROVIDER"
 
-nohup litellm --config "$LITELLM_CONFIG" --port "$LITELLM_PORT" --host 127.0.0.1 \
+LITELLM_LOCAL_MODEL_COST_MAP="True" \
+  nohup litellm --config "$LITELLM_CONFIG" --port "$LITELLM_PORT" --host 127.0.0.1 \
   >> "$LITELLM_LOG" 2>&1 &
 echo "[litellm] Starting on 127.0.0.1:${LITELLM_PORT} (pid $!)"
 
 # Wait for LiteLLM to accept connections before proceeding.
-_litellm_deadline=$(($(date +%s) + 30))
-while ! curl -sf "http://127.0.0.1:${LITELLM_PORT}/health" >/dev/null 2>&1; do
+# Use /health/liveliness (basic liveness, no model checks) and --noproxy
+# to bypass the sandbox HTTP proxy for localhost connections.
+_litellm_deadline=$(($(date +%s) + 60))
+while ! curl -sf --noproxy 127.0.0.1 "http://127.0.0.1:${LITELLM_PORT}/health/liveliness" >/dev/null 2>&1; do
   if [ "$(date +%s)" -ge "$_litellm_deadline" ]; then
-    echo "[litellm] WARNING: LiteLLM did not become ready within 30s. Continuing anyway."
+    echo "[litellm] WARNING: LiteLLM did not become ready within 60s. Continuing anyway."
     break
   fi
-  sleep 0.5
+  sleep 1
 done
 
 # --------------------------------------------------------------------------
diff --git a/sandboxes/nemoclaw/policy-proxy.js b/sandboxes/nemoclaw/policy-proxy.js
index 8b92b14..308cc8b 100644
--- a/sandboxes/nemoclaw/policy-proxy.js
+++ b/sandboxes/nemoclaw/policy-proxy.js
@@ -431,32 +431,44 @@ const { execFile } = require("child_process");
 const LITELLM_PORT = 4000;
 const LITELLM_CONFIG_PATH = "/tmp/litellm_config.yaml";
 const LITELLM_LOG_PATH = "/tmp/litellm.log";
+const LITELLM_KEY_FILE = "/tmp/litellm_api_key";
 
 const PROVIDER_MAP = {
   "nvidia-endpoints": {
     litellmPrefix: "nvidia_nim",
     apiBase: "https://integrate.api.nvidia.com/v1",
-    apiKeyEnv: "NVIDIA_NIM_API_KEY",
   },
   "nvidia-inference": {
     litellmPrefix: "nvidia_nim",
     apiBase: "https://inference-api.nvidia.com/v1",
-    apiKeyEnv: "NVIDIA_NIM_API_KEY",
   },
 };
 
 let litellmPid = null;
 
+function readApiKey() {
+  try {
+    const key = fs.readFileSync(LITELLM_KEY_FILE, "utf8").trim();
+    if (key) return key;
+  } catch (e) {}
+  return process.env.NVIDIA_NIM_API_KEY || "";
+}
+
+function writeApiKey(key) {
+  fs.writeFileSync(LITELLM_KEY_FILE, key, { mode: 0o600 });
+}
+
 function generateLitellmConfig(providerName, modelId) {
   const provider = PROVIDER_MAP[providerName] || PROVIDER_MAP["nvidia-endpoints"];
   const fullModel = `${provider.litellmPrefix}/${modelId}`;
+  const apiKey = readApiKey() || "key-not-yet-configured";
 
   const config = [
     "model_list:",
     '  - model_name: "*"',
     "    litellm_params:",
     `      model: "${fullModel}"`,
-    `      api_key: os.environ/${provider.apiKeyEnv}`,
+    `      api_key: "${apiKey}"`,
     `      api_base: "${provider.apiBase}"`,
     "general_settings:",
     "  master_key: sk-nemoclaw-local",
@@ -468,7 +480,8 @@ function generateLitellmConfig(providerName, modelId) {
   ].join("\n");
 
   fs.writeFileSync(LITELLM_CONFIG_PATH, config, "utf8");
-  console.log(`[litellm-mgr] Config written: model=${fullModel} api_base=${provider.apiBase}`);
+  const keyStatus = apiKey === "key-not-yet-configured" ? "missing" : "present";
+  console.log(`[litellm-mgr] Config written: model=${fullModel} api_base=${provider.apiBase} key=${keyStatus}`);
 }
 
 function restartLitellm() {
@@ -486,37 +499,38 @@ function restartLitellm() {
     // Brief grace period for the old process to release the port.
     setTimeout(() => {
       const logFd = fs.openSync(LITELLM_LOG_PATH, "a");
+      const env = { ...process.env, LITELLM_LOCAL_MODEL_COST_MAP: "True" };
       const child = execFile(
         "litellm",
         ["--config", LITELLM_CONFIG_PATH, "--port", String(LITELLM_PORT), "--host", "127.0.0.1"],
-        { stdio: ["ignore", logFd, logFd], detached: true }
+        { stdio: ["ignore", logFd, logFd], detached: true, env }
       );
       child.unref();
       litellmPid = child.pid;
       console.log(`[litellm-mgr] Started new LiteLLM (pid ${litellmPid})`);
       fs.closeSync(logFd);
 
-      // Wait for the health endpoint to become available.
+      // Wait for the liveness endpoint (no model connectivity checks).
       let attempts = 0;
-      const maxAttempts = 20;
+      const maxAttempts = 60;
       const poll = setInterval(() => {
         attempts++;
-        const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health`, (healthRes) => {
+        const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health/liveliness`, (healthRes) => {
           if (healthRes.statusCode === 200) {
             clearInterval(poll);
-            console.log(`[litellm-mgr] LiteLLM ready after ${attempts * 500}ms`);
+            console.log(`[litellm-mgr] LiteLLM ready after ${attempts}s`);
             resolve(true);
           }
           healthRes.resume();
         });
         healthReq.on("error", () => {});
-        healthReq.setTimeout(400, () => healthReq.destroy());
+        healthReq.setTimeout(800, () => healthReq.destroy());
         if (attempts >= maxAttempts) {
           clearInterval(poll);
-          console.warn("[litellm-mgr] LiteLLM did not become ready within 10s");
+          console.warn("[litellm-mgr] LiteLLM did not become ready within 60s");
           resolve(false);
         }
-      }, 500);
+      }, 1000);
     }, 500);
   });
 }
@@ -593,12 +607,66 @@ function handleClusterInferencePost(clientReq, clientRes) {
   });
 }
 
+// ---------------------------------------------------------------------------
+// /api/litellm-key handler — accepts an API key update from the welcome UI
+// ---------------------------------------------------------------------------
+
+function handleLitellmKey(req, res) {
+  const chunks = [];
+  req.on("data", (c) => chunks.push(c));
+  req.on("end", () => {
+    let body;
+    try {
+      body = JSON.parse(Buffer.concat(chunks).toString("utf8"));
+    } catch (e) {
+      res.writeHead(400, { "Content-Type": "application/json" });
+      res.end(JSON.stringify({ error: "invalid JSON" }));
+      return;
+    }
+
+    const apiKey = (body.apiKey || "").trim();
+    if (!apiKey) {
+      res.writeHead(400, { "Content-Type": "application/json" });
+      res.end(JSON.stringify({ error: "missing apiKey" }));
+      return;
+    }
+
+    console.log(`[litellm-mgr] API key update received (${apiKey.length} chars)`);
+    writeApiKey(apiKey);
+
+    // Read the current config to extract the model/provider, then regenerate
+    // with the new key.
+    let currentModel = "moonshotai/kimi-k2.5";
+    let currentProvider = "nvidia-endpoints";
+    try {
+      const cfg = fs.readFileSync(LITELLM_CONFIG_PATH, "utf8");
+      const modelMatch = cfg.match(/model:\s*"[^/]+\/(.+?)"/);
+      if (modelMatch) currentModel = modelMatch[1];
+      const baseMatch = cfg.match(/api_base:\s*"(.+?)"/);
+      if (baseMatch) {
+        const base = baseMatch[1];
+        for (const [name, p] of Object.entries(PROVIDER_MAP)) {
+          if (p.apiBase === base) { currentProvider = name; break; }
+        }
+      }
+    } catch (e) {}
+
+    generateLitellmConfig(currentProvider, currentModel);
+    restartLitellm().then((ready) => {
+      console.log(`[litellm-mgr] Restarted with new key, ready=${ready}`);
+    });
+
+    res.writeHead(200, { "Content-Type": "application/json" });
+    res.end(JSON.stringify({ ok: true }));
+  });
+}
+
 // ---------------------------------------------------------------------------
 // /api/litellm-health handler
 // ---------------------------------------------------------------------------
 
 function handleLitellmHealth(req, res) {
-  const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health`, (healthRes) => {
+  const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health/liveliness`, (healthRes) => {
     const chunks = [];
     healthRes.on("data", (c) => chunks.push(c));
     healthRes.on("end", () => {
@@ -651,6 +719,12 @@ const server = http.createServer((req, res) => {
     return;
   }
 
+  if (req.url === "/api/litellm-key" && req.method === "POST") {
+    setCorsHeaders(res);
+    handleLitellmKey(req, res);
+    return;
+  }
+
   if (req.url === "/api/litellm-health") {
     setCorsHeaders(res);
     if (req.method === "OPTIONS") {
diff --git a/sandboxes/nemoclaw/policy.yaml b/sandboxes/nemoclaw/policy.yaml
index 3a1422e..749a058 100644
--- a/sandboxes/nemoclaw/policy.yaml
+++ b/sandboxes/nemoclaw/policy.yaml
@@ -82,10 +82,13 @@ network_policies:
     name: nvidia
     endpoints:
       - { host: integrate.api.nvidia.com, port: 443 }
+      - { host: inference-api.nvidia.com, port: 443 }
     binaries:
       - { path: /usr/bin/curl }
       - { path: /bin/bash }
       - { path: /usr/local/bin/opencode }
+      - { path: /usr/bin/python3 }
+      - { path: /usr/bin/python3.12 }
   nvidia_web:
     name: nvidia_web
     endpoints:

From dc1d7acc61bc1daa308c43c618ffd8982afeb36b Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Thu, 12 Mar 2026 11:37:11 -0700
Subject: [PATCH 07/25] Update welcome UI icon assets

---
 brev/welcome-ui/OpenShell-Icon.svg | 1 +
 brev/welcome-ui/openshell-mark.svg | 5 -----
 2 files changed, 1 insertion(+), 5 deletions(-)
 create mode 100644 brev/welcome-ui/OpenShell-Icon.svg
 delete mode 100644 brev/welcome-ui/openshell-mark.svg

diff --git a/brev/welcome-ui/OpenShell-Icon.svg b/brev/welcome-ui/OpenShell-Icon.svg
new file mode 100644
index 0000000..81bcd2c
--- /dev/null
+++ b/brev/welcome-ui/OpenShell-Icon.svg
@@ -0,0 +1 @@
+<?xml version="1.0" encoding="UTF-8"?><svg id="a" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 133.9 141.7"><defs><style>.b{fill:none;stroke:#76b900;stroke-miterlimit:10;stroke-width:4px;}</style></defs><path class="b" d="M107.3,119.3l-40.3,20.2-40.3-20.2L2.4,34.5,67,2.3l64.6,32.3-24.2,84.7Z"/><path class="b" d="M77.5,32.7l1.3,22c0,1.1-1.1,1.8-2,1.2l-10.3-6.4c-.6-.4-.8-1.1-.5-1.8l8.7-15.7c.7-1.3,2.7-.9,2.8.6Z"/><path class="b" d="M60.3,103.1c-1.3,0-2.6-.5-3.5-1.5-2.1-2.2-5.7-6.2-6.5-8.3s-.3-2.7-.2-4.2,1-2,2.1-2h12.6c1.5,0,2.8,1.1,3.1,2.5l1.9,10c.3,1.8-1,3.4-2.8,3.4h-6.7Z"/><path class="b" d="M64.5,80.9h-12.5c-1.5,0-2.9-.5-4.1-1.4-3.1-2.4-8.8-7.9-9.8-15.1-.4-3.1,0-19.7,3.4-27.6,3.6-8.1,9.5-13.8,17.5-16.8,2-.8,4,1.2,3.2,3.2-2.6,6.9-6.6,19.5-4,26.5,1.6,4.3,10.3,9.8,15.7,12.9s3,4.3,1.6,6.6l-5.8,8.9c-1.1,1.8-3.1,2.8-5.2,2.8Z"/><path class="b" d="M84.6,120h-9.6c-1,0-2-.4-2.6-1.2l-7.2-8.3c-.2-.2,0-.5.2-.5h7.6c1.5,0,2-4.1,2.4-5.9s1-1,1.6-.7l8.8,6c.8.5,1.3,1.4,1.3,2.4v5.7c0,1.3-1.1,2.4-2.4,2.4Z"/></svg>
\ No newline at end of file
diff --git a/brev/welcome-ui/openshell-mark.svg b/brev/welcome-ui/openshell-mark.svg
deleted file mode 100644
index 300ba64..0000000
--- a/brev/welcome-ui/openshell-mark.svg
+++ /dev/null
@@ -1,5 +0,0 @@
-<svg viewBox="0 0 32 32" fill="none" xmlns="http://www.w3.org/2000/svg">
-  <rect x="3" y="3" width="26" height="26" rx="8" fill="#76B900"/>
-  <path d="M11 11h10a3 3 0 0 1 0 6h-7a3 3 0 0 0 0 6h7" stroke="#081106" stroke-width="2.5" stroke-linecap="round" stroke-linejoin="round"/>
-  <path d="M20 11h1" stroke="#081106" stroke-width="2.5" stroke-linecap="round"/>
-</svg>

From ce8197af187006d9aeba3d31722c9f9bba36eab5 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Thu, 12 Mar 2026 14:05:58 -0700
Subject: [PATCH 08/25] Add on-demand nemoclaw build; improve auto-pair

---
 sandboxes/nemoclaw/nemoclaw-start.sh | 30 ++++++++++++++++++++++++----
 1 file changed, 26 insertions(+), 4 deletions(-)

diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index e1c35ce..541f2ed 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -210,6 +210,7 @@ json.dump(cfg, open(os.environ['HOME'] + '/.openclaw/openclaw.json', 'w'), inden
 "
 
 nohup openclaw gateway > /tmp/gateway.log 2>&1 &
+echo "[gateway] openclaw gateway launched (pid $!)"
 
 # Copy the default policy to a writable location so that policy-proxy can
 # update it at runtime.  /etc is read-only under Landlock, but /sandbox is
@@ -228,17 +229,38 @@ _POLICY_PATH="${_POLICY_DST}"
 # /api/policy requests to read/write the sandbox policy file.
 NODE_PATH=$(npm root -g) POLICY_PATH=${_POLICY_PATH} UPSTREAM_PORT=${INTERNAL_GATEWAY_PORT} LISTEN_PORT=${PUBLIC_PORT} \
   nohup node /usr/local/lib/policy-proxy.js >> /tmp/gateway.log 2>&1 &
+echo "[gateway] policy-proxy launched (pid $!) upstream=${INTERNAL_GATEWAY_PORT} public=${PUBLIC_PORT}"
 
 # Auto-approve pending device pairing requests so the browser is paired
 # before the user notices the "pairing required" prompt in the Control UI.
 (
+  echo "[auto-pair] watcher starting"
   _pair_deadline=$(($(date +%s) + 300))
+  _pair_attempts=0
+  _pair_approved=0
+  _pair_errors=0
   while [ "$(date +%s)" -lt "$_pair_deadline" ]; do
     sleep 0.5
-    if openclaw devices approve --latest --json 2>/dev/null | grep -q '"ok"'; then
-      echo "[auto-pair] Approved pending device pairing request."
+    _pair_attempts=$((_pair_attempts + 1))
+    _approve_output="$(openclaw devices approve --latest --json 2>&1 || true)"
+
+    if printf '%s\n' "$_approve_output" | grep -q '"ok"[[:space:]]*:[[:space:]]*true'; then
+      _pair_approved=$((_pair_approved + 1))
+      echo "[auto-pair] Approved pending device pairing request: ${_approve_output}"
+      continue
+    fi
+
+    if [ -n "$_approve_output" ] && ! printf '%s\n' "$_approve_output" | grep -qiE 'no pending|no device|not paired|nothing to approve'; then
+      _pair_errors=$((_pair_errors + 1))
+      echo "[auto-pair] approve --latest returned non-success output: ${_approve_output}"
+    fi
+
+    if [ $((_pair_attempts % 20)) -eq 0 ]; then
+      _list_output="$(openclaw devices list --json 2>&1 || true)"
+      echo "[auto-pair] heartbeat attempts=${_pair_attempts} approved=${_pair_approved} errors=${_pair_errors} devices=${_list_output}"
     fi
   done
+  echo "[auto-pair] watcher exiting attempts=${_pair_attempts} approved=${_pair_approved} errors=${_pair_errors}"
 ) >> /tmp/gateway.log 2>&1 &
 
 CONFIG_FILE="${HOME}/.openclaw/openclaw.json"
@@ -246,8 +268,8 @@ token=$(grep -o '"token"\s*:\s*"[^"]*"' "${CONFIG_FILE}" 2>/dev/null | head -1 |
 
 CHAT_UI_BASE="${CHAT_UI_URL%/}"
 if [ -n "${token}" ]; then
-    LOCAL_URL="http://127.0.0.1:18789/?token=${token}"
-    CHAT_URL="${CHAT_UI_BASE}/?token=${token}"
+    LOCAL_URL="http://127.0.0.1:18789/#token=${token}"
+    CHAT_URL="${CHAT_UI_BASE}/#token=${token}"
 else
     LOCAL_URL="http://127.0.0.1:18789/"
     CHAT_URL="${CHAT_UI_BASE}/"

From 6c319fa6f30880def7290694d04eb29694778439 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Thu, 12 Mar 2026 15:38:44 -0700
Subject: [PATCH 09/25] Logo fixup, improve auto-approve cycle, NO_PROXY for
 localhost

---
 brev/welcome-ui/OpenShell-Icon-Logo.svg       | 20 +++++++++++
 sandboxes/nemoclaw/nemoclaw-start.sh          | 36 ++++++++++++++++---
 .../nemoclaw-ui-extension/extension/index.ts  | 16 +++++++--
 3 files changed, 66 insertions(+), 6 deletions(-)
 create mode 100644 brev/welcome-ui/OpenShell-Icon-Logo.svg

diff --git a/brev/welcome-ui/OpenShell-Icon-Logo.svg b/brev/welcome-ui/OpenShell-Icon-Logo.svg
new file mode 100644
index 0000000..91e389d
--- /dev/null
+++ b/brev/welcome-ui/OpenShell-Icon-Logo.svg
@@ -0,0 +1,20 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 133.9 141.7">
+  <defs>
+    <style>
+      .logo-stroke {
+        fill: none;
+        stroke: #76b900;
+        stroke-linecap: round;
+        stroke-linejoin: round;
+        stroke-miterlimit: 10;
+        stroke-width: 5.5px;
+      }
+    </style>
+  </defs>
+  <path class="logo-stroke" d="M107.3,119.3l-40.3,20.2-40.3-20.2L2.4,34.5,67,2.3l64.6,32.3-24.2,84.7Z"/>
+  <path class="logo-stroke" d="M77.5,32.7l1.3,22c0,1.1-1.1,1.8-2,1.2l-10.3-6.4c-.6-.4-.8-1.1-.5-1.8l8.7-15.7c.7-1.3,2.7-.9,2.8.6Z"/>
+  <path class="logo-stroke" d="M60.3,103.1c-1.3,0-2.6-.5-3.5-1.5-2.1-2.2-5.7-6.2-6.5-8.3s-.3-2.7-.2-4.2,1-2,2.1-2h12.6c1.5,0,2.8,1.1,3.1,2.5l1.9,10c.3,1.8-1,3.4-2.8,3.4h-6.7Z"/>
+  <path class="logo-stroke" d="M64.5,80.9h-12.5c-1.5,0-2.9-.5-4.1-1.4-3.1-2.4-8.8-7.9-9.8-15.1-.4-3.1,0-19.7,3.4-27.6,3.6-8.1,9.5-13.8,17.5-16.8,2-.8,4,1.2,3.2,3.2-2.6,6.9-6.6,19.5-4,26.5,1.6,4.3,10.3,9.8,15.7,12.9s3,4.3,1.6,6.6l-5.8,8.9c-1.1,1.8-3.1,2.8-5.2,2.8Z"/>
+  <path class="logo-stroke" d="M84.6,120h-9.6c-1,0-2-.4-2.6-1.2l-7.2-8.3c-.2-.2,0-.5.2-.5h7.6c1.5,0,2-4.1,2.4-5.9s1-1,1.6-.7l8.8,6c.8.5,1.3,1.4,1.3,2.4v5.7c0,1.3-1.1,2.4-2.4,2.4Z"/>
+</svg>
diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index 541f2ed..06912a5 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -48,6 +48,12 @@ if [ -z "${CHAT_UI_URL:-}" ]; then
     exit 1
 fi
 
+# Keep local service-to-service traffic off the sandbox forward proxy.
+# LiteLLM/OpenClaw must talk to 127.0.0.1 directly, while upstream NVIDIA
+# requests should continue using the configured HTTP(S) proxy.
+export NO_PROXY="${NO_PROXY:+${NO_PROXY},}127.0.0.1,localhost,::1"
+export no_proxy="${no_proxy:+${no_proxy},}127.0.0.1,localhost,::1"
+
 BUNDLE="$(npm root -g)/openclaw/dist/control-ui/assets/nemoclaw-devx.js"
 
 if [ -f "$BUNDLE" ]; then
@@ -235,6 +241,26 @@ echo "[gateway] policy-proxy launched (pid $!) upstream=${INTERNAL_GATEWAY_PORT}
 # before the user notices the "pairing required" prompt in the Control UI.
 (
   echo "[auto-pair] watcher starting"
+  _json_has_approval() {
+    jq -e '
+      .device
+      | objects
+      | (.approvedAtMs? // empty) or ((.tokens? // []) | length > 0)
+    ' >/dev/null 2>&1
+  }
+
+  _summarize_device_list() {
+    jq -r '
+      def labels($entries):
+        ($entries // [])
+        | map(select(type == "object" and (.deviceId? // "") != "")
+          | "\((.clientId // "unknown")):\((.deviceId // "")[0:12])");
+      (labels(.pending)) as $pending
+      | (labels(.paired)) as $paired
+      | "pending=\($pending | length) [\(($pending | if length > 0 then join(", ") else "-" end))] paired=\($paired | length) [\(($paired | if length > 0 then join(", ") else "-" end))]"
+    ' 2>/dev/null || echo "unparseable"
+  }
+
   _pair_deadline=$(($(date +%s) + 300))
   _pair_attempts=0
   _pair_approved=0
@@ -244,20 +270,22 @@ echo "[gateway] policy-proxy launched (pid $!) upstream=${INTERNAL_GATEWAY_PORT}
     _pair_attempts=$((_pair_attempts + 1))
     _approve_output="$(openclaw devices approve --latest --json 2>&1 || true)"
 
-    if printf '%s\n' "$_approve_output" | grep -q '"ok"[[:space:]]*:[[:space:]]*true'; then
+    if printf '%s\n' "$_approve_output" | _json_has_approval; then
       _pair_approved=$((_pair_approved + 1))
-      echo "[auto-pair] Approved pending device pairing request: ${_approve_output}"
+      _approved_device_id="$(printf '%s\n' "$_approve_output" | jq -r '.device.deviceId // ""' 2>/dev/null | cut -c1-12)"
+      echo "[auto-pair] approved request attempts=${_pair_attempts} count=${_pair_approved} device=${_approved_device_id:-unknown}"
       continue
     fi
 
     if [ -n "$_approve_output" ] && ! printf '%s\n' "$_approve_output" | grep -qiE 'no pending|no device|not paired|nothing to approve'; then
       _pair_errors=$((_pair_errors + 1))
-      echo "[auto-pair] approve --latest returned non-success output: ${_approve_output}"
+      echo "[auto-pair] approve --latest unexpected output attempts=${_pair_attempts} errors=${_pair_errors}: ${_approve_output}"
     fi
 
     if [ $((_pair_attempts % 20)) -eq 0 ]; then
       _list_output="$(openclaw devices list --json 2>&1 || true)"
-      echo "[auto-pair] heartbeat attempts=${_pair_attempts} approved=${_pair_approved} errors=${_pair_errors} devices=${_list_output}"
+      _device_summary="$(printf '%s\n' "$_list_output" | _summarize_device_list)"
+      echo "[auto-pair] heartbeat attempts=${_pair_attempts} approved=${_pair_approved} errors=${_pair_errors} ${_device_summary}"
     fi
   done
   echo "[auto-pair] watcher exiting attempts=${_pair_attempts} approved=${_pair_approved} errors=${_pair_errors}"
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index 2d4a239..939ccdb 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -18,6 +18,9 @@ import { ingestKeysFromUrl, DEFAULT_MODEL, resolveApiKey, isKeyConfigured } from
 import { waitForReconnect } from "./gateway-bridge.ts";
 import { syncKeysToProviders } from "./api-keys-page.ts";
 
+const INITIAL_CONNECT_TIMEOUT_MS = 30_000;
+const POST_PAIRING_SETTLE_DELAY_MS = 15_000;
+
 function inject(): boolean {
   const hasButton = injectButton();
   const hasNav = injectNavGroup();
@@ -56,6 +59,11 @@ function showConnectOverlay(): void {
   document.body.prepend(overlay);
 }
 
+function setConnectOverlayText(text: string): void {
+  const textNode = document.querySelector<HTMLElement>(".nemoclaw-connect-overlay__text");
+  if (textNode) textNode.textContent = text;
+}
+
 function revealApp(): void {
   document.body.setAttribute("data-nemoclaw-ready", "");
   const overlay = document.querySelector(".nemoclaw-connect-overlay");
@@ -68,8 +76,12 @@ function revealApp(): void {
 function bootstrap() {
   showConnectOverlay();
 
-  waitForReconnect(30_000)
-    .then(revealApp)
+  waitForReconnect(INITIAL_CONNECT_TIMEOUT_MS)
+    .then(async () => {
+      setConnectOverlayText("Device pairing approved. Finalizing dashboard...");
+      await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
+      revealApp();
+    })
     .catch(revealApp);
 
   const keysIngested = ingestKeysFromUrl();

From 536e63c9efe34ae90ea1ede2fa9488e4d1e3ca6a Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Thu, 12 Mar 2026 17:10:40 -0700
Subject: [PATCH 10/25] Bump defualt context window, set NO_PROXY widely

---
 sandboxes/nemoclaw/nemoclaw-start.sh | 8 ++++++++
 sandboxes/openclaw/policy.yaml       | 4 ++++
 2 files changed, 12 insertions(+)

diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index 06912a5..a6b5518 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -101,6 +101,8 @@ export LITELLM_LOCAL_MODEL_COST_MAP="True"
 
 _DEFAULT_MODEL="moonshotai/kimi-k2.5"
 _DEFAULT_PROVIDER="nvidia-endpoints"
+_DEFAULT_CONTEXT_WINDOW=200000
+_DEFAULT_MAX_TOKENS=8192
 
 generate_litellm_config() {
   local model_id="${1:-$_DEFAULT_MODEL}"
@@ -212,6 +214,12 @@ cfg['gateway']['controlUi'] = {
     'allowInsecureAuth': True,
     'allowedOrigins': origins,
 }
+provider = cfg.get('models', {}).get('providers', {}).get('custom-127-0-0-1-4000')
+if isinstance(provider, dict):
+    for model in provider.get('models', []):
+        if isinstance(model, dict) and model.get('id') == '${_DEFAULT_MODEL}':
+            model['contextWindow'] = ${_DEFAULT_CONTEXT_WINDOW}
+            model['maxTokens'] = ${_DEFAULT_MAX_TOKENS}
 json.dump(cfg, open(os.environ['HOME'] + '/.openclaw/openclaw.json', 'w'), indent=2)
 "
 
diff --git a/sandboxes/openclaw/policy.yaml b/sandboxes/openclaw/policy.yaml
index a91da84..a12c46b 100644
--- a/sandboxes/openclaw/policy.yaml
+++ b/sandboxes/openclaw/policy.yaml
@@ -125,3 +125,7 @@ network_policies:
     binaries:
       - { path: /usr/local/bin/claude }
       - { path: /usr/bin/gh }
+
+inference:
+  allowed_routes:
+    - local

From ec4895452e19d9e0f3ae80d599e69262f6d1f9e3 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 08:21:22 -0700
Subject: [PATCH 11/25] Extend timer for device auto approval, minimize wait

---
 sandboxes/nemoclaw/nemoclaw-start.sh          | 21 ++++++++---
 .../extension/gateway-bridge.ts               | 36 +++++++++++++++++++
 .../nemoclaw-ui-extension/extension/index.ts  | 12 +++++--
 3 files changed, 63 insertions(+), 6 deletions(-)

diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index a6b5518..522e648 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -249,6 +249,9 @@ echo "[gateway] policy-proxy launched (pid $!) upstream=${INTERNAL_GATEWAY_PORT}
 # before the user notices the "pairing required" prompt in the Control UI.
 (
   echo "[auto-pair] watcher starting"
+  _pair_timeout_secs="${AUTO_PAIR_TIMEOUT_SECS:-1800}"
+  _pair_sleep_secs="0.5"
+  _pair_heartbeat_every=120
   _json_has_approval() {
     jq -e '
       .device
@@ -269,12 +272,22 @@ echo "[gateway] policy-proxy launched (pid $!) upstream=${INTERNAL_GATEWAY_PORT}
     ' 2>/dev/null || echo "unparseable"
   }
 
-  _pair_deadline=$(($(date +%s) + 300))
+  if [ "${_pair_timeout_secs}" -gt 0 ] 2>/dev/null; then
+    _pair_deadline=$(($(date +%s) + _pair_timeout_secs))
+    echo "[auto-pair] watcher timeout=${_pair_timeout_secs}s"
+  else
+    _pair_deadline=0
+    echo "[auto-pair] watcher timeout=disabled"
+  fi
   _pair_attempts=0
   _pair_approved=0
   _pair_errors=0
-  while [ "$(date +%s)" -lt "$_pair_deadline" ]; do
-    sleep 0.5
+  while true; do
+    if [ "${_pair_deadline}" -gt 0 ] && [ "$(date +%s)" -ge "${_pair_deadline}" ]; then
+      break
+    fi
+
+    sleep "${_pair_sleep_secs}"
     _pair_attempts=$((_pair_attempts + 1))
     _approve_output="$(openclaw devices approve --latest --json 2>&1 || true)"
 
@@ -290,7 +303,7 @@ echo "[gateway] policy-proxy launched (pid $!) upstream=${INTERNAL_GATEWAY_PORT}
       echo "[auto-pair] approve --latest unexpected output attempts=${_pair_attempts} errors=${_pair_errors}: ${_approve_output}"
     fi
 
-    if [ $((_pair_attempts % 20)) -eq 0 ]; then
+    if [ $((_pair_attempts % _pair_heartbeat_every)) -eq 0 ]; then
       _list_output="$(openclaw devices list --json 2>&1 || true)"
       _device_summary="$(printf '%s\n' "$_list_output" | _summarize_device_list)"
       echo "[auto-pair] heartbeat attempts=${_pair_attempts} approved=${_pair_approved} errors=${_pair_errors} ${_device_summary}"
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/gateway-bridge.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/gateway-bridge.ts
index 8da56c0..dcdcce5 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/gateway-bridge.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/gateway-bridge.ts
@@ -112,3 +112,39 @@ export function waitForReconnect(timeoutMs = 15_000): Promise<void> {
     }, 500);
   });
 }
+
+/**
+ * Wait until the app remains connected for a continuous stability window.
+ *
+ * This helps distinguish "socket connected for a moment" from "dashboard is
+ * actually ready to be revealed after pairing/bootstrap settles".
+ */
+export function waitForStableConnection(
+  stableForMs = 3_000,
+  timeoutMs = 15_000,
+): Promise<void> {
+  return new Promise((resolve, reject) => {
+    const start = Date.now();
+    let connectedSince = isAppConnected() ? Date.now() : 0;
+
+    const interval = setInterval(() => {
+      const now = Date.now();
+
+      if (isAppConnected()) {
+        if (!connectedSince) connectedSince = now;
+        if (now - connectedSince >= stableForMs) {
+          clearInterval(interval);
+          resolve();
+          return;
+        }
+      } else {
+        connectedSince = 0;
+      }
+
+      if (now - start > timeoutMs) {
+        clearInterval(interval);
+        reject(new Error("Timed out waiting for stable gateway connection"));
+      }
+    }, 500);
+  });
+}
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index 939ccdb..fc48f58 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -15,11 +15,12 @@ import { injectButton } from "./deploy-modal.ts";
 import { injectNavGroup, activateNemoPage, watchOpenClawNavClicks } from "./nav-group.ts";
 import { injectModelSelector, watchChatCompose } from "./model-selector.ts";
 import { ingestKeysFromUrl, DEFAULT_MODEL, resolveApiKey, isKeyConfigured } from "./model-registry.ts";
-import { waitForReconnect } from "./gateway-bridge.ts";
+import { waitForReconnect, waitForStableConnection } from "./gateway-bridge.ts";
 import { syncKeysToProviders } from "./api-keys-page.ts";
 
 const INITIAL_CONNECT_TIMEOUT_MS = 30_000;
 const POST_PAIRING_SETTLE_DELAY_MS = 15_000;
+const STABLE_CONNECTION_WINDOW_MS = 3_000;
 
 function inject(): boolean {
   const hasButton = injectButton();
@@ -79,7 +80,14 @@ function bootstrap() {
   waitForReconnect(INITIAL_CONNECT_TIMEOUT_MS)
     .then(async () => {
       setConnectOverlayText("Device pairing approved. Finalizing dashboard...");
-      await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
+      try {
+        await waitForStableConnection(
+          STABLE_CONNECTION_WINDOW_MS,
+          POST_PAIRING_SETTLE_DELAY_MS,
+        );
+      } catch {
+        await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
+      }
       revealApp();
     })
     .catch(revealApp);

From 7d6355f8a46205ea0a4497562f04788f602f6d0a Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 08:55:32 -0700
Subject: [PATCH 12/25] Reload dashboard once after pairing approval

---
 .../nemoclaw-ui-extension/extension/index.ts  | 37 ++++++++++++++++++-
 1 file changed, 36 insertions(+), 1 deletion(-)

diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index fc48f58..37f0e70 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -21,6 +21,7 @@ import { syncKeysToProviders } from "./api-keys-page.ts";
 const INITIAL_CONNECT_TIMEOUT_MS = 30_000;
 const POST_PAIRING_SETTLE_DELAY_MS = 15_000;
 const STABLE_CONNECTION_WINDOW_MS = 3_000;
+const PAIRING_RELOAD_FLAG = "nemoclaw:pairing-bootstrap-reloaded";
 
 function inject(): boolean {
   const hasButton = injectButton();
@@ -74,6 +75,30 @@ function revealApp(): void {
   }
 }
 
+function shouldForcePairingReload(): boolean {
+  try {
+    return sessionStorage.getItem(PAIRING_RELOAD_FLAG) !== "1";
+  } catch {
+    return true;
+  }
+}
+
+function markPairingReloadComplete(): void {
+  try {
+    sessionStorage.setItem(PAIRING_RELOAD_FLAG, "1");
+  } catch {
+    // ignore storage failures
+  }
+}
+
+function clearPairingReloadFlag(): void {
+  try {
+    sessionStorage.removeItem(PAIRING_RELOAD_FLAG);
+  } catch {
+    // ignore storage failures
+  }
+}
+
 function bootstrap() {
   showConnectOverlay();
 
@@ -88,9 +113,19 @@ function bootstrap() {
       } catch {
         await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
       }
+      if (shouldForcePairingReload()) {
+        markPairingReloadComplete();
+        setConnectOverlayText("Device pairing approved. Reloading dashboard...");
+        window.location.reload();
+        return;
+      }
+      clearPairingReloadFlag();
       revealApp();
     })
-    .catch(revealApp);
+    .catch(() => {
+      clearPairingReloadFlag();
+      revealApp();
+    });
 
   const keysIngested = ingestKeysFromUrl();
 

From e512644017b8f136478cf6c101e94123fdb40222 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 10:24:29 -0700
Subject: [PATCH 13/25] Revert nemoclaw runtime back to inference.local

---
 brev/welcome-ui/server.js                     |  41 +--
 sandboxes/nemoclaw/Dockerfile                 |   8 -
 sandboxes/nemoclaw/nemoclaw-start.sh          | 117 +------
 .../extension/model-registry.ts               |  16 +-
 .../extension/model-selector.ts               |  23 +-
 sandboxes/nemoclaw/policy-proxy.js            | 300 +-----------------
 6 files changed, 31 insertions(+), 474 deletions(-)

diff --git a/brev/welcome-ui/server.js b/brev/welcome-ui/server.js
index 240947b..0a12223 100644
--- a/brev/welcome-ui/server.js
+++ b/brev/welcome-ui/server.js
@@ -266,8 +266,7 @@ const injectKeyState = {
 };
 
 // Raw API key stored in memory so it can be passed to the sandbox at
-// creation time and forwarded to LiteLLM for inference.  Not persisted
-// to disk.
+// creation time. Not persisted to disk.
 let _nvidiaApiKey = process.env.NVIDIA_INFERENCE_API_KEY
   || process.env.NVIDIA_INTEGRATE_API_KEY
   || "";
@@ -804,38 +803,6 @@ function runInjectKey(key, keyHash) {
     });
 }
 
-/**
- * Forward the API key to the sandbox's LiteLLM instance via the
- * policy-proxy's /api/litellm-key endpoint.  This triggers a config
- * regeneration and LiteLLM restart with the new key.
- */
-function forwardKeyToSandbox(key) {
-  const body = JSON.stringify({ apiKey: key });
-  const opts = {
-    hostname: "127.0.0.1",
-    port: SANDBOX_PORT,
-    path: "/api/litellm-key",
-    method: "POST",
-    headers: {
-      "Content-Type": "application/json",
-      "Content-Length": Buffer.byteLength(body),
-    },
-    timeout: 10000,
-  };
-  const req = http.request(opts, (res) => {
-    res.resume();
-    if (res.statusCode === 200) {
-      log("inject-key", "Forwarded API key to sandbox LiteLLM");
-    } else {
-      log("inject-key", `Sandbox LiteLLM key forward returned ${res.statusCode}`);
-    }
-  });
-  req.on("error", (err) => {
-    log("inject-key", `Failed to forward key to sandbox: ${err.message}`);
-  });
-  req.end(body);
-}
-
 // ── Provider CRUD ──────────────────────────────────────────────────────────
 
 function parseProviderDetail(stdout) {
@@ -1323,12 +1290,6 @@ async function handleInjectKey(req, res) {
 
   runInjectKey(key, keyH);
 
-  // If the sandbox is already running, forward the key to LiteLLM inside
-  // the sandbox so it can authenticate with upstream NVIDIA APIs.
-  if (sandboxState.status === "running") {
-    forwardKeyToSandbox(key);
-  }
-
   return jsonResponse(res, 202, { ok: true, started: true });
 }
 
diff --git a/sandboxes/nemoclaw/Dockerfile b/sandboxes/nemoclaw/Dockerfile
index 9a5d96e..c07b6d6 100644
--- a/sandboxes/nemoclaw/Dockerfile
+++ b/sandboxes/nemoclaw/Dockerfile
@@ -16,9 +16,6 @@ FROM ${BASE_IMAGE}
 
 USER root
 
-ENV NO_PROXY=127.0.0.1,localhost,::1
-ENV no_proxy=127.0.0.1,localhost,::1
-
 RUN apt-get update && \
     apt-get install -y --no-install-recommends jq && \
     rm -rf /var/lib/apt/lists/*
@@ -34,11 +31,6 @@ COPY policy-proxy.js /usr/local/lib/policy-proxy.js
 COPY proto/ /usr/local/lib/nemoclaw-proto/
 RUN npm install -g @grpc/grpc-js @grpc/proto-loader js-yaml
 
-# Install LiteLLM proxy for streaming-capable local LLM inference routing.
-# LiteLLM handles SSE streaming natively, bypassing the sandbox proxy's
-# inference interception path which buffers responses and times out.
-RUN python3 -m pip install --no-cache-dir --break-system-packages 'litellm[proxy]'
-
 # Fix @hono/node-server authorization bypass (GHSA-wc8c-qw6v-h7f6)
 RUN npm install -g @hono/node-server@1.19.11
 
diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index 522e648..e1f1282 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -48,12 +48,6 @@ if [ -z "${CHAT_UI_URL:-}" ]; then
     exit 1
 fi
 
-# Keep local service-to-service traffic off the sandbox forward proxy.
-# LiteLLM/OpenClaw must talk to 127.0.0.1 directly, while upstream NVIDIA
-# requests should continue using the configured HTTP(S) proxy.
-export NO_PROXY="${NO_PROXY:+${NO_PROXY},}127.0.0.1,localhost,::1"
-export no_proxy="${no_proxy:+${no_proxy},}127.0.0.1,localhost,::1"
-
 BUNDLE="$(npm root -g)/openclaw/dist/control-ui/assets/nemoclaw-devx.js"
 
 if [ -f "$BUNDLE" ]; then
@@ -72,109 +66,11 @@ if [ -f "$BUNDLE" ]; then
 fi
 
 # --------------------------------------------------------------------------
-# LiteLLM streaming inference proxy
-#
-# LiteLLM runs on localhost:4000 and provides streaming-capable inference
-# routing.  This bypasses the sandbox proxy's inference.local interception
-# path which buffers entire responses and has a 60s hard timeout.
+# Onboard and start the gateway
 # --------------------------------------------------------------------------
-LITELLM_PORT=4000
-LITELLM_CONFIG="/tmp/litellm_config.yaml"
-LITELLM_LOG="/tmp/litellm.log"
-
-NVIDIA_NIM_API_KEY="${NVIDIA_INFERENCE_API_KEY:-${NVIDIA_INTEGRATE_API_KEY:-}}"
-export NVIDIA_NIM_API_KEY
-
-# Persist the API key to a well-known file so the policy-proxy can read
-# it later when regenerating the LiteLLM config (e.g. on model switch or
-# late key injection from the welcome UI).
-LITELLM_KEY_FILE="/tmp/litellm_api_key"
-if [ -n "$NVIDIA_NIM_API_KEY" ]; then
-  echo -n "$NVIDIA_NIM_API_KEY" > "$LITELLM_KEY_FILE"
-  chmod 600 "$LITELLM_KEY_FILE"
-fi
-
-# Use the local bundled cost map to avoid a blocked HTTPS fetch to GitHub
-# at startup (the sandbox network policy doesn't allow Python to reach
-# raw.githubusercontent.com, causing a ~5s timeout on every start).
-export LITELLM_LOCAL_MODEL_COST_MAP="True"
-
 _DEFAULT_MODEL="moonshotai/kimi-k2.5"
-_DEFAULT_PROVIDER="nvidia-endpoints"
 _DEFAULT_CONTEXT_WINDOW=200000
 _DEFAULT_MAX_TOKENS=8192
-
-generate_litellm_config() {
-  local model_id="${1:-$_DEFAULT_MODEL}"
-  local provider="${2:-$_DEFAULT_PROVIDER}"
-  local api_base=""
-  local litellm_prefix="nvidia_nim"
-  local api_key="${NVIDIA_NIM_API_KEY:-}"
-
-  # Read from persisted key file if env var is empty.
-  if [ -z "$api_key" ] && [ -f "$LITELLM_KEY_FILE" ]; then
-    api_key="$(cat "$LITELLM_KEY_FILE")"
-  fi
-
-  case "$provider" in
-    nvidia-endpoints)
-      api_base="https://integrate.api.nvidia.com/v1" ;;
-    nvidia-inference)
-      api_base="https://inference-api.nvidia.com/v1" ;;
-    *)
-      api_base="https://integrate.api.nvidia.com/v1" ;;
-  esac
-
-  # Write the actual key value into the config. Using os.environ/ references
-  # is fragile inside the sandbox where env vars may not be propagated to all
-  # child processes.  If no key is available yet, use a placeholder — the
-  # policy-proxy will regenerate the config when the key arrives.
-  local key_yaml
-  if [ -n "$api_key" ]; then
-    key_yaml="      api_key: \"${api_key}\""
-  else
-    key_yaml="      api_key: \"key-not-yet-configured\""
-  fi
-
-  cat > "$LITELLM_CONFIG" <<LITELLM_EOF
-model_list:
-  - model_name: "*"
-    litellm_params:
-      model: "${litellm_prefix}/${model_id}"
-${key_yaml}
-      api_base: "${api_base}"
-general_settings:
-  master_key: sk-nemoclaw-local
-litellm_settings:
-  request_timeout: 600
-  drop_params: true
-  num_retries: 0
-LITELLM_EOF
-  echo "[litellm] Config written: model=${litellm_prefix}/${model_id} api_base=${api_base} key=${api_key:+present}"
-}
-
-generate_litellm_config "$_DEFAULT_MODEL" "$_DEFAULT_PROVIDER"
-
-LITELLM_LOCAL_MODEL_COST_MAP="True" \
-  nohup litellm --config "$LITELLM_CONFIG" --port "$LITELLM_PORT" --host 127.0.0.1 \
-  >> "$LITELLM_LOG" 2>&1 &
-echo "[litellm] Starting on 127.0.0.1:${LITELLM_PORT} (pid $!)"
-
-# Wait for LiteLLM to accept connections before proceeding.
-# Use /health/liveliness (basic liveness, no model checks) and --noproxy
-# to bypass the sandbox HTTP proxy for localhost connections.
-_litellm_deadline=$(($(date +%s) + 60))
-while ! curl -sf --noproxy 127.0.0.1 "http://127.0.0.1:${LITELLM_PORT}/health/liveliness" >/dev/null 2>&1; do
-  if [ "$(date +%s)" -ge "$_litellm_deadline" ]; then
-    echo "[litellm] WARNING: LiteLLM did not become ready within 60s. Continuing anyway."
-    break
-  fi
-  sleep 1
-done
-
-# --------------------------------------------------------------------------
-# Onboard and start the gateway
-# --------------------------------------------------------------------------
 export NVIDIA_API_KEY="${NVIDIA_INFERENCE_API_KEY:- }"
 _ONBOARD_KEY="${NVIDIA_INFERENCE_API_KEY:-not-used}"
 openclaw onboard \
@@ -185,9 +81,9 @@ openclaw onboard \
   --skip-skills \
   --skip-health \
   --auth-choice custom-api-key \
-  --custom-base-url "http://127.0.0.1:${LITELLM_PORT}/v1" \
-  --custom-model-id "$_DEFAULT_MODEL" \
-  --custom-api-key "sk-nemoclaw-local" \
+  --custom-base-url "https://inference.local/v1" \
+  --custom-model-id "-" \
+  --custom-api-key "$_ONBOARD_KEY" \
   --secret-input-mode plaintext \
   --custom-compatibility openai \
   --gateway-port 18788 \
@@ -214,8 +110,9 @@ cfg['gateway']['controlUi'] = {
     'allowInsecureAuth': True,
     'allowedOrigins': origins,
 }
-provider = cfg.get('models', {}).get('providers', {}).get('custom-127-0-0-1-4000')
-if isinstance(provider, dict):
+for provider in cfg.get('models', {}).get('providers', {}).values():
+    if not isinstance(provider, dict):
+        continue
     for model in provider.get('models', []):
         if isinstance(model, dict) and model.get('id') == '${_DEFAULT_MODEL}':
             model['contextWindow'] = ${_DEFAULT_CONTEXT_WINDOW}
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts
index da97edc..9016971 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-registry.ts
@@ -118,8 +118,8 @@ export interface ModelEntry {
 }
 
 // ---------------------------------------------------------------------------
-// Curated models — hardcoded presets routed through the local LiteLLM proxy.
-// LiteLLM handles upstream credential injection and SSE streaming natively.
+// Curated models — hardcoded presets routed through inference.local.
+// The NemoClaw proxy injects credentials based on the providerName.
 // ---------------------------------------------------------------------------
 
 export interface CuratedModel {
@@ -179,7 +179,7 @@ export function curatedToModelEntry(c: CuratedModel): ModelEntry {
     keyType: "inference",
     isDynamic: true,
     providerConfig: {
-      baseUrl: "http://127.0.0.1:4000/v1",
+      baseUrl: "https://inference.local/v1",
       api: "openai-completions",
       models: [
         {
@@ -215,7 +215,7 @@ export const MODEL_REGISTRY: readonly ModelEntry[] = [
     modelRef: `${DEFAULT_PROVIDER_KEY}/moonshotai/kimi-k2.5`,
     keyType: "inference",
     providerConfig: {
-      baseUrl: "http://127.0.0.1:4000/v1",
+      baseUrl: "https://inference.local/v1",
       api: "openai-completions",
       models: [
         {
@@ -267,8 +267,8 @@ export function getModelByCuratedModelId(modelId: string): ModelEntry | undefine
 
 /**
  * Build a ModelEntry for a provider managed through the inference tab.
- * These route through the local LiteLLM proxy which handles credentials
- * and streaming, so no client-side API key is needed.
+ * These route through inference.local where the proxy injects credentials,
+ * so no client-side API key is needed.
  */
 export function buildDynamicEntry(
   providerName: string,
@@ -288,7 +288,7 @@ export function buildDynamicEntry(
     keyType: "inference",
     isDynamic: true,
     providerConfig: {
-      baseUrl: "http://127.0.0.1:4000/v1",
+      baseUrl: "https://inference.local/v1",
       api: "openai-completions",
       models: [
         {
@@ -328,7 +328,7 @@ export function buildQuickSelectEntry(
     keyType: "inference",
     isDynamic: true,
     providerConfig: {
-      baseUrl: "http://127.0.0.1:4000/v1",
+      baseUrl: "https://inference.local/v1",
       api: "openai-completions",
       models: [
         {
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts
index 7b2fbe6..3c897ce 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/model-selector.ts
@@ -2,11 +2,11 @@
  * NeMoClaw DevX — Model Selector
  *
  * Dropdown injected into the chat compose area that lets users pick a
- * model.  For models routed through the local LiteLLM proxy (curated +
- * dynamic), switching only updates the NemoClaw cluster-inference route
- * — no OpenClaw config.patch is needed because the LiteLLM proxy
- * handles model routing and streaming natively.  This avoids the
- * gateway disconnect that config.patch causes.
+ * model.  For models routed through inference.local (curated + dynamic),
+ * switching only updates the NemoClaw cluster-inference route — no
+ * OpenClaw config.patch is needed because the NemoClaw proxy rewrites
+ * the model field in every request body.  This avoids the gateway
+ * disconnect that config.patch causes.
  *
  * Models are fetched dynamically from the NemoClaw runtime (providers
  * and active route configured in the Inference tab).
@@ -264,14 +264,14 @@ function dismissTransitionBanner(): void {
 // ---------------------------------------------------------------------------
 
 /**
- * Returns true if the model routes through the local LiteLLM proxy,
- * meaning credential injection and streaming are handled server-side.
+ * Returns true if the model routes through inference.local, meaning the
+ * NemoClaw proxy manages credential injection and model rewriting.
  * For these models we only need to update the cluster-inference route —
  * no OpenClaw config.patch (and therefore no gateway disconnect).
  */
 function isProxyManaged(entry: ModelEntry): boolean {
   return entry.isDynamic === true ||
-    entry.providerConfig.baseUrl === "http://127.0.0.1:4000/v1";
+    entry.providerConfig.baseUrl === "https://inference.local/v1";
 }
 
 async function applyModelSelection(
@@ -295,9 +295,10 @@ async function applyModelSelection(
 
   try {
     if (isProxyManaged(entry)) {
-      // Proxy-managed models route through the local LiteLLM proxy.  We
-      // update the cluster-inference route and LiteLLM is restarted with the
-      // new model config (no OpenClaw config.patch, no gateway disconnect).
+      // Proxy-managed models route through inference.local.  We update the
+      // NemoClaw cluster-inference route (no OpenClaw config.patch, no
+      // gateway disconnect).  The sandbox polls every ~30s for route
+      // updates, so we show an honest propagation countdown.
       const curated = getCuratedByModelId(entry.providerConfig.models[0]?.id || "");
       const provName = curated?.providerName || entry.providerKey.replace(/^dynamic-/, "");
       const modelId = entry.providerConfig.models[0]?.id || "";
diff --git a/sandboxes/nemoclaw/policy-proxy.js b/sandboxes/nemoclaw/policy-proxy.js
index 308cc8b..ea479f6 100644
--- a/sandboxes/nemoclaw/policy-proxy.js
+++ b/sandboxes/nemoclaw/policy-proxy.js
@@ -418,286 +418,15 @@ function syncAndRespond(yamlBody, res, t0) {
   });
 }
 
-// ---------------------------------------------------------------------------
-// LiteLLM config manager
-//
-// When the user switches models via the UI, the extension POSTs to
-// /api/cluster-inference.  After forwarding to the gateway we regenerate
-// the LiteLLM config and restart the proxy so the new model takes effect.
-// ---------------------------------------------------------------------------
-
-const { execFile } = require("child_process");
-
-const LITELLM_PORT = 4000;
-const LITELLM_CONFIG_PATH = "/tmp/litellm_config.yaml";
-const LITELLM_LOG_PATH = "/tmp/litellm.log";
-const LITELLM_KEY_FILE = "/tmp/litellm_api_key";
-
-const PROVIDER_MAP = {
-  "nvidia-endpoints": {
-    litellmPrefix: "nvidia_nim",
-    apiBase: "https://integrate.api.nvidia.com/v1",
-  },
-  "nvidia-inference": {
-    litellmPrefix: "nvidia_nim",
-    apiBase: "https://inference-api.nvidia.com/v1",
-  },
-};
-
-let litellmPid = null;
-
-function readApiKey() {
-  try {
-    const key = fs.readFileSync(LITELLM_KEY_FILE, "utf8").trim();
-    if (key) return key;
-  } catch (e) {}
-  return process.env.NVIDIA_NIM_API_KEY || "";
-}
-
-function writeApiKey(key) {
-  fs.writeFileSync(LITELLM_KEY_FILE, key, { mode: 0o600 });
-}
-
-function generateLitellmConfig(providerName, modelId) {
-  const provider = PROVIDER_MAP[providerName] || PROVIDER_MAP["nvidia-endpoints"];
-  const fullModel = `${provider.litellmPrefix}/${modelId}`;
-  const apiKey = readApiKey() || "key-not-yet-configured";
-
-  const config = [
-    "model_list:",
-    '  - model_name: "*"',
-    "    litellm_params:",
-    `      model: "${fullModel}"`,
-    `      api_key: "${apiKey}"`,
-    `      api_base: "${provider.apiBase}"`,
-    "general_settings:",
-    "  master_key: sk-nemoclaw-local",
-    "litellm_settings:",
-    "  request_timeout: 600",
-    "  drop_params: true",
-    "  num_retries: 0",
-    "",
-  ].join("\n");
-
-  fs.writeFileSync(LITELLM_CONFIG_PATH, config, "utf8");
-  const keyStatus = apiKey === "key-not-yet-configured" ? "missing" : "present";
-  console.log(`[litellm-mgr] Config written: model=${fullModel} api_base=${provider.apiBase} key=${keyStatus}`);
-}
-
-function restartLitellm() {
-  return new Promise((resolve) => {
-    if (litellmPid) {
-      try {
-        process.kill(litellmPid, "SIGTERM");
-        console.log(`[litellm-mgr] Sent SIGTERM to old LiteLLM (pid ${litellmPid})`);
-      } catch (e) {
-        // Process may have already exited.
-      }
-      litellmPid = null;
-    }
-
-    // Brief grace period for the old process to release the port.
-    setTimeout(() => {
-      const logFd = fs.openSync(LITELLM_LOG_PATH, "a");
-      const env = { ...process.env, LITELLM_LOCAL_MODEL_COST_MAP: "True" };
-      const child = execFile(
-        "litellm",
-        ["--config", LITELLM_CONFIG_PATH, "--port", String(LITELLM_PORT), "--host", "127.0.0.1"],
-        { stdio: ["ignore", logFd, logFd], detached: true, env }
-      );
-      child.unref();
-      litellmPid = child.pid;
-      console.log(`[litellm-mgr] Started new LiteLLM (pid ${litellmPid})`);
-      fs.closeSync(logFd);
-
-      // Wait for the liveness endpoint (no model connectivity checks).
-      let attempts = 0;
-      const maxAttempts = 60;
-      const poll = setInterval(() => {
-        attempts++;
-        const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health/liveliness`, (healthRes) => {
-          if (healthRes.statusCode === 200) {
-            clearInterval(poll);
-            console.log(`[litellm-mgr] LiteLLM ready after ${attempts}s`);
-            resolve(true);
-          }
-          healthRes.resume();
-        });
-        healthReq.on("error", () => {});
-        healthReq.setTimeout(800, () => healthReq.destroy());
-        if (attempts >= maxAttempts) {
-          clearInterval(poll);
-          console.warn("[litellm-mgr] LiteLLM did not become ready within 60s");
-          resolve(false);
-        }
-      }, 1000);
-    }, 500);
-  });
-}
-
-// Discover existing LiteLLM pid at startup so we can manage restarts.
-try {
-  const { execSync } = require("child_process");
-  const pidStr = execSync(`pgrep -f "litellm.*--port ${LITELLM_PORT}" 2>/dev/null || true`, { encoding: "utf8" }).trim();
-  if (pidStr) {
-    litellmPid = parseInt(pidStr.split("\n")[0], 10);
-    console.log(`[litellm-mgr] Discovered existing LiteLLM pid: ${litellmPid}`);
-  }
-} catch (e) {}
-
-// ---------------------------------------------------------------------------
-// /api/cluster-inference intercept
-// ---------------------------------------------------------------------------
-
-function handleClusterInferencePost(clientReq, clientRes) {
-  const chunks = [];
-  clientReq.on("data", (chunk) => chunks.push(chunk));
-  clientReq.on("end", () => {
-    const rawBody = Buffer.concat(chunks);
-    let payload;
-    try {
-      payload = JSON.parse(rawBody.toString("utf8"));
-    } catch (e) {
-      clientRes.writeHead(400, { "Content-Type": "application/json" });
-      clientRes.end(JSON.stringify({ error: "invalid JSON" }));
-      return;
-    }
-
-    // Forward the original request to the upstream gateway first.
-    const opts = {
-      hostname: UPSTREAM_HOST,
-      port: UPSTREAM_PORT,
-      path: clientReq.url,
-      method: clientReq.method,
-      headers: { ...clientReq.headers, "content-length": rawBody.length },
-    };
-
-    const upstream = http.request(opts, (upstreamRes) => {
-      const upChunks = [];
-      upstreamRes.on("data", (c) => upChunks.push(c));
-      upstreamRes.on("end", () => {
-        const upBody = Buffer.concat(upChunks);
-        clientRes.writeHead(upstreamRes.statusCode, upstreamRes.headers);
-        clientRes.end(upBody);
-
-        // On success, regenerate LiteLLM config and restart.
-        if (upstreamRes.statusCode >= 200 && upstreamRes.statusCode < 300) {
-          const providerName = payload.providerName || "nvidia-endpoints";
-          const modelId = payload.modelId || payload.model || "";
-          if (modelId) {
-            console.log(`[litellm-mgr] Model switch detected: provider=${providerName} model=${modelId}`);
-            generateLitellmConfig(providerName, modelId);
-            restartLitellm().then((ready) => {
-              console.log(`[litellm-mgr] Restart complete, ready=${ready}`);
-            });
-          }
-        }
-      });
-    });
-
-    upstream.on("error", (err) => {
-      console.error("[litellm-mgr] upstream error on cluster-inference forward:", err.message);
-      if (!clientRes.headersSent) {
-        clientRes.writeHead(502, { "Content-Type": "application/json" });
-      }
-      clientRes.end(JSON.stringify({ error: "upstream unavailable" }));
-    });
-
-    upstream.end(rawBody);
-  });
-}
-
-// ---------------------------------------------------------------------------
-// /api/litellm-key handler — accepts an API key update from the welcome UI
-// ---------------------------------------------------------------------------
-
-function handleLitellmKey(req, res) {
-  const chunks = [];
-  req.on("data", (c) => chunks.push(c));
-  req.on("end", () => {
-    let body;
-    try {
-      body = JSON.parse(Buffer.concat(chunks).toString("utf8"));
-    } catch (e) {
-      res.writeHead(400, { "Content-Type": "application/json" });
-      res.end(JSON.stringify({ error: "invalid JSON" }));
-      return;
-    }
-
-    const apiKey = (body.apiKey || "").trim();
-    if (!apiKey) {
-      res.writeHead(400, { "Content-Type": "application/json" });
-      res.end(JSON.stringify({ error: "missing apiKey" }));
-      return;
-    }
-
-    console.log(`[litellm-mgr] API key update received (${apiKey.length} chars)`);
-    writeApiKey(apiKey);
-
-    // Read the current config to extract the model/provider, then regenerate
-    // with the new key.
-    let currentModel = "moonshotai/kimi-k2.5";
-    let currentProvider = "nvidia-endpoints";
-    try {
-      const cfg = fs.readFileSync(LITELLM_CONFIG_PATH, "utf8");
-      const modelMatch = cfg.match(/model:\s*"[^/]+\/(.+?)"/);
-      if (modelMatch) currentModel = modelMatch[1];
-      const baseMatch = cfg.match(/api_base:\s*"(.+?)"/);
-      if (baseMatch) {
-        const base = baseMatch[1];
-        for (const [name, p] of Object.entries(PROVIDER_MAP)) {
-          if (p.apiBase === base) { currentProvider = name; break; }
-        }
-      }
-    } catch (e) {}
-
-    generateLitellmConfig(currentProvider, currentModel);
-    restartLitellm().then((ready) => {
-      console.log(`[litellm-mgr] Restarted with new key, ready=${ready}`);
-    });
-
-    res.writeHead(200, { "Content-Type": "application/json" });
-    res.end(JSON.stringify({ ok: true }));
-  });
-}
-
-// ---------------------------------------------------------------------------
-// /api/litellm-health handler
-// ---------------------------------------------------------------------------
-
-function handleLitellmHealth(req, res) {
-  const healthReq = http.get(`http://127.0.0.1:${LITELLM_PORT}/health/liveliness`, (healthRes) => {
-    const chunks = [];
-    healthRes.on("data", (c) => chunks.push(c));
-    healthRes.on("end", () => {
-      res.writeHead(healthRes.statusCode, { "Content-Type": "application/json" });
-      res.end(Buffer.concat(chunks));
-    });
-  });
-  healthReq.on("error", (err) => {
-    res.writeHead(503, { "Content-Type": "application/json" });
-    res.end(JSON.stringify({ error: "litellm unreachable", detail: err.message, pid: litellmPid }));
-  });
-  healthReq.setTimeout(3000, () => {
-    healthReq.destroy();
-    res.writeHead(504, { "Content-Type": "application/json" });
-    res.end(JSON.stringify({ error: "litellm health check timed out", pid: litellmPid }));
-  });
-}
-
 // ---------------------------------------------------------------------------
 // HTTP server
 // ---------------------------------------------------------------------------
 
-function setCorsHeaders(res) {
-  res.setHeader("Access-Control-Allow-Origin", "*");
-  res.setHeader("Access-Control-Allow-Methods", "GET, POST, OPTIONS");
-  res.setHeader("Access-Control-Allow-Headers", "Content-Type, Authorization");
-}
-
 const server = http.createServer((req, res) => {
   if (req.url === "/api/policy") {
-    setCorsHeaders(res);
+    res.setHeader("Access-Control-Allow-Origin", "*");
+    res.setHeader("Access-Control-Allow-Methods", "GET, POST, OPTIONS");
+    res.setHeader("Access-Control-Allow-Headers", "Content-Type");
 
     if (req.method === "OPTIONS") {
       res.writeHead(204);
@@ -713,29 +442,6 @@ const server = http.createServer((req, res) => {
     return;
   }
 
-  if (req.url === "/api/cluster-inference" && req.method === "POST") {
-    setCorsHeaders(res);
-    handleClusterInferencePost(req, res);
-    return;
-  }
-
-  if (req.url === "/api/litellm-key" && req.method === "POST") {
-    setCorsHeaders(res);
-    handleLitellmKey(req, res);
-    return;
-  }
-
-  if (req.url === "/api/litellm-health") {
-    setCorsHeaders(res);
-    if (req.method === "OPTIONS") {
-      res.writeHead(204);
-      res.end();
-    } else {
-      handleLitellmHealth(req, res);
-    }
-    return;
-  }
-
   proxyRequest(req, res);
 });
 

From 10d871a91035d858afeecd5e69961a28e96d40a8 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 10:26:25 -0700
Subject: [PATCH 14/25] Keep pairing watcher alive until approval

---
 sandboxes/nemoclaw/nemoclaw-start.sh          |  2 +-
 .../nemoclaw-ui-extension/extension/index.ts  | 47 +++++++++++--------
 2 files changed, 29 insertions(+), 20 deletions(-)

diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index e1f1282..bc82fa9 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -146,7 +146,7 @@ echo "[gateway] policy-proxy launched (pid $!) upstream=${INTERNAL_GATEWAY_PORT}
 # before the user notices the "pairing required" prompt in the Control UI.
 (
   echo "[auto-pair] watcher starting"
-  _pair_timeout_secs="${AUTO_PAIR_TIMEOUT_SECS:-1800}"
+  _pair_timeout_secs="${AUTO_PAIR_TIMEOUT_SECS:-0}"
   _pair_sleep_secs="0.5"
   _pair_heartbeat_every=120
   _json_has_approval() {
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index 37f0e70..249538b 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -19,6 +19,7 @@ import { waitForReconnect, waitForStableConnection } from "./gateway-bridge.ts";
 import { syncKeysToProviders } from "./api-keys-page.ts";
 
 const INITIAL_CONNECT_TIMEOUT_MS = 30_000;
+const EXTENDED_CONNECT_TIMEOUT_MS = 300_000;
 const POST_PAIRING_SETTLE_DELAY_MS = 15_000;
 const STABLE_CONNECTION_WINDOW_MS = 3_000;
 const PAIRING_RELOAD_FLAG = "nemoclaw:pairing-bootstrap-reloaded";
@@ -102,29 +103,37 @@ function clearPairingReloadFlag(): void {
 function bootstrap() {
   showConnectOverlay();
 
+  const finalizeConnectedState = async () => {
+    setConnectOverlayText("Device pairing approved. Finalizing dashboard...");
+    try {
+      await waitForStableConnection(
+        STABLE_CONNECTION_WINDOW_MS,
+        POST_PAIRING_SETTLE_DELAY_MS,
+      );
+    } catch {
+      await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
+    }
+    if (shouldForcePairingReload()) {
+      markPairingReloadComplete();
+      setConnectOverlayText("Device pairing approved. Reloading dashboard...");
+      window.location.reload();
+      return;
+    }
+    clearPairingReloadFlag();
+    revealApp();
+  };
+
   waitForReconnect(INITIAL_CONNECT_TIMEOUT_MS)
-    .then(async () => {
-      setConnectOverlayText("Device pairing approved. Finalizing dashboard...");
+    .then(finalizeConnectedState)
+    .catch(async () => {
+      setConnectOverlayText("Still waiting for device pairing approval...");
       try {
-        await waitForStableConnection(
-          STABLE_CONNECTION_WINDOW_MS,
-          POST_PAIRING_SETTLE_DELAY_MS,
-        );
+        await waitForReconnect(EXTENDED_CONNECT_TIMEOUT_MS);
+        await finalizeConnectedState();
       } catch {
-        await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
-      }
-      if (shouldForcePairingReload()) {
-        markPairingReloadComplete();
-        setConnectOverlayText("Device pairing approved. Reloading dashboard...");
-        window.location.reload();
-        return;
+        clearPairingReloadFlag();
+        revealApp();
       }
-      clearPairingReloadFlag();
-      revealApp();
-    })
-    .catch(() => {
-      clearPairingReloadFlag();
-      revealApp();
     });
 
   const keysIngested = ingestKeysFromUrl();

From 9483694f53f259e1fa49f3a6b81a0b8e0e0d406e Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 12:21:59 -0700
Subject: [PATCH 15/25] Add proxy request tracing for sandbox launch

---
 brev/welcome-ui/server.js          |  7 +++++++
 sandboxes/nemoclaw/policy-proxy.js | 14 +++++++++++++-
 2 files changed, 20 insertions(+), 1 deletion(-)

diff --git a/brev/welcome-ui/server.js b/brev/welcome-ui/server.js
index 0a12223..b0d58f9 100644
--- a/brev/welcome-ui/server.js
+++ b/brev/welcome-ui/server.js
@@ -1092,6 +1092,9 @@ async function handleClusterInferenceSet(req, res) {
 // ── Reverse proxy (HTTP) ───────────────────────────────────────────────────
 
 function proxyToSandbox(clientReq, clientRes) {
+  logWelcome(
+    `proxy http in ${clientReq.method || "GET"} ${clientReq.url || "/"} -> 127.0.0.1:${SANDBOX_PORT}`
+  );
   const headers = {};
   for (const [key, val] of Object.entries(clientReq.headers)) {
     if (key.toLowerCase() === "host") continue;
@@ -1109,6 +1112,9 @@ function proxyToSandbox(clientReq, clientRes) {
   };
 
   const upstream = http.request(opts, (upstreamRes) => {
+    logWelcome(
+      `proxy http out ${clientReq.method || "GET"} ${clientReq.url || "/"} status=${upstreamRes.statusCode || 0}`
+    );
     // Filter hop-by-hop + content-length (we'll set our own)
     const outHeaders = {};
     for (const [key, val] of Object.entries(upstreamRes.headers)) {
@@ -1147,6 +1153,7 @@ function proxyToSandbox(clientReq, clientRes) {
 // ── Reverse proxy (WebSocket) ──────────────────────────────────────────────
 
 function proxyWebSocket(req, clientSocket, head) {
+  logWelcome(`proxy ws in ${req.method || "GET"} ${req.url || "/"} -> 127.0.0.1:${SANDBOX_PORT}`);
   const upstream = net.createConnection(
     { host: "127.0.0.1", port: SANDBOX_PORT },
     () => {
diff --git a/sandboxes/nemoclaw/policy-proxy.js b/sandboxes/nemoclaw/policy-proxy.js
index ea479f6..9030097 100644
--- a/sandboxes/nemoclaw/policy-proxy.js
+++ b/sandboxes/nemoclaw/policy-proxy.js
@@ -37,6 +37,11 @@ const WELL_KNOWN_ENDPOINT = "https://navigator.navigator.svc.cluster.local:8080"
 let gatewayEndpoint = "";
 let sandboxName = "";
 
+function formatRequestLine(req) {
+  const host = req.headers.host || "unknown-host";
+  return `${req.method || "GET"} ${req.url || "/"} host=${host}`;
+}
+
 // ---------------------------------------------------------------------------
 // Discovery helpers
 // ---------------------------------------------------------------------------
@@ -312,6 +317,7 @@ function pushPolicyToGateway(yamlBody) {
 // ---------------------------------------------------------------------------
 
 function proxyRequest(clientReq, clientRes) {
+  console.log(`[policy-proxy] http in  ${formatRequestLine(clientReq)} -> ${UPSTREAM_HOST}:${UPSTREAM_PORT}`);
   const opts = {
     hostname: UPSTREAM_HOST,
     port: UPSTREAM_PORT,
@@ -321,6 +327,10 @@ function proxyRequest(clientReq, clientRes) {
   };
 
   const upstream = http.request(opts, (upstreamRes) => {
+    console.log(
+      `[policy-proxy] http out ${clientReq.method || "GET"} ${clientReq.url || "/"} ` +
+      `status=${upstreamRes.statusCode || 0}`
+    );
     clientRes.writeHead(upstreamRes.statusCode, upstreamRes.headers);
     upstreamRes.pipe(clientRes, { end: true });
   });
@@ -341,6 +351,7 @@ function proxyRequest(clientReq, clientRes) {
 // ---------------------------------------------------------------------------
 
 function handlePolicyGet(req, res) {
+  console.log(`[policy-proxy] policy get ${formatRequestLine(req)}`);
   fs.readFile(POLICY_PATH, "utf8", (err, data) => {
     if (err) {
       res.writeHead(err.code === "ENOENT" ? 404 : 500, {
@@ -356,7 +367,7 @@ function handlePolicyGet(req, res) {
 
 function handlePolicyPost(req, res) {
   const t0 = Date.now();
-  console.log(`[policy-proxy] ── POST /api/policy received`);
+  console.log(`[policy-proxy] policy post ${formatRequestLine(req)}`);
   const chunks = [];
   req.on("data", (chunk) => chunks.push(chunk));
   req.on("end", () => {
@@ -447,6 +458,7 @@ const server = http.createServer((req, res) => {
 
 // WebSocket upgrade — pipe raw TCP to upstream
 server.on("upgrade", (req, socket, head) => {
+  console.log(`[policy-proxy] ws in    ${formatRequestLine(req)} -> ${UPSTREAM_HOST}:${UPSTREAM_PORT}`);
   const upstream = net.createConnection({ host: UPSTREAM_HOST, port: UPSTREAM_PORT }, () => {
     const reqLine = `${req.method} ${req.url} HTTP/${req.httpVersion}\r\n`;
     let headers = "";

From b2f361c8bf2a7ad0092c239958ccdc0ee535af87 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 12:24:46 -0700
Subject: [PATCH 16/25] Add override to skip nemoclaw image build

---
 brev/launch.sh | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/brev/launch.sh b/brev/launch.sh
index 881a1af..b429498 100755
--- a/brev/launch.sh
+++ b/brev/launch.sh
@@ -33,6 +33,7 @@ CLI_RETRY_DELAY_SECS="${CLI_RETRY_DELAY_SECS:-3}"
 GHCR_LOGIN="${GHCR_LOGIN:-auto}"
 GHCR_USER="${GHCR_USER:-}"
 NEMOCLAW_IMAGE="${NEMOCLAW_IMAGE:-ghcr.io/nvidia/openshell-community/sandboxes/nemoclaw:latest}"
+SKIP_NEMOCLAW_IMAGE_BUILD="${SKIP_NEMOCLAW_IMAGE_BUILD:-}"
 
 mkdir -p "$(dirname "$LAUNCH_LOG")"
 touch "$LAUNCH_LOG"
@@ -254,6 +255,9 @@ docker_login_ghcr_if_needed() {
 }
 
 should_build_nemoclaw_image() {
+  if [[ "$SKIP_NEMOCLAW_IMAGE_BUILD" == "1" || "$SKIP_NEMOCLAW_IMAGE_BUILD" == "true" || "$SKIP_NEMOCLAW_IMAGE_BUILD" == "yes" ]]; then
+    return 1
+  fi
   [[ -n "$COMMUNITY_REF" && "$COMMUNITY_REF" != "main" ]]
 }
 
@@ -263,7 +267,11 @@ build_nemoclaw_image_if_needed() {
   local dockerfile_path="$image_context/Dockerfile"
 
   if ! should_build_nemoclaw_image; then
-    log "Skipping local NeMoClaw image build (COMMUNITY_REF=${COMMUNITY_REF:-<unset>})."
+    if [[ "$SKIP_NEMOCLAW_IMAGE_BUILD" == "1" || "$SKIP_NEMOCLAW_IMAGE_BUILD" == "true" || "$SKIP_NEMOCLAW_IMAGE_BUILD" == "yes" ]]; then
+      log "Skipping local NeMoClaw image build by override (SKIP_NEMOCLAW_IMAGE_BUILD=${SKIP_NEMOCLAW_IMAGE_BUILD})."
+    else
+      log "Skipping local NeMoClaw image build (COMMUNITY_REF=${COMMUNITY_REF:-<unset>})."
+    fi
     return
   fi
 

From 6784eae86beba7da30a3b7eb3710ebcc8b0f8a2c Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 14:16:59 -0700
Subject: [PATCH 17/25] Add revised policy and NO_PROXY

---
 brev/welcome-ui/server.js      |  9 +++++++++
 sandboxes/nemoclaw/policy.yaml | 14 ++++++++++++++
 2 files changed, 23 insertions(+)

diff --git a/brev/welcome-ui/server.js b/brev/welcome-ui/server.js
index b0d58f9..4631874 100644
--- a/brev/welcome-ui/server.js
+++ b/brev/welcome-ui/server.js
@@ -639,6 +639,15 @@ function runSandboxCreate() {
       ];
       if (policyPath) cmd.push("--policy", policyPath);
       const envArgs = [`CHAT_UI_URL=${chatUiUrl}`];
+      const loopbackNoProxy = "127.0.0.1,localhost,::1";
+      const mergedNoProxy = [
+        process.env.NO_PROXY || process.env.no_proxy || "",
+        loopbackNoProxy,
+      ]
+        .filter(Boolean)
+        .join(",");
+      envArgs.push(`NO_PROXY=${mergedNoProxy}`);
+      envArgs.push(`no_proxy=${mergedNoProxy}`);
       const nvapiKey = _nvidiaApiKey
         || process.env.NVIDIA_INFERENCE_API_KEY
         || process.env.NVIDIA_INTEGRATE_API_KEY
diff --git a/sandboxes/nemoclaw/policy.yaml b/sandboxes/nemoclaw/policy.yaml
index 749a058..ae34f93 100644
--- a/sandboxes/nemoclaw/policy.yaml
+++ b/sandboxes/nemoclaw/policy.yaml
@@ -36,6 +36,20 @@ process:
 # SHA256 integrity is enforced in Rust via trust-on-first-use, not here.
 
 network_policies:
+  allow_navigator_navigator_svc_cluster_local_8080:
+    name: allow_navigator_navigator_svc_cluster_local_8080
+    endpoints:
+    - host: navigator.navigator.svc.cluster.local
+      port: 8080
+    binaries:
+    - path: /usr/bin/node
+  allow_registry_npmjs_org_443:
+    name: allow_registry_npmjs_org_443
+    endpoints:
+    - host: registry.npmjs.org
+      port: 443
+    binaries:
+    - path: /usr/bin/node
   claude_code:
     name: claude_code
     endpoints:

From 29720c9fb4a007329a71920d074dea634314c27e Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 18:38:48 -0700
Subject: [PATCH 18/25] Fix unconditional chown

---
 sandboxes/nemoclaw/Dockerfile | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/sandboxes/nemoclaw/Dockerfile b/sandboxes/nemoclaw/Dockerfile
index c07b6d6..d04d19a 100644
--- a/sandboxes/nemoclaw/Dockerfile
+++ b/sandboxes/nemoclaw/Dockerfile
@@ -16,6 +16,10 @@ FROM ${BASE_IMAGE}
 
 USER root
 
+RUN apt-get update && \
+    apt-get install -y --no-install-recommends jq && \
+    rm -rf /var/lib/apt/lists/*
+
 RUN apt-get update && \
     apt-get install -y --no-install-recommends jq && \
     rm -rf /var/lib/apt/lists/*
@@ -34,6 +38,10 @@ RUN npm install -g @grpc/grpc-js @grpc/proto-loader js-yaml
 # Fix @hono/node-server authorization bypass (GHSA-wc8c-qw6v-h7f6)
 RUN npm install -g @hono/node-server@1.19.11
 
+# Allow the sandbox user to read the default policy (the startup script
+# copies it to a writable location; this chown covers non-Landlock envs).
+# Some base image variants do not pre-create /etc/navigator.
+RUN mkdir -p /etc/navigator && chown -R sandbox:sandbox /etc/navigator
 # Stage the NeMoClaw DevX extension source
 COPY nemoclaw-ui-extension/extension/ /opt/nemoclaw-devx/
 

From 61e84fa3a0ebf4adfbfab7e112165fcecb919751 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 19:16:16 -0700
Subject: [PATCH 19/25] Added guarded reload for pairing; ensure custom
 policy.yaml bake-in

---
 README.md                                     |  19 ++-
 sandboxes/nemoclaw/Dockerfile                 |   8 +-
 sandboxes/nemoclaw/nemoclaw-start.sh          |   1 +
 .../nemoclaw-ui-extension/extension/index.ts  |  14 +-
 sandboxes/nemoclaw/policy-proxy.js            | 142 ++++++++++++++++++
 5 files changed, 178 insertions(+), 6 deletions(-)

diff --git a/README.md b/README.md
index 53762ab..489021e 100644
--- a/README.md
+++ b/README.md
@@ -30,7 +30,24 @@ This repo is the community ecosystem around OpenShell -- a hub for contributed s
 
 ### Quick Start with Brev
 
-TODO: Add Brev instructions
+#### Deploy Instantly with NVIDIA Brev
+
+Skip the setup and launch OpenShell Community on a fully configured Brev instance.
+
+| Instance | Best For | Deploy |
+| -------- | -------- | ------ |
+| CPU-only | External inference endpoints, remote APIs, lighter-weight sandbox workflows | <a href="https://brev.nvidia.com/"><img src="https://brev-assets.s3.us-west-1.amazonaws.com/nv-lb-dark.svg" alt="Deploy on Brev" height="40"/></a> |
+| NVIDIA H100 | Locally hosted LLM endpoints, GPU-heavy sandboxes, higher-throughput agent workloads | <a href="https://brev.nvidia.com/"><img src="https://brev-assets.s3.us-west-1.amazonaws.com/nv-lb-dark.svg" alt="Deploy on Brev" height="40"/></a> |
+
+After the Brev instance is ready, bootstrap the Welcome UI:
+
+```bash
+git clone https://github.com/NVIDIA/OpenShell-Community.git
+cd OpenShell-Community
+bash brev/launch.sh
+```
+
+The launcher brings up the Welcome UI on `http://localhost:8081`, where you can inject provider keys and create the NeMoClaw sandbox flow.
 
 ### Using Sandboxes
 
diff --git a/sandboxes/nemoclaw/Dockerfile b/sandboxes/nemoclaw/Dockerfile
index d04d19a..686c3c3 100644
--- a/sandboxes/nemoclaw/Dockerfile
+++ b/sandboxes/nemoclaw/Dockerfile
@@ -20,9 +20,11 @@ RUN apt-get update && \
     apt-get install -y --no-install-recommends jq && \
     rm -rf /var/lib/apt/lists/*
 
-RUN apt-get update && \
-    apt-get install -y --no-install-recommends jq && \
-    rm -rf /var/lib/apt/lists/*
+# Bake the NeMoClaw default policy into the same location used by the
+# OpenClaw base image so direct image launches and create-time --policy
+# launches start from the same policy.
+RUN mkdir -p /etc/navigator
+COPY policy.yaml /etc/navigator/policy.yaml
 
 # Override the startup script with our version (adds runtime API key injection)
 COPY nemoclaw-start.sh /usr/local/bin/nemoclaw-start
diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index bc82fa9..6e65f66 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -134,6 +134,7 @@ if [ ! -f "$_POLICY_DST" ] && [ -f "$_POLICY_SRC" ]; then
 fi
 _POLICY_PATH="${_POLICY_DST}"
 [ -f "$_POLICY_PATH" ] || _POLICY_PATH="$_POLICY_SRC"
+echo "[gateway] policy path selected: ${_POLICY_PATH} (src=${_POLICY_SRC} dst=${_POLICY_DST})"
 
 # Start the policy reverse proxy on the public-facing port.  It forwards all
 # traffic to the OpenClaw gateway on the internal port and intercepts
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index 249538b..89b1d96 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -21,7 +21,8 @@ import { syncKeysToProviders } from "./api-keys-page.ts";
 const INITIAL_CONNECT_TIMEOUT_MS = 30_000;
 const EXTENDED_CONNECT_TIMEOUT_MS = 300_000;
 const POST_PAIRING_SETTLE_DELAY_MS = 15_000;
-const STABLE_CONNECTION_WINDOW_MS = 3_000;
+const STABLE_CONNECTION_WINDOW_MS = 10_000;
+const STABLE_CONNECTION_TIMEOUT_MS = 45_000;
 const PAIRING_RELOAD_FLAG = "nemoclaw:pairing-bootstrap-reloaded";
 
 function inject(): boolean {
@@ -108,7 +109,7 @@ function bootstrap() {
     try {
       await waitForStableConnection(
         STABLE_CONNECTION_WINDOW_MS,
-        POST_PAIRING_SETTLE_DELAY_MS,
+        STABLE_CONNECTION_TIMEOUT_MS,
       );
     } catch {
       await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
@@ -119,6 +120,15 @@ function bootstrap() {
       window.location.reload();
       return;
     }
+    setConnectOverlayText("Device pairing approved. Verifying dashboard health...");
+    try {
+      await waitForStableConnection(
+        STABLE_CONNECTION_WINDOW_MS,
+        STABLE_CONNECTION_TIMEOUT_MS,
+      );
+    } catch {
+      await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
+    }
     clearPairingReloadFlag();
     revealApp();
   };
diff --git a/sandboxes/nemoclaw/policy-proxy.js b/sandboxes/nemoclaw/policy-proxy.js
index 9030097..e699e53 100644
--- a/sandboxes/nemoclaw/policy-proxy.js
+++ b/sandboxes/nemoclaw/policy-proxy.js
@@ -14,6 +14,7 @@ const http = require("http");
 const fs = require("fs");
 const os = require("os");
 const net = require("net");
+const crypto = require("crypto");
 
 const POLICY_PATH = process.env.POLICY_PATH || "/etc/openshell/policy.yaml";
 const UPSTREAM_PORT = parseInt(process.env.UPSTREAM_PORT || "18788", 10);
@@ -312,6 +313,145 @@ function pushPolicyToGateway(yamlBody) {
   });
 }
 
+function sha256Hex(text) {
+  return crypto.createHash("sha256").update(text, "utf8").digest("hex");
+}
+
+function hasCriticalNavigatorRule(parsed) {
+  const rule = parsed
+    && parsed.network_policies
+    && parsed.network_policies.allow_navigator_navigator_svc_cluster_local_8080;
+  if (!rule || !Array.isArray(rule.endpoints) || !Array.isArray(rule.binaries)) {
+    return false;
+  }
+  const hasEndpoint = rule.endpoints.some(
+    (ep) => ep && ep.host === "navigator.navigator.svc.cluster.local" && Number(ep.port) === 8080
+  );
+  const hasBinary = rule.binaries.some((bin) => bin && bin.path === "/usr/bin/node");
+  return hasEndpoint && hasBinary;
+}
+
+function policyStatusName(status) {
+  switch (status) {
+    case 1: return "PENDING";
+    case 2: return "LOADED";
+    case 3: return "FAILED";
+    case 4: return "SUPERSEDED";
+    default: return "UNSPECIFIED";
+  }
+}
+
+function auditStartupPolicyFile() {
+  let yaml;
+  try {
+    yaml = require("js-yaml");
+  } catch (e) {
+    console.warn(`[policy-proxy] startup audit skipped: js-yaml unavailable (${e.message})`);
+    return;
+  }
+
+  let raw;
+  try {
+    raw = fs.readFileSync(POLICY_PATH, "utf8");
+  } catch (e) {
+    console.error(`[policy-proxy] startup audit failed: could not read ${POLICY_PATH}: ${e.message}`);
+    return;
+  }
+
+  let parsed;
+  try {
+    parsed = yaml.load(raw);
+  } catch (e) {
+    console.error(`[policy-proxy] startup audit failed: YAML parse error in ${POLICY_PATH}: ${e.message}`);
+    return;
+  }
+
+  const criticalRulePresent = hasCriticalNavigatorRule(parsed);
+  console.log(
+    `[policy-proxy] startup policy audit path=${POLICY_PATH} ` +
+    `sha256=${sha256Hex(raw)} version=${parsed && parsed.version ? parsed.version : 0} ` +
+    `critical_rule.allow_navigator_navigator_svc_cluster_local_8080=${criticalRulePresent}`
+  );
+}
+
+function listSandboxPolicies(request) {
+  return new Promise((resolve, reject) => {
+    grpcClient.ListSandboxPolicies(request, (err, response) => {
+      if (err) {
+        reject(err);
+        return;
+      }
+      resolve(response);
+    });
+  });
+}
+
+function getSandboxPolicyStatus(request) {
+  return new Promise((resolve, reject) => {
+    grpcClient.GetSandboxPolicyStatus(request, (err, response) => {
+      if (err) {
+        reject(err);
+        return;
+      }
+      resolve(response);
+    });
+  });
+}
+
+async function auditNavigatorPolicyState() {
+  if (!grpcEnabled || !grpcClient || grpcPermanentlyDisabled) {
+    console.log(
+      `[policy-proxy] startup navigator audit skipped: ` +
+      `grpcEnabled=${grpcEnabled} grpcClient=${!!grpcClient} disabled=${grpcPermanentlyDisabled}`
+    );
+    return;
+  }
+
+  try {
+    const listed = await listSandboxPolicies({ name: sandboxName, limit: 1, offset: 0 });
+    const revision = listed && Array.isArray(listed.revisions) ? listed.revisions[0] : null;
+    if (!revision) {
+      console.log(`[policy-proxy] startup navigator audit: no policy revisions found for sandbox=${sandboxName}`);
+      return;
+    }
+
+    const statusResp = await getSandboxPolicyStatus({ name: sandboxName, version: revision.version || 0 });
+    console.log(
+      `[policy-proxy] startup navigator audit sandbox=${sandboxName} ` +
+      `latest_version=${revision.version || 0} latest_hash=${revision.policy_hash || ""} ` +
+      `latest_status=${policyStatusName(revision.status)} active_version=${statusResp.active_version || 0}`
+    );
+  } catch (e) {
+    console.warn(`[policy-proxy] startup navigator audit failed: ${e.message}`);
+  }
+}
+
+function scheduleStartupAudit(attempt = 1) {
+  const maxAttempts = 5;
+  const delayMs = 1500;
+
+  setTimeout(async () => {
+    if (grpcEnabled && grpcClient && !grpcPermanentlyDisabled) {
+      await auditNavigatorPolicyState();
+      return;
+    }
+
+    if (attempt >= maxAttempts) {
+      console.log(
+        `[policy-proxy] startup navigator audit gave up after ${attempt} attempts ` +
+        `(grpcEnabled=${grpcEnabled} grpcClient=${!!grpcClient} disabled=${grpcPermanentlyDisabled})`
+      );
+      return;
+    }
+
+    console.log(
+      `[policy-proxy] startup navigator audit retry ${attempt}/${maxAttempts} ` +
+      `(grpcEnabled=${grpcEnabled} grpcClient=${!!grpcClient} disabled=${grpcPermanentlyDisabled})`
+    );
+    scheduleStartupAudit(attempt + 1);
+  }, delayMs);
+}
+
 // ---------------------------------------------------------------------------
 // HTTP proxy helpers
 // ---------------------------------------------------------------------------
@@ -484,7 +624,9 @@ server.on("upgrade", (req, socket, head) => {
 
 // Initialize gRPC client before starting the HTTP server.
 initGrpcClient();
+auditStartupPolicyFile();
 
 server.listen(LISTEN_PORT, "127.0.0.1", () => {
   console.log(`[policy-proxy] Listening on 127.0.0.1:${LISTEN_PORT}, upstream 127.0.0.1:${UPSTREAM_PORT}`);
+  scheduleStartupAudit();
 });

From 93436b09962b8148337756c3c1e26441aead1c38 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 19:51:15 -0700
Subject: [PATCH 20/25] Add console logging for device pairing; extend NO_PROXY

---
 brev/.gitignore                               |  3 +-
 brev/reset.sh.log                             | 81 +++++++++++++++++++
 brev/welcome-ui/server.js                     | 11 ++-
 .../nemoclaw-ui-extension/extension/index.ts  | 16 ++--
 4 files changed, 101 insertions(+), 10 deletions(-)
 create mode 100644 brev/reset.sh.log

diff --git a/brev/.gitignore b/brev/.gitignore
index c26c3f6..54affb1 100644
--- a/brev/.gitignore
+++ b/brev/.gitignore
@@ -1 +1,2 @@
-brev-start-vm.sh
\ No newline at end of file
+brev-start-vm.sh
+reset.sh
\ No newline at end of file
diff --git a/brev/reset.sh.log b/brev/reset.sh.log
new file mode 100644
index 0000000..d2acd08
--- /dev/null
+++ b/brev/reset.sh.log
@@ -0,0 +1,81 @@
+#!/usr/bin/env bash
+
+set -euo pipefail
+
+SCRIPT_DIR="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" && pwd)"
+REPO_ROOT="$(cd -- "$SCRIPT_DIR/.." && pwd)"
+
+CLI_BIN="${CLI_BIN:-openshell}"
+SANDBOX_NAME="${SANDBOX_NAME:-nemoclaw}"
+WELCOME_UI_PATTERN="${WELCOME_UI_PATTERN:-node server.js}"
+NEMOCLAW_IMAGE="${NEMOCLAW_IMAGE:-ghcr.io/nvidia/openshell-community/sandboxes/nemoclaw:latest}"
+REMOVE_IMAGE="${REMOVE_IMAGE:-0}"
+
+log() {
+  printf '[reset] %s\n' "$*"
+}
+
+try_run() {
+  if "$@"; then
+    return 0
+  fi
+  return 1
+}
+
+stop_welcome_ui() {
+  if pgrep -f "$WELCOME_UI_PATTERN" >/dev/null 2>&1; then
+    log "Stopping Welcome UI processes matching: $WELCOME_UI_PATTERN"
+    pkill -f "$WELCOME_UI_PATTERN" || true
+  else
+    log "No Welcome UI process found"
+  fi
+}
+
+delete_sandbox() {
+  log "Deleting sandbox: $SANDBOX_NAME"
+  if ! try_run "$CLI_BIN" sandbox delete "$SANDBOX_NAME"; then
+    log "Sandbox delete returned non-zero; continuing"
+  fi
+}
+
+stop_forward() {
+  if "$CLI_BIN" forward --help >/dev/null 2>&1; then
+    log "Stopping forwarded port 18789 for $SANDBOX_NAME"
+    if ! try_run "$CLI_BIN" forward stop 18789 "$SANDBOX_NAME"; then
+      log "Forward stop returned non-zero; continuing"
+    fi
+  else
+    log "openshell forward subcommand unavailable; skipping forward stop"
+  fi
+}
+
+cleanup_logs() {
+  log "Removing temporary logs and generated policy files"
+  rm -f \
+    /tmp/welcome-ui.log \
+    /tmp/nemoclaw-sandbox-create.log \
+    /tmp/sandbox-policy-*.yaml
+}
+
+remove_image() {
+  if [[ "$REMOVE_IMAGE" == "1" || "$REMOVE_IMAGE" == "true" || "$REMOVE_IMAGE" == "yes" ]]; then
+    log "Removing local image: $NEMOCLAW_IMAGE"
+    if ! try_run docker rmi "$NEMOCLAW_IMAGE"; then
+      log "Image removal returned non-zero; continuing"
+    fi
+  else
+    log "Leaving local image in place (set REMOVE_IMAGE=1 to remove it)"
+  fi
+}
+
+main() {
+  log "Repo root: $REPO_ROOT"
+  stop_welcome_ui
+  delete_sandbox
+  stop_forward
+  cleanup_logs
+  remove_image
+  log "Reset complete"
+}
+
+main "$@"
diff --git a/brev/welcome-ui/server.js b/brev/welcome-ui/server.js
index 4631874..a6f9036 100644
--- a/brev/welcome-ui/server.js
+++ b/brev/welcome-ui/server.js
@@ -639,7 +639,16 @@ function runSandboxCreate() {
       ];
       if (policyPath) cmd.push("--policy", policyPath);
       const envArgs = [`CHAT_UI_URL=${chatUiUrl}`];
-      const loopbackNoProxy = "127.0.0.1,localhost,::1";
+      const loopbackNoProxy = [
+        "127.0.0.1",
+        "localhost",
+        "::1",
+        "navigator.navigator.svc.cluster.local",
+        ".svc",
+        ".svc.cluster.local",
+        "10.42.0.0/16",
+        "10.43.0.0/16",
+      ].join(",");
       const mergedNoProxy = [
         process.env.NO_PROXY || process.env.no_proxy || "",
         loopbackNoProxy,
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index 89b1d96..2127453 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -102,19 +102,14 @@ function clearPairingReloadFlag(): void {
 }
 
 function bootstrap() {
+  console.info("[NeMoClaw] pairing bootstrap: start");
   showConnectOverlay();
 
   const finalizeConnectedState = async () => {
     setConnectOverlayText("Device pairing approved. Finalizing dashboard...");
-    try {
-      await waitForStableConnection(
-        STABLE_CONNECTION_WINDOW_MS,
-        STABLE_CONNECTION_TIMEOUT_MS,
-      );
-    } catch {
-      await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
-    }
+    console.info("[NeMoClaw] pairing bootstrap: reconnect detected");
     if (shouldForcePairingReload()) {
+      console.info("[NeMoClaw] pairing bootstrap: forcing one-time reload");
       markPairingReloadComplete();
       setConnectOverlayText("Device pairing approved. Reloading dashboard...");
       window.location.reload();
@@ -122,13 +117,16 @@ function bootstrap() {
     }
     setConnectOverlayText("Device pairing approved. Verifying dashboard health...");
     try {
+      console.info("[NeMoClaw] pairing bootstrap: waiting for stable post-reload connection");
       await waitForStableConnection(
         STABLE_CONNECTION_WINDOW_MS,
         STABLE_CONNECTION_TIMEOUT_MS,
       );
     } catch {
+      console.warn("[NeMoClaw] pairing bootstrap: stable post-reload connection check timed out; delaying reveal");
       await new Promise((resolve) => setTimeout(resolve, POST_PAIRING_SETTLE_DELAY_MS));
     }
+    console.info("[NeMoClaw] pairing bootstrap: reveal app");
     clearPairingReloadFlag();
     revealApp();
   };
@@ -136,11 +134,13 @@ function bootstrap() {
   waitForReconnect(INITIAL_CONNECT_TIMEOUT_MS)
     .then(finalizeConnectedState)
     .catch(async () => {
+      console.warn("[NeMoClaw] pairing bootstrap: initial reconnect timed out; extending wait");
       setConnectOverlayText("Still waiting for device pairing approval...");
       try {
         await waitForReconnect(EXTENDED_CONNECT_TIMEOUT_MS);
         await finalizeConnectedState();
       } catch {
+        console.warn("[NeMoClaw] pairing bootstrap: extended reconnect timed out; revealing app anyway");
         clearPairingReloadFlag();
         revealApp();
       }

From 59b4389649bf7d37a3c7f6f09a72bccfdc892a4b Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 20:22:47 -0700
Subject: [PATCH 21/25] Handle context mod for inference.local

---
 .gitignore                           | 1 +
 sandboxes/nemoclaw/nemoclaw-start.sh | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)
 create mode 100644 .gitignore

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..3412b31
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1 @@
+/AGENTS.md
diff --git a/sandboxes/nemoclaw/nemoclaw-start.sh b/sandboxes/nemoclaw/nemoclaw-start.sh
index 6e65f66..5d70d53 100644
--- a/sandboxes/nemoclaw/nemoclaw-start.sh
+++ b/sandboxes/nemoclaw/nemoclaw-start.sh
@@ -114,7 +114,7 @@ for provider in cfg.get('models', {}).get('providers', {}).values():
     if not isinstance(provider, dict):
         continue
     for model in provider.get('models', []):
-        if isinstance(model, dict) and model.get('id') == '${_DEFAULT_MODEL}':
+        if isinstance(model, dict) and model.get('id') in ('${_DEFAULT_MODEL}', '-'):
             model['contextWindow'] = ${_DEFAULT_CONTEXT_WINDOW}
             model['maxTokens'] = ${_DEFAULT_MAX_TOKENS}
 json.dump(cfg, open(os.environ['HOME'] + '/.openclaw/openclaw.json', 'w'), indent=2)

From c35e759dbce5a53b6c8431167fe17a3a49f35e20 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 21:04:54 -0700
Subject: [PATCH 22/25] Fix k3s image import on build; force reload on first
 pass timeout

---
 brev/launch.sh                                | 94 ++++++++++++++++++-
 brev/reset.sh.log                             | 81 ----------------
 .../nemoclaw-ui-extension/extension/index.ts  | 17 +++-
 3 files changed, 106 insertions(+), 86 deletions(-)
 delete mode 100644 brev/reset.sh.log

diff --git a/brev/launch.sh b/brev/launch.sh
index b429498..782be4e 100755
--- a/brev/launch.sh
+++ b/brev/launch.sh
@@ -32,8 +32,15 @@ CLI_RETRY_COUNT="${CLI_RETRY_COUNT:-5}"
 CLI_RETRY_DELAY_SECS="${CLI_RETRY_DELAY_SECS:-3}"
 GHCR_LOGIN="${GHCR_LOGIN:-auto}"
 GHCR_USER="${GHCR_USER:-}"
-NEMOCLAW_IMAGE="${NEMOCLAW_IMAGE:-ghcr.io/nvidia/openshell-community/sandboxes/nemoclaw:latest}"
+DEFAULT_NEMOCLAW_IMAGE="ghcr.io/nvidia/openshell-community/sandboxes/nemoclaw:latest"
+if [[ -n "${NEMOCLAW_IMAGE+x}" ]]; then
+  NEMOCLAW_IMAGE_EXPLICIT=1
+else
+  NEMOCLAW_IMAGE_EXPLICIT=0
+fi
+NEMOCLAW_IMAGE="${NEMOCLAW_IMAGE:-$DEFAULT_NEMOCLAW_IMAGE}"
 SKIP_NEMOCLAW_IMAGE_BUILD="${SKIP_NEMOCLAW_IMAGE_BUILD:-}"
+CLUSTER_CONTAINER_NAME="${CLUSTER_CONTAINER_NAME:-openshell-cluster-openshell}"
 
 mkdir -p "$(dirname "$LAUNCH_LOG")"
 touch "$LAUNCH_LOG"
@@ -261,6 +268,19 @@ should_build_nemoclaw_image() {
   [[ -n "$COMMUNITY_REF" && "$COMMUNITY_REF" != "main" ]]
 }
 
+maybe_use_branch_local_nemoclaw_tag() {
+  if ! should_build_nemoclaw_image; then
+    return
+  fi
+
+  if [[ "$NEMOCLAW_IMAGE_EXPLICIT" == "1" || "$NEMOCLAW_IMAGE" != "$DEFAULT_NEMOCLAW_IMAGE" ]]; then
+    return
+  fi
+
+  NEMOCLAW_IMAGE="ghcr.io/nvidia/openshell-community/sandboxes/nemoclaw:local-dev"
+  log "Using non-main branch NeMoClaw image tag: $NEMOCLAW_IMAGE"
+}
+
 build_nemoclaw_image_if_needed() {
   local docker_cmd=()
   local image_context="$REPO_ROOT/sandboxes/nemoclaw"
@@ -302,6 +322,75 @@ build_nemoclaw_image_if_needed() {
   log "Local NeMoClaw image ready: $NEMOCLAW_IMAGE"
 }
 
+resolve_docker_cmd() {
+  if command -v docker >/dev/null 2>&1; then
+    printf 'docker'
+    return 0
+  fi
+  if command -v sudo >/dev/null 2>&1; then
+    printf 'sudo docker'
+    return 0
+  fi
+  return 1
+}
+
+resolve_cluster_container_name() {
+  local docker_bin
+
+  if [[ -n "$CLUSTER_CONTAINER_NAME" ]]; then
+    printf '%s' "$CLUSTER_CONTAINER_NAME"
+    return 0
+  fi
+
+  docker_bin="$(resolve_docker_cmd)" || return 1
+
+  CLUSTER_CONTAINER_NAME="$($docker_bin ps --format '{{.Names}}\t{{.Image}}' | awk '$1 ~ /^openshell-cluster-/ { print $1; exit }')"
+  if [[ -z "$CLUSTER_CONTAINER_NAME" ]]; then
+    CLUSTER_CONTAINER_NAME="$($docker_bin ps --format '{{.Names}}\t{{.Image}}' | awk '$2 ~ /ghcr.io\\/nvidia\\/openshell\\/cluster/ { print $1; exit }')"
+  fi
+
+  [[ -n "$CLUSTER_CONTAINER_NAME" ]]
+}
+
+import_nemoclaw_image_into_cluster_if_needed() {
+  local docker_bin cluster_name
+
+  if ! should_build_nemoclaw_image && [[ "$NEMOCLAW_IMAGE_EXPLICIT" != "1" ]]; then
+    log "Skipping cluster image import; using registry-backed image: $NEMOCLAW_IMAGE"
+    return
+  fi
+
+  docker_bin="$(resolve_docker_cmd)" || {
+    log "Docker not available; skipping cluster image import."
+    return
+  }
+
+  if ! $docker_bin image inspect "$NEMOCLAW_IMAGE" >/dev/null 2>&1; then
+    log "Local NeMoClaw image not present on host; skipping cluster image import: $NEMOCLAW_IMAGE"
+    return
+  fi
+
+  if ! cluster_name="$(resolve_cluster_container_name)"; then
+    log "OpenShell cluster container not found; skipping cluster image import."
+    return
+  fi
+
+  log "Importing NeMoClaw image into cluster containerd: $NEMOCLAW_IMAGE -> $cluster_name"
+  if ! $docker_bin save "$NEMOCLAW_IMAGE" | $docker_bin exec -i "$cluster_name" sh -lc 'ctr -n k8s.io images import -'; then
+    log "Failed to import NeMoClaw image into cluster containerd."
+    exit 1
+  fi
+
+  if ! $docker_bin exec -i "$cluster_name" sh -lc "ctr -n k8s.io images ls | awk '{print \$1}' | grep -Fx '$NEMOCLAW_IMAGE' >/dev/null"; then
+    log "Imported image tag not found in cluster containerd: $NEMOCLAW_IMAGE"
+    log "Cluster image list:"
+    $docker_bin exec -i "$cluster_name" sh -lc "ctr -n k8s.io images ls | grep 'sandboxes/nemoclaw' || true"
+    exit 1
+  fi
+
+  log "Cluster image import complete: $NEMOCLAW_IMAGE"
+}
+
 checkout_repo_ref() {
   if [[ -z "$COMMUNITY_REF" ]]; then
     return
@@ -597,6 +686,7 @@ main() {
   step "Resolving CLI"
   resolve_cli
   ensure_cli_compat_aliases
+  maybe_use_branch_local_nemoclaw_tag
   step "Authenticating registries"
   docker_login_ghcr_if_needed
   step "Preparing NeMoClaw image"
@@ -612,6 +702,8 @@ main() {
 
   step "Starting gateway"
   start_gateway
+  step "Importing NeMoClaw image into cluster"
+  import_nemoclaw_image_into_cluster_if_needed
 
   step "Configuring providers"
   run_provider_create_or_replace \
diff --git a/brev/reset.sh.log b/brev/reset.sh.log
deleted file mode 100644
index d2acd08..0000000
--- a/brev/reset.sh.log
+++ /dev/null
@@ -1,81 +0,0 @@
-#!/usr/bin/env bash
-
-set -euo pipefail
-
-SCRIPT_DIR="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" && pwd)"
-REPO_ROOT="$(cd -- "$SCRIPT_DIR/.." && pwd)"
-
-CLI_BIN="${CLI_BIN:-openshell}"
-SANDBOX_NAME="${SANDBOX_NAME:-nemoclaw}"
-WELCOME_UI_PATTERN="${WELCOME_UI_PATTERN:-node server.js}"
-NEMOCLAW_IMAGE="${NEMOCLAW_IMAGE:-ghcr.io/nvidia/openshell-community/sandboxes/nemoclaw:latest}"
-REMOVE_IMAGE="${REMOVE_IMAGE:-0}"
-
-log() {
-  printf '[reset] %s\n' "$*"
-}
-
-try_run() {
-  if "$@"; then
-    return 0
-  fi
-  return 1
-}
-
-stop_welcome_ui() {
-  if pgrep -f "$WELCOME_UI_PATTERN" >/dev/null 2>&1; then
-    log "Stopping Welcome UI processes matching: $WELCOME_UI_PATTERN"
-    pkill -f "$WELCOME_UI_PATTERN" || true
-  else
-    log "No Welcome UI process found"
-  fi
-}
-
-delete_sandbox() {
-  log "Deleting sandbox: $SANDBOX_NAME"
-  if ! try_run "$CLI_BIN" sandbox delete "$SANDBOX_NAME"; then
-    log "Sandbox delete returned non-zero; continuing"
-  fi
-}
-
-stop_forward() {
-  if "$CLI_BIN" forward --help >/dev/null 2>&1; then
-    log "Stopping forwarded port 18789 for $SANDBOX_NAME"
-    if ! try_run "$CLI_BIN" forward stop 18789 "$SANDBOX_NAME"; then
-      log "Forward stop returned non-zero; continuing"
-    fi
-  else
-    log "openshell forward subcommand unavailable; skipping forward stop"
-  fi
-}
-
-cleanup_logs() {
-  log "Removing temporary logs and generated policy files"
-  rm -f \
-    /tmp/welcome-ui.log \
-    /tmp/nemoclaw-sandbox-create.log \
-    /tmp/sandbox-policy-*.yaml
-}
-
-remove_image() {
-  if [[ "$REMOVE_IMAGE" == "1" || "$REMOVE_IMAGE" == "true" || "$REMOVE_IMAGE" == "yes" ]]; then
-    log "Removing local image: $NEMOCLAW_IMAGE"
-    if ! try_run docker rmi "$NEMOCLAW_IMAGE"; then
-      log "Image removal returned non-zero; continuing"
-    fi
-  else
-    log "Leaving local image in place (set REMOVE_IMAGE=1 to remove it)"
-  fi
-}
-
-main() {
-  log "Repo root: $REPO_ROOT"
-  stop_welcome_ui
-  delete_sandbox
-  stop_forward
-  cleanup_logs
-  remove_image
-  log "Reset complete"
-}
-
-main "$@"
diff --git a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
index 2127453..b167a0a 100644
--- a/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
+++ b/sandboxes/nemoclaw/nemoclaw-ui-extension/extension/index.ts
@@ -24,6 +24,7 @@ const POST_PAIRING_SETTLE_DELAY_MS = 15_000;
 const STABLE_CONNECTION_WINDOW_MS = 10_000;
 const STABLE_CONNECTION_TIMEOUT_MS = 45_000;
 const PAIRING_RELOAD_FLAG = "nemoclaw:pairing-bootstrap-reloaded";
+const FORCED_RELOAD_DELAY_MS = 1_000;
 
 function inject(): boolean {
   const hasButton = injectButton();
@@ -101,6 +102,13 @@ function clearPairingReloadFlag(): void {
   }
 }
 
+function forcePairingReload(reason: string, overlayText: string): void {
+  console.info(`[NeMoClaw] pairing bootstrap: forcing one-time reload (${reason})`);
+  markPairingReloadComplete();
+  setConnectOverlayText(overlayText);
+  window.setTimeout(() => window.location.reload(), FORCED_RELOAD_DELAY_MS);
+}
+
 function bootstrap() {
   console.info("[NeMoClaw] pairing bootstrap: start");
   showConnectOverlay();
@@ -109,10 +117,7 @@ function bootstrap() {
     setConnectOverlayText("Device pairing approved. Finalizing dashboard...");
     console.info("[NeMoClaw] pairing bootstrap: reconnect detected");
     if (shouldForcePairingReload()) {
-      console.info("[NeMoClaw] pairing bootstrap: forcing one-time reload");
-      markPairingReloadComplete();
-      setConnectOverlayText("Device pairing approved. Reloading dashboard...");
-      window.location.reload();
+      forcePairingReload("post-reconnect", "Device pairing approved. Reloading dashboard...");
       return;
     }
     setConnectOverlayText("Device pairing approved. Verifying dashboard health...");
@@ -135,6 +140,10 @@ function bootstrap() {
     .then(finalizeConnectedState)
     .catch(async () => {
       console.warn("[NeMoClaw] pairing bootstrap: initial reconnect timed out; extending wait");
+      if (shouldForcePairingReload()) {
+        forcePairingReload("initial-timeout", "Pairing is still settling. Reloading dashboard...");
+        return;
+      }
       setConnectOverlayText("Still waiting for device pairing approval...");
       try {
         await waitForReconnect(EXTENDED_CONNECT_TIMEOUT_MS);

From 9ef9e78719f4b3bd23d4dcbb250f79b858951ddd Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 21:16:00 -0700
Subject: [PATCH 23/25] Revise Brev README

---
 README.md | 16 ++++------------
 1 file changed, 4 insertions(+), 12 deletions(-)

diff --git a/README.md b/README.md
index 489021e..a9e2a18 100644
--- a/README.md
+++ b/README.md
@@ -32,22 +32,14 @@ This repo is the community ecosystem around OpenShell -- a hub for contributed s
 
 #### Deploy Instantly with NVIDIA Brev
 
-Skip the setup and launch OpenShell Community on a fully configured Brev instance.
+Skip the setup and launch OpenShell Community on a fully configured Brev instance, whether you want to use Brev as a remote OpenShell gateway with or without GPU accelerators, or as an all-in-one playground for sandboxes, inference, and UI workflows.
 
 | Instance | Best For | Deploy |
 | -------- | -------- | ------ |
-| CPU-only | External inference endpoints, remote APIs, lighter-weight sandbox workflows | <a href="https://brev.nvidia.com/"><img src="https://brev-assets.s3.us-west-1.amazonaws.com/nv-lb-dark.svg" alt="Deploy on Brev" height="40"/></a> |
-| NVIDIA H100 | Locally hosted LLM endpoints, GPU-heavy sandboxes, higher-throughput agent workloads | <a href="https://brev.nvidia.com/"><img src="https://brev-assets.s3.us-west-1.amazonaws.com/nv-lb-dark.svg" alt="Deploy on Brev" height="40"/></a> |
+| CPU-only | Remote OpenShell gateway deployments, external inference endpoints, remote APIs, and lighter-weight sandbox workflows | <a href="https://brev.nvidia.com/"><img src="https://brev-assets.s3.us-west-1.amazonaws.com/nv-lb-dark.svg" alt="Deploy on Brev" height="40"/></a> |
+| NVIDIA H100 | All-in-one OpenShell playgrounds, locally hosted LLM endpoints, GPU-heavy sandboxes, and higher-throughput agent workloads | <a href="https://brev.nvidia.com/"><img src="https://brev-assets.s3.us-west-1.amazonaws.com/nv-lb-dark.svg" alt="Deploy on Brev" height="40"/></a> |
 
-After the Brev instance is ready, bootstrap the Welcome UI:
-
-```bash
-git clone https://github.com/NVIDIA/OpenShell-Community.git
-cd OpenShell-Community
-bash brev/launch.sh
-```
-
-The launcher brings up the Welcome UI on `http://localhost:8081`, where you can inject provider keys and create the NeMoClaw sandbox flow.
+After the Brev instance is ready, access the Welcome UI to inject provider keys and access your Openclaw sandbox.
 
 ### Using Sandboxes
 

From efeb9aa8c27a2ba325407a5b08748f2e9881b1a1 Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 21:29:09 -0700
Subject: [PATCH 24/25] Cleanup Brev section

---
 README.md | 2 --
 1 file changed, 2 deletions(-)

diff --git a/README.md b/README.md
index a9e2a18..fa3557e 100644
--- a/README.md
+++ b/README.md
@@ -30,8 +30,6 @@ This repo is the community ecosystem around OpenShell -- a hub for contributed s
 
 ### Quick Start with Brev
 
-#### Deploy Instantly with NVIDIA Brev
-
 Skip the setup and launch OpenShell Community on a fully configured Brev instance, whether you want to use Brev as a remote OpenShell gateway with or without GPU accelerators, or as an all-in-one playground for sandboxes, inference, and UI workflows.
 
 | Instance | Best For | Deploy |

From 7aa8d1811595f22c1799da3e9879438d93bbb10c Mon Sep 17 00:00:00 2001
From: JR Morgan <liveaverage@gmail.com>
Date: Fri, 13 Mar 2026 22:08:06 -0700
Subject: [PATCH 25/25] Revert policy.yaml to orig

---
 sandboxes/openclaw/policy.yaml | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/sandboxes/openclaw/policy.yaml b/sandboxes/openclaw/policy.yaml
index a12c46b..a91da84 100644
--- a/sandboxes/openclaw/policy.yaml
+++ b/sandboxes/openclaw/policy.yaml
@@ -125,7 +125,3 @@ network_policies:
     binaries:
       - { path: /usr/local/bin/claude }
       - { path: /usr/bin/gh }
-
-inference:
-  allowed_routes:
-    - local