feat(setup): Claude-assisted error recovery with resume-at-step retry
When a setup step fails — whether hard via fail() or soft via the
"What's left" / "Skipping the first chat" notes — offer to ask Claude
to diagnose. On consent, spawn `claude -p --output-format stream-json`
with a scrolling 3-line action window ("Reading x", "Running y") so
the 1–4 minute investigations feel active rather than hung. No hard
timeout: debugging can take time, Ctrl-C is the escape hatch.
The prompt is minimal: one-paragraph framing, failed step name + msg +
hint, and a list of file references (not contents). Claude's Read/Grep
tools fetch what they need. A per-step map in claude-assist.ts gives
the most relevant files per step; the rest is README + auto.ts +
logs/setup.log + the per-step raw log.
Claude responds with REASON + COMMAND lines. We show the reason in a
clack note, prefill the command via setup/run-suggested.sh (bash 4+
readline, 3.x fallback to Enter-to-run), and eval on the user's
confirm.
When the user runs a fix, fail() now offers to retry the failing step
rather than aborting. setup/logs.ts tracks successfully-completed step
names in-memory; fail() threads those as NANOCLAW_SKIP on a spawnSync
retry, so the child picks up exactly where the parent left off — no
rebuilding containers or reinstalling OneCLI.
Other polish in this change:
- fitToWidth + dimWrap in lib/theme.ts to prevent long spinner labels
from soft-wrapping (each terminal row stacks a stale copy otherwise).
- Shorter container step label ("Preparing your assistant's sandbox…")
so it fits on narrow terminals.
- Wordmark anchored in the clack intro line on every run.
- All 25 existing fail() call sites updated to await fail(...) since
fail is now async.
Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
This commit is contained in:
410
setup/lib/claude-assist.ts
Normal file
410
setup/lib/claude-assist.ts
Normal file
@@ -0,0 +1,410 @@
|
||||
/**
|
||||
* Offer Claude-assisted debugging when a setup step fails.
|
||||
*
|
||||
* Flow:
|
||||
* 1. Check `claude` is on PATH and has a working credential. If not,
|
||||
* silently skip — pre-auth failures can't use this path.
|
||||
* 2. Ask the user for consent ("Want me to ask Claude for a fix?").
|
||||
* 3. Build a minimal prompt: the one-paragraph situation, the failing
|
||||
* step's name/message/hint, and a short list of *file references*
|
||||
* (not contents) so Claude can Read what it needs on its own.
|
||||
* 4. Spawn `claude -p --output-format text` with a 2-minute timeout and
|
||||
* a spinner that shows elapsed time.
|
||||
* 5. Parse `REASON:` / `COMMAND:` out of the response. Show the reason
|
||||
* in a clack note, then hand off to `setup/run-suggested.sh` for
|
||||
* editable pre-fill + exec.
|
||||
*
|
||||
* Skippable with NANOCLAW_SKIP_CLAUDE_ASSIST=1 for CI/scripted runs.
|
||||
*/
|
||||
import { execSync, spawn } from 'child_process';
|
||||
import fs from 'fs';
|
||||
import path from 'path';
|
||||
|
||||
import * as p from '@clack/prompts';
|
||||
import k from 'kleur';
|
||||
|
||||
import { ensureAnswer } from './runner.js';
|
||||
import { fitToWidth } from './theme.js';
|
||||
|
||||
export interface AssistContext {
|
||||
stepName: string;
|
||||
msg: string;
|
||||
hint?: string;
|
||||
/** Absolute path to the per-step raw log, if the caller has one. */
|
||||
rawLogPath?: string;
|
||||
}
|
||||
|
||||
/**
|
||||
* File-path hints per step. Claude reads these on its own via its Read tool
|
||||
* rather than us stuffing contents into the prompt. Keys are step names as
|
||||
* they appear in fail() calls; values are repo-relative paths.
|
||||
*/
|
||||
const STEP_FILES: Record<string, string[]> = {
|
||||
bootstrap: ['setup.sh', 'setup/install-node.sh', 'nanoclaw.sh'],
|
||||
environment: ['setup/environment.ts'],
|
||||
container: [
|
||||
'setup/container.ts',
|
||||
'setup/install-docker.sh',
|
||||
'container/Dockerfile',
|
||||
],
|
||||
onecli: ['setup/onecli.ts'],
|
||||
auth: [
|
||||
'setup/auth.ts',
|
||||
'setup/register-claude-token.sh',
|
||||
'setup/install-claude.sh',
|
||||
],
|
||||
mounts: ['setup/mounts.ts'],
|
||||
service: ['setup/service.ts'],
|
||||
'cli-agent': ['setup/cli-agent.ts', 'scripts/init-cli-agent.ts'],
|
||||
channel: ['setup/auto.ts'],
|
||||
verify: ['setup/verify.ts'],
|
||||
// Channel-specific sub-steps:
|
||||
'telegram-install': ['setup/add-telegram.sh', 'setup/channels/telegram.ts'],
|
||||
'telegram-validate': ['setup/channels/telegram.ts'],
|
||||
'pair-telegram': ['setup/pair-telegram.ts', 'setup/channels/telegram.ts'],
|
||||
'discord-install': ['setup/add-discord.sh', 'setup/channels/discord.ts'],
|
||||
'init-first-agent': [
|
||||
'scripts/init-first-agent.ts',
|
||||
'setup/channels/telegram.ts',
|
||||
'setup/channels/discord.ts',
|
||||
],
|
||||
};
|
||||
|
||||
const BIG_PICTURE_FILES = ['README.md', 'setup/auto.ts'];
|
||||
|
||||
/**
|
||||
* Returns `true` if the user ran a Claude-suggested fix command; callers
|
||||
* can use that signal to offer a retry instead of aborting outright.
|
||||
* Returns `false` for every other outcome (skipped, declined, no command,
|
||||
* Claude unreachable, user chose not to run).
|
||||
*/
|
||||
export async function offerClaudeAssist(
|
||||
ctx: AssistContext,
|
||||
projectRoot: string = process.cwd(),
|
||||
): Promise<boolean> {
|
||||
if (process.env.NANOCLAW_SKIP_CLAUDE_ASSIST === '1') return false;
|
||||
if (!isClaudeUsable()) return false;
|
||||
|
||||
const want = ensureAnswer(
|
||||
await p.confirm({
|
||||
message: 'Want me to ask Claude to diagnose this?',
|
||||
initialValue: true,
|
||||
}),
|
||||
);
|
||||
if (!want) return false;
|
||||
|
||||
const prompt = buildPrompt(ctx, projectRoot);
|
||||
const response = await queryClaudeUnderSpinner(prompt, projectRoot);
|
||||
if (!response) return false;
|
||||
|
||||
const parsed = parseResponse(response);
|
||||
if (!parsed) {
|
||||
p.log.warn("Claude responded but I couldn't parse a command out of it.");
|
||||
p.log.message(k.dim(response.trim().slice(0, 500)));
|
||||
return false;
|
||||
}
|
||||
|
||||
p.note(
|
||||
`${parsed.reason}\n\n${k.cyan('$')} ${parsed.command}`,
|
||||
"Claude's suggestion",
|
||||
);
|
||||
|
||||
const run = ensureAnswer(
|
||||
await p.confirm({
|
||||
message: 'Run this command? (you can edit it before executing)',
|
||||
initialValue: false,
|
||||
}),
|
||||
);
|
||||
if (!run) return false;
|
||||
|
||||
await runSuggested(parsed.command, projectRoot);
|
||||
return true;
|
||||
}
|
||||
|
||||
function isClaudeUsable(): boolean {
|
||||
try {
|
||||
execSync('command -v claude', { stdio: 'ignore' });
|
||||
} catch {
|
||||
return false;
|
||||
}
|
||||
// Availability without auth is half the story; a real query will still
|
||||
// fail if the token isn't registered. We try first and surface the error
|
||||
// rather than pre-checking auth with a separate round trip.
|
||||
return true;
|
||||
}
|
||||
|
||||
function buildPrompt(ctx: AssistContext, projectRoot: string): string {
|
||||
const stepRefs = STEP_FILES[ctx.stepName] ?? [];
|
||||
const references = [
|
||||
...BIG_PICTURE_FILES,
|
||||
...stepRefs,
|
||||
'logs/setup.log',
|
||||
ctx.rawLogPath
|
||||
? path.relative(projectRoot, ctx.rawLogPath)
|
||||
: 'logs/setup-steps/',
|
||||
].filter((v, i, a) => a.indexOf(v) === i);
|
||||
|
||||
const hintLine = ctx.hint ? `Hint shown to the user: ${ctx.hint}\n` : '';
|
||||
|
||||
return [
|
||||
"I'm trying to set up NanoClaw on my machine and ran into an issue",
|
||||
'during the setup flow. Please read the referenced files to understand',
|
||||
'the flow and the step that failed, look at the logs to see what went',
|
||||
'wrong, then suggest a single bash command I can run to fix it.',
|
||||
'',
|
||||
`Failed step: ${ctx.stepName}`,
|
||||
`Error shown to the user: ${ctx.msg}`,
|
||||
hintLine,
|
||||
'References (read as needed with your Read tool):',
|
||||
...references.map((r) => ` - ${r}`),
|
||||
'',
|
||||
'Respond in EXACTLY this format, nothing before or after:',
|
||||
'',
|
||||
'REASON: <one short line describing the root cause>',
|
||||
'COMMAND: <single bash command, one line, no backticks>',
|
||||
'',
|
||||
'If no safe single command can fix it, respond with:',
|
||||
'REASON: <why>',
|
||||
'COMMAND: none',
|
||||
].join('\n');
|
||||
}
|
||||
|
||||
/**
|
||||
* Fixed-height scrolling window for Claude's progress.
|
||||
*
|
||||
* Clack's spinner only owns one line, so long tool-use breadcrumbs wrap
|
||||
* and blow out the gutter. Instead we manage a 4-line window ourselves:
|
||||
* a spinner header + 3 lines showing the most recent tool actions. On
|
||||
* each update we use raw ANSI (cursor up, clear line) to redraw in
|
||||
* place. When the query finishes we clear the whole block and emit a
|
||||
* single `p.log.success` / `p.log.error` so the flow continues in
|
||||
* standard clack style.
|
||||
*/
|
||||
const WINDOW_SIZE = 3;
|
||||
const SPINNER_FRAMES = ['◒', '◐', '◓', '◑'];
|
||||
const HIDE_CURSOR = '\x1b[?25l';
|
||||
const SHOW_CURSOR = '\x1b[?25h';
|
||||
|
||||
async function queryClaudeUnderSpinner(
|
||||
prompt: string,
|
||||
projectRoot: string,
|
||||
): Promise<string | null> {
|
||||
const out = process.stdout;
|
||||
const start = Date.now();
|
||||
const actions: string[] = [];
|
||||
let frameIdx = 0;
|
||||
|
||||
const redraw = (): void => {
|
||||
// Move cursor back to the start of the block (WINDOW_SIZE + 1 = header + window).
|
||||
out.write(`\x1b[${WINDOW_SIZE + 1}A`);
|
||||
|
||||
const elapsed = Math.round((Date.now() - start) / 1000);
|
||||
const icon = SPINNER_FRAMES[frameIdx % SPINNER_FRAMES.length];
|
||||
const suffix = ` (${elapsed}s)`;
|
||||
const header = fitToWidth('Asking Claude to diagnose…', suffix);
|
||||
out.write(`\x1b[2K${k.cyan(icon)} ${header}${k.dim(suffix)}\n`);
|
||||
|
||||
for (let i = 0; i < WINDOW_SIZE; i++) {
|
||||
const idx = actions.length - WINDOW_SIZE + i;
|
||||
const action = idx >= 0 ? actions[idx] : '';
|
||||
out.write('\x1b[2K');
|
||||
if (action) {
|
||||
out.write(`${k.gray('│')} ${k.dim(`▸ ${fitToWidth(action, '')}`)}`);
|
||||
} else {
|
||||
out.write(k.gray('│'));
|
||||
}
|
||||
out.write('\n');
|
||||
}
|
||||
};
|
||||
|
||||
const clearBlock = (): void => {
|
||||
out.write(`\x1b[${WINDOW_SIZE + 1}A`);
|
||||
for (let i = 0; i < WINDOW_SIZE + 1; i++) {
|
||||
out.write('\x1b[2K\n');
|
||||
}
|
||||
out.write(`\x1b[${WINDOW_SIZE + 1}A`);
|
||||
};
|
||||
|
||||
// Seed the block: move cursor to a fresh line, then write (header + window)
|
||||
// blank lines so `redraw()`'s cursor-up math lands correctly. Hide the
|
||||
// cursor for the duration so the redraw doesn't flicker.
|
||||
out.write(HIDE_CURSOR);
|
||||
for (let i = 0; i < WINDOW_SIZE + 1; i++) out.write('\n');
|
||||
redraw();
|
||||
|
||||
// If the user Ctrl-C's during the query, we never reach `finish()` —
|
||||
// add an exit hook so the cursor comes back regardless.
|
||||
const restoreCursorOnExit = (): void => {
|
||||
out.write(SHOW_CURSOR);
|
||||
};
|
||||
process.once('exit', restoreCursorOnExit);
|
||||
|
||||
const frameTick = setInterval(() => {
|
||||
frameIdx++;
|
||||
redraw();
|
||||
}, 250);
|
||||
|
||||
return new Promise((resolve) => {
|
||||
let lineBuf = '';
|
||||
let finalText = '';
|
||||
let stderr = '';
|
||||
let settled = false;
|
||||
|
||||
const finish = (
|
||||
kind: 'ok' | 'error',
|
||||
payload: string | null,
|
||||
): void => {
|
||||
clearInterval(frameTick);
|
||||
clearBlock();
|
||||
out.write(SHOW_CURSOR);
|
||||
process.off('exit', restoreCursorOnExit);
|
||||
const elapsed = Math.round((Date.now() - start) / 1000);
|
||||
const suffix = ` (${elapsed}s)`;
|
||||
if (kind === 'ok') {
|
||||
p.log.success(`${fitToWidth('Claude replied.', suffix)}${k.dim(suffix)}`);
|
||||
resolve(payload);
|
||||
} else {
|
||||
p.log.error(
|
||||
`${fitToWidth("Claude couldn't help here.", suffix)}${k.dim(suffix)}`,
|
||||
);
|
||||
const tail = stderr.trim().split('\n').slice(-3).join('\n');
|
||||
if (tail) p.log.message(k.dim(tail));
|
||||
resolve(null);
|
||||
}
|
||||
};
|
||||
|
||||
// No hard timeout — debugging can take a long time, and the cost of
|
||||
// cutting Claude off mid-investigation is worse than letting the
|
||||
// spinner run. The user can Ctrl-C if they want to abort.
|
||||
const child = spawn(
|
||||
'claude',
|
||||
[
|
||||
'-p',
|
||||
'--output-format',
|
||||
'stream-json',
|
||||
'--verbose',
|
||||
'--permission-mode',
|
||||
'bypassPermissions',
|
||||
],
|
||||
{ cwd: projectRoot, stdio: ['pipe', 'pipe', 'pipe'] },
|
||||
);
|
||||
|
||||
child.stdout.on('data', (c: Buffer) => {
|
||||
lineBuf += c.toString('utf-8');
|
||||
let idx: number;
|
||||
while ((idx = lineBuf.indexOf('\n')) !== -1) {
|
||||
const line = lineBuf.slice(0, idx);
|
||||
lineBuf = lineBuf.slice(idx + 1);
|
||||
if (!line.trim()) continue;
|
||||
try {
|
||||
const event = JSON.parse(line) as StreamEvent;
|
||||
handleStreamEvent(event, {
|
||||
setAction: (a) => {
|
||||
actions.push(a);
|
||||
redraw();
|
||||
},
|
||||
appendText: (t) => {
|
||||
finalText += t;
|
||||
},
|
||||
});
|
||||
} catch {
|
||||
// Malformed or non-JSON line — ignore.
|
||||
}
|
||||
}
|
||||
});
|
||||
child.stderr.on('data', (c: Buffer) => {
|
||||
stderr += c.toString('utf-8');
|
||||
});
|
||||
child.on('close', (code) => {
|
||||
if (settled) return;
|
||||
settled = true;
|
||||
if (code === 0 && finalText.trim()) finish('ok', finalText);
|
||||
else finish('error', null);
|
||||
});
|
||||
child.on('error', () => {
|
||||
if (settled) return;
|
||||
settled = true;
|
||||
finish('error', null);
|
||||
});
|
||||
|
||||
child.stdin.end(prompt);
|
||||
});
|
||||
}
|
||||
|
||||
// Minimal shape of the stream-json events we care about. Claude emits
|
||||
// many more, but we only read tool_use blocks (for breadcrumbs) and text
|
||||
// blocks (to reassemble the final REASON/COMMAND answer).
|
||||
interface StreamEvent {
|
||||
type: string;
|
||||
message?: {
|
||||
content?: Array<
|
||||
| { type: 'text'; text: string }
|
||||
| { type: 'tool_use'; name: string; input: Record<string, unknown> }
|
||||
>;
|
||||
};
|
||||
}
|
||||
|
||||
function handleStreamEvent(
|
||||
event: StreamEvent,
|
||||
cb: { setAction: (a: string) => void; appendText: (t: string) => void },
|
||||
): void {
|
||||
if (event.type !== 'assistant') return;
|
||||
const blocks = event.message?.content ?? [];
|
||||
for (const block of blocks) {
|
||||
if (block.type === 'text') {
|
||||
cb.appendText(block.text);
|
||||
} else if (block.type === 'tool_use') {
|
||||
cb.setAction(formatToolUse(block.name, block.input));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
function formatToolUse(name: string, input: Record<string, unknown>): string {
|
||||
const truncate = (v: string, n: number): string =>
|
||||
v.length > n ? v.slice(0, n) + '…' : v;
|
||||
if (name === 'Read') {
|
||||
const f = String(input.file_path ?? '');
|
||||
return `Reading ${shortenPath(f)}`;
|
||||
}
|
||||
if (name === 'Bash') {
|
||||
const cmd = String(input.command ?? '').replace(/\s+/g, ' ').trim();
|
||||
return `Running ${truncate(cmd, 60)}`;
|
||||
}
|
||||
if (name === 'Grep') return `Searching for "${truncate(String(input.pattern ?? ''), 40)}"`;
|
||||
if (name === 'Glob') return `Finding ${truncate(String(input.pattern ?? ''), 40)}`;
|
||||
return `Using ${name}`;
|
||||
}
|
||||
|
||||
function shortenPath(abs: string): string {
|
||||
const root = process.cwd();
|
||||
return abs.startsWith(`${root}/`) ? abs.slice(root.length + 1) : abs;
|
||||
}
|
||||
|
||||
function parseResponse(
|
||||
raw: string,
|
||||
): { reason: string; command: string } | null {
|
||||
// Accept the fields anywhere in the output — Claude sometimes wraps the
|
||||
// answer in a trailing explanation we can safely ignore.
|
||||
const reasonMatch = raw.match(/^\s*REASON:\s*(.+?)\s*$/m);
|
||||
const commandMatch = raw.match(/^\s*COMMAND:\s*(.+?)\s*$/m);
|
||||
if (!reasonMatch || !commandMatch) return null;
|
||||
const command = commandMatch[1].trim();
|
||||
if (!command || command.toLowerCase() === 'none') return null;
|
||||
return { reason: reasonMatch[1].trim(), command };
|
||||
}
|
||||
|
||||
function runSuggested(command: string, projectRoot: string): Promise<void> {
|
||||
const script = path.join(projectRoot, 'setup/run-suggested.sh');
|
||||
if (!fs.existsSync(script)) {
|
||||
p.log.error(`Missing helper: ${script}`);
|
||||
return Promise.resolve();
|
||||
}
|
||||
return new Promise((resolve) => {
|
||||
const child = spawn('bash', [script, command], {
|
||||
cwd: projectRoot,
|
||||
stdio: 'inherit',
|
||||
});
|
||||
child.on('close', () => resolve());
|
||||
child.on('error', () => resolve());
|
||||
});
|
||||
}
|
||||
Reference in New Issue
Block a user