Some checks are pending
CI / build-check-test (push) Waiting to run
- Merge 3 servers into single tool-server.mjs on port 7700 - HTTP API: POST /api/bash, /api/browser/* - WebSocket: /ws/terminal (xterm.js panel) - WebSocket: /ws/browser (live browser panel) - SHARED Playwright instance between LLM browser tool and user panel - When AI navigates a page, user sees it live in browser panel - When user clicks in panel, AI tools see the same page state - Remove standalone terminal-server.mjs (was :7701) - Remove standalone browser-server.mjs (was :7702) - Update browser-panel.ts: ws://localhost:7700/ws/browser - Update terminal-panel.ts: ws://localhost:7700/ws/terminal - Agent Zero-inspired system prompt with: - Structured problem-solving methodology (analyse/plan/execute/verify/report) - Clear tool usage rules (no tools for casual chat) - Detailed tool descriptions with usage guidance - Resourceful retry behaviour on failures - npm run dev starts both vite + unified server via concurrently
320 lines
11 KiB
JavaScript
320 lines
11 KiB
JavaScript
import http from 'http';
|
|
import { exec } from 'child_process';
|
|
import { chromium } from 'playwright';
|
|
import { WebSocketServer, WebSocket } from 'ws';
|
|
import { spawn } from 'child_process';
|
|
import url from 'url';
|
|
|
|
const PORT = parseInt(process.env.TOOL_SERVER_PORT || '7700');
|
|
|
|
// ── CORS ──────────────────────────────────────────────────────
|
|
const cors = {
|
|
'Access-Control-Allow-Origin': '*',
|
|
'Access-Control-Allow-Methods': 'POST, GET, OPTIONS',
|
|
'Access-Control-Allow-Headers': 'Content-Type',
|
|
'Content-Type': 'application/json',
|
|
};
|
|
|
|
function parseBody(req) {
|
|
return new Promise((resolve) => {
|
|
let body = '';
|
|
req.on('data', c => body += c);
|
|
req.on('end', () => {
|
|
try { resolve(JSON.parse(body || '{}')); } catch { resolve({}); }
|
|
});
|
|
});
|
|
}
|
|
|
|
// ── SHARED PLAYWRIGHT BROWSER ─────────────────────────────────
|
|
let browser = null;
|
|
let context = null;
|
|
let page = null;
|
|
const browserPanelClients = new Set(); // WS clients watching the browser
|
|
|
|
async function launchBrowser() {
|
|
if (!browser) {
|
|
browser = await chromium.launch({
|
|
headless: true,
|
|
args: ['--no-sandbox', '--disable-setuid-sandbox', '--disable-dev-shm-usage']
|
|
});
|
|
console.log('[tool-server] Playwright browser launched');
|
|
}
|
|
return browser;
|
|
}
|
|
|
|
async function getPage() {
|
|
if (!page || page.isClosed()) {
|
|
const b = await launchBrowser();
|
|
if (context) await context.close().catch(() => {});
|
|
context = await b.newContext({ viewport: { width: 1280, height: 800 } });
|
|
page = await context.newPage();
|
|
}
|
|
return page;
|
|
}
|
|
|
|
async function snap() {
|
|
const p = await getPage();
|
|
const buf = await p.screenshot({ type: 'jpeg', quality: 70, fullPage: false });
|
|
return { screenshot: buf.toString('base64'), url: p.url(), title: await p.title() };
|
|
}
|
|
|
|
// Broadcast screenshot to all connected browser panel WebSocket clients
|
|
async function broadcastScreenshot() {
|
|
if (browserPanelClients.size === 0) return;
|
|
try {
|
|
const s = await snap();
|
|
const msg = JSON.stringify({ type: 'screenshot', data: s.screenshot, url: s.url, title: s.title });
|
|
for (const ws of browserPanelClients) {
|
|
if (ws.readyState === WebSocket.OPEN) ws.send(msg);
|
|
}
|
|
} catch (e) {
|
|
const errMsg = JSON.stringify({ type: 'error', msg: String(e) });
|
|
for (const ws of browserPanelClients) {
|
|
if (ws.readyState === WebSocket.OPEN) ws.send(errMsg);
|
|
}
|
|
}
|
|
}
|
|
|
|
// ── BASH HANDLER ──────────────────────────────────────────────
|
|
async function handleBash(body) {
|
|
const { command, timeout = 30000 } = body;
|
|
if (!command) return { error: 'No command provided' };
|
|
return new Promise((resolve) => {
|
|
exec(command, {
|
|
timeout,
|
|
maxBuffer: 10 * 1024 * 1024,
|
|
cwd: process.env.WORKSPACE || process.env.HOME || '/root',
|
|
env: { ...process.env, TERM: 'dumb', COLUMNS: '200' },
|
|
}, (error, stdout, stderr) => {
|
|
resolve({
|
|
stdout: stdout || '',
|
|
stderr: stderr || '',
|
|
exitCode: error ? (error.code ?? 1) : 0,
|
|
output: (stdout || '') + (stderr ? '\nSTDERR: ' + stderr : ''),
|
|
});
|
|
});
|
|
});
|
|
}
|
|
|
|
// ── BROWSER HTTP HANDLERS (used by LLM tool) ─────────────────
|
|
async function handleNavigate(body) {
|
|
const { url: targetUrl } = body;
|
|
if (!targetUrl) return { error: 'No URL' };
|
|
const p = await getPage();
|
|
const target = targetUrl.startsWith('http') ? targetUrl : 'https://' + targetUrl;
|
|
await p.goto(target, { timeout: 30000, waitUntil: 'domcontentloaded' });
|
|
const result = await snap();
|
|
broadcastScreenshot(); // sync panel
|
|
return result;
|
|
}
|
|
|
|
async function handleClick(body) {
|
|
const p = await getPage();
|
|
await p.mouse.click(body.x || 0, body.y || 0);
|
|
await p.waitForTimeout(500);
|
|
const result = await snap();
|
|
broadcastScreenshot();
|
|
return result;
|
|
}
|
|
|
|
async function handleType(body) {
|
|
const p = await getPage();
|
|
if (body.selector) await p.fill(body.selector, body.text || '');
|
|
else await p.keyboard.type(body.text || '');
|
|
await p.waitForTimeout(300);
|
|
const result = await snap();
|
|
broadcastScreenshot();
|
|
return result;
|
|
}
|
|
|
|
async function handleScroll(body) {
|
|
const p = await getPage();
|
|
await p.mouse.wheel(0, body.dy || 300);
|
|
await p.waitForTimeout(300);
|
|
const result = await snap();
|
|
broadcastScreenshot();
|
|
return result;
|
|
}
|
|
|
|
async function handleBack() {
|
|
const p = await getPage();
|
|
await p.goBack({ timeout: 10000 }).catch(() => {});
|
|
const result = await snap();
|
|
broadcastScreenshot();
|
|
return result;
|
|
}
|
|
|
|
async function handleForward() {
|
|
const p = await getPage();
|
|
await p.goForward({ timeout: 10000 }).catch(() => {});
|
|
const result = await snap();
|
|
broadcastScreenshot();
|
|
return result;
|
|
}
|
|
|
|
async function handleReload() {
|
|
const p = await getPage();
|
|
await p.reload({ timeout: 15000 }).catch(() => {});
|
|
const result = await snap();
|
|
broadcastScreenshot();
|
|
return result;
|
|
}
|
|
|
|
async function handleText() {
|
|
const p = await getPage();
|
|
const text = await p.evaluate(() => document.body.innerText);
|
|
return { url: p.url(), title: await p.title(), text: text.slice(0, 8000) };
|
|
}
|
|
|
|
async function handleEval(body) {
|
|
const p = await getPage();
|
|
const result = await p.evaluate(body.script || 'null');
|
|
const ss = await snap();
|
|
broadcastScreenshot();
|
|
return { ...ss, evalResult: String(result) };
|
|
}
|
|
|
|
// ── HTTP ROUTES ───────────────────────────────────────────────
|
|
const routes = {
|
|
'/api/bash': handleBash,
|
|
'/api/browser/navigate': handleNavigate,
|
|
'/api/browser/click': handleClick,
|
|
'/api/browser/type': handleType,
|
|
'/api/browser/scroll': handleScroll,
|
|
'/api/browser/back': handleBack,
|
|
'/api/browser/forward': handleForward,
|
|
'/api/browser/reload': handleReload,
|
|
'/api/browser/screenshot': () => { const r = snap(); broadcastScreenshot(); return r; },
|
|
'/api/browser/text': handleText,
|
|
'/api/browser/eval': handleEval,
|
|
};
|
|
|
|
// ── HTTP SERVER ───────────────────────────────────────────────
|
|
const server = http.createServer(async (req, res) => {
|
|
if (req.method === 'OPTIONS') { res.writeHead(204, cors); res.end(); return; }
|
|
if (req.url === '/health') { res.writeHead(200, cors); res.end(JSON.stringify({ ok: true, browser: !!browser })); return; }
|
|
const handler = routes[req.url];
|
|
if (req.method === 'POST' && handler) {
|
|
try {
|
|
const body = await parseBody(req);
|
|
const result = await handler(body);
|
|
res.writeHead(200, cors);
|
|
res.end(JSON.stringify(result));
|
|
} catch (err) {
|
|
res.writeHead(500, cors);
|
|
res.end(JSON.stringify({ error: String(err) }));
|
|
}
|
|
return;
|
|
}
|
|
res.writeHead(404, cors);
|
|
res.end(JSON.stringify({ error: 'Not found' }));
|
|
});
|
|
|
|
// ── WEBSOCKET: TERMINAL (/ws/terminal) ────────────────────────
|
|
const terminalWss = new WebSocketServer({ noServer: true });
|
|
terminalWss.on('connection', (ws) => {
|
|
console.log('[tool-server] Terminal WS client connected');
|
|
const shell = spawn('/bin/bash', [], {
|
|
env: { ...process.env, TERM: 'xterm-256color', COLORTERM: 'truecolor' },
|
|
cwd: process.env.HOME || '/root',
|
|
});
|
|
shell.stdout.on('data', (d) => { try { ws.send(JSON.stringify({ type: 'data', data: d.toString('binary') })); } catch {} });
|
|
shell.stderr.on('data', (d) => { try { ws.send(JSON.stringify({ type: 'data', data: d.toString('binary') })); } catch {} });
|
|
shell.on('close', (code) => { try { ws.send(JSON.stringify({ type: 'exit', code })); ws.close(); } catch {} });
|
|
ws.on('message', (msg) => {
|
|
try {
|
|
const m = JSON.parse(msg.toString());
|
|
if (m.type === 'input') shell.stdin.write(m.data);
|
|
if (m.type === 'resize') { /* best effort without node-pty */ }
|
|
} catch {}
|
|
});
|
|
ws.on('close', () => { shell.kill(); });
|
|
});
|
|
|
|
// ── WEBSOCKET: BROWSER PANEL (/ws/browser) ────────────────────
|
|
const browserWss = new WebSocketServer({ noServer: true });
|
|
browserWss.on('connection', async (ws) => {
|
|
console.log('[tool-server] Browser panel WS client connected');
|
|
browserPanelClients.add(ws);
|
|
ws.on('close', () => browserPanelClients.delete(ws));
|
|
ws.on('error', () => browserPanelClients.delete(ws));
|
|
|
|
// Handle panel user interactions (navigate, click, scroll, etc.)
|
|
ws.on('message', async (msg) => {
|
|
try {
|
|
const m = JSON.parse(msg.toString());
|
|
if (m.type === 'navigate') {
|
|
const p = await getPage();
|
|
const target = m.url.startsWith('http') ? m.url : 'https://' + m.url;
|
|
ws.send(JSON.stringify({ type: 'loading' }));
|
|
await p.goto(target, { timeout: 30000, waitUntil: 'domcontentloaded' });
|
|
await broadcastScreenshot();
|
|
}
|
|
if (m.type === 'click') {
|
|
const p = await getPage();
|
|
await p.mouse.click(m.x || 0, m.y || 0);
|
|
await p.waitForTimeout(500);
|
|
await broadcastScreenshot();
|
|
}
|
|
if (m.type === 'scroll') {
|
|
const p = await getPage();
|
|
await p.mouse.wheel(0, m.dy || 300);
|
|
await p.waitForTimeout(300);
|
|
await broadcastScreenshot();
|
|
}
|
|
if (m.type === 'type') {
|
|
const p = await getPage();
|
|
await p.keyboard.type(m.text || '');
|
|
await p.waitForTimeout(300);
|
|
await broadcastScreenshot();
|
|
}
|
|
if (m.type === 'back') {
|
|
const p = await getPage();
|
|
await p.goBack({ timeout: 10000 }).catch(() => {});
|
|
await broadcastScreenshot();
|
|
}
|
|
if (m.type === 'fwd') {
|
|
const p = await getPage();
|
|
await p.goForward({ timeout: 10000 }).catch(() => {});
|
|
await broadcastScreenshot();
|
|
}
|
|
if (m.type === 'reload') {
|
|
const p = await getPage();
|
|
await p.reload({ timeout: 15000 }).catch(() => {});
|
|
await broadcastScreenshot();
|
|
}
|
|
if (m.type === 'screenshot') {
|
|
await broadcastScreenshot();
|
|
}
|
|
} catch (e) {
|
|
ws.send(JSON.stringify({ type: 'error', msg: String(e) }));
|
|
}
|
|
});
|
|
|
|
// Send initial ready + screenshot if browser exists
|
|
ws.send(JSON.stringify({ type: 'ready' }));
|
|
if (page && !page.isClosed()) {
|
|
try { await broadcastScreenshot(); } catch {}
|
|
}
|
|
});
|
|
|
|
// ── UPGRADE HANDLER (route WS by path) ────────────────────────
|
|
server.on('upgrade', (req, socket, head) => {
|
|
const pathname = url.parse(req.url).pathname;
|
|
if (pathname === '/ws/terminal') {
|
|
terminalWss.handleUpgrade(req, socket, head, (ws) => terminalWss.emit('connection', ws, req));
|
|
} else if (pathname === '/ws/browser') {
|
|
browserWss.handleUpgrade(req, socket, head, (ws) => browserWss.emit('connection', ws, req));
|
|
} else {
|
|
socket.destroy();
|
|
}
|
|
});
|
|
|
|
// ── START ─────────────────────────────────────────────────────
|
|
server.listen(PORT, () => {
|
|
console.log(`[tool-server] Unified server on http://localhost:${PORT}`);
|
|
console.log(`[tool-server] HTTP API: POST /api/bash, /api/browser/*`);
|
|
console.log(`[tool-server] Terminal WS: ws://localhost:${PORT}/ws/terminal`);
|
|
console.log(`[tool-server] Browser WS: ws://localhost:${PORT}/ws/browser`);
|
|
console.log(`[tool-server] Health: GET /health`);
|
|
});
|