- Added globalThis.__name polyfill in layout.tsx head using dangerouslySetInnerHTML - Fixed wrangler.jsonc to use inline DO (removed script_name reference) - Fixed patch-worker.js duplicate detection - Updated todos: WebSocket still needs debugging but core app is functional
483 lines
14 KiB
TypeScript
483 lines
14 KiB
TypeScript
/**
|
|
* LangGraph agent integrated with SSH proxy
|
|
* Runs in Node.js environment with full dependency support
|
|
* Based on context7 best practices for streaming and config passing
|
|
*/
|
|
|
|
import { StateGraph, END, START, Annotation } from "@langchain/langgraph"
|
|
import { HumanMessage, SystemMessage } from "@langchain/core/messages"
|
|
import { ChatOpenAI } from "@langchain/openai"
|
|
import type { RunnableConfig } from "@langchain/core/runnables"
|
|
import type { Client } from 'ssh2'
|
|
import type { Response } from 'express'
|
|
|
|
// Define state using Annotation for proper LangGraph typing
|
|
const BanditState = Annotation.Root({
|
|
runId: Annotation<string>,
|
|
currentLevel: Annotation<number>,
|
|
targetLevel: Annotation<number>,
|
|
currentPassword: Annotation<string>,
|
|
nextPassword: Annotation<string | null>,
|
|
levelGoal: Annotation<string>,
|
|
commandHistory: Annotation<Array<{
|
|
command: string
|
|
output: string
|
|
exitCode: number
|
|
timestamp: string
|
|
level: number
|
|
}>>({
|
|
reducer: (left, right) => left.concat(right),
|
|
default: () => [],
|
|
}),
|
|
thoughts: Annotation<Array<{
|
|
type: 'plan' | 'observation' | 'reasoning' | 'decision'
|
|
content: string
|
|
timestamp: string
|
|
level: number
|
|
}>>({
|
|
reducer: (left, right) => left.concat(right),
|
|
default: () => [],
|
|
}),
|
|
status: Annotation<'planning' | 'executing' | 'validating' | 'advancing' | 'paused' | 'complete' | 'failed'>,
|
|
retryCount: Annotation<number>,
|
|
maxRetries: Annotation<number>,
|
|
sshConnectionId: Annotation<string | null>,
|
|
error: Annotation<string | null>,
|
|
})
|
|
|
|
type BanditAgentState = typeof BanditState.State
|
|
|
|
const LEVEL_GOALS: Record<number, string> = {
|
|
0: "Read 'readme' file in home directory",
|
|
1: "Read '-' file (use 'cat ./-' or 'cat < -')",
|
|
2: "Find and read hidden file with spaces in name",
|
|
3: "Find file with specific permissions",
|
|
4: "Find file in inhere directory that is human-readable",
|
|
5: "Find file owned by bandit7, group bandit6, 33 bytes",
|
|
// Add more as needed
|
|
}
|
|
|
|
const SYSTEM_PROMPT = `You are BanditRunner, an autonomous operator solving the OverTheWire Bandit wargame.
|
|
|
|
RULES:
|
|
1. Only use safe commands: ls, cat, grep, find, base64, etc.
|
|
2. Think step-by-step
|
|
3. Extract passwords (32-char alphanumeric strings)
|
|
4. Validate before advancing
|
|
|
|
WORKFLOW:
|
|
1. Plan - analyze level goal
|
|
2. Execute - run command
|
|
3. Validate - check for password
|
|
4. Advance - move to next level`
|
|
|
|
/**
|
|
* Create planning node - LLM decides next command
|
|
* Following context7 pattern: pass RunnableConfig for proper streaming
|
|
*/
|
|
async function planLevel(
|
|
state: BanditAgentState,
|
|
config?: RunnableConfig
|
|
): Promise<Partial<BanditAgentState>> {
|
|
const { currentLevel, levelGoal, commandHistory, sshConnectionId, currentPassword } = state
|
|
|
|
// Establish SSH connection if needed
|
|
if (!sshConnectionId) {
|
|
const sshProxyUrl = process.env.SSH_PROXY_URL || 'http://localhost:3001'
|
|
const connectResponse = await fetch(`${sshProxyUrl}/ssh/connect`, {
|
|
method: 'POST',
|
|
headers: { 'Content-Type': 'application/json' },
|
|
body: JSON.stringify({
|
|
host: 'bandit.labs.overthewire.org',
|
|
port: 2220,
|
|
username: `bandit${currentLevel}`,
|
|
password: currentPassword,
|
|
testOnly: false,
|
|
}),
|
|
})
|
|
|
|
const connectData = await connectResponse.json() as { connectionId?: string; success?: boolean; message?: string }
|
|
|
|
if (!connectData.success || !connectData.connectionId) {
|
|
return {
|
|
status: 'failed',
|
|
error: `SSH connection failed: ${connectData.message || 'Unknown error'}`,
|
|
}
|
|
}
|
|
|
|
// Update state with connection ID
|
|
return {
|
|
sshConnectionId: connectData.connectionId,
|
|
status: 'planning',
|
|
}
|
|
}
|
|
|
|
// Get LLM from config (injected by agent)
|
|
const llm = (config?.configurable?.llm) as ChatOpenAI
|
|
|
|
// Build context from recent commands
|
|
const recentCommands = commandHistory.slice(-3).map(cmd =>
|
|
`Command: ${cmd.command}\nOutput: ${cmd.output.slice(0, 300)}\nExit: ${cmd.exitCode}`
|
|
).join('\n\n')
|
|
|
|
const messages = [
|
|
new SystemMessage(SYSTEM_PROMPT),
|
|
new HumanMessage(`Level ${currentLevel}: ${levelGoal}
|
|
|
|
Recent Commands:
|
|
${recentCommands || 'No commands yet'}
|
|
|
|
What command should I run next? Provide ONLY the exact command to execute.`),
|
|
]
|
|
|
|
const response = await llm.invoke(messages, config)
|
|
const thought = response.content as string
|
|
|
|
return {
|
|
thoughts: [{
|
|
type: 'plan',
|
|
content: thought,
|
|
timestamp: new Date().toISOString(),
|
|
level: currentLevel,
|
|
}],
|
|
status: 'executing',
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Execute SSH command via proxy with PTY
|
|
*/
|
|
async function executeCommand(
|
|
state: BanditAgentState,
|
|
config?: RunnableConfig
|
|
): Promise<Partial<BanditAgentState>> {
|
|
const { thoughts, currentLevel, sshConnectionId } = state
|
|
|
|
// Extract command from latest thought
|
|
const latestThought = thoughts[thoughts.length - 1]
|
|
const commandMatch = latestThought.content.match(/```(?:bash|sh)?\s*\n?(.+?)\n?```/s) ||
|
|
latestThought.content.match(/^(.+)$/m)
|
|
|
|
if (!commandMatch) {
|
|
return {
|
|
status: 'failed',
|
|
error: 'Could not extract command from LLM response',
|
|
}
|
|
}
|
|
|
|
const command = commandMatch[1].trim()
|
|
|
|
// Execute via SSH with PTY enabled
|
|
try {
|
|
const sshProxyUrl = process.env.SSH_PROXY_URL || 'http://localhost:3001'
|
|
const response = await fetch(`${sshProxyUrl}/ssh/exec`, {
|
|
method: 'POST',
|
|
headers: { 'Content-Type': 'application/json' },
|
|
body: JSON.stringify({
|
|
connectionId: sshConnectionId,
|
|
command,
|
|
usePTY: true, // Enable PTY for full terminal capture
|
|
timeout: 30000,
|
|
}),
|
|
})
|
|
|
|
const data = await response.json() as { output?: string; exitCode?: number; success?: boolean }
|
|
|
|
const result = {
|
|
command,
|
|
output: data.output || '',
|
|
exitCode: data.exitCode || 1,
|
|
timestamp: new Date().toISOString(),
|
|
level: currentLevel,
|
|
}
|
|
|
|
return {
|
|
commandHistory: [result],
|
|
status: 'validating',
|
|
}
|
|
} catch (error) {
|
|
return {
|
|
status: 'failed',
|
|
error: `SSH execution failed: ${error instanceof Error ? error.message : String(error)}`,
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Validate if password was found
|
|
*/
|
|
async function validateResult(
|
|
state: BanditAgentState,
|
|
config?: RunnableConfig
|
|
): Promise<Partial<BanditAgentState>> {
|
|
const { commandHistory } = state
|
|
const lastCommand = commandHistory[commandHistory.length - 1]
|
|
|
|
// Simple password extraction (32-char alphanumeric)
|
|
const passwordMatch = lastCommand.output.match(/([A-Za-z0-9]{32,})/)
|
|
|
|
if (passwordMatch) {
|
|
return {
|
|
nextPassword: passwordMatch[1],
|
|
status: 'advancing',
|
|
}
|
|
}
|
|
|
|
// Retry if under limit
|
|
if (state.retryCount < state.maxRetries) {
|
|
return {
|
|
retryCount: state.retryCount + 1,
|
|
status: 'planning',
|
|
}
|
|
}
|
|
|
|
return {
|
|
status: 'failed',
|
|
error: `Max retries reached for level ${state.currentLevel}`,
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Advance to next level
|
|
*/
|
|
async function advanceLevel(
|
|
state: BanditAgentState,
|
|
config?: RunnableConfig
|
|
): Promise<Partial<BanditAgentState>> {
|
|
const nextLevel = state.currentLevel + 1
|
|
|
|
if (nextLevel > state.targetLevel) {
|
|
return {
|
|
status: 'complete',
|
|
currentLevel: nextLevel,
|
|
currentPassword: state.nextPassword || '',
|
|
}
|
|
}
|
|
|
|
return {
|
|
currentLevel: nextLevel,
|
|
currentPassword: state.nextPassword || '',
|
|
nextPassword: null,
|
|
levelGoal: LEVEL_GOALS[nextLevel] || 'Unknown',
|
|
retryCount: 0,
|
|
status: 'planning',
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Conditional routing function
|
|
*/
|
|
function shouldContinue(state: BanditAgentState): string {
|
|
if (state.status === 'complete' || state.status === 'failed') return END
|
|
if (state.status === 'paused') return END
|
|
if (state.status === 'planning') return 'plan_level'
|
|
if (state.status === 'executing') return 'execute_command'
|
|
if (state.status === 'validating') return 'validate_result'
|
|
if (state.status === 'advancing') return 'advance_level'
|
|
return END
|
|
}
|
|
|
|
/**
|
|
* Agent executor that can run in SSH proxy
|
|
*/
|
|
export class BanditAgent {
|
|
private llm: ChatOpenAI
|
|
private graph: ReturnType<typeof StateGraph.prototype.compile>
|
|
private responseSender?: Response
|
|
|
|
constructor(config: {
|
|
runId: string
|
|
modelName: string
|
|
apiKey: string
|
|
startLevel: number
|
|
endLevel: number
|
|
responseSender?: Response
|
|
}) {
|
|
this.llm = new ChatOpenAI({
|
|
model: config.modelName,
|
|
apiKey: config.apiKey,
|
|
temperature: 0.7,
|
|
configuration: {
|
|
baseURL: 'https://openrouter.ai/api/v1',
|
|
},
|
|
})
|
|
|
|
this.responseSender = config.responseSender
|
|
this.graph = this.createGraph()
|
|
}
|
|
|
|
private createGraph() {
|
|
const workflow = new StateGraph(BanditState)
|
|
.addNode('plan_level', planLevel)
|
|
.addNode('execute_command', executeCommand)
|
|
.addNode('validate_result', validateResult)
|
|
.addNode('advance_level', advanceLevel)
|
|
.addEdge(START, 'plan_level')
|
|
.addConditionalEdges('plan_level', shouldContinue)
|
|
.addConditionalEdges('execute_command', shouldContinue)
|
|
.addConditionalEdges('validate_result', shouldContinue)
|
|
.addConditionalEdges('advance_level', shouldContinue)
|
|
|
|
return workflow.compile()
|
|
}
|
|
|
|
private emit(event: any) {
|
|
if (this.responseSender && !this.responseSender.writableEnded) {
|
|
// Send as JSONL (newline-delimited JSON)
|
|
this.responseSender.write(JSON.stringify(event) + '\n')
|
|
}
|
|
}
|
|
|
|
async run(initialState: Partial<BanditAgentState>): Promise<void> {
|
|
try {
|
|
// Stream updates using context7 recommended pattern
|
|
const stream = await this.graph.stream(
|
|
initialState,
|
|
{
|
|
streamMode: "updates", // Per context7: emit after each step
|
|
configurable: { llm: this.llm }, // Pass LLM through config
|
|
}
|
|
)
|
|
|
|
for await (const update of stream) {
|
|
// Emit each update as JSONL event
|
|
const [nodeName, nodeOutput] = Object.entries(update)[0]
|
|
|
|
this.emit({
|
|
type: 'node_update',
|
|
node: nodeName,
|
|
data: nodeOutput,
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
|
|
// Send specific event types based on node
|
|
if (nodeName === 'plan_level' && nodeOutput.thoughts) {
|
|
const thought = nodeOutput.thoughts[nodeOutput.thoughts.length - 1]
|
|
|
|
// Emit as 'thinking' event for UI
|
|
this.emit({
|
|
type: 'thinking',
|
|
data: {
|
|
content: thought.content,
|
|
level: thought.level,
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
|
|
// Also emit as 'agent_message' for chat panel
|
|
this.emit({
|
|
type: 'agent_message',
|
|
data: {
|
|
content: `Planning: ${thought.content}`,
|
|
level: thought.level,
|
|
metadata: {
|
|
thoughtType: thought.type,
|
|
},
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
}
|
|
|
|
if (nodeName === 'execute_command' && nodeOutput.commandHistory) {
|
|
const cmd = nodeOutput.commandHistory[nodeOutput.commandHistory.length - 1]
|
|
|
|
// Emit tool call event
|
|
this.emit({
|
|
type: 'tool_call',
|
|
data: {
|
|
content: `ssh_exec: ${cmd.command}`,
|
|
level: cmd.level,
|
|
metadata: {
|
|
tool: 'ssh_exec',
|
|
command: cmd.command,
|
|
},
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
|
|
// Emit terminal output with prompt
|
|
this.emit({
|
|
type: 'terminal_output',
|
|
data: {
|
|
content: `$ ${cmd.command}`,
|
|
command: cmd.command,
|
|
level: cmd.level,
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
|
|
// Emit command result (includes ANSI codes from PTY)
|
|
this.emit({
|
|
type: 'terminal_output',
|
|
data: {
|
|
content: cmd.output,
|
|
level: cmd.level,
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
}
|
|
|
|
if (nodeName === 'validate_result' && nodeOutput.nextPassword) {
|
|
this.emit({
|
|
type: 'agent_message',
|
|
data: {
|
|
content: `Password found: ${nodeOutput.nextPassword}`,
|
|
level: nodeOutput.currentLevel,
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
}
|
|
|
|
if (nodeName === 'advance_level' && nodeOutput.currentLevel !== undefined) {
|
|
this.emit({
|
|
type: 'level_complete',
|
|
data: {
|
|
content: `Level ${nodeOutput.currentLevel - 1} completed successfully`,
|
|
level: nodeOutput.currentLevel - 1,
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
|
|
this.emit({
|
|
type: 'agent_message',
|
|
data: {
|
|
content: `Advancing to Level ${nodeOutput.currentLevel}`,
|
|
level: nodeOutput.currentLevel,
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
}
|
|
|
|
if (nodeOutput.error) {
|
|
this.emit({
|
|
type: 'error',
|
|
data: {
|
|
content: nodeOutput.error,
|
|
level: nodeOutput.currentLevel,
|
|
},
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
}
|
|
}
|
|
|
|
// Final completion event
|
|
this.emit({
|
|
type: 'run_complete',
|
|
data: { content: 'Agent run completed successfully' },
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
} catch (error) {
|
|
this.emit({
|
|
type: 'error',
|
|
data: { content: error instanceof Error ? error.message : String(error) },
|
|
timestamp: new Date().toISOString(),
|
|
})
|
|
} finally {
|
|
if (this.responseSender && !this.responseSender.writableEnded) {
|
|
this.responseSender.end()
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|