nicholai 4a517dfa97 Fix __name polyfill - app now loads without errors
- Added globalThis.__name polyfill in layout.tsx head using dangerouslySetInnerHTML
- Fixed wrangler.jsonc to use inline DO (removed script_name reference)
- Fixed patch-worker.js duplicate detection
- Updated todos: WebSocket still needs debugging but core app is functional
2025-10-09 14:27:03 -06:00

483 lines
14 KiB
TypeScript

/**
* LangGraph agent integrated with SSH proxy
* Runs in Node.js environment with full dependency support
* Based on context7 best practices for streaming and config passing
*/
import { StateGraph, END, START, Annotation } from "@langchain/langgraph"
import { HumanMessage, SystemMessage } from "@langchain/core/messages"
import { ChatOpenAI } from "@langchain/openai"
import type { RunnableConfig } from "@langchain/core/runnables"
import type { Client } from 'ssh2'
import type { Response } from 'express'
// Define state using Annotation for proper LangGraph typing
const BanditState = Annotation.Root({
runId: Annotation<string>,
currentLevel: Annotation<number>,
targetLevel: Annotation<number>,
currentPassword: Annotation<string>,
nextPassword: Annotation<string | null>,
levelGoal: Annotation<string>,
commandHistory: Annotation<Array<{
command: string
output: string
exitCode: number
timestamp: string
level: number
}>>({
reducer: (left, right) => left.concat(right),
default: () => [],
}),
thoughts: Annotation<Array<{
type: 'plan' | 'observation' | 'reasoning' | 'decision'
content: string
timestamp: string
level: number
}>>({
reducer: (left, right) => left.concat(right),
default: () => [],
}),
status: Annotation<'planning' | 'executing' | 'validating' | 'advancing' | 'paused' | 'complete' | 'failed'>,
retryCount: Annotation<number>,
maxRetries: Annotation<number>,
sshConnectionId: Annotation<string | null>,
error: Annotation<string | null>,
})
type BanditAgentState = typeof BanditState.State
const LEVEL_GOALS: Record<number, string> = {
0: "Read 'readme' file in home directory",
1: "Read '-' file (use 'cat ./-' or 'cat < -')",
2: "Find and read hidden file with spaces in name",
3: "Find file with specific permissions",
4: "Find file in inhere directory that is human-readable",
5: "Find file owned by bandit7, group bandit6, 33 bytes",
// Add more as needed
}
const SYSTEM_PROMPT = `You are BanditRunner, an autonomous operator solving the OverTheWire Bandit wargame.
RULES:
1. Only use safe commands: ls, cat, grep, find, base64, etc.
2. Think step-by-step
3. Extract passwords (32-char alphanumeric strings)
4. Validate before advancing
WORKFLOW:
1. Plan - analyze level goal
2. Execute - run command
3. Validate - check for password
4. Advance - move to next level`
/**
* Create planning node - LLM decides next command
* Following context7 pattern: pass RunnableConfig for proper streaming
*/
async function planLevel(
state: BanditAgentState,
config?: RunnableConfig
): Promise<Partial<BanditAgentState>> {
const { currentLevel, levelGoal, commandHistory, sshConnectionId, currentPassword } = state
// Establish SSH connection if needed
if (!sshConnectionId) {
const sshProxyUrl = process.env.SSH_PROXY_URL || 'http://localhost:3001'
const connectResponse = await fetch(`${sshProxyUrl}/ssh/connect`, {
method: 'POST',
headers: { 'Content-Type': 'application/json' },
body: JSON.stringify({
host: 'bandit.labs.overthewire.org',
port: 2220,
username: `bandit${currentLevel}`,
password: currentPassword,
testOnly: false,
}),
})
const connectData = await connectResponse.json() as { connectionId?: string; success?: boolean; message?: string }
if (!connectData.success || !connectData.connectionId) {
return {
status: 'failed',
error: `SSH connection failed: ${connectData.message || 'Unknown error'}`,
}
}
// Update state with connection ID
return {
sshConnectionId: connectData.connectionId,
status: 'planning',
}
}
// Get LLM from config (injected by agent)
const llm = (config?.configurable?.llm) as ChatOpenAI
// Build context from recent commands
const recentCommands = commandHistory.slice(-3).map(cmd =>
`Command: ${cmd.command}\nOutput: ${cmd.output.slice(0, 300)}\nExit: ${cmd.exitCode}`
).join('\n\n')
const messages = [
new SystemMessage(SYSTEM_PROMPT),
new HumanMessage(`Level ${currentLevel}: ${levelGoal}
Recent Commands:
${recentCommands || 'No commands yet'}
What command should I run next? Provide ONLY the exact command to execute.`),
]
const response = await llm.invoke(messages, config)
const thought = response.content as string
return {
thoughts: [{
type: 'plan',
content: thought,
timestamp: new Date().toISOString(),
level: currentLevel,
}],
status: 'executing',
}
}
/**
* Execute SSH command via proxy with PTY
*/
async function executeCommand(
state: BanditAgentState,
config?: RunnableConfig
): Promise<Partial<BanditAgentState>> {
const { thoughts, currentLevel, sshConnectionId } = state
// Extract command from latest thought
const latestThought = thoughts[thoughts.length - 1]
const commandMatch = latestThought.content.match(/```(?:bash|sh)?\s*\n?(.+?)\n?```/s) ||
latestThought.content.match(/^(.+)$/m)
if (!commandMatch) {
return {
status: 'failed',
error: 'Could not extract command from LLM response',
}
}
const command = commandMatch[1].trim()
// Execute via SSH with PTY enabled
try {
const sshProxyUrl = process.env.SSH_PROXY_URL || 'http://localhost:3001'
const response = await fetch(`${sshProxyUrl}/ssh/exec`, {
method: 'POST',
headers: { 'Content-Type': 'application/json' },
body: JSON.stringify({
connectionId: sshConnectionId,
command,
usePTY: true, // Enable PTY for full terminal capture
timeout: 30000,
}),
})
const data = await response.json() as { output?: string; exitCode?: number; success?: boolean }
const result = {
command,
output: data.output || '',
exitCode: data.exitCode || 1,
timestamp: new Date().toISOString(),
level: currentLevel,
}
return {
commandHistory: [result],
status: 'validating',
}
} catch (error) {
return {
status: 'failed',
error: `SSH execution failed: ${error instanceof Error ? error.message : String(error)}`,
}
}
}
/**
* Validate if password was found
*/
async function validateResult(
state: BanditAgentState,
config?: RunnableConfig
): Promise<Partial<BanditAgentState>> {
const { commandHistory } = state
const lastCommand = commandHistory[commandHistory.length - 1]
// Simple password extraction (32-char alphanumeric)
const passwordMatch = lastCommand.output.match(/([A-Za-z0-9]{32,})/)
if (passwordMatch) {
return {
nextPassword: passwordMatch[1],
status: 'advancing',
}
}
// Retry if under limit
if (state.retryCount < state.maxRetries) {
return {
retryCount: state.retryCount + 1,
status: 'planning',
}
}
return {
status: 'failed',
error: `Max retries reached for level ${state.currentLevel}`,
}
}
/**
* Advance to next level
*/
async function advanceLevel(
state: BanditAgentState,
config?: RunnableConfig
): Promise<Partial<BanditAgentState>> {
const nextLevel = state.currentLevel + 1
if (nextLevel > state.targetLevel) {
return {
status: 'complete',
currentLevel: nextLevel,
currentPassword: state.nextPassword || '',
}
}
return {
currentLevel: nextLevel,
currentPassword: state.nextPassword || '',
nextPassword: null,
levelGoal: LEVEL_GOALS[nextLevel] || 'Unknown',
retryCount: 0,
status: 'planning',
}
}
/**
* Conditional routing function
*/
function shouldContinue(state: BanditAgentState): string {
if (state.status === 'complete' || state.status === 'failed') return END
if (state.status === 'paused') return END
if (state.status === 'planning') return 'plan_level'
if (state.status === 'executing') return 'execute_command'
if (state.status === 'validating') return 'validate_result'
if (state.status === 'advancing') return 'advance_level'
return END
}
/**
* Agent executor that can run in SSH proxy
*/
export class BanditAgent {
private llm: ChatOpenAI
private graph: ReturnType<typeof StateGraph.prototype.compile>
private responseSender?: Response
constructor(config: {
runId: string
modelName: string
apiKey: string
startLevel: number
endLevel: number
responseSender?: Response
}) {
this.llm = new ChatOpenAI({
model: config.modelName,
apiKey: config.apiKey,
temperature: 0.7,
configuration: {
baseURL: 'https://openrouter.ai/api/v1',
},
})
this.responseSender = config.responseSender
this.graph = this.createGraph()
}
private createGraph() {
const workflow = new StateGraph(BanditState)
.addNode('plan_level', planLevel)
.addNode('execute_command', executeCommand)
.addNode('validate_result', validateResult)
.addNode('advance_level', advanceLevel)
.addEdge(START, 'plan_level')
.addConditionalEdges('plan_level', shouldContinue)
.addConditionalEdges('execute_command', shouldContinue)
.addConditionalEdges('validate_result', shouldContinue)
.addConditionalEdges('advance_level', shouldContinue)
return workflow.compile()
}
private emit(event: any) {
if (this.responseSender && !this.responseSender.writableEnded) {
// Send as JSONL (newline-delimited JSON)
this.responseSender.write(JSON.stringify(event) + '\n')
}
}
async run(initialState: Partial<BanditAgentState>): Promise<void> {
try {
// Stream updates using context7 recommended pattern
const stream = await this.graph.stream(
initialState,
{
streamMode: "updates", // Per context7: emit after each step
configurable: { llm: this.llm }, // Pass LLM through config
}
)
for await (const update of stream) {
// Emit each update as JSONL event
const [nodeName, nodeOutput] = Object.entries(update)[0]
this.emit({
type: 'node_update',
node: nodeName,
data: nodeOutput,
timestamp: new Date().toISOString(),
})
// Send specific event types based on node
if (nodeName === 'plan_level' && nodeOutput.thoughts) {
const thought = nodeOutput.thoughts[nodeOutput.thoughts.length - 1]
// Emit as 'thinking' event for UI
this.emit({
type: 'thinking',
data: {
content: thought.content,
level: thought.level,
},
timestamp: new Date().toISOString(),
})
// Also emit as 'agent_message' for chat panel
this.emit({
type: 'agent_message',
data: {
content: `Planning: ${thought.content}`,
level: thought.level,
metadata: {
thoughtType: thought.type,
},
},
timestamp: new Date().toISOString(),
})
}
if (nodeName === 'execute_command' && nodeOutput.commandHistory) {
const cmd = nodeOutput.commandHistory[nodeOutput.commandHistory.length - 1]
// Emit tool call event
this.emit({
type: 'tool_call',
data: {
content: `ssh_exec: ${cmd.command}`,
level: cmd.level,
metadata: {
tool: 'ssh_exec',
command: cmd.command,
},
},
timestamp: new Date().toISOString(),
})
// Emit terminal output with prompt
this.emit({
type: 'terminal_output',
data: {
content: `$ ${cmd.command}`,
command: cmd.command,
level: cmd.level,
},
timestamp: new Date().toISOString(),
})
// Emit command result (includes ANSI codes from PTY)
this.emit({
type: 'terminal_output',
data: {
content: cmd.output,
level: cmd.level,
},
timestamp: new Date().toISOString(),
})
}
if (nodeName === 'validate_result' && nodeOutput.nextPassword) {
this.emit({
type: 'agent_message',
data: {
content: `Password found: ${nodeOutput.nextPassword}`,
level: nodeOutput.currentLevel,
},
timestamp: new Date().toISOString(),
})
}
if (nodeName === 'advance_level' && nodeOutput.currentLevel !== undefined) {
this.emit({
type: 'level_complete',
data: {
content: `Level ${nodeOutput.currentLevel - 1} completed successfully`,
level: nodeOutput.currentLevel - 1,
},
timestamp: new Date().toISOString(),
})
this.emit({
type: 'agent_message',
data: {
content: `Advancing to Level ${nodeOutput.currentLevel}`,
level: nodeOutput.currentLevel,
},
timestamp: new Date().toISOString(),
})
}
if (nodeOutput.error) {
this.emit({
type: 'error',
data: {
content: nodeOutput.error,
level: nodeOutput.currentLevel,
},
timestamp: new Date().toISOString(),
})
}
}
// Final completion event
this.emit({
type: 'run_complete',
data: { content: 'Agent run completed successfully' },
timestamp: new Date().toISOString(),
})
} catch (error) {
this.emit({
type: 'error',
data: { content: error instanceof Error ? error.message : String(error) },
timestamp: new Date().toISOString(),
})
} finally {
if (this.responseSender && !this.responseSender.writableEnded) {
this.responseSender.end()
}
}
}
}