Use custom tool calling prompts to get streaming working

2026-03-28 20:19:28 -04:00 · 2024-09-27 15:56:36 -04:00
parent 3b7af5749d
commit b1dcff8f64
4 changed files with 737 additions and 250 deletions
--- a/src/api/providers/anthropic.ts
+++ b/src/api/providers/anthropic.ts
@@ -43,7 +43,7 @@ export class AnthropicHandler implements ApiHandler {
 					{
 						model: modelId,
 						max_tokens: this.getModel().info.maxTokens,
-						temperature: 0.2,
+						temperature: 0,
 						system: [{ text: systemPrompt, type: "text", cache_control: { type: "ephemeral" } }], // setting cache breakpoint for system prompt so new tasks can reuse it
 						messages: messages.map((message, index) => {
 							if (index === lastUserMsgIndex || index === secondLastMsgUserIndex) {
@@ -67,8 +67,8 @@ export class AnthropicHandler implements ApiHandler {
 							}
 							return message
 						}),
-						tools, // cache breakpoints go from tools > system > messages, and since tools dont change, we can just set the breakpoint at the end of system (this avoids having to set a breakpoint at the end of tools which by itself does not meet min requirements for haiku caching)
+						// tools, // cache breakpoints go from tools > system > messages, and since tools dont change, we can just set the breakpoint at the end of system (this avoids having to set a breakpoint at the end of tools which by itself does not meet min requirements for haiku caching)
-						tool_choice: { type: "auto" },
+						// tool_choice: { type: "auto" },
 						stream: true,
 					},
 					(() => {
@@ -101,11 +101,11 @@ export class AnthropicHandler implements ApiHandler {
 				const stream = await this.client.messages.create({
 					model: modelId,
 					max_tokens: this.getModel().info.maxTokens,
-					temperature: 0.2,
+					temperature: 0,
 					system: [{ text: systemPrompt, type: "text" }],
 					messages,
-					tools,
+					// tools,
-					tool_choice: { type: "auto" },
+					// tool_choice: { type: "auto" },
 					stream: true,
 				})
 				return stream as AnthropicStream
--- a/src/core/AssistantMessage.ts
+++ b/src/core/AssistantMessage.ts
@@ -0,0 +1,95 @@
 // export interface AssistantMessage {
 // 	textContent: TextContent
 // 	toolCalls: ToolCall[]
 // }
 export type AssistantMessageContent = TextContent | ToolCall
 export interface TextContent {
 	type: "text"
 	content: string
 	partial: boolean
 }
 export const toolCallNames = [
 	"execute_command",
 	"read_file",
 	"write_to_file",
 	"search_files",
 	"list_files",
 	"list_code_definition_names",
 	"inspect_site",
 	"ask_followup_question",
 	"attempt_completion",
 ] as const
 // Converts array of tool call names into a union type ("execute_command" | "read_file" | ...)
 export type ToolCallName = (typeof toolCallNames)[number]
 export const toolParamNames = [
 	"command",
 	"path",
 	"content",
 	"regex",
 	"file_pattern",
 	"recursive",
 	"url",
 	"question",
 	"result",
 ] as const
 export type ToolParamName = (typeof toolParamNames)[number]
 export interface ToolCall {
 	type: "tool_call"
 	name: ToolCallName
 	// params is a partial record, allowing only some or none of the possible parameters to be used
 	params: Partial<Record<ToolParamName, string>>
 	partial: boolean
 }
 interface ExecuteCommandToolCall extends ToolCall {
 	name: "execute_command"
 	// Pick<Record<ToolParamName, string>, "command"> makes "command" required, but Partial<> makes it optional
 	params: Partial<Pick<Record<ToolParamName, string>, "command">>
 }
 interface ReadFileToolCall extends ToolCall {
 	name: "read_file"
 	params: Partial<Pick<Record<ToolParamName, string>, "path">>
 }
 interface WriteToFileToolCall extends ToolCall {
 	name: "write_to_file"
 	params: Partial<Pick<Record<ToolParamName, string>, "path" | "content">>
 }
 interface SearchFilesToolCall extends ToolCall {
 	name: "search_files"
 	params: Partial<Pick<Record<ToolParamName, string>, "path" | "regex" | "file_pattern">>
 }
 interface ListFilesToolCall extends ToolCall {
 	name: "list_files"
 	params: Partial<Pick<Record<ToolParamName, string>, "path" | "recursive">>
 }
 interface ListCodeDefinitionNamesToolCall extends ToolCall {
 	name: "list_code_definition_names"
 	params: Partial<Pick<Record<ToolParamName, string>, "path">>
 }
 interface InspectSiteToolCall extends ToolCall {
 	name: "inspect_site"
 	params: Partial<Pick<Record<ToolParamName, string>, "url">>
 }
 interface AskFollowupQuestionToolCall extends ToolCall {
 	name: "ask_followup_question"
 	params: Partial<Pick<Record<ToolParamName, string>, "question">>
 }
 interface AttemptCompletionToolCall extends ToolCall {
 	name: "attempt_completion"
 	params: Partial<Pick<Record<ToolParamName, string>, "result" | "command">>
 }
--- a/src/core/ClaudeDev.ts
+++ b/src/core/ClaudeDev.ts
@@ -34,6 +34,15 @@ import { TOOLS } from "./prompts/tools"
 import { truncateHalfConversation } from "./sliding-window"
 import { ClaudeDevProvider } from "./webview/ClaudeDevProvider"
 import cloneDeep from "clone-deep"
 import {
 	AssistantMessageContent,
 	TextContent,
 	ToolCall,
 	ToolCallName,
 	toolCallNames,
 	ToolParamName,
 	toolParamNames,
 } from "./AssistantMessage"
 const cwd =
 	vscode.workspace.workspaceFolders?.map((folder) => folder.uri.fsPath).at(0) ?? path.join(os.homedir(), "Desktop") // may or may not exist but fs checking existence would immediately ask for permission which would be bad UX, need to come up with a better solution
@@ -43,9 +52,9 @@ type UserContent = Array<
 	Anthropic.TextBlockParam | Anthropic.ImageBlockParam | Anthropic.ToolUseBlockParam | Anthropic.ToolResultBlockParam
 >
-type AnthropicPartialContentBlock = Anthropic.Messages.ContentBlock & {
+// type AnthropicPartialContentBlock = Anthropic.Messages.ContentBlock & {
-	partial?: boolean
+// 	partial?: boolean
-}
+// }
 export class ClaudeDev {
 	readonly taskId: string
@@ -65,29 +74,6 @@ export class ClaudeDev {
 	private providerRef: WeakRef<ClaudeDevProvider>
 	private abort: boolean = false
 	// streaming
 	private currentStreamingContentBlockIndex = 0
 	private didCompleteReadingStream = false
 	private assistantContentBlocks: AnthropicPartialContentBlock[] = []
 	private toolResults: Anthropic.ToolResultBlockParam[] = []
 	private toolResultsReady = false
 	private didRejectTool = false
 	private presentAssistantContentLocked = false
 	private partialJsonParser: JSONParser | undefined
 	private partialJsonParserState: {
 		partialObject: Record<string, string>
 		currentKey: string
 		currentValue: string
 		parsingKey: boolean
 		parsingValue: boolean
 	} = {
 		partialObject: {},
 		currentKey: "",
 		currentValue: "",
 		parsingKey: false,
 		parsingValue: false,
 	}
 	constructor(
 		provider: ClaudeDevProvider,
 		apiConfiguration: ApiConfiguration,
@@ -1725,63 +1711,105 @@ ${this.customInstructions.trim()}
 		}
 	}
-	private presentAssistantContentHasPendingUpdates = false
+	async presentAssistantMessage() {
-	async presentAssistantContent() {
+		if (this.presentAssistantMessageLocked) {
-		if (this.presentAssistantContentLocked) {
+			this.presentAssistantMessageHasPendingUpdates = true
 			this.presentAssistantContentHasPendingUpdates = true
 			return
 		}
-		this.presentAssistantContentLocked = true
+		this.presentAssistantMessageLocked = true
-		this.presentAssistantContentHasPendingUpdates = false
+		this.presentAssistantMessageHasPendingUpdates = false
-		if (this.currentStreamingContentBlockIndex >= this.assistantContentBlocks.length) {
+		if (this.currentStreamingContentIndex >= this.assistantMessageContent.length) {
 			throw new Error("No more content blocks to stream! This shouldn't happen...") // remove and just return after testing
 		}
-		const block = cloneDeep(this.assistantContentBlocks[this.currentStreamingContentBlockIndex]) // need to create copy bc while stream is updating the array, it could be updating the reference block properties too
+		const block = cloneDeep(this.assistantMessageContent[this.currentStreamingContentIndex]) // need to create copy bc while stream is updating the array, it could be updating the reference block properties too
 		switch (block.type) {
 			case "text":
-				await this.say("text", block.text, undefined, block.partial)
+				await this.say("text", block.content, undefined, block.partial)
 				break
-			case "tool_use":
+			case "tool_call":
-				const toolName = block.name as ToolName
+				const toolDescription = () => {
-				const toolInput = block.input as any
+					switch (block.name) {
-				const toolUseId = block.id
+						case "execute_command":
 							return `[${block.name} for '${block.params.command}']`
 						case "read_file":
 							return `[${block.name} for '${block.params.path}']`
 						case "write_to_file":
 							return `[${block.name} for '${block.params.path}']`
 						case "search_files":
 							return `[${block.name} for '${block.params.regex}'${
 								block.params.file_pattern ? ` in '${block.params.file_pattern}'` : ""
 							}]`
 						case "list_files":
 							return `[${block.name} for '${block.params.path}']`
 						case "list_code_definition_names":
 							return `[${block.name} for '${block.params.path}']`
 						case "inspect_site":
 							return `[${block.name} for '${block.params.url}']`
 						case "ask_followup_question":
 							return `[${block.name} for '${block.params.question}']`
 						case "attempt_completion":
 							return `[${block.name}]`
 					}
 				}
 				if (this.didRejectTool) {
 					// ignore any tool content after user has rejected tool once
 					// we'll fill it in with a rejection message when the message is complete
 					if (!block.partial) {
-						this.toolResults.push({
+						this.userMessageContent.push({
-							type: "tool_result",
+							type: "text",
-							tool_use_id: toolUseId,
+							text: `Skipping tool ${toolDescription()} due to user rejecting a previous tool.`,
 							content: "Skipping tool execution due to previous tool user rejection.",
 						})
 					}
 					break
 				}
 				const pushToolResult = (content: ToolResponse) => {
 					this.userMessageContent.push({
 						type: "text",
 						text: `${toolDescription()} Result:`,
 					})
 					if (typeof content === "string") {
 						this.userMessageContent.push({
 							type: "text",
 							text: content,
 						})
 					} else {
 						this.userMessageContent.push(...content)
 					}
 				}
 				const askApproval = async (type: ClaudeAsk, partialMessage?: string) => {
 					const { response, text, images } = await this.ask(type, partialMessage, false)
 					if (response !== "yesButtonTapped") {
 						if (response === "messageResponse") {
 							await this.say("user_feedback", text, images)
-							this.toolResults.push({
+							pushToolResult(
-								type: "tool_result",
+								this.formatToolResponseWithImages(await this.formatToolDeniedFeedback(text), images)
-								tool_use_id: toolUseId,
+							)
-								content: this.formatToolResponseWithImages(
+							// this.userMessageContent.push({
-									await this.formatToolDeniedFeedback(text),
+							// 	type: "text",
-									images
+							// 	text: `${toolDescription()}`,
-								),
+							// })
-							})
+							// this.toolResults.push({
 							// 	type: "tool_result",
 							// 	tool_use_id: toolUseId,
 							// 	content: this.formatToolResponseWithImages(
 							// 		await this.formatToolDeniedFeedback(text),
 							// 		images
 							// 	),
 							// })
 							this.didRejectTool = true
 							return false
 						}
-						this.toolResults.push({
+						pushToolResult(await this.formatToolDenied())
-							type: "tool_result",
+						// this.toolResults.push({
-							tool_use_id: toolUseId,
+						// 	type: "tool_result",
-							content: await this.formatToolDenied(),
+						// 	tool_use_id: toolUseId,
-						})
+						// 	content: await this.formatToolDenied(),
 						// })
 						this.didRejectTool = true
 						return false
 					}
@@ -1794,24 +1822,17 @@ ${this.customInstructions.trim()}
 						"error",
 						`Error ${action}:\n${error.message ?? JSON.stringify(serializeError(error), null, 2)}`
 					)
-					this.toolResults.push({
+					// this.toolResults.push({
-						type: "tool_result",
+					// 	type: "tool_result",
-						tool_use_id: toolUseId,
+					// 	tool_use_id: toolUseId,
-						content: await this.formatToolError(errorString),
+					// 	content: await this.formatToolError(errorString),
-					})
+					// })
 					pushToolResult(await this.formatToolError(errorString))
 				}
-				const pushToolResult = (content: ToolResponse) => {
+				switch (block.name) {
 					this.toolResults.push({
 						type: "tool_result",
 						tool_use_id: toolUseId,
 						content,
 					})
 				}
 				switch (toolName) {
 					case "read_file": {
-						const relPath: string | undefined = toolInput.path
+						const relPath: string | undefined = block.params.path
 						const sharedMessageProps: ClaudeSayTool = {
 							tool: "readFile",
 							path: relPath || "", //this.getReadablePath(relPath || ""),
@@ -1859,8 +1880,8 @@ ${this.customInstructions.trim()}
 						}
 					}
 					case "list_files": {
-						const relDirPath: string | undefined = toolInput.path
+						const relDirPath: string | undefined = block.params.path
-						const recursiveRaw: string | undefined = toolInput.path
+						const recursiveRaw: string | undefined = block.params.path
 						const recursive = recursiveRaw?.toLowerCase() === "true"
 						const sharedMessageProps: ClaudeSayTool = {
 							tool: !recursive ? "listFilesTopLevel" : "listFilesRecursive",
@@ -1909,7 +1930,7 @@ ${this.customInstructions.trim()}
 						}
 					}
 					case "list_code_definition_names": {
-						const relDirPath: string | undefined = toolInput.path
+						const relDirPath: string | undefined = block.params.path
 						const sharedMessageProps: ClaudeSayTool = {
 							tool: "listCodeDefinitionNames",
 							path: relDirPath || "",
@@ -1958,9 +1979,9 @@ ${this.customInstructions.trim()}
 						}
 					}
 					case "search_files": {
-						const relDirPath: string | undefined = toolInput.path
+						const relDirPath: string | undefined = block.params.path
-						const regex: string | undefined = toolInput.regex
+						const regex: string | undefined = block.params.regex
-						const filePattern: string | undefined = toolInput.filePattern
+						const filePattern: string | undefined = block.params.file_pattern
 						const sharedMessageProps: ClaudeSayTool = {
 							tool: "searchFiles",
 							path: relDirPath || "",
@@ -2014,7 +2035,7 @@ ${this.customInstructions.trim()}
 						}
 					}
 					case "inspect_site": {
-						const url: string | undefined = toolInput.url
+						const url: string | undefined = block.params.url
 						const sharedMessageProps: ClaudeSayTool = {
 							tool: "inspectSite",
 							path: url || "",
@@ -2076,7 +2097,7 @@ ${this.customInstructions.trim()}
 						}
 					}
 					case "execute_command": {
-						const command: string | undefined = toolInput.command
+						const command: string | undefined = block.params.command
 						try {
 							if (block.partial) {
 								await this.ask("command", command || "", block.partial).catch(() => {})
@@ -2108,7 +2129,7 @@ ${this.customInstructions.trim()}
 					}
 					case "ask_followup_question": {
-						const question: string | undefined = toolInput.question
+						const question: string | undefined = block.params.question
 						try {
 							if (block.partial) {
 								await this.ask("followup", question || "", block.partial).catch(() => {})
@@ -2135,8 +2156,8 @@ ${this.customInstructions.trim()}
 						}
 					}
 					case "attempt_completion": {
-						const result: string | undefined = toolInput.result
+						const result: string | undefined = block.params.result
-						const command: string | undefined = toolInput.command
+						const command: string | undefined = block.params.command
 						try {
 							const lastMessage = this.claudeMessages.at(-1)
 							if (block.partial) {
@@ -2214,135 +2235,268 @@ ${this.customInstructions.trim()}
 				break
 		}
-		this.presentAssistantContentLocked = false
+		this.presentAssistantMessageLocked = false
 		if (!block.partial) {
 			// block is finished streaming and executing
 			if (
-				this.currentStreamingContentBlockIndex === this.assistantContentBlocks.length - 1 &&
+				this.currentStreamingContentIndex === this.assistantMessageContent.length - 1 &&
 				this.didCompleteReadingStream
 			) {
 				// last block is complete and it is finished executing
-				this.toolResultsReady = true // will allow pwaitfor to continue
+				this.userMessageContentReady = true // will allow pwaitfor to continue
 			} else {
 				// call next block if it exists (if not then read stream will call it when its ready)
-				this.currentStreamingContentBlockIndex++ // need to increment regardless, so when read stream calls this function again it will be streaming the next block
+				this.currentStreamingContentIndex++ // need to increment regardless, so when read stream calls this function again it will be streaming the next block
-				if (this.currentStreamingContentBlockIndex < this.assistantContentBlocks.length) {
+				if (this.currentStreamingContentIndex < this.assistantMessageContent.length) {
 					// there are already more content blocks to stream, so we'll call this function ourselves
 					// await this.presentAssistantContent()
-					this.presentAssistantContent()
+					this.presentAssistantMessage()
 					return
 				}
 			}
 		}
 		// block is partial, but the read stream may have finished
-		if (this.presentAssistantContentHasPendingUpdates) {
+		if (this.presentAssistantMessageHasPendingUpdates) {
-			this.presentAssistantContent()
+			this.presentAssistantMessage()
 		}
 	}
-	//
+	// //
 	// private partialJsonParser: JSONParser | undefined
 	// private partialJsonParserState: {
 	// 	partialObject: Record<string, string>
 	// 	currentKey: string
 	// 	currentValue: string
 	// 	parsingKey: boolean
 	// 	parsingValue: boolean
 	// } = {
 	// 	partialObject: {},
 	// 	currentKey: "",
 	// 	currentValue: "",
 	// 	parsingKey: false,
 	// 	parsingValue: false,
 	// }
 	// private chunkIndexToJsonParser = new Map<number, JSONParser>()
 	// getJsonParserForChunk(chunkIndex: number): JSONParser {
 	// 	if (!this.chunkIndexToJsonParser.has(chunkIndex)) {
 	// 		const parser = new JSONParser({ emitPartialTokens: true, emitPartialValues: true })
 	// 		// this package enforces setting up an onValue listener ("Can't emit data before the "onValue" callback has been set up."), even though we don't need it.
 	// 		parser.onValue = () => console.log(`onValue for chunk ${chunkIndex}`)
 	// 		// parser.onError = (error) => console.error(`Error parsing JSON for chunk ${chunkIndex}:`, error);
 	// 		// parser.onEnd = () => console.log(`JSON parsing ended for chunk ${chunkIndex}`);
-	private chunkIndexToJsonParser = new Map<number, JSONParser>()
+	// 		let partialObject: Record<string, string> = {}
-	getJsonParserForChunk(chunkIndex: number): JSONParser {
+	// 		let currentKey: string = ""
-		if (!this.chunkIndexToJsonParser.has(chunkIndex)) {
+	// 		let currentValue: string = ""
-			const parser = new JSONParser({ emitPartialTokens: true, emitPartialValues: true })
+	// 		let parsingKey: boolean = false
-			// this package enforces setting up an onValue listener ("Can't emit data before the "onValue" callback has been set up."), even though we don't need it.
+	// 		let parsingValue: boolean = false
 			parser.onValue = () => console.log(`onValue for chunk ${chunkIndex}`)
 			// parser.onError = (error) => console.error(`Error parsing JSON for chunk ${chunkIndex}:`, error);
 			// parser.onEnd = () => console.log(`JSON parsing ended for chunk ${chunkIndex}`);
-			let partialObject: Record<string, string> = {}
+	// 		// our json will only ever be string to string maps
-			let currentKey: string = ""
+	// 		// { "key": "value", "key2": "value2" }
-			let currentValue: string = ""
+	// 		// so left brace, string, colon, comma, right brace
-			let parsingKey: boolean = false
+	// 		// (need to recreate this listener each time to update the resolve ref)
-			let parsingValue: boolean = false
+	// 		parser.onToken = ({ token, value, offset, partial }) => {
 	// 			console.log("onToken")
-			// our json will only ever be string to string maps
+	// 			try {
-			// { "key": "value", "key2": "value2" }
+	// 				switch (token) {
-			// so left brace, string, colon, comma, right brace
+	// 					case TokenType.LEFT_BRACE:
-			// (need to recreate this listener each time to update the resolve ref)
+	// 						// Start of a new JSON object
-			parser.onToken = ({ token, value, offset, partial }) => {
+	// 						partialObject = {}
-				console.log("onToken")
+	// 						currentKey = ""
 	// 						parsingKey = false
 	// 						parsingValue = false
 	// 						break
 	// 					case TokenType.RIGHT_BRACE:
 	// 						// End of the current JSON object
 	// 						currentKey = ""
 	// 						currentValue = ""
 	// 						parsingKey = false
 	// 						parsingValue = false
-				try {
+	// 						// Finalize the object once parsing is complete
-					switch (token) {
+	// 						// ;(this.assistantContentBlocks[chunkIndex] as Anthropic.ToolUseBlock).input = this.partialObject
-						case TokenType.LEFT_BRACE:
+	// 						// this.assistantContentBlocks[chunkIndex]!.partial = false
-							// Start of a new JSON object
+	// 						// await this.presentAssistantContent() // NOTE: only set partial = false and call this once, since doing it several times will create duplicate messages.
-							partialObject = {}
+	// 						console.log("Final parsed object:", partialObject)
-							currentKey = ""
+	// 						break
-							parsingKey = false
+	// 					case TokenType.STRING:
-							parsingValue = false
+	// 						if (!parsingValue && !parsingKey) {
-							break
+	// 							// Starting to parse a key
-						case TokenType.RIGHT_BRACE:
+	// 							currentKey = value as string
-							// End of the current JSON object
+	// 							parsingKey = !!partial // if not partial, we are done parsing key
-							currentKey = ""
+	// 						} else if (parsingKey) {
-							currentValue = ""
+	// 							// Continuing to parse a key
-							parsingKey = false
+	// 							currentKey = value as string
-							parsingValue = false
+	// 							parsingKey = !!partial
 	// 						} else if (parsingValue) {
 	// 							// Parsing a value
 	// 							// Accumulate partial value and update the object
 	// 							currentValue = value as string
 	// 							if (currentKey) {
 	// 								partialObject[currentKey] = currentValue
 	// 							}
 	// 							parsingValue = !!partial // if not partial, complete value
 	// 						}
 	// 						break
 	// 					case TokenType.COLON:
 	// 						// After a key and colon, expect a value
 	// 						if (currentKey !== null) {
 	// 							parsingValue = true
 	// 						}
 	// 						break
 	// 					case TokenType.COMMA:
 	// 						// Reset for the next key-value pair
 	// 						currentKey = ""
 	// 						currentValue = ""
 	// 						parsingKey = false
 	// 						parsingValue = false
 	// 						break
 	// 					default:
 	// 						console.error("Unexpected token:", token)
 	// 				}
-							// Finalize the object once parsing is complete
+	// 				// Debugging logs to trace the parsing process
-							// ;(this.assistantContentBlocks[chunkIndex] as Anthropic.ToolUseBlock).input = this.partialObject
+	// 				console.log("Partial object:", partialObject)
-							// this.assistantContentBlocks[chunkIndex]!.partial = false
+	// 				console.log("Offset:", offset, "isPartialToken:", partial)
-							// await this.presentAssistantContent() // NOTE: only set partial = false and call this once, since doing it several times will create duplicate messages.
+
-							console.log("Final parsed object:", partialObject)
+	// 				// Update the contentBlock with the current state of the partial object
-							break
+	// 				// Use spread operator to ensure a new object reference
-						case TokenType.STRING:
+	// 				;(this.assistantContentBlocks[chunkIndex] as Anthropic.ToolUseBlock).input = {
-							if (!parsingValue && !parsingKey) {
+	// 					...partialObject,
-								// Starting to parse a key
+	// 				}
-								currentKey = value as string
+	// 				// right brace indicates the end of the json object
-								parsingKey = !!partial // if not partial, we are done parsing key
+	// 				this.assistantContentBlocks[chunkIndex]!.partial = token !== TokenType.RIGHT_BRACE
-							} else if (parsingKey) {
+
-								// Continuing to parse a key
+	// 				this.presentAssistantContent()
-								currentKey = value as string
+	// 			} catch (error) {
-								parsingKey = !!partial
+	// 				console.error("Error parsing input_json_delta", error)
-							} else if (parsingValue) {
+	// 			}
-								// Parsing a value
+	// 		}
-								// Accumulate partial value and update the object
+
-								currentValue = value as string
+	// 		this.chunkIndexToJsonParser.set(chunkIndex, parser)
-								if (currentKey) {
+	// 	}
-									partialObject[currentKey] = currentValue
+	// 	return this.chunkIndexToJsonParser.get(chunkIndex)!
-								}
+	// }
-								parsingValue = !!partial // if not partial, complete value
+
-							}
+	// streaming
-							break
+	private currentStreamingContentIndex = 0
-						case TokenType.COLON:
+	private assistantMessageContent: AssistantMessageContent[] = []
-							// After a key and colon, expect a value
+	private didCompleteReadingStream = false
-							if (currentKey !== null) {
+	// private assistantMessage?: AssistantMessage
-								parsingValue = true
+	private userMessageContent: (Anthropic.TextBlockParam | Anthropic.ImageBlockParam)[] = []
-							}
+	private userMessageContentReady = false
-							break
+	private didRejectTool = false
-						case TokenType.COMMA:
+	private presentAssistantMessageLocked = false
-							// Reset for the next key-value pair
+	private presentAssistantMessageHasPendingUpdates = false
-							currentKey = ""
+
-							currentValue = ""
+	private parseTextStreamAccumulator = ""
-							parsingKey = false
+
-							parsingValue = false
+	parseTextStream(chunk: string) {
-							break
+		this.parseTextStreamAccumulator += chunk
-						default:
+
-							console.error("Unexpected token:", token)
+		// let text = ""
 		let textContent: TextContent = {
 			type: "text",
 			content: "",
 			partial: true,
 		}
 		let toolCalls: ToolCall[] = []
-					// Debugging logs to trace the parsing process
+		let currentToolCall: ToolCall | undefined = undefined
-					console.log("Partial object:", partialObject)
+		let currentParamName: ToolParamName | undefined = undefined
-					console.log("Offset:", offset, "isPartialToken:", partial)
+		let currentParamValueLines: string[] = []
 		let textContentLines: string[] = []
-					// Update the contentBlock with the current state of the partial object
+		const rawLines = this.parseTextStreamAccumulator.split("\n")
 					// Use spread operator to ensure a new object reference
 					;(this.assistantContentBlocks[chunkIndex] as Anthropic.ToolUseBlock).input = {
 						...partialObject,
 					}
 					// right brace indicates the end of the json object
 					this.assistantContentBlocks[chunkIndex]!.partial = token !== TokenType.RIGHT_BRACE
-					this.presentAssistantContent()
+		if (rawLines.length === 1) {
-				} catch (error) {
+			const firstLine = rawLines[0].trim()
-					console.error("Error parsing input_json_delta", error)
+			if (!firstLine.startsWith("<t") && firstLine.startsWith("<")) {
 				// (we ignore tags that start with <t since it's most like a <thinking> tag (and none of our tags start with t)
 				// content is just starting, if it starts with < we can assume it's a tool call, so we'll wait for the next line
 				console.log("skipping reason 1")
 				return
 			}
 		}
-			this.chunkIndexToJsonParser.set(chunkIndex, parser)
+		if (
 			this.assistantMessageContent.length === 1 &&
 			this.assistantMessageContent[0].partial // first element is always TextContent
 		) {
 			// we're updating text content, so if we have a partial xml tag on the last line we can ignore it until we get the full line.
 			const lastLine = rawLines.at(-1)?.trim()
 			if (lastLine && !lastLine.startsWith("<t") && lastLine.startsWith("<") && !lastLine.endsWith(">")) {
 				console.log("skipping reason 2")
 				return
 			}
-		return this.chunkIndexToJsonParser.get(chunkIndex)!
+		}
 		for (const line of rawLines) {
 			const trimmed = line.trim()
 			// if currenttoolcall or currentparamname look for closing tag, more efficient and safe
 			if (currentToolCall && currentParamName && trimmed === `</${currentParamName}>`) {
 				// End of a tool parameter
 				currentToolCall.params[currentParamName] = currentParamValueLines.join("\n")
 				currentParamName = undefined
 				currentParamValueLines = []
 				// currentParamValue = undefined
 				continue
 			} else if (currentToolCall && !currentParamName && trimmed === `</${currentToolCall.name}>`) {
 				// End of a tool call
 				currentToolCall.partial = false
 				toolCalls.push(currentToolCall)
 				currentToolCall = undefined
 				continue
 			}
 			if (!currentParamName && trimmed.startsWith("<") && trimmed.endsWith(">")) {
 				const tag = trimmed.slice(1, -1)
 				if (toolCallNames.includes(tag as ToolCallName)) {
 					// Start of a new tool call
 					currentToolCall = { type: "tool_call", name: tag as ToolCallName, params: {}, partial: true }
 					// This also indicates the end of the text content
 					textContent.partial = false
 					continue
 				} else if (currentToolCall && toolParamNames.includes(tag as ToolParamName)) {
 					// Start of a parameter
 					currentParamName = tag as ToolParamName
 					// currentToolCall.params[currentParamName] = ""
 					continue
 				}
 			}
 			if (currentToolCall && !currentParamName) {
 				// current tool doesn't have a param match yet, it's likely partial so ignore
 				continue
 			}
 			if (currentToolCall && currentParamName) {
 				// add line to current param value
 				currentParamValueLines.push(line)
 				continue
 			}
 			// only add text content if we haven't started a tool yet
 			if (textContent.partial) {
 				textContentLines.push(line)
 			}
 		}
 		if (currentToolCall) {
 			// stream did not complete tool call, add it as partial
 			if (currentParamName) {
 				// tool call has a parameter that was not completed
 				currentToolCall.params[currentParamName] = currentParamValueLines.join("\n")
 			}
 			toolCalls.push(currentToolCall)
 		}
 		textContent.content = textContentLines.join("\n")
 		this.assistantMessageContent = [textContent, ...toolCalls]
 		// Present the updated content
 		this.presentAssistantMessage()
 	}
 	async recursivelyMakeClaudeRequests(
@@ -2412,11 +2566,18 @@ ${this.customInstructions.trim()}
 			// todo add error listeners so we can return api error? or wil lfor await handle that below?
-			// let contentBlocks: AnthropicPartialContentBlock[] = []
+			let apiContentBlocks: Anthropic.ContentBlock[] = []
-			this.assistantContentBlocks = []
+			this.currentStreamingContentIndex = 0
 			this.assistantMessageContent = []
 			this.didCompleteReadingStream = false
-			this.currentStreamingContentBlockIndex = 0
+			this.userMessageContent = []
-			this.chunkIndexToJsonParser.clear()
+			this.userMessageContentReady = false
 			this.didRejectTool = false
 			this.presentAssistantMessageLocked = false
 			this.presentAssistantMessageHasPendingUpdates = false
 			this.parseTextStreamAccumulator = ""
 			// this.chunkIndexToJsonParser.clear()
 			for await (const chunk of stream) {
 				switch (chunk.type) {
 					case "message_start":
@@ -2443,24 +2604,37 @@ ${this.customInstructions.trim()}
 						switch (chunk.content_block.type) {
 							case "text":
 								console.log("text", chunk.content_block.text)
-								this.assistantContentBlocks.push(chunk.content_block)
+								// this.assistantContentBlocks.push({
-								this.assistantContentBlocks.at(-1)!.partial = true
+								// 	text: chunk.content_block.text,
-								this.presentAssistantContent()
+								// 	toolCalls: [],
 								// 	partial: true,
 								// })
 								apiContentBlocks.push(chunk.content_block)
 								// we may receive multiple text blocks, in which case just insert a line break between them
 								if (chunk.index > 0) {
 									this.parseTextStream("\n")
 								}
 								this.parseTextStream(chunk.content_block.text)
 								// this.assistantContentBlocks.at(-1)!.partial = true
 								this.presentAssistantMessage()
 								break
-							case "tool_use":
+							// case "tool_use":
-								console.log(
+							// 	console.log(
-									"tool_use",
+							// 		"tool_use",
-									chunk.index,
+							// 		chunk.index,
-									chunk.content_block.id,
+							// 		chunk.content_block.id,
-									chunk.content_block.name,
+							// 		chunk.content_block.name,
-									chunk.content_block.input // input is always object, which will be streamed as partial json in content_block_delta. (this initial 'input' will always be an empty object)
+							// 		chunk.content_block.input // input is always object, which will be streamed as partial json in content_block_delta. (this initial 'input' will always be an empty object)
-								)
+							// 	)
-								this.assistantContentBlocks.push(chunk.content_block)
+							// 	apiContentBlocks.push(chunk.content_block)
-								this.assistantContentBlocks.at(-1)!.partial = true
+							// 	this.assistantContentBlocks.push(chunk.content_block)
-								this.presentAssistantContent()
+							// 	this.assistantContentBlocks.at(-1)!.partial = true
-								// Initialize the JSON parser with partial tokens enabled
+							// 	this.presentAssistantContent()
-								// partialJsonParser =
+							// // Initialize the JSON parser with partial tokens enabled
-								this.getJsonParserForChunk(chunk.index)
+							// // partialJsonParser =
 							// this.getJsonParserForChunk(chunk.index)
 						}
 						break
 					case "content_block_delta":
@@ -2468,42 +2642,42 @@ ${this.customInstructions.trim()}
 						switch (chunk.delta.type) {
 							case "text_delta":
 								console.log("text_delta", chunk.delta.text)
-								;(this.assistantContentBlocks[chunk.index] as Anthropic.TextBlock).text +=
+								;(apiContentBlocks[chunk.index] as Anthropic.TextBlock).text += chunk.delta.text
-									chunk.delta.text
+								this.parseTextStream(chunk.delta.text)
-								this.presentAssistantContent()
+								this.presentAssistantMessage()
 								break
-							case "input_json_delta":
+							// case "input_json_delta":
-								console.log("input_json_delta", chunk.delta.partial_json)
+							// 	console.log("input_json_delta", chunk.delta.partial_json)
 								try {
 									this.getJsonParserForChunk(chunk.index).write(chunk.delta.partial_json)
 								} catch (error) {
 									console.error("Error parsing input_json_delta", error)
 								}
 							// 	try {
-								// 	// JSONParser will always give us a token unless we pass in an empty/undefined value (in which case the promise would never resolve)
+							// 		// this.getJsonParserForChunk(chunk.index).write(chunk.delta.partial_json)
 								// 	if (chunk.delta.partial_json) {
 								// 		// need to await this since we dont want to create multiple jsonparsers in case the read stream comes in faster than the jsonparser can parse
 								// 		await this.updateAssistantContentWithPartialJson(
 								// 			chunk.index,
 								// 			chunk.delta.partial_json
 								// 		)
 								// 	}
 							// 	} catch (error) {
 								// 	// may be due to timeout, in which case we can safely ignore
 							// 		console.error("Error parsing input_json_delta", error)
 							// 	}
-								// this.presentAssistantContent()
+
-								break
+							// 	// try {
 							// 	// 	// JSONParser will always give us a token unless we pass in an empty/undefined value (in which case the promise would never resolve)
 							// 	// 	if (chunk.delta.partial_json) {
 							// 	// 		// need to await this since we dont want to create multiple jsonparsers in case the read stream comes in faster than the jsonparser can parse
 							// 	// 		await this.updateAssistantContentWithPartialJson(
 							// 	// 			chunk.index,
 							// 	// 			chunk.delta.partial_json
 							// 	// 		)
 							// 	// 	}
 							// 	// } catch (error) {
 							// 	// 	// may be due to timeout, in which case we can safely ignore
 							// 	// 	console.error("Error parsing input_json_delta", error)
 							// 	// }
 							// 	// this.presentAssistantContent()
 							// 	break
 						}
 						break
 					case "content_block_stop":
-						if (this.assistantContentBlocks[chunk.index]!.type === "text") {
+						// if (apiContentBlocks[chunk.index]!.type === "text") {
-							// we only call this for text block since partialJsonParser handles calling this for tool_use blocks (we only eve want to set partial to false and presentAssistantContent once for each block)
+						// 	// we only call this for text block since partialJsonParser handles calling this for tool_use blocks (we only eve want to set partial to false and presentAssistantContent once for each block)
-							console.log(11)
+						// 	console.log(11)
-							this.assistantContentBlocks[chunk.index]!.partial = false
+						// 	this.assistantContentBlocks[chunk.index]!.partial = false
-							this.presentAssistantContent()
+						// 	this.presentAssistantContent()
-						}
+						// }
 						console.log("content_block_stop", chunk.index)
@@ -2514,7 +2688,7 @@ ${this.customInstructions.trim()}
 			}
 			this.didCompleteReadingStream = true
-			console.log("contentBlocks", this.assistantContentBlocks)
+			console.log("contentBlocks", apiContentBlocks)
 			let totalCost: string | undefined
@@ -2539,19 +2713,19 @@ ${this.customInstructions.trim()}
 			// now add to apiconversationhistory
 			// need to save assistant responses to file before proceeding to tool use since user can exit at any moment and we wouldn't be able to save the assistant's response
 			let didEndLoop = false
-			if (this.assistantContentBlocks.length > 0) {
+			if (apiContentBlocks.length > 0) {
 				// Remove 'partial' prop from assistantContentBlocks
-				const blocksWithoutPartial: Anthropic.Messages.ContentBlock[] = this.assistantContentBlocks.map(
+				// const blocksWithoutPartial: Anthropic.Messages.ContentBlock[] = this.assistantContentBlocks.map(
-					(block) => {
+				// 	(block) => {
-						const { partial, ...rest } = block
+				// 		const { partial, ...rest } = block
-						return rest
+				// 		return rest
-					}
+				// 	}
-				)
+				// )
-				await this.addToApiConversationHistory({ role: "assistant", content: blocksWithoutPartial })
+				await this.addToApiConversationHistory({ role: "assistant", content: apiContentBlocks })
-				await pWaitFor(() => this.toolResultsReady)
+				await pWaitFor(() => this.userMessageContentReady)
-				const recDidEndLoop = await this.recursivelyMakeClaudeRequests(this.toolResults)
+				const recDidEndLoop = await this.recursivelyMakeClaudeRequests(this.userMessageContent)
 				didEndLoop = recDidEndLoop
 			} else {
 				// this should never happen! it there's no assistant_responses, that means we got no text or tool_use content blocks from API which we should assume is an error
--- a/src/core/prompts/system.ts
+++ b/src/core/prompts/system.ts
@@ -70,4 +70,222 @@ Operating System: ${osName()}
 Default Shell: ${defaultShell}
 Home Directory: ${os.homedir().toPosix()}
 Current Working Directory: ${cwd.toPosix()}
 ====
 INSTRUCTIONS FOR FORMULATING YOUR RESPONSE
 You must respond to the user's request by using at least one tool call. When formulating your response, follow these guidelines:
 1. Begin your response with normal text, explaining your thoughts, analysis, or plan of action.
 2. If you need to use any tools, place ALL tool calls at the END of your message, after your normal text explanation.
 3. You can use multiple tool calls if needed, but they should all be grouped together at the end of your message.
 4. After placing the tool calls, do not add any additional normal text. The tool calls should be the final content in your message.
 Here's the general structure your responses should follow:
 \`\`\`
 [Your normal text response explaining your thoughts and actions]
 [Tool Call 1]
 [Tool Call 2 if needed]
 [Tool Call 3 if needed]
 ...
 \`\`\`
 Remember:
 - Choose the most appropriate tool(s) based on the task and the tool descriptions provided.
 - Formulate your tool calls using the XML format specified for each tool.
 - Provide clear explanations in your normal text about what actions you're taking and why you're using particular tools.
 - Act as if the tool calls will be executed immediately after your message, and your next response will have access to their results.
 # Tool Descriptions and XML Formats
 ## execute_command
 <execute_command>
 <command>
 Your command here
 </command>
 </execute_command>
 Description: Execute a CLI command on the system. Use this when you need to perform system operations or run specific commands to accomplish any step in the user's task. You must tailor your command to the user's system and provide a clear explanation of what the command does. Prefer to execute complex CLI commands over creating executable scripts, as they are more flexible and easier to run. Commands will be executed in the current working directory: ${cwd.toPosix()}
 Parameters:
 - command: (required) The CLI command to execute. This should be valid for the current operating system. Ensure the command is properly formatted and does not contain any harmful instructions.
 ## read_file
 <read_file>
 <path>
 File path here
 </path>
 </read_file>
 Description: Read the contents of a file at the specified path. Use this when you need to examine the contents of an existing file, for example to analyze code, review text files, or extract information from configuration files. Automatically extracts raw text from PDF and DOCX files. May not be suitable for other types of binary files, as it returns the raw content as a string.
 Parameters:
 - path: (required) The path of the file to read (relative to the current working directory ${cwd.toPosix()})
 ## write_to_file
 <write_to_file>
 <path>
 File path here
 </path>
 <content>
 Your file content here
 </content>
 </write_to_file>
 Description: Write content to a file at the specified path. If the file exists, it will be overwritten with the provided content. If the file doesn't exist, it will be created. Always provide the full intended content of the file, without any truncation. This tool will automatically create any directories needed to write the file.
 Parameters:
 - path: (required) The path of the file to write to (relative to the current working directory ${cwd.toPosix()})
 - content: (required) The full content to write to the file.
 ## search_files
 <search_files>
 <path>
 Directory path here
 </path>
 <regex>
 Your regex pattern here
 </regex>
 <file_pattern>
 Optional file pattern here
 </file_pattern>
 </search_files>
 Description: Perform a regex search across files in a specified directory, providing context-rich results. This tool searches for patterns or specific content across multiple files, displaying each match with encapsulating context.
 Parameters:
 - path: (required) The path of the directory to search in (relative to the current working directory ${cwd.toPosix()}). This directory will be recursively searched.
 - regex: (required) The regular expression pattern to search for. Uses Rust regex syntax.
 - file_pattern: (optional) Glob pattern to filter files (e.g., '*.ts' for TypeScript files). If not provided, it will search all files (*).
 ## list_files
 <list_files>
 <path>
 Directory path here
 </path>
 <recursive>
 true or false (optional)
 </recursive>
 </list_files>
 Description: List files and directories within the specified directory. If recursive is true, it will list all files and directories recursively. If recursive is false or not provided, it will only list the top-level contents.
 Parameters:
 - path: (required) The path of the directory to list contents for (relative to the current working directory ${cwd.toPosix()})
 - recursive: (optional) Whether to list files recursively. Use true for recursive listing, false or omit for top-level only.
 ## list_code_definition_names
 <list_code_definition_names>
 <path>
 Directory path here
 </path>
 </list_code_definition_names>
 Description: Lists definition names (classes, functions, methods, etc.) used in source code files at the top level of the specified directory. This tool provides insights into the codebase structure and important constructs, encapsulating high-level concepts and relationships that are crucial for understanding the overall architecture.
 Parameters:
 - path: (required) The path of the directory (relative to the current working directory ${cwd.toPosix()}) to list top level source code definitions for.${
 	supportsImages
 		? `
 ## inspect_site
 <inspect_site>
 <url>
 URL of the site to inspect
 </url>
 </inspect_site>
 Description: Captures a screenshot and console logs of the initial state of a website. This tool navigates to the specified URL, takes a screenshot of the entire page as it appears immediately after loading, and collects any console logs or errors that occur during page load. It does not interact with the page or capture any state changes after the initial load.
 Parameters:
 - url: (required) The URL of the site to inspect. This should be a valid URL including the protocol (e.g. http://localhost:3000/page, file:///path/to/file.html, etc.)`
 		: ""
 }
 ## ask_followup_question
 <ask_followup_question>
 <question>
 Your question here
 </question>
 </ask_followup_question>
 Description: Ask the user a question to gather additional information needed to complete the task. This tool should be used when you encounter ambiguities, need clarification, or require more details to proceed effectively. It allows for interactive problem-solving by enabling direct communication with the user. Use this tool judiciously to maintain a balance between gathering necessary information and avoiding excessive back-and-forth.
 Parameters:
 - question: (required) The question to ask the user. This should be a clear, specific question that addresses the information you need.
 ## attempt_completion
 <attempt_completion>
 <result>
 Your final result description here
 </result>
 <command>
 Optional command to demonstrate result
 </command>
 </attempt_completion>
 Description: Once you've completed the task, use this tool to present the result to the user. Optionally you may provide a CLI command to showcase the result of your work, but avoid using commands like 'echo' or 'cat' that merely print text. They may respond with feedback if they are not satisfied with the result, which you can use to make improvements and try again.
 Parameters:
 - result: (required) The result of the task. Formulate this result in a way that is final and does not require further input from the user. Don't end your result with questions or offers for further assistance.
 - command: (optional) A CLI command to execute to show a live demo of the result to the user. For example, use 'open index.html' to display a created website. This command should be valid for the current operating system. Ensure the command is properly formatted and does not contain any harmful instructions.
 # Examples
 Here are some examples of how to structure your responses with tool calls:
 ## Example 1: Using a single tool
 Let's run the test suite for our project. This will help us ensure that all our components are functioning correctly.
 <execute_command>
 <command>
 npm test
 </command>
 </execute_command>
 ## Example 2: Using multiple tools
 Let's create two new configuration files for the web application, one for the frontend and one for the backend.
 <write_to_file>
 <path>
 ./frontend-config.json
 </path>
 <content>
 {
  "apiEndpoint": "https://api.example.com",
  "theme": {
    "primaryColor": "#007bff",
    "secondaryColor": "#6c757d",
    "fontFamily": "Arial, sans-serif"
  },
  "features": {
    "darkMode": true,
    "notifications": true,
    "analytics": false
  },
  "version": "1.0.0"
 }
 </content>
 </write_to_file>
 <write_to_file>
 <path>
 ./backend-config.yaml
 </path>
 <content>
 database:
  host: localhost
  port: 5432
  name: myapp_db
  user: admin
 server:
  port: 3000
  environment: development
  logLevel: debug
 externalServices:
  emailProvider: sendgrid
  storageProvider: aws-s3
 </content>
 </write_to_file>
 ## Example 3: Asking a follow-up question
 I've analyzed the project structure, but I need more information to proceed. Let me ask the user for clarification.
 <ask_followup_question>
 <question>
 Which specific feature would you like me to implement in the example.py file?
 </question>
 </ask_followup_question>
 `