mirror of
https://github.com/pacnpal/Roo-Code.git
synced 2025-12-19 20:01:08 -05:00
573 lines
17 KiB
TypeScript
573 lines
17 KiB
TypeScript
import deepEqual from "fast-deep-equal"
|
|
import React, { memo, useEffect, useMemo, useRef, useState } from "react"
|
|
import { useSize } from "react-use"
|
|
import { useExtensionState } from "../../context/ExtensionStateContext"
|
|
import {
|
|
BrowserAction,
|
|
BrowserActionResult,
|
|
ClineMessage,
|
|
ClineSayBrowserAction,
|
|
} from "../../../../src/shared/ExtensionMessage"
|
|
import { vscode } from "../../utils/vscode"
|
|
import CodeBlock, { CODE_BLOCK_BG_COLOR } from "../common/CodeBlock"
|
|
import { ChatRowContent, ProgressIndicator } from "./ChatRow"
|
|
import { VSCodeButton } from "@vscode/webview-ui-toolkit/react"
|
|
|
|
interface BrowserSessionRowProps {
|
|
messages: ClineMessage[]
|
|
isExpanded: (messageTs: number) => boolean
|
|
onToggleExpand: (messageTs: number) => void
|
|
lastModifiedMessage?: ClineMessage
|
|
isLast: boolean
|
|
onHeightChange: (isTaller: boolean) => void
|
|
isStreaming: boolean
|
|
}
|
|
|
|
const BrowserSessionRow = memo((props: BrowserSessionRowProps) => {
|
|
const { messages, isLast, onHeightChange, lastModifiedMessage } = props
|
|
const prevHeightRef = useRef(0)
|
|
const [maxActionHeight, setMaxActionHeight] = useState(0)
|
|
const [consoleLogsExpanded, setConsoleLogsExpanded] = useState(false)
|
|
|
|
const { browserViewportSize = "900x600" } = useExtensionState()
|
|
const [viewportWidth, viewportHeight] = browserViewportSize.split("x").map(Number)
|
|
const aspectRatio = ((viewportHeight / viewportWidth) * 100).toFixed(2)
|
|
const defaultMousePosition = `${Math.round(viewportWidth / 2)},${Math.round(viewportHeight / 2)}`
|
|
|
|
const isLastApiReqInterrupted = useMemo(() => {
|
|
// Check if last api_req_started is cancelled
|
|
const lastApiReqStarted = [...messages].reverse().find((m) => m.say === "api_req_started")
|
|
if (lastApiReqStarted?.text != null) {
|
|
const info = JSON.parse(lastApiReqStarted.text)
|
|
if (info.cancelReason != null) {
|
|
return true
|
|
}
|
|
}
|
|
const lastApiReqFailed = isLast && lastModifiedMessage?.ask === "api_req_failed"
|
|
if (lastApiReqFailed) {
|
|
return true
|
|
}
|
|
return false
|
|
}, [messages, lastModifiedMessage, isLast])
|
|
|
|
const isBrowsing = useMemo(() => {
|
|
return isLast && messages.some((m) => m.say === "browser_action_result") && !isLastApiReqInterrupted // after user approves, browser_action_result with "" is sent to indicate that the session has started
|
|
}, [isLast, messages, isLastApiReqInterrupted])
|
|
|
|
// Organize messages into pages with current state and next action
|
|
const pages = useMemo(() => {
|
|
const result: {
|
|
currentState: {
|
|
url?: string
|
|
screenshot?: string
|
|
mousePosition?: string
|
|
consoleLogs?: string
|
|
messages: ClineMessage[] // messages up to and including the result
|
|
}
|
|
nextAction?: {
|
|
messages: ClineMessage[] // messages leading to next result
|
|
}
|
|
}[] = []
|
|
|
|
let currentStateMessages: ClineMessage[] = []
|
|
let nextActionMessages: ClineMessage[] = []
|
|
|
|
messages.forEach((message) => {
|
|
if (message.ask === "browser_action_launch") {
|
|
// Start first page
|
|
currentStateMessages = [message]
|
|
} else if (message.say === "browser_action_result") {
|
|
if (message.text === "") {
|
|
// first browser_action_result is an empty string that signals that session has started
|
|
return
|
|
}
|
|
// Complete current state
|
|
currentStateMessages.push(message)
|
|
const resultData = JSON.parse(message.text || "{}") as BrowserActionResult
|
|
|
|
// Add page with current state and previous next actions
|
|
result.push({
|
|
currentState: {
|
|
url: resultData.currentUrl,
|
|
screenshot: resultData.screenshot,
|
|
mousePosition: resultData.currentMousePosition,
|
|
consoleLogs: resultData.logs,
|
|
messages: [...currentStateMessages],
|
|
},
|
|
nextAction:
|
|
nextActionMessages.length > 0
|
|
? {
|
|
messages: [...nextActionMessages],
|
|
}
|
|
: undefined,
|
|
})
|
|
|
|
// Reset for next page
|
|
currentStateMessages = []
|
|
nextActionMessages = []
|
|
} else if (
|
|
message.say === "api_req_started" ||
|
|
message.say === "text" ||
|
|
message.say === "browser_action"
|
|
) {
|
|
// These messages lead to the next result, so they should always go in nextActionMessages
|
|
nextActionMessages.push(message)
|
|
} else {
|
|
// Any other message types
|
|
currentStateMessages.push(message)
|
|
}
|
|
})
|
|
|
|
// Add incomplete page if exists
|
|
if (currentStateMessages.length > 0 || nextActionMessages.length > 0) {
|
|
result.push({
|
|
currentState: {
|
|
messages: [...currentStateMessages],
|
|
},
|
|
nextAction:
|
|
nextActionMessages.length > 0
|
|
? {
|
|
messages: [...nextActionMessages],
|
|
}
|
|
: undefined,
|
|
})
|
|
}
|
|
|
|
return result
|
|
}, [messages])
|
|
|
|
// Auto-advance to latest page
|
|
const [currentPageIndex, setCurrentPageIndex] = useState(0)
|
|
useEffect(() => {
|
|
setCurrentPageIndex(pages.length - 1)
|
|
}, [pages.length])
|
|
|
|
// Get initial URL from launch message
|
|
const initialUrl = useMemo(() => {
|
|
const launchMessage = messages.find((m) => m.ask === "browser_action_launch")
|
|
return launchMessage?.text || ""
|
|
}, [messages])
|
|
|
|
// Find the latest available URL and screenshot
|
|
const latestState = useMemo(() => {
|
|
for (let i = pages.length - 1; i >= 0; i--) {
|
|
const page = pages[i]
|
|
if (page.currentState.url || page.currentState.screenshot) {
|
|
return {
|
|
url: page.currentState.url,
|
|
mousePosition: page.currentState.mousePosition,
|
|
consoleLogs: page.currentState.consoleLogs,
|
|
screenshot: page.currentState.screenshot,
|
|
}
|
|
}
|
|
}
|
|
return { url: undefined, mousePosition: undefined, consoleLogs: undefined, screenshot: undefined }
|
|
}, [pages])
|
|
|
|
const currentPage = pages[currentPageIndex]
|
|
const isLastPage = currentPageIndex === pages.length - 1
|
|
|
|
// Use latest state if we're on the last page and don't have a state yet
|
|
const displayState = isLastPage
|
|
? {
|
|
url: currentPage?.currentState.url || latestState.url || initialUrl,
|
|
mousePosition:
|
|
currentPage?.currentState.mousePosition || latestState.mousePosition || defaultMousePosition,
|
|
consoleLogs: currentPage?.currentState.consoleLogs,
|
|
screenshot: currentPage?.currentState.screenshot || latestState.screenshot,
|
|
}
|
|
: {
|
|
url: currentPage?.currentState.url || initialUrl,
|
|
mousePosition: currentPage?.currentState.mousePosition || defaultMousePosition,
|
|
consoleLogs: currentPage?.currentState.consoleLogs,
|
|
screenshot: currentPage?.currentState.screenshot,
|
|
}
|
|
|
|
const [actionContent, { height: actionHeight }] = useSize(
|
|
<div>
|
|
{currentPage?.nextAction?.messages.map((message) => (
|
|
<BrowserSessionRowContent
|
|
key={message.ts}
|
|
{...props}
|
|
message={message}
|
|
setMaxActionHeight={setMaxActionHeight}
|
|
/>
|
|
))}
|
|
{!isBrowsing && messages.some((m) => m.say === "browser_action_result") && currentPageIndex === 0 && (
|
|
<BrowserActionBox action={"launch"} text={initialUrl} />
|
|
)}
|
|
</div>,
|
|
)
|
|
|
|
useEffect(() => {
|
|
if (actionHeight === 0 || actionHeight === Infinity) {
|
|
return
|
|
}
|
|
if (actionHeight > maxActionHeight) {
|
|
setMaxActionHeight(actionHeight)
|
|
}
|
|
}, [actionHeight, maxActionHeight])
|
|
|
|
// Track latest click coordinate
|
|
const latestClickPosition = useMemo(() => {
|
|
if (!isBrowsing) return undefined
|
|
|
|
// Look through current page's next actions for the latest browser_action
|
|
const actions = currentPage?.nextAction?.messages || []
|
|
for (let i = actions.length - 1; i >= 0; i--) {
|
|
const message = actions[i]
|
|
if (message.say === "browser_action") {
|
|
const browserAction = JSON.parse(message.text || "{}") as ClineSayBrowserAction
|
|
if (browserAction.action === "click" && browserAction.coordinate) {
|
|
return browserAction.coordinate
|
|
}
|
|
}
|
|
}
|
|
return undefined
|
|
}, [isBrowsing, currentPage?.nextAction?.messages])
|
|
|
|
// Use latest click position while browsing, otherwise use display state
|
|
const mousePosition = isBrowsing
|
|
? latestClickPosition || displayState.mousePosition
|
|
: displayState.mousePosition || defaultMousePosition
|
|
|
|
const [browserSessionRow, { height: rowHeight }] = useSize(
|
|
<div style={{ padding: "10px 6px 10px 15px", marginBottom: -10 }}>
|
|
<div style={{ display: "flex", alignItems: "center", gap: "10px", marginBottom: "10px" }}>
|
|
{isBrowsing ? (
|
|
<ProgressIndicator />
|
|
) : (
|
|
<span
|
|
className={`codicon codicon-inspect`}
|
|
style={{ color: "var(--vscode-foreground)", marginBottom: "-1.5px" }}></span>
|
|
)}
|
|
<span style={{ fontWeight: "bold" }}>
|
|
<>Roo wants to use the browser:</>
|
|
</span>
|
|
</div>
|
|
<div
|
|
style={{
|
|
borderRadius: 3,
|
|
border: "1px solid var(--vscode-editorGroup-border)",
|
|
overflow: "hidden",
|
|
backgroundColor: CODE_BLOCK_BG_COLOR,
|
|
marginBottom: 10,
|
|
}}>
|
|
{/* URL Bar */}
|
|
<div
|
|
style={{
|
|
margin: "5px auto",
|
|
width: "calc(100% - 10px)",
|
|
boxSizing: "border-box", // includes padding in width calculation
|
|
backgroundColor: "var(--vscode-input-background)",
|
|
border: "1px solid var(--vscode-input-border)",
|
|
borderRadius: "4px",
|
|
padding: "3px 5px",
|
|
display: "flex",
|
|
alignItems: "center",
|
|
justifyContent: "center",
|
|
color: displayState.url
|
|
? "var(--vscode-input-foreground)"
|
|
: "var(--vscode-descriptionForeground)",
|
|
fontSize: "12px",
|
|
}}>
|
|
<div
|
|
style={{
|
|
textOverflow: "ellipsis",
|
|
overflow: "hidden",
|
|
whiteSpace: "nowrap",
|
|
width: "100%",
|
|
textAlign: "center",
|
|
}}>
|
|
{displayState.url || "http"}
|
|
</div>
|
|
</div>
|
|
|
|
{/* Screenshot Area */}
|
|
<div
|
|
data-testid="screenshot-container"
|
|
style={{
|
|
width: "100%",
|
|
paddingBottom: `${aspectRatio}%`, // height/width ratio
|
|
position: "relative",
|
|
backgroundColor: "var(--vscode-input-background)",
|
|
}}>
|
|
{displayState.screenshot ? (
|
|
<img
|
|
src={displayState.screenshot}
|
|
alt="Browser screenshot"
|
|
style={{
|
|
position: "absolute",
|
|
top: 0,
|
|
left: 0,
|
|
width: "100%",
|
|
height: "100%",
|
|
objectFit: "contain",
|
|
cursor: "pointer",
|
|
}}
|
|
onClick={() =>
|
|
vscode.postMessage({
|
|
type: "openImage",
|
|
text: displayState.screenshot,
|
|
})
|
|
}
|
|
/>
|
|
) : (
|
|
<div
|
|
style={{
|
|
position: "absolute",
|
|
top: "50%",
|
|
left: "50%",
|
|
transform: "translate(-50%, -50%)",
|
|
}}>
|
|
<span
|
|
className="codicon codicon-globe"
|
|
style={{ fontSize: "80px", color: "var(--vscode-descriptionForeground)" }}
|
|
/>
|
|
</div>
|
|
)}
|
|
{displayState.mousePosition && (
|
|
<BrowserCursor
|
|
style={{
|
|
position: "absolute",
|
|
top: `${(parseInt(mousePosition.split(",")[1]) / viewportHeight) * 100}%`,
|
|
left: `${(parseInt(mousePosition.split(",")[0]) / viewportWidth) * 100}%`,
|
|
transition: "top 0.3s ease-out, left 0.3s ease-out",
|
|
}}
|
|
/>
|
|
)}
|
|
</div>
|
|
|
|
<div style={{ width: "100%" }}>
|
|
<div
|
|
onClick={() => {
|
|
setConsoleLogsExpanded(!consoleLogsExpanded)
|
|
}}
|
|
style={{
|
|
display: "flex",
|
|
alignItems: "center",
|
|
gap: "4px",
|
|
width: "100%",
|
|
justifyContent: "flex-start",
|
|
cursor: "pointer",
|
|
padding: `9px 8px ${consoleLogsExpanded ? 0 : 8}px 8px`,
|
|
}}>
|
|
<span className={`codicon codicon-chevron-${consoleLogsExpanded ? "down" : "right"}`}></span>
|
|
<span style={{ fontSize: "0.8em" }}>Console Logs</span>
|
|
</div>
|
|
{consoleLogsExpanded && (
|
|
<CodeBlock source={`${"```"}shell\n${displayState.consoleLogs || "(No new logs)"}\n${"```"}`} />
|
|
)}
|
|
</div>
|
|
</div>
|
|
|
|
{/* Action content with min height */}
|
|
<div style={{ minHeight: maxActionHeight }}>{actionContent}</div>
|
|
|
|
{/* Pagination moved to bottom */}
|
|
{pages.length > 1 && (
|
|
<div
|
|
style={{
|
|
display: "flex",
|
|
justifyContent: "space-between",
|
|
alignItems: "center",
|
|
padding: "8px 0px",
|
|
marginTop: "15px",
|
|
borderTop: "1px solid var(--vscode-editorGroup-border)",
|
|
}}>
|
|
<div>
|
|
Step {currentPageIndex + 1} of {pages.length}
|
|
</div>
|
|
<div style={{ display: "flex", gap: "4px" }}>
|
|
<VSCodeButton
|
|
disabled={currentPageIndex === 0 || isBrowsing}
|
|
onClick={() => setCurrentPageIndex((i) => i - 1)}>
|
|
Previous
|
|
</VSCodeButton>
|
|
<VSCodeButton
|
|
disabled={currentPageIndex === pages.length - 1 || isBrowsing}
|
|
onClick={() => setCurrentPageIndex((i) => i + 1)}>
|
|
Next
|
|
</VSCodeButton>
|
|
</div>
|
|
</div>
|
|
)}
|
|
</div>,
|
|
)
|
|
|
|
// Height change effect
|
|
useEffect(() => {
|
|
const isInitialRender = prevHeightRef.current === 0
|
|
if (isLast && rowHeight !== 0 && rowHeight !== Infinity && rowHeight !== prevHeightRef.current) {
|
|
if (!isInitialRender) {
|
|
onHeightChange(rowHeight > prevHeightRef.current)
|
|
}
|
|
prevHeightRef.current = rowHeight
|
|
}
|
|
}, [rowHeight, isLast, onHeightChange])
|
|
|
|
return browserSessionRow
|
|
}, deepEqual)
|
|
|
|
interface BrowserSessionRowContentProps extends Omit<BrowserSessionRowProps, "messages"> {
|
|
message: ClineMessage
|
|
setMaxActionHeight: (height: number) => void
|
|
isStreaming: boolean
|
|
}
|
|
|
|
const BrowserSessionRowContent = ({
|
|
message,
|
|
isExpanded,
|
|
onToggleExpand,
|
|
lastModifiedMessage,
|
|
isLast,
|
|
setMaxActionHeight,
|
|
isStreaming,
|
|
}: BrowserSessionRowContentProps) => {
|
|
const headerStyle: React.CSSProperties = {
|
|
display: "flex",
|
|
alignItems: "center",
|
|
gap: "10px",
|
|
marginBottom: "10px",
|
|
}
|
|
|
|
switch (message.type) {
|
|
case "say":
|
|
switch (message.say) {
|
|
case "api_req_started":
|
|
case "text":
|
|
return (
|
|
<div style={{ padding: "10px 0 10px 0" }}>
|
|
<ChatRowContent
|
|
message={message}
|
|
isExpanded={isExpanded(message.ts)}
|
|
onToggleExpand={() => {
|
|
if (message.say === "api_req_started") {
|
|
setMaxActionHeight(0)
|
|
}
|
|
onToggleExpand(message.ts)
|
|
}}
|
|
lastModifiedMessage={lastModifiedMessage}
|
|
isLast={isLast}
|
|
isStreaming={isStreaming}
|
|
/>
|
|
</div>
|
|
)
|
|
|
|
case "browser_action":
|
|
const browserAction = JSON.parse(message.text || "{}") as ClineSayBrowserAction
|
|
return (
|
|
<BrowserActionBox
|
|
action={browserAction.action}
|
|
coordinate={browserAction.coordinate}
|
|
text={browserAction.text}
|
|
/>
|
|
)
|
|
|
|
default:
|
|
return null
|
|
}
|
|
|
|
case "ask":
|
|
switch (message.ask) {
|
|
case "browser_action_launch":
|
|
return (
|
|
<>
|
|
<div style={headerStyle}>
|
|
<span style={{ fontWeight: "bold" }}>Browser Session Started</span>
|
|
</div>
|
|
<div
|
|
style={{
|
|
borderRadius: 3,
|
|
border: "1px solid var(--vscode-editorGroup-border)",
|
|
overflow: "hidden",
|
|
backgroundColor: CODE_BLOCK_BG_COLOR,
|
|
}}>
|
|
<CodeBlock source={`${"```"}shell\n${message.text}\n${"```"}`} forceWrap={true} />
|
|
</div>
|
|
</>
|
|
)
|
|
|
|
default:
|
|
return null
|
|
}
|
|
}
|
|
}
|
|
|
|
const BrowserActionBox = ({
|
|
action,
|
|
coordinate,
|
|
text,
|
|
}: {
|
|
action: BrowserAction
|
|
coordinate?: string
|
|
text?: string
|
|
}) => {
|
|
const getBrowserActionText = (action: BrowserAction, coordinate?: string, text?: string) => {
|
|
switch (action) {
|
|
case "launch":
|
|
return `Launch browser at ${text}`
|
|
case "click":
|
|
return `Click (${coordinate?.replace(",", ", ")})`
|
|
case "type":
|
|
return `Type "${text}"`
|
|
case "scroll_down":
|
|
return "Scroll down"
|
|
case "scroll_up":
|
|
return "Scroll up"
|
|
case "close":
|
|
return "Close browser"
|
|
default:
|
|
return action
|
|
}
|
|
}
|
|
return (
|
|
<div style={{ padding: "10px 0 0 0" }}>
|
|
<div
|
|
style={{
|
|
borderRadius: 3,
|
|
backgroundColor: CODE_BLOCK_BG_COLOR,
|
|
overflow: "hidden",
|
|
border: "1px solid var(--vscode-editorGroup-border)",
|
|
}}>
|
|
<div
|
|
style={{
|
|
display: "flex",
|
|
alignItems: "center",
|
|
padding: "9px 10px",
|
|
}}>
|
|
<span
|
|
style={{
|
|
whiteSpace: "normal",
|
|
wordBreak: "break-word",
|
|
}}>
|
|
<span style={{ fontWeight: 500 }}>Browse Action: </span>
|
|
{getBrowserActionText(action, coordinate, text)}
|
|
</span>
|
|
</div>
|
|
</div>
|
|
</div>
|
|
)
|
|
}
|
|
|
|
const BrowserCursor: React.FC<{ style?: React.CSSProperties }> = ({ style }) => {
|
|
// (can't use svgs in vsc extensions)
|
|
const cursorBase64 =
|
|
""
|
|
|
|
return (
|
|
<img
|
|
src={cursorBase64}
|
|
style={{
|
|
width: "17px",
|
|
height: "22px",
|
|
...style,
|
|
}}
|
|
alt="cursor"
|
|
aria-label="cursor"
|
|
/>
|
|
)
|
|
}
|
|
|
|
export default BrowserSessionRow
|