| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565 |
- import deepEqual from "fast-deep-equal"
- import React, { memo, useEffect, useMemo, useRef, useState } from "react"
- import { useSize } from "react-use"
- import { useExtensionState } from "../../context/ExtensionStateContext"
- import {
- BrowserAction,
- BrowserActionResult,
- ClineMessage,
- ClineSayBrowserAction,
- } from "../../../../src/shared/ExtensionMessage"
- import { vscode } from "../../utils/vscode"
- import CodeBlock, { CODE_BLOCK_BG_COLOR } from "../common/CodeBlock"
- import { ChatRowContent, ProgressIndicator } from "./ChatRow"
- import { VSCodeButton } from "@vscode/webview-ui-toolkit/react"
- interface BrowserSessionRowProps {
- messages: ClineMessage[]
- isExpanded: (messageTs: number) => boolean
- onToggleExpand: (messageTs: number) => void
- lastModifiedMessage?: ClineMessage
- isLast: boolean
- onHeightChange: (isTaller: boolean) => void
- }
- const BrowserSessionRow = memo((props: BrowserSessionRowProps) => {
- const { messages, isLast, onHeightChange, lastModifiedMessage } = props
- const prevHeightRef = useRef(0)
- const [maxActionHeight, setMaxActionHeight] = useState(0)
- const [consoleLogsExpanded, setConsoleLogsExpanded] = useState(false)
- const { browserViewportSize = "900x600" } = useExtensionState()
- const [viewportWidth, viewportHeight] = browserViewportSize.split("x").map(Number)
- const aspectRatio = (viewportHeight / viewportWidth * 100).toFixed(2)
- const defaultMousePosition = `${Math.round(viewportWidth/2)},${Math.round(viewportHeight/2)}`
- const isLastApiReqInterrupted = useMemo(() => {
- // Check if last api_req_started is cancelled
- const lastApiReqStarted = [...messages].reverse().find((m) => m.say === "api_req_started")
- if (lastApiReqStarted?.text != null) {
- const info = JSON.parse(lastApiReqStarted.text)
- if (info.cancelReason != null) {
- return true
- }
- }
- const lastApiReqFailed = isLast && lastModifiedMessage?.ask === "api_req_failed"
- if (lastApiReqFailed) {
- return true
- }
- return false
- }, [messages, lastModifiedMessage, isLast])
- const isBrowsing = useMemo(() => {
- return isLast && messages.some((m) => m.say === "browser_action_result") && !isLastApiReqInterrupted // after user approves, browser_action_result with "" is sent to indicate that the session has started
- }, [isLast, messages, isLastApiReqInterrupted])
- // Organize messages into pages with current state and next action
- const pages = useMemo(() => {
- const result: {
- currentState: {
- url?: string
- screenshot?: string
- mousePosition?: string
- consoleLogs?: string
- messages: ClineMessage[] // messages up to and including the result
- }
- nextAction?: {
- messages: ClineMessage[] // messages leading to next result
- }
- }[] = []
- let currentStateMessages: ClineMessage[] = []
- let nextActionMessages: ClineMessage[] = []
- messages.forEach((message) => {
- if (message.ask === "browser_action_launch") {
- // Start first page
- currentStateMessages = [message]
- } else if (message.say === "browser_action_result") {
- if (message.text === "") {
- // first browser_action_result is an empty string that signals that session has started
- return
- }
- // Complete current state
- currentStateMessages.push(message)
- const resultData = JSON.parse(message.text || "{}") as BrowserActionResult
- // Add page with current state and previous next actions
- result.push({
- currentState: {
- url: resultData.currentUrl,
- screenshot: resultData.screenshot,
- mousePosition: resultData.currentMousePosition,
- consoleLogs: resultData.logs,
- messages: [...currentStateMessages],
- },
- nextAction:
- nextActionMessages.length > 0
- ? {
- messages: [...nextActionMessages],
- }
- : undefined,
- })
- // Reset for next page
- currentStateMessages = []
- nextActionMessages = []
- } else if (
- message.say === "api_req_started" ||
- message.say === "text" ||
- message.say === "browser_action"
- ) {
- // These messages lead to the next result, so they should always go in nextActionMessages
- nextActionMessages.push(message)
- } else {
- // Any other message types
- currentStateMessages.push(message)
- }
- })
- // Add incomplete page if exists
- if (currentStateMessages.length > 0 || nextActionMessages.length > 0) {
- result.push({
- currentState: {
- messages: [...currentStateMessages],
- },
- nextAction:
- nextActionMessages.length > 0
- ? {
- messages: [...nextActionMessages],
- }
- : undefined,
- })
- }
- return result
- }, [messages])
- // Auto-advance to latest page
- const [currentPageIndex, setCurrentPageIndex] = useState(0)
- useEffect(() => {
- setCurrentPageIndex(pages.length - 1)
- }, [pages.length])
- // Get initial URL from launch message
- const initialUrl = useMemo(() => {
- const launchMessage = messages.find((m) => m.ask === "browser_action_launch")
- return launchMessage?.text || ""
- }, [messages])
- // Find the latest available URL and screenshot
- const latestState = useMemo(() => {
- for (let i = pages.length - 1; i >= 0; i--) {
- const page = pages[i]
- if (page.currentState.url || page.currentState.screenshot) {
- return {
- url: page.currentState.url,
- mousePosition: page.currentState.mousePosition,
- consoleLogs: page.currentState.consoleLogs,
- screenshot: page.currentState.screenshot,
- }
- }
- }
- return { url: undefined, mousePosition: undefined, consoleLogs: undefined, screenshot: undefined }
- }, [pages])
- const currentPage = pages[currentPageIndex]
- const isLastPage = currentPageIndex === pages.length - 1
- // Use latest state if we're on the last page and don't have a state yet
- const displayState = isLastPage
- ? {
- url: currentPage?.currentState.url || latestState.url || initialUrl,
- mousePosition: currentPage?.currentState.mousePosition || latestState.mousePosition || defaultMousePosition,
- consoleLogs: currentPage?.currentState.consoleLogs,
- screenshot: currentPage?.currentState.screenshot || latestState.screenshot,
- }
- : {
- url: currentPage?.currentState.url || initialUrl,
- mousePosition: currentPage?.currentState.mousePosition || defaultMousePosition,
- consoleLogs: currentPage?.currentState.consoleLogs,
- screenshot: currentPage?.currentState.screenshot,
- }
- const [actionContent, { height: actionHeight }] = useSize(
- <div>
- {currentPage?.nextAction?.messages.map((message) => (
- <BrowserSessionRowContent
- key={message.ts}
- {...props}
- message={message}
- setMaxActionHeight={setMaxActionHeight}
- />
- ))}
- {!isBrowsing && messages.some((m) => m.say === "browser_action_result") && currentPageIndex === 0 && (
- <BrowserActionBox action={"launch"} text={initialUrl} />
- )}
- </div>,
- )
- useEffect(() => {
- if (actionHeight === 0 || actionHeight === Infinity) {
- return
- }
- if (actionHeight > maxActionHeight) {
- setMaxActionHeight(actionHeight)
- }
- }, [actionHeight, maxActionHeight])
- // Track latest click coordinate
- const latestClickPosition = useMemo(() => {
- if (!isBrowsing) return undefined
- // Look through current page's next actions for the latest browser_action
- const actions = currentPage?.nextAction?.messages || []
- for (let i = actions.length - 1; i >= 0; i--) {
- const message = actions[i]
- if (message.say === "browser_action") {
- const browserAction = JSON.parse(message.text || "{}") as ClineSayBrowserAction
- if (browserAction.action === "click" && browserAction.coordinate) {
- return browserAction.coordinate
- }
- }
- }
- return undefined
- }, [isBrowsing, currentPage?.nextAction?.messages])
- // Use latest click position while browsing, otherwise use display state
- const mousePosition = isBrowsing ? latestClickPosition || displayState.mousePosition : displayState.mousePosition || defaultMousePosition
- const [browserSessionRow, { height: rowHeight }] = useSize(
- <div style={{ padding: "10px 6px 10px 15px", marginBottom: -10 }}>
- <div style={{ display: "flex", alignItems: "center", gap: "10px", marginBottom: "10px" }}>
- {isBrowsing ? (
- <ProgressIndicator />
- ) : (
- <span
- className={`codicon codicon-inspect`}
- style={{ color: "var(--vscode-foreground)", marginBottom: "-1.5px" }}></span>
- )}
- <span style={{ fontWeight: "bold" }}>
- <>Cline wants to use the browser:</>
- </span>
- </div>
- <div
- style={{
- borderRadius: 3,
- border: "1px solid var(--vscode-editorGroup-border)",
- overflow: "hidden",
- backgroundColor: CODE_BLOCK_BG_COLOR,
- marginBottom: 10,
- }}>
- {/* URL Bar */}
- <div
- style={{
- margin: "5px auto",
- width: "calc(100% - 10px)",
- boxSizing: "border-box", // includes padding in width calculation
- backgroundColor: "var(--vscode-input-background)",
- border: "1px solid var(--vscode-input-border)",
- borderRadius: "4px",
- padding: "3px 5px",
- display: "flex",
- alignItems: "center",
- justifyContent: "center",
- color: displayState.url
- ? "var(--vscode-input-foreground)"
- : "var(--vscode-descriptionForeground)",
- fontSize: "12px",
- }}>
- <div
- style={{
- textOverflow: "ellipsis",
- overflow: "hidden",
- whiteSpace: "nowrap",
- width: "100%",
- textAlign: "center",
- }}>
- {displayState.url || "http"}
- </div>
- </div>
- {/* Screenshot Area */}
- <div
- data-testid="screenshot-container"
- style={{
- width: "100%",
- paddingBottom: `${aspectRatio}%`, // height/width ratio
- position: "relative",
- backgroundColor: "var(--vscode-input-background)",
- }}>
- {displayState.screenshot ? (
- <img
- src={displayState.screenshot}
- alt="Browser screenshot"
- style={{
- position: "absolute",
- top: 0,
- left: 0,
- width: "100%",
- height: "100%",
- objectFit: "contain",
- cursor: "pointer",
- }}
- onClick={() =>
- vscode.postMessage({
- type: "openImage",
- text: displayState.screenshot,
- })
- }
- />
- ) : (
- <div
- style={{
- position: "absolute",
- top: "50%",
- left: "50%",
- transform: "translate(-50%, -50%)",
- }}>
- <span
- className="codicon codicon-globe"
- style={{ fontSize: "80px", color: "var(--vscode-descriptionForeground)" }}
- />
- </div>
- )}
- {displayState.mousePosition && (
- <BrowserCursor
- style={{
- position: "absolute",
- top: `${(parseInt(mousePosition.split(",")[1]) / viewportHeight) * 100}%`,
- left: `${(parseInt(mousePosition.split(",")[0]) / viewportWidth) * 100}%`,
- transition: "top 0.3s ease-out, left 0.3s ease-out",
- }}
- />
- )}
- </div>
- <div style={{ width: "100%" }}>
- <div
- onClick={() => {
- setConsoleLogsExpanded(!consoleLogsExpanded)
- }}
- style={{
- display: "flex",
- alignItems: "center",
- gap: "4px",
- width: "100%",
- justifyContent: "flex-start",
- cursor: "pointer",
- padding: `9px 8px ${consoleLogsExpanded ? 0 : 8}px 8px`,
- }}>
- <span className={`codicon codicon-chevron-${consoleLogsExpanded ? "down" : "right"}`}></span>
- <span style={{ fontSize: "0.8em" }}>Console Logs</span>
- </div>
- {consoleLogsExpanded && (
- <CodeBlock source={`${"```"}shell\n${displayState.consoleLogs || "(No new logs)"}\n${"```"}`} />
- )}
- </div>
- </div>
- {/* Action content with min height */}
- <div style={{ minHeight: maxActionHeight }}>{actionContent}</div>
- {/* Pagination moved to bottom */}
- {pages.length > 1 && (
- <div
- style={{
- display: "flex",
- justifyContent: "space-between",
- alignItems: "center",
- padding: "8px 0px",
- marginTop: "15px",
- borderTop: "1px solid var(--vscode-editorGroup-border)",
- }}>
- <div>
- Step {currentPageIndex + 1} of {pages.length}
- </div>
- <div style={{ display: "flex", gap: "4px" }}>
- <VSCodeButton
- disabled={currentPageIndex === 0 || isBrowsing}
- onClick={() => setCurrentPageIndex((i) => i - 1)}>
- Previous
- </VSCodeButton>
- <VSCodeButton
- disabled={currentPageIndex === pages.length - 1 || isBrowsing}
- onClick={() => setCurrentPageIndex((i) => i + 1)}>
- Next
- </VSCodeButton>
- </div>
- </div>
- )}
- </div>,
- )
- // Height change effect
- useEffect(() => {
- const isInitialRender = prevHeightRef.current === 0
- if (isLast && rowHeight !== 0 && rowHeight !== Infinity && rowHeight !== prevHeightRef.current) {
- if (!isInitialRender) {
- onHeightChange(rowHeight > prevHeightRef.current)
- }
- prevHeightRef.current = rowHeight
- }
- }, [rowHeight, isLast, onHeightChange])
- return browserSessionRow
- }, deepEqual)
- interface BrowserSessionRowContentProps extends Omit<BrowserSessionRowProps, "messages"> {
- message: ClineMessage
- setMaxActionHeight: (height: number) => void
- }
- const BrowserSessionRowContent = ({
- message,
- isExpanded,
- onToggleExpand,
- lastModifiedMessage,
- isLast,
- setMaxActionHeight,
- }: BrowserSessionRowContentProps) => {
- const headerStyle: React.CSSProperties = {
- display: "flex",
- alignItems: "center",
- gap: "10px",
- marginBottom: "10px",
- }
- switch (message.type) {
- case "say":
- switch (message.say) {
- case "api_req_started":
- case "text":
- return (
- <div style={{ padding: "10px 0 10px 0" }}>
- <ChatRowContent
- message={message}
- isExpanded={isExpanded(message.ts)}
- onToggleExpand={() => {
- if (message.say === "api_req_started") {
- setMaxActionHeight(0)
- }
- onToggleExpand(message.ts)
- }}
- lastModifiedMessage={lastModifiedMessage}
- isLast={isLast}
- />
- </div>
- )
- case "browser_action":
- const browserAction = JSON.parse(message.text || "{}") as ClineSayBrowserAction
- return (
- <BrowserActionBox
- action={browserAction.action}
- coordinate={browserAction.coordinate}
- text={browserAction.text}
- />
- )
- default:
- return null
- }
- case "ask":
- switch (message.ask) {
- case "browser_action_launch":
- return (
- <>
- <div style={headerStyle}>
- <span style={{ fontWeight: "bold" }}>Browser Session Started</span>
- </div>
- <div
- style={{
- borderRadius: 3,
- border: "1px solid var(--vscode-editorGroup-border)",
- overflow: "hidden",
- backgroundColor: CODE_BLOCK_BG_COLOR,
- }}>
- <CodeBlock source={`${"```"}shell\n${message.text}\n${"```"}`} forceWrap={true} />
- </div>
- </>
- )
- default:
- return null
- }
- }
- }
- const BrowserActionBox = ({
- action,
- coordinate,
- text,
- }: {
- action: BrowserAction
- coordinate?: string
- text?: string
- }) => {
- const getBrowserActionText = (action: BrowserAction, coordinate?: string, text?: string) => {
- switch (action) {
- case "launch":
- return `Launch browser at ${text}`
- case "click":
- return `Click (${coordinate?.replace(",", ", ")})`
- case "type":
- return `Type "${text}"`
- case "scroll_down":
- return "Scroll down"
- case "scroll_up":
- return "Scroll up"
- case "close":
- return "Close browser"
- default:
- return action
- }
- }
- return (
- <div style={{ padding: "10px 0 0 0" }}>
- <div
- style={{
- borderRadius: 3,
- backgroundColor: CODE_BLOCK_BG_COLOR,
- overflow: "hidden",
- border: "1px solid var(--vscode-editorGroup-border)",
- }}>
- <div
- style={{
- display: "flex",
- alignItems: "center",
- padding: "9px 10px",
- }}>
- <span
- style={{
- whiteSpace: "normal",
- wordBreak: "break-word",
- }}>
- <span style={{ fontWeight: 500 }}>Browse Action: </span>
- {getBrowserActionText(action, coordinate, text)}
- </span>
- </div>
- </div>
- </div>
- )
- }
- const BrowserCursor: React.FC<{ style?: React.CSSProperties }> = ({ style }) => {
- // (can't use svgs in vsc extensions)
- const cursorBase64 =
- ""
- return (
- <img
- src={cursorBase64}
- style={{
- width: "17px",
- height: "22px",
- ...style,
- }}
- alt="cursor"
- aria-label="cursor"
- />
- )
- }
- export default BrowserSessionRow
|