Loading...
Loading...
Browser automation using the agent-browser CLI. Use when user asks to browse websites, open webpages, interact with page elements, take screenshots, fill forms, click buttons, scrape content, or automate browser tasks.
npx skill4agent add linuxlewis/agent-skills agent-browseragent-browsernpm install -g agent-browser
agent-browser install # Install browser binaries# Navigate to a URL
agent-browser open https://example.com
# Get accessibility snapshot (shows refs like @e1, @e2)
agent-browser snapshot -i
# Click using ref from snapshot
agent-browser click @e2
# Type into an element
agent-browser fill @e3 "hello world"
# Take screenshot
agent-browser screenshot output.pngagent-browser open <url> # Navigate to URL
agent-browser back # Go back
agent-browser forward # Go forward
agent-browser reload # Reload pageagent-browser click <sel> # Click element (or @ref)
agent-browser fill <sel> <text> # Clear and fill
agent-browser press <key> # Press key (Enter, Tab, etc.)
agent-browser select <sel> <val> # Select dropdown optionagent-browser snapshot # Accessibility tree with refs
agent-browser snapshot -i # Interactive elements only
agent-browser get text <sel> # Get element text
agent-browser get url # Get current URLagent-browser screenshot [path] # Take screenshot
agent-browser screenshot --full # Full page screenshot
agent-browser pdf <path> # Save as PDFagent-browser --session myproject open https://example.com
agent-browser --session myproject snapshot
agent-browser --session myproject click @e1@e1@e2#id.classdiv > spantext=Submitrole=button[name="Submit"]@e1wait