npx skills add https://github.com/shipshitdev/library --skill agent-browseragent-browser open <url> # 导航到页面
agent-browser snapshot -i # 获取带有引用标识的交互元素
agent-browser click @e1 # 通过引用标识点击元素
agent-browser fill @e2 "text" # 通过引用标识填写输入框
agent-browser close # 关闭浏览器
agent-browser open <url>agent-browser snapshot -i(返回带有 @e1、@e2 等引用标识的元素)agent-browser open <url> # 导航到 URL
agent-browser back # 后退
agent-browser forward # 前进
agent-browser reload # 重新加载页面
agent-browser close # 关闭浏览器
广告位招租
在这里展示您的产品或服务
触达数万 AI 开发者,精准高效
agent-browser snapshot # 完整的无障碍功能树
agent-browser snapshot -i # 仅交互元素(推荐)
agent-browser snapshot -c # 紧凑输出
agent-browser snapshot -d 3 # 限制深度为 3
agent-browser snapshot -s "#main" # 限定到 CSS 选择器范围
agent-browser click @e1 # 点击
agent-browser dblclick @e1 # 双击
agent-browser focus @e1 # 聚焦元素
agent-browser fill @e2 "text" # 清空并输入
agent-browser type @e2 "text" # 输入(不清空)
agent-browser press Enter # 按键
agent-browser press Control+a # 组合键
agent-browser keydown Shift # 按下按键
agent-browser keyup Shift # 释放按键
agent-browser hover @e1 # 悬停
agent-browser check @e1 # 勾选复选框
agent-browser uncheck @e1 # 取消勾选复选框
agent-browser select @e1 "value" # 选择下拉框选项
agent-browser scroll down 500 # 滚动页面
agent-browser scrollintoview @e1 # 将元素滚动到视图中
agent-browser drag @e1 @e2 # 拖放
agent-browser upload @e1 file.pdf # 上传文件
agent-browser get text @e1 # 获取元素文本
agent-browser get html @e1 # 获取 innerHTML
agent-browser get value @e1 # 获取输入框值
agent-browser get attr @e1 href # 获取属性
agent-browser get title # 获取页面标题
agent-browser get url # 获取当前 URL
agent-browser get count ".item" # 统计匹配元素数量
agent-browser get box @e1 # 获取边界框
agent-browser is visible @e1 # 检查是否可见
agent-browser is enabled @e1 # 检查是否启用
agent-browser is checked @e1 # 检查是否已勾选
agent-browser screenshot # 截图到标准输出
agent-browser screenshot path.png # 保存到文件
agent-browser screenshot --full # 完整页面截图
agent-browser pdf output.pdf # 保存为 PDF
agent-browser record start ./demo.webm # 开始录制
agent-browser click @e1 # 执行操作
agent-browser record stop # 停止并保存视频
agent-browser record restart ./take2.webm # 停止当前录制并开始新的录制
agent-browser wait @e1 # 等待元素出现
agent-browser wait 2000 # 等待毫秒数
agent-browser wait --text "Success" # 等待文本出现
agent-browser wait --url "**/dashboard" # 等待 URL 模式匹配
agent-browser wait --load networkidle # 等待网络空闲
agent-browser wait --fn "window.ready" # 等待 JavaScript 条件满足
agent-browser mouse move 100 200 # 移动鼠标
agent-browser mouse down left # 按下鼠标按钮
agent-browser mouse up left # 释放鼠标按钮
agent-browser mouse wheel 100 # 滚动鼠标滚轮
agent-browser find role button click --name "Submit"
agent-browser find text "Sign In" click
agent-browser find label "Email" fill "user@test.com"
agent-browser find first ".item" click
agent-browser find nth 2 "a" text
agent-browser set viewport 1920 1080 # 设置视口大小
agent-browser set device "iPhone 14" # 模拟设备
agent-browser set geo 37.7749 -122.4194 # 设置地理位置
agent-browser set offline on # 切换离线模式
agent-browser set headers '{"X-Key":"v"}' # 额外的 HTTP 请求头
agent-browser set credentials user pass # HTTP 基本认证
agent-browser set media dark # 模拟配色方案
agent-browser cookies # 获取所有 Cookie
agent-browser cookies set name value # 设置 Cookie
agent-browser cookies clear # 清除 Cookie
agent-browser storage local # 获取所有 localStorage
agent-browser storage local key # 获取特定键值
agent-browser storage local set k v # 设置值
agent-browser storage local clear # 清除所有
agent-browser network route <url> # 拦截请求
agent-browser network route <url> --abort # 阻止请求
agent-browser network route <url> --body '{}' # 模拟响应
agent-browser network unroute [url] # 移除路由规则
agent-browser network requests # 查看已跟踪的请求
agent-browser network requests --filter api # 过滤请求
agent-browser tab # 列出标签页
agent-browser tab new [url] # 新建标签页
agent-browser tab 2 # 切换到标签页
agent-browser tab close # 关闭标签页
agent-browser window new # 新建窗口
agent-browser frame "#iframe" # 切换到 iframe
agent-browser frame main # 返回主框架
agent-browser dialog accept [text] # 接受对话框
agent-browser dialog dismiss # 关闭对话框
agent-browser eval "document.title" # 运行 JavaScript
agent-browser --session test1 open site-a.com
agent-browser --session test2 open site-b.com
agent-browser session list
添加 --json 参数以获取机器可读的输出:
agent-browser snapshot -i --json
agent-browser get text @e1 --json
agent-browser open example.com --headed # 显示浏览器窗口
agent-browser console # 查看控制台消息
agent-browser console --clear # 清除控制台
agent-browser errors # 查看页面错误
agent-browser errors --clear # 清除错误
agent-browser highlight @e1 # 高亮显示元素
agent-browser trace start # 开始录制跟踪信息
agent-browser trace stop trace.zip # 停止并保存跟踪信息
agent-browser --cdp 9222 snapshot # 通过 CDP 连接
agent-browser open https://app.example.com/signup
agent-browser snapshot -i
# 测试空提交
agent-browser click @e5 # 提交按钮
agent-browser snapshot -i # 检查错误信息
# 测试无效邮箱
agent-browser fill @e1 "invalid-email"
agent-browser click @e5
agent-browser get text @e1 # 检查错误
# 测试有效提交
agent-browser fill @e1 "valid@email.com"
agent-browser fill @e2 "ValidPass123!"
agent-browser click @e5
agent-browser wait --url "**/dashboard"
agent-browser open https://app.example.com
agent-browser set viewport 1920 1080
agent-browser screenshot desktop.png --full
agent-browser set device "iPhone 14"
agent-browser reload
agent-browser screenshot mobile.png --full
# 登录
agent-browser open https://app.example.com/login
agent-browser snapshot -i
agent-browser fill @e1 "testuser"
agent-browser fill @e2 "testpass"
agent-browser click @e3
agent-browser wait --url "**/dashboard"
# 保存认证状态以便复用
agent-browser state save auth.json
# 在新会话中加载状态
agent-browser state load auth.json
agent-browser open https://app.example.com/protected
agent-browser open https://shop.example.com/cart
agent-browser snapshot -i
# 步骤 1:购物车
agent-browser click @e3 # 进入结账流程
# 步骤 2:配送信息
agent-browser wait @e1
agent-browser snapshot -i
agent-browser fill @e1 "123 Test St"
agent-browser fill @e2 "Test City"
agent-browser select @e3 "CA"
agent-browser fill @e4 "90210"
agent-browser click @e5 # 继续
# 步骤 3:支付信息
agent-browser wait --text "Payment"
agent-browser snapshot -i
agent-browser fill @e1 "4111111111111111"
agent-browser fill @e2 "12/28"
agent-browser fill @e3 "123"
agent-browser click @e4 # 下订单
agent-browser wait --text "Order confirmed"
agent-browser screenshot order-confirmation.png
# 模拟缓慢的 API 响应
agent-browser network route "**/api/data" --body '{"items":[]}'
agent-browser open https://app.example.com
agent-browser snapshot -i # 验证空状态 UI
# 阻止外部分析
agent-browser network route "**/analytics/**" --abort
完整命令文档请参阅 references/commands.md。
每周安装量
92
代码仓库
GitHub 星标数
16
首次出现
2026年1月20日
安全审计
已安装于
codex74
opencode71
gemini-cli70
cursor70
github-copilot64
claude-code56
agent-browser open <url> # Navigate to page
agent-browser snapshot -i # Get interactive elements with refs
agent-browser click @e1 # Click element by ref
agent-browser fill @e2 "text" # Fill input by ref
agent-browser close # Close browser
agent-browser open <url>agent-browser snapshot -i (returns elements with refs like @e1, @e2)agent-browser open <url> # Navigate to URL
agent-browser back # Go back
agent-browser forward # Go forward
agent-browser reload # Reload page
agent-browser close # Close browser
agent-browser snapshot # Full accessibility tree
agent-browser snapshot -i # Interactive elements only (recommended)
agent-browser snapshot -c # Compact output
agent-browser snapshot -d 3 # Limit depth to 3
agent-browser snapshot -s "#main" # Scope to CSS selector
agent-browser click @e1 # Click
agent-browser dblclick @e1 # Double-click
agent-browser focus @e1 # Focus element
agent-browser fill @e2 "text" # Clear and type
agent-browser type @e2 "text" # Type without clearing
agent-browser press Enter # Press key
agent-browser press Control+a # Key combination
agent-browser keydown Shift # Hold key down
agent-browser keyup Shift # Release key
agent-browser hover @e1 # Hover
agent-browser check @e1 # Check checkbox
agent-browser uncheck @e1 # Uncheck checkbox
agent-browser select @e1 "value" # Select dropdown
agent-browser scroll down 500 # Scroll page
agent-browser scrollintoview @e1 # Scroll element into view
agent-browser drag @e1 @e2 # Drag and drop
agent-browser upload @e1 file.pdf # Upload files
agent-browser get text @e1 # Get element text
agent-browser get html @e1 # Get innerHTML
agent-browser get value @e1 # Get input value
agent-browser get attr @e1 href # Get attribute
agent-browser get title # Get page title
agent-browser get url # Get current URL
agent-browser get count ".item" # Count matching elements
agent-browser get box @e1 # Get bounding box
agent-browser is visible @e1 # Check if visible
agent-browser is enabled @e1 # Check if enabled
agent-browser is checked @e1 # Check if checked
agent-browser screenshot # Screenshot to stdout
agent-browser screenshot path.png # Save to file
agent-browser screenshot --full # Full page
agent-browser pdf output.pdf # Save as PDF
agent-browser record start ./demo.webm # Start recording
agent-browser click @e1 # Perform actions
agent-browser record stop # Stop and save video
agent-browser record restart ./take2.webm # Stop current + start new
agent-browser wait @e1 # Wait for element
agent-browser wait 2000 # Wait milliseconds
agent-browser wait --text "Success" # Wait for text
agent-browser wait --url "**/dashboard" # Wait for URL pattern
agent-browser wait --load networkidle # Wait for network idle
agent-browser wait --fn "window.ready" # Wait for JS condition
agent-browser mouse move 100 200 # Move mouse
agent-browser mouse down left # Press button
agent-browser mouse up left # Release button
agent-browser mouse wheel 100 # Scroll wheel
agent-browser find role button click --name "Submit"
agent-browser find text "Sign In" click
agent-browser find label "Email" fill "user@test.com"
agent-browser find first ".item" click
agent-browser find nth 2 "a" text
agent-browser set viewport 1920 1080 # Set viewport size
agent-browser set device "iPhone 14" # Emulate device
agent-browser set geo 37.7749 -122.4194 # Set geolocation
agent-browser set offline on # Toggle offline mode
agent-browser set headers '{"X-Key":"v"}' # Extra HTTP headers
agent-browser set credentials user pass # HTTP basic auth
agent-browser set media dark # Emulate color scheme
agent-browser cookies # Get all cookies
agent-browser cookies set name value # Set cookie
agent-browser cookies clear # Clear cookies
agent-browser storage local # Get all localStorage
agent-browser storage local key # Get specific key
agent-browser storage local set k v # Set value
agent-browser storage local clear # Clear all
agent-browser network route <url> # Intercept requests
agent-browser network route <url> --abort # Block requests
agent-browser network route <url> --body '{}' # Mock response
agent-browser network unroute [url] # Remove routes
agent-browser network requests # View tracked requests
agent-browser network requests --filter api # Filter requests
agent-browser tab # List tabs
agent-browser tab new [url] # New tab
agent-browser tab 2 # Switch to tab
agent-browser tab close # Close tab
agent-browser window new # New window
agent-browser frame "#iframe" # Switch to iframe
agent-browser frame main # Back to main frame
agent-browser dialog accept [text] # Accept dialog
agent-browser dialog dismiss # Dismiss dialog
agent-browser eval "document.title" # Run JavaScript
agent-browser --session test1 open site-a.com
agent-browser --session test2 open site-b.com
agent-browser session list
Add --json for machine-readable output:
agent-browser snapshot -i --json
agent-browser get text @e1 --json
agent-browser open example.com --headed # Show browser window
agent-browser console # View console messages
agent-browser console --clear # Clear console
agent-browser errors # View page errors
agent-browser errors --clear # Clear errors
agent-browser highlight @e1 # Highlight element
agent-browser trace start # Start recording trace
agent-browser trace stop trace.zip # Stop and save trace
agent-browser --cdp 9222 snapshot # Connect via CDP
agent-browser open https://app.example.com/signup
agent-browser snapshot -i
# Test empty submission
agent-browser click @e5 # Submit button
agent-browser snapshot -i # Check for error messages
# Test invalid email
agent-browser fill @e1 "invalid-email"
agent-browser click @e5
agent-browser get text @e1 # Check error
# Test valid submission
agent-browser fill @e1 "valid@email.com"
agent-browser fill @e2 "ValidPass123!"
agent-browser click @e5
agent-browser wait --url "**/dashboard"
agent-browser open https://app.example.com
agent-browser set viewport 1920 1080
agent-browser screenshot desktop.png --full
agent-browser set device "iPhone 14"
agent-browser reload
agent-browser screenshot mobile.png --full
# Login
agent-browser open https://app.example.com/login
agent-browser snapshot -i
agent-browser fill @e1 "testuser"
agent-browser fill @e2 "testpass"
agent-browser click @e3
agent-browser wait --url "**/dashboard"
# Save auth state for reuse
agent-browser state save auth.json
# Load state in new session
agent-browser state load auth.json
agent-browser open https://app.example.com/protected
agent-browser open https://shop.example.com/cart
agent-browser snapshot -i
# Step 1: Cart
agent-browser click @e3 # Proceed to checkout
# Step 2: Shipping
agent-browser wait @e1
agent-browser snapshot -i
agent-browser fill @e1 "123 Test St"
agent-browser fill @e2 "Test City"
agent-browser select @e3 "CA"
agent-browser fill @e4 "90210"
agent-browser click @e5 # Continue
# Step 3: Payment
agent-browser wait --text "Payment"
agent-browser snapshot -i
agent-browser fill @e1 "4111111111111111"
agent-browser fill @e2 "12/28"
agent-browser fill @e3 "123"
agent-browser click @e4 # Place order
agent-browser wait --text "Order confirmed"
agent-browser screenshot order-confirmation.png
# Mock slow API response
agent-browser network route "**/api/data" --body '{"items":[]}'
agent-browser open https://app.example.com
agent-browser snapshot -i # Verify empty state UI
# Block external analytics
agent-browser network route "**/analytics/**" --abort
See references/commands.md for full command documentation.
Weekly Installs
92
Repository
GitHub Stars
16
First Seen
Jan 20, 2026
Security Audits
Gen Agent Trust HubWarnSocketPassSnykFail
Installed on
codex74
opencode71
gemini-cli70
cursor70
github-copilot64
claude-code56
Skills CLI 使用指南:AI Agent 技能包管理器安装与管理教程
43,100 周安装