mirror of
https://github.com/browser-use/browser-use
synced 2026-04-22 17:45:09 +02:00
252 lines
9.8 KiB
JSON
252 lines
9.8 KiB
JSON
{
|
|
"$schema": "https://github.com/anthropics/dxt/blob/main/dist/dxt-manifest.schema.json",
|
|
"dxt_version": "0.1",
|
|
"name": "browser-use",
|
|
"display_name": "Browser-Use AI Browser Automation",
|
|
"version": "0.5.0",
|
|
"description": "AI-powered browser automation that lets Claude control web browsers to complete tasks autonomously",
|
|
"long_description": "Browser-Use is a powerful extension that enables Claude to control real web browsers through an AI agent. It can navigate websites, fill forms, extract data, and perform complex multi-step tasks autonomously. Perfect for web scraping, testing, research, and automation workflows.\n\n### Key Features:\n- **Autonomous AI Agent**: High-level task execution with minimal supervision\n- **Direct Browser Control**: Navigate, click, type, and interact with any website\n- **Content Extraction**: Smart extraction of structured data from web pages\n- **Tab Management**: Handle multiple tabs and complex workflows\n- **Vision Capabilities**: Use screenshots for visual understanding\n- **Security Features**: Domain restrictions and sandboxed execution\n\n### Use Cases:\n- Web scraping and data extraction\n- Automated testing and QA\n- Research and information gathering\n- Form filling and submissions\n- Multi-step workflow automation",
|
|
"icon": "icon.png",
|
|
"homepage": "https://browser-use.com",
|
|
"documentation": "https://docs.browser-use.com",
|
|
"repository": {
|
|
"type": "git",
|
|
"url": "https://github.com/browser-use/browser-use"
|
|
},
|
|
"support": "https://github.com/browser-use/browser-use/issues",
|
|
"author": {
|
|
"name": "Browser-Use Team",
|
|
"email": "support@browser-use.com",
|
|
"url": "https://browser-use.com"
|
|
},
|
|
"server": {
|
|
"type": "python",
|
|
"entry_point": "python",
|
|
"mcp_config": {
|
|
"command": "uvx",
|
|
"args": ["browser-use", "--mcp"],
|
|
"env": {
|
|
"OPENAI_API_KEY": "${user_config.openai_api_key}",
|
|
"ANTHROPIC_API_KEY": "${user_config.anthropic_api_key}",
|
|
"BROWSER_USE_HEADLESS": "${user_config.headless}",
|
|
"BROWSER_USE_ALLOWED_DOMAINS": "${user_config.allowed_domains}",
|
|
"BROWSER_USE_LLM_MODEL": "${user_config.llm_model}"
|
|
}
|
|
}
|
|
},
|
|
"tools": [
|
|
{
|
|
"name": "retry_with_browser_use_agent",
|
|
"description": "Execute a high-level task using the AI browser agent. Best for complex multi-step workflows"
|
|
},
|
|
{
|
|
"name": "browser_navigate",
|
|
"description": "Navigate to a URL in the current tab or open a new tab. Example: Navigate to https://example.com"
|
|
},
|
|
{
|
|
"name": "browser_click",
|
|
"description": "Click on an element by its index from browser_get_state. Supports opening links in new tabs"
|
|
},
|
|
{
|
|
"name": "browser_type",
|
|
"description": "Type text into an input field identified by its index. Use after browser_get_state to find inputs"
|
|
},
|
|
{
|
|
"name": "browser_get_state",
|
|
"description": "Get the current page state including all interactive elements with their indices. Essential for interaction"
|
|
},
|
|
{
|
|
"name": "browser_extract_content",
|
|
"description": "Extract structured content from the page using AI. Perfect for scraping specific information"
|
|
},
|
|
{
|
|
"name": "browser_scroll",
|
|
"description": "Scroll the page up or down by one viewport height"
|
|
},
|
|
{
|
|
"name": "browser_go_back",
|
|
"description": "Navigate back to the previous page in browser history"
|
|
},
|
|
{
|
|
"name": "browser_list_tabs",
|
|
"description": "List all open browser tabs with their URLs and titles"
|
|
},
|
|
{
|
|
"name": "browser_switch_tab",
|
|
"description": "Switch to a different tab by its index"
|
|
},
|
|
{
|
|
"name": "browser_close_tab",
|
|
"description": "Close a specific tab by its index"
|
|
}
|
|
],
|
|
"prompts": [
|
|
{
|
|
"name": "scrape_data",
|
|
"description": "Extract structured data from a website",
|
|
"text": "Use browser_navigate to go to {url}, then use browser_extract_content to extract {data_type}. If the page requires interaction, use browser_get_state to find elements and browser_click/browser_type as needed."
|
|
},
|
|
{
|
|
"name": "fill_form",
|
|
"description": "Fill out and submit a web form",
|
|
"text": "Navigate to {url}, use browser_get_state to identify form fields, then use browser_type to fill in: {field_data}. Finally, click the submit button."
|
|
},
|
|
{
|
|
"name": "multi_step_task",
|
|
"description": "Execute a complex multi-step task",
|
|
"text": "Use retry_with_browser_use_agent with task: '{task_description}'. Set max_steps based on complexity and use_vision=true for better understanding."
|
|
},
|
|
{
|
|
"name": "research_topic",
|
|
"description": "Research a topic across multiple websites",
|
|
"text": "Open multiple tabs using browser_navigate with new_tab=true for sites: {sites}. Use browser_extract_content on each to gather information about {topic}. Switch between tabs with browser_switch_tab."
|
|
}
|
|
],
|
|
"keywords": ["browser", "automation", "web-scraping", "testing", "ai-agent", "playwright", "selenium-alternative", "rpa", "web-automation", "mcp", "browser-use"],
|
|
"license": "MIT",
|
|
"user_config": {
|
|
"workspace_directory": {
|
|
"type": "directory",
|
|
"title": "Workspace Directory",
|
|
"description": "Directory to use as workspace for downloads and file operations",
|
|
"default": "${HOME}/.config/browseruse/workspace",
|
|
"required": false
|
|
},
|
|
"headless": {
|
|
"type": "boolean",
|
|
"title": "Headless Mode",
|
|
"description": "Run browser without GUI (faster but no visual feedback). Set to false to see the browser in action",
|
|
"default": false,
|
|
"required": false
|
|
},
|
|
"stealth": {
|
|
"type": "boolean",
|
|
"title": "Stealth Mode",
|
|
"description": "Use stealth mode to avoid detection by anti-bot systems",
|
|
"default": false,
|
|
"required": false
|
|
},
|
|
"user_data_dir": {
|
|
"type": "directory",
|
|
"title": "User Data Directory",
|
|
"description": "Chrome profile directory for persistent sessions (cookies, localStorage, etc)",
|
|
"default": "${HOME}/.config/browseruse/profiles/default",
|
|
"required": false
|
|
},
|
|
"openai_api_key": {
|
|
"type": "string",
|
|
"title": "OpenAI API Key",
|
|
"description": "API key for OpenAI models (used by browser agent for content extraction). Get one at https://platform.openai.com",
|
|
"default": "",
|
|
"required": false,
|
|
"sensitive": true
|
|
},
|
|
"anthropic_api_key": {
|
|
"type": "string",
|
|
"title": "Anthropic API Key",
|
|
"description": "API key for Anthropic Claude models (alternative to OpenAI). Get one at https://console.anthropic.com",
|
|
"default": "",
|
|
"required": false,
|
|
"sensitive": true
|
|
},
|
|
"llm_model": {
|
|
"type": "string",
|
|
"title": "LLM Model",
|
|
"description": "Which AI model to use for browser agent tasks",
|
|
"enum": ["gpt-4o", "gpt-4o-mini", "claude-3-opus-20240229", "claude-3-sonnet-20240229"],
|
|
"default": "gpt-4o-mini",
|
|
"required": false
|
|
},
|
|
"llm_endpoint": {
|
|
"type": "string",
|
|
"title": "LLM API Endpoint",
|
|
"description": "Custom API endpoint for LLM (e.g., for Azure OpenAI or self-hosted models)",
|
|
"default": "",
|
|
"required": false
|
|
},
|
|
"use_vision": {
|
|
"type": "boolean",
|
|
"title": "Use Vision",
|
|
"description": "Enable vision capabilities for the agent to understand page content via screenshots",
|
|
"default": true,
|
|
"required": false
|
|
},
|
|
"disable_security": {
|
|
"type": "boolean",
|
|
"title": "Disable Security",
|
|
"description": "Disable browser security features (CORS, CSP, etc). Use with caution",
|
|
"default": false,
|
|
"required": false
|
|
},
|
|
"deterministic_rendering": {
|
|
"type": "boolean",
|
|
"title": "Deterministic Rendering",
|
|
"description": "Force deterministic rendering for consistent screenshots. May break some sites",
|
|
"default": false,
|
|
"required": false
|
|
},
|
|
"viewport_expansion": {
|
|
"type": "number",
|
|
"title": "Viewport Expansion",
|
|
"description": "Extra pixels to expand viewport for better LLM context understanding",
|
|
"default": 500,
|
|
"minimum": 0,
|
|
"maximum": 2000,
|
|
"required": false
|
|
},
|
|
"allowed_domains": {
|
|
"type": "string",
|
|
"title": "Allowed Domains",
|
|
"description": "Comma-separated list of domains the browser can access (e.g., 'example.com,*.google.com'). Leave empty for no restrictions",
|
|
"default": "",
|
|
"required": false
|
|
},
|
|
"sensitive_data_masking": {
|
|
"type": "boolean",
|
|
"title": "Sensitive Data Masking",
|
|
"description": "Mask sensitive data (passwords, credit cards) in screenshots and logs",
|
|
"default": true,
|
|
"required": false
|
|
},
|
|
"browser_type": {
|
|
"type": "string",
|
|
"title": "Browser Type",
|
|
"description": "Which browser engine to use",
|
|
"enum": ["chromium", "firefox", "webkit"],
|
|
"default": "chromium",
|
|
"required": false
|
|
},
|
|
"default_timeout": {
|
|
"type": "number",
|
|
"title": "Default Timeout (ms)",
|
|
"description": "Default timeout for browser operations in milliseconds",
|
|
"default": 30000,
|
|
"minimum": 1000,
|
|
"maximum": 300000,
|
|
"required": false
|
|
},
|
|
"wait_between_actions": {
|
|
"type": "number",
|
|
"title": "Wait Between Actions (seconds)",
|
|
"description": "Time to wait between browser actions for stability",
|
|
"default": 0.5,
|
|
"minimum": 0,
|
|
"maximum": 10,
|
|
"required": false
|
|
},
|
|
"max_steps": {
|
|
"type": "number",
|
|
"title": "Max Agent Steps",
|
|
"description": "Maximum number of steps the agent can take in a single task",
|
|
"default": 100,
|
|
"minimum": 1,
|
|
"maximum": 1000,
|
|
"required": false
|
|
}
|
|
},
|
|
"compatibility": {
|
|
"claude_desktop": ">=0.10.0",
|
|
"platforms": ["darwin", "win32", "linux"]
|
|
}
|
|
}
|