browser-use
diff --git a/‎.gitignore‎
Lines changed: 9 additions & 0 deletions b/‎.gitignore‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎.vscode/settings.json‎
Lines changed: 6 additions & 0 deletions b/‎.vscode/settings.json‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎cli/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎cli/__init__.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎cli/browser-tasks-example.ts‎
Lines changed: 181 additions & 0 deletions b/‎cli/browser-tasks-example.ts‎
Lines changed: 181 additions & 0 deletions
diff --git a/‎cli/browser-use‎
Lines changed: 20 additions & 0 deletions b/‎cli/browser-use‎
Lines changed: 20 additions & 0 deletions
diff --git a/‎cli/browser-use.toolchain.json‎
Lines changed: 50 additions & 0 deletions b/‎cli/browser-use.toolchain.json‎
Lines changed: 50 additions & 0 deletions
@@ -184,3 +184,12 @@ AgentHistoryList.json
 
 # For Docker
 data/
+
+# cursor
+.cursorrules
+.cursorignore
+.backup.env
+.brain/** */
+
+# Brain directory
+.brain/
@@ -7,5 +7,11 @@
       "source.fixAll.ruff": "explicit",
       "source.organizeImports.ruff": "explicit"
     }
+  },
+  "dotenv.enableAutocloaking": false,
+  "workbench.colorCustomizations": {
+    "activityBar.background": "#452606",
+    "titleBar.activeBackground": "#603608",
+    "titleBar.activeForeground": "#FEFBF7"
   }
 }
@@ -0,0 +1,3 @@
+"""
+Command-line interface for browser-use.
+""" 
@@ -0,0 +1,181 @@
+/**
+ * Browser Automation Task Sequences
+ * 
+ * This file defines task sequences for browser automation using the browser-use command.
+ * Each sequence represents a series of browser interactions that can be executed in order.
+ */
+
+export interface BrowserCommand {
+    prompt: string;
+    model?: 'deepseek-chat' | 'gemini' | 'gpt-4' | 'claude-3';
+    headless?: boolean;
+    vision?: boolean;
+    keepSessionAlive?: boolean;
+}
+
+export interface BrowserTask {
+    description: string;
+    command: BrowserCommand;
+    subtasks?: BrowserTask[];
+}
+
+export interface BrowserTaskSequence {
+    name: string;
+    description: string;
+    tasks: BrowserTask[];
+}
+
+// Example task sequences
+export const browserTasks: BrowserTaskSequence[] = [
+    {
+        name: "Product Research",
+        description: "Compare product prices across multiple e-commerce sites",
+        tasks: [
+            {
+                description: "Search Amazon for wireless earbuds",
+                command: {
+                    prompt: "go to amazon.com and search for 'wireless earbuds' and tell me the price of the top 3 results",
+                    model: "gemini",
+                    vision: true,
+                    keepSessionAlive: true
+                }
+            },
+            {
+                description: "Search Best Buy for comparison",
+                command: {
+                    prompt: "go to bestbuy.com and search for 'wireless earbuds' and tell me the price of the top 3 results",
+                    model: "gemini",
+                    vision: true,
+                    keepSessionAlive: true
+                }
+            },
+            {
+                description: "Create price comparison",
+                command: {
+                    prompt: "create a comparison table of the prices from both sites",
+                    keepSessionAlive: false
+                }
+            }
+        ]
+    },
+    {
+        name: "Site Health Check",
+        description: "Monitor website availability and performance",
+        tasks: [
+            {
+                description: "Check main site",
+                command: {
+                    prompt: "go to example.com and check if it loads properly",
+                    headless: true
+                }
+            },
+            {
+                description: "Verify API health",
+                command: {
+                    prompt: "go to api.example.com/health and tell me the status",
+                    headless: true
+                }
+            },
+            {
+                description: "Test documentation site",
+                command: {
+                    prompt: "go to docs.example.com and verify all navigation links are working",
+                    headless: true
+                }
+            }
+        ]
+    },
+    {
+        name: "Content Analysis",
+        description: "Analyze blog content and engagement",
+        tasks: [
+            {
+                description: "List articles",
+                command: {
+                    prompt: "go to blog.example.com and list all article titles from the homepage",
+                    model: "gemini",
+                    vision: true
+                }
+            },
+            {
+                description: "Analyze first article",
+                command: {
+                    prompt: "click on the first article and summarize its main points"
+                },
+                subtasks: [
+                    {
+                        description: "Get metadata",
+                        command: {
+                            prompt: "tell me the author, publication date, and reading time"
+                        }
+                    },
+                    {
+                        description: "Analyze comments",
+                        command: {
+                            prompt: "scroll to the comments section and summarize the main discussion points",
+                            vision: true
+                        }
+                    }
+                ]
+            }
+        ]
+    },
+    {
+        name: "Advanced Content Analysis",
+        description: "Analyze website content using different models for different tasks",
+        tasks: [
+            {
+                description: "Initial navigation and basic text extraction",
+                command: {
+                    prompt: "go to docs.github.com and navigate to the Actions documentation",
+                    model: "deepseek-chat",  // Use DeepSeek for basic navigation
+                    keepSessionAlive: true
+                }
+            },
+            {
+                description: "Visual analysis of page structure",
+                command: {
+                    prompt: "analyze the layout of the page and tell me how the documentation is structured, including sidebars, navigation, and content areas",
+                    model: "gemini",  // Switch to Gemini for visual analysis
+                    vision: true,
+                    keepSessionAlive: true
+                }
+            },
+            {
+                description: "Complex content summarization",
+                command: {
+                    prompt: "summarize the key concepts of GitHub Actions based on the documentation",
+                    model: "claude-3",  // Switch to Claude for complex summarization
+                    keepSessionAlive: true
+                }
+            },
+            {
+                description: "Extract code examples",
+                command: {
+                    prompt: "find and list all YAML workflow examples on the page",
+                    model: "deepseek-chat",  // Back to DeepSeek for code extraction
+                    keepSessionAlive: false  // Close browser after final task
+                }
+            }
+        ]
+    }
+];
+
+// Example of executing a task sequence
+const executeTask = (task: BrowserCommand): string => {
+    const options: string[] = [];
+    if (task.model) options.push(`--model ${task.model}`);
+    if (task.headless) options.push('--headless');
+    if (task.vision) options.push('--vision');
+    if (task.keepSessionAlive) options.push('--keep-browser-open');
+    
+    return `browser-use "${task.prompt}" ${options.join(' ')}`.trim();
+};
+
+// Example usage:
+const sequence = browserTasks[0]; // Get Product Research sequence
+console.log(`Executing sequence: ${sequence.name}`);
+sequence.tasks.forEach(task => {
+    console.log(`\n${task.description}:`);
+    console.log(executeTask(task.command));
+}); 
@@ -0,0 +1,20 @@
+#!/bin/bash
+
+# Get the absolute directory of this script
+SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
+
+# Add the project directory to PYTHONPATH
+export PYTHONPATH="$SCRIPT_DIR:$PYTHONPATH"
+
+# Activate the virtual environment if it exists
+if [ -f "$SCRIPT_DIR/venv/bin/activate" ]; then
+    source "$SCRIPT_DIR/venv/bin/activate"
+fi
+
+# Run the Python script with all arguments passed through
+"$SCRIPT_DIR/venv/bin/python" "$SCRIPT_DIR/browser-use-cli.py" "$@"
+
+# Deactivate the virtual environment if it was activated
+if [ -n "$VIRTUAL_ENV" ]; then
+    deactivate
+fi 
@@ -0,0 +1,50 @@
+{
+    "name": "browser-use",
+    "description": "Execute natural language browser automation commands",
+    "type": "terminal_command",
+    "functions": [
+        {
+            "name": "browser_command",
+            "description": "Control a browser using natural language instructions",
+            "parameters": {
+                "properties": {
+                    "prompt": {
+                        "type": "string",
+                        "description": "The natural language instruction (e.g., 'go to google.com and search for OpenAI')"
+                    },
+                    "model": {
+                        "type": "string",
+                        "enum": ["deepseek-chat", "gemini", "gpt-4", "claude-3"],
+                        "default": "deepseek-chat",
+                        "description": "The LLM model to use (optional)"
+                    },
+                    "headless": {
+                        "type": "boolean",
+                        "default": false,
+                        "description": "Run browser in headless mode (optional)"
+                    },
+                    "vision": {
+                        "type": "boolean",
+                        "default": false,
+                        "description": "Enable vision capabilities for supported models (optional)"
+                    }
+                },
+                "required": ["prompt"]
+            }
+        }
+    ],
+    "examples": [
+        {
+            "description": "Basic usage",
+            "command": "browser-use \"go to google.com and search for OpenAI\""
+        },
+        {
+            "description": "Using vision to analyze a webpage",
+            "command": "browser-use \"go to openai.com and tell me what you see\" --model gemini --vision"
+        },
+        {
+            "description": "Running a check in headless mode",
+            "command": "browser-use \"check if github.com is up\" --headless"
+        }
+    ]
+}
Original file line number	Diff line number	Diff line change
`@@ -7,5 +7,11 @@`
`7`	`7`	`"source.fixAll.ruff": "explicit",`
`8`	`8`	`"source.organizeImports.ruff": "explicit"`
`9`	`9`	`}`
	`10`	`+ },`
	`11`	`+ "dotenv.enableAutocloaking": false,`
	`12`	`+ "workbench.colorCustomizations": {`
	`13`	`+ "activityBar.background": "#452606",`
	`14`	`+ "titleBar.activeBackground": "#603608",`
	`15`	`+ "titleBar.activeForeground": "#FEFBF7"`
`10`	`16`	`}`
`11`	`17`	`}`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+"""`
	`2`	`+Command-line interface for browser-use.`
	`3`	`+"""`