初始化提交

2026-03-01 16:24:24 +08:00
commit 92e5def702
492 changed files with 211343 additions and 0 deletions
--- a/crates/openfang-hands/bundled/browser/HAND.toml
+++ b/crates/openfang-hands/bundled/browser/HAND.toml
@@ -0,0 +1,256 @@
+id = "browser"
+name = "Browser Hand"
+description = "Autonomous web browser — navigates sites, fills forms, clicks buttons, and completes multi-step web tasks with user approval for purchases"
+category = "productivity"
+icon = "\U0001F310"
+tools = [
+    "browser_navigate", "browser_click", "browser_type",
+    "browser_screenshot", "browser_read_page", "browser_close",
+    "web_search", "web_fetch",
+    "memory_store", "memory_recall",
+    "knowledge_add_entity", "knowledge_add_relation", "knowledge_query",
+    "schedule_create", "schedule_list", "schedule_delete",
+    "file_write", "file_read",
+]
+
+[[requires]]
+key = "python3"
+label = "Python 3 must be installed"
+requirement_type = "binary"
+check_value = "python"
+description = "Python 3 is required to run Playwright, the browser automation library that powers this hand."
+
+[requires.install]
+macos = "brew install python3"
+windows = "winget install Python.Python.3.12"
+linux_apt = "sudo apt install python3"
+linux_dnf = "sudo dnf install python3"
+linux_pacman = "sudo pacman -S python"
+manual_url = "https://www.python.org/downloads/"
+estimated_time = "2-5 min"
+
+[[requires]]
+key = "playwright"
+label = "Playwright must be installed"
+requirement_type = "binary"
+check_value = "playwright"
+description = "Playwright is a browser automation framework. After installing via pip, you also need to install browser binaries."
+
+[requires.install]
+macos = "pip3 install playwright && playwright install chromium"
+windows = "pip install playwright && playwright install chromium"
+linux_apt = "pip3 install playwright && playwright install chromium"
+pip = "pip install playwright && playwright install chromium"
+manual_url = "https://playwright.dev/python/docs/intro"
+estimated_time = "3-5 min"
+steps = [
+    "Install Playwright: pip install playwright",
+    "Install browser binaries: playwright install chromium",
+]
+
+# ─── Configurable settings ───────────────────────────────────────────────────
+
+[[settings]]
+key = "headless"
+label = "Headless Mode"
+description = "Run the browser without a visible window (recommended for servers)"
+setting_type = "toggle"
+default = "true"
+
+[[settings]]
+key = "approval_mode"
+label = "Purchase Approval"
+description = "Require explicit user confirmation before completing any purchase or payment"
+setting_type = "toggle"
+default = "true"
+
+[[settings]]
+key = "max_pages_per_task"
+label = "Max Pages Per Task"
+description = "Maximum number of page navigations allowed per task to prevent runaway browsing"
+setting_type = "select"
+default = "20"
+
+[[settings.options]]
+value = "10"
+label = "10 pages (conservative)"
+
+[[settings.options]]
+value = "20"
+label = "20 pages (balanced)"
+
+[[settings.options]]
+value = "50"
+label = "50 pages (thorough)"
+
+[[settings]]
+key = "default_wait"
+label = "Default Wait After Action"
+description = "How long to wait after clicking or navigating for the page to settle"
+setting_type = "select"
+default = "auto"
+
+[[settings.options]]
+value = "auto"
+label = "Auto-detect (wait for DOM)"
+
+[[settings.options]]
+value = "1"
+label = "1 second"
+
+[[settings.options]]
+value = "3"
+label = "3 seconds"
+
+[[settings]]
+key = "screenshot_on_action"
+label = "Screenshot After Actions"
+description = "Automatically take a screenshot after every click/navigate for visual verification"
+setting_type = "toggle"
+default = "false"
+
+# ─── Agent configuration ─────────────────────────────────────────────────────
+
+[agent]
+name = "browser-hand"
+description = "AI web browser — navigates websites, fills forms, searches products, and completes multi-step web tasks autonomously with safety guardrails"
+module = "builtin:chat"
+provider = "default"
+model = "default"
+max_tokens = 16384
+temperature = 0.3
+max_iterations = 60
+system_prompt = """You are Browser Hand — an autonomous web browser agent that interacts with real websites on behalf of the user.
+
+## Core Capabilities
+
+You can navigate to URLs, click buttons/links, fill forms, read page content, and take screenshots. You have a real browser session that persists across tool calls within a conversation.
+
+## Multi-Phase Pipeline
+
+### Phase 1 — Understand the Task
+Parse the user's request and plan your approach:
+- What website(s) do you need to visit?
+- What information do you need to find or what action do you need to perform?
+- What are the success criteria?
+
+### Phase 2 — Navigate & Observe
+1. Use `browser_navigate` to go to the target URL
+2. Read the page content to understand the layout
+3. Identify the relevant elements (buttons, links, forms, search boxes)
+
+### Phase 3 — Interact
+1. Use `browser_click` for buttons and links (use CSS selectors or visible text)
+2. Use `browser_type` for filling form fields
+3. Use `browser_read_page` after each action to see the updated state
+4. Use `browser_screenshot` when you need visual verification
+
+### Phase 4 — MANDATORY Purchase/Payment Approval
+**CRITICAL RULE**: Before completing ANY purchase, payment, or form submission that involves money:
+1. Summarize what you are about to buy/pay for
+2. Show the total cost
+3. List all items in the cart
+4. STOP and ask the user for explicit confirmation
+5. Only proceed after receiving clear approval
+
+NEVER auto-complete purchases. NEVER click "Place Order", "Pay Now", "Confirm Purchase", or any payment button without user approval.
+
+### Phase 5 — Report Results
+After completing the task:
+1. Summarize what was accomplished
+2. Include relevant details (prices, confirmation numbers, etc.)
+3. Save important data to memory for future reference
+
+## CSS Selector Cheat Sheet
+
+Common selectors for web interaction:
+- `#id` — element by ID (e.g., `#search-box`, `#add-to-cart`)
+- `.class` — element by class (e.g., `.btn-primary`, `.product-title`)
+- `input[name="email"]` — input by name attribute
+- `input[type="search"]` — search inputs
+- `button[type="submit"]` — submit buttons
+- `a[href*="cart"]` — links containing "cart" in href
+- `[data-testid="checkout"]` — elements with test IDs
+- `select[name="quantity"]` — dropdown selectors
+
+When CSS selectors fail, fall back to clicking by visible text content.
+
+## Common Web Interaction Patterns
+
+### Search Pattern
+1. Navigate to site
+2. Find search box: `input[type="search"]`, `input[name="q"]`, `#search`
+3. Type query with `browser_type`
+4. Click search button or the text will auto-submit
+5. Read results
+
+### Login Pattern
+1. Navigate to login page
+2. Fill email/username: `input[name="email"]` or `input[type="email"]`
+3. Fill password: `input[name="password"]` or `input[type="password"]`
+4. Click login button: `button[type="submit"]`, `.login-btn`
+5. Verify login success by reading page
+
+### E-commerce Pattern
+1. Search for product
+2. Click product from results
+3. Select options (size, color, quantity)
+4. Click "Add to Cart"
+5. Navigate to cart
+6. Review items and total
+7. **STOP — Ask user for purchase approval**
+8. Only proceed to checkout after approval
+
+### Form Filling Pattern
+1. Navigate to form page
+2. Read form structure
+3. Fill fields one by one with `browser_type`
+4. Use `browser_click` for checkboxes, radio buttons, dropdowns
+5. Screenshot before submission for verification
+6. Submit form
+
+## Error Recovery
+
+- If a click fails, try a different selector or use visible text
+- If a page doesn't load, wait and retry with `browser_navigate`
+- If you get a CAPTCHA, inform the user — you cannot solve CAPTCHAs
+- If a login is required, ask the user for credentials (never store passwords)
+- If blocked or rate-limited, wait and try again, or inform the user
+
+## Security Rules
+
+- NEVER store passwords or credit card numbers in memory
+- NEVER auto-complete payments without user approval
+- NEVER navigate to URLs from untrusted sources without checking them
+- NEVER fill in credentials without the user explicitly providing them
+- If you encounter suspicious or phishing-like content, warn the user immediately
+- Always verify you're on the correct domain before entering sensitive information
+
+## Session Management
+
+- Your browser session persists across messages in this conversation
+- Cookies and login state are maintained
+- Use `browser_close` when you're done to free resources
+- The browser auto-closes when the conversation ends
+
+Update stats via memory_store after each task:
+- `browser_hand_pages_visited` — increment by pages navigated
+- `browser_hand_tasks_completed` — increment by 1
+- `browser_hand_screenshots_taken` — increment by screenshots captured
+"""
+
+[dashboard]
+[[dashboard.metrics]]
+label = "Pages Visited"
+memory_key = "browser_hand_pages_visited"
+format = "number"
+
+[[dashboard.metrics]]
+label = "Tasks Completed"
+memory_key = "browser_hand_tasks_completed"
+format = "number"
+
+[[dashboard.metrics]]
+label = "Screenshots"
+memory_key = "browser_hand_screenshots_taken"
+format = "number"
--- a/crates/openfang-hands/bundled/browser/SKILL.md
+++ b/crates/openfang-hands/bundled/browser/SKILL.md
@@ -0,0 +1,124 @@
+---
+name: browser-automation
+version: "1.0.0"
+description: Playwright-based browser automation patterns for autonomous web interaction
+author: OpenFang
+tags: [browser, automation, playwright, web, scraping]
+tools: [browser_navigate, browser_click, browser_type, browser_screenshot, browser_read_page, browser_close]
+runtime: prompt_only
+---
+
+# Browser Automation Skill
+
+## Playwright CSS Selector Reference
+
+### Basic Selectors
+| Selector | Description | Example |
+|----------|-------------|---------|
+| `#id` | By ID | `#checkout-btn` |
+| `.class` | By class | `.add-to-cart` |
+| `tag` | By element | `button`, `input` |
+| `[attr=val]` | By attribute | `[data-testid="submit"]` |
+| `tag.class` | Combined | `button.primary` |
+
+### Form Selectors
+| Selector | Use Case |
+|----------|----------|
+| `input[type="email"]` | Email fields |
+| `input[type="password"]` | Password fields |
+| `input[type="search"]` | Search boxes |
+| `input[name="q"]` | Google/search query |
+| `textarea` | Multi-line text areas |
+| `select[name="country"]` | Dropdown menus |
+| `input[type="checkbox"]` | Checkboxes |
+| `input[type="radio"]` | Radio buttons |
+| `button[type="submit"]` | Submit buttons |
+
+### Navigation Selectors
+| Selector | Use Case |
+|----------|----------|
+| `a[href*="cart"]` | Cart links |
+| `a[href*="checkout"]` | Checkout links |
+| `a[href*="login"]` | Login links |
+| `nav a` | Navigation menu links |
+| `.breadcrumb a` | Breadcrumb links |
+| `[role="navigation"] a` | ARIA nav links |
+
+### E-commerce Selectors
+| Selector | Use Case |
+|----------|----------|
+| `.product-price`, `[data-price]` | Product prices |
+| `.add-to-cart`, `#add-to-cart` | Add to cart buttons |
+| `.cart-total`, `.order-total` | Cart total |
+| `.quantity`, `input[name="quantity"]` | Quantity selectors |
+| `.checkout-btn`, `#checkout` | Checkout buttons |
+
+## Common Workflows
+
+### Product Search & Purchase
+```
+1. browser_navigate → store homepage
+2. browser_type → search box with product name
+3. browser_click → search button or press Enter
+4. browser_read_page → scan results
+5. browser_click → desired product
+6. browser_read_page → verify product details & price
+7. browser_click → "Add to Cart"
+8. browser_navigate → cart page
+9. browser_read_page → verify cart contents & total
+10. STOP → Report to user, wait for approval
+11. browser_click → "Proceed to Checkout" (only after approval)
+```
+
+### Account Login
+```
+1. browser_navigate → login page
+2. browser_type → email/username field
+3. browser_type → password field
+4. browser_click → login/submit button
+5. browser_read_page → verify successful login
+```
+
+### Form Submission
+```
+1. browser_navigate → form page
+2. browser_read_page → understand form structure
+3. browser_type → fill each field sequentially
+4. browser_click → checkboxes/radio buttons as needed
+5. browser_screenshot → visual verification before submit
+6. browser_click → submit button
+7. browser_read_page → verify confirmation
+```
+
+### Price Comparison
+```
+1. For each store:
+   a. browser_navigate → store URL
+   b. browser_type → search query
+   c. browser_read_page → extract prices
+   d. memory_store → save price data
+2. memory_recall → compare all prices
+3. Report findings to user
+```
+
+## Error Recovery Strategies
+
+| Error | Recovery |
+|-------|----------|
+| Element not found | Try alternative selector, use visible text, scroll page |
+| Page timeout | Retry navigation, check URL |
+| Login required | Inform user, ask for credentials |
+| CAPTCHA | Cannot solve — inform user |
+| Pop-up/modal | Click dismiss/close button first |
+| Cookie consent | Click "Accept" or dismiss banner |
+| Rate limited | Wait 30s, retry |
+| Wrong page | Use browser_read_page to verify, navigate back |
+
+## Security Checklist
+
+- Verify domain before entering credentials
+- Never store passwords in memory_store
+- Check for HTTPS before submitting sensitive data
+- Report suspicious redirects to user
+- Never auto-approve financial transactions
+- Warn about phishing indicators (misspelled domains, unusual URLs)