From 0eb73c778a49b35676c6a3a3a06d9af2f2064400 Mon Sep 17 00:00:00 2001
From: rcholic <ivytony@gmail.com>
Date: Thu, 25 Dec 2025 21:09:46 -0800
Subject: [PATCH] linting

---
 pyproject.toml                         |   2 +-
 sentience/__init__.py                  |   2 +-
 sentience/cli.py                       |   1 -
 sentience_python.egg-info/PKG-INFO     | 508 ++++++++++++++++++++++---
 sentience_python.egg-info/SOURCES.txt  |  18 +
 sentience_python.egg-info/requires.txt |   3 +
 6 files changed, 485 insertions(+), 49 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 43198f3..2ec681f 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "sentience-python"
-version = "0.10.8"
+version = "0.11.0"
 description = "Python SDK for Sentience AI Agent Browser Automation"
 readme = "README.md"
 requires-python = ">=3.11"
diff --git a/sentience/__init__.py b/sentience/__init__.py
index 7c1b07f..edec2ab 100644
--- a/sentience/__init__.py
+++ b/sentience/__init__.py
@@ -41,7 +41,7 @@
 from .snapshot import snapshot
 from .wait import wait_for
 
-__version__ = "0.10.8"
+__version__ = "0.11.0"
 
 __all__ = [
     # Core SDK
diff --git a/sentience/cli.py b/sentience/cli.py
index 088e819..a7f0ef4 100644
--- a/sentience/cli.py
+++ b/sentience/cli.py
@@ -4,7 +4,6 @@
 
 import argparse
 import sys
-from pathlib import Path
 
 from .browser import SentienceBrowser
 from .generator import ScriptGenerator
diff --git a/sentience_python.egg-info/PKG-INFO b/sentience_python.egg-info/PKG-INFO
index 9af70e0..fbff41c 100644
--- a/sentience_python.egg-info/PKG-INFO
+++ b/sentience_python.egg-info/PKG-INFO
@@ -1,97 +1,513 @@
 Metadata-Version: 2.4
 Name: sentience-python
-Version: 0.1.0
+Version: 0.10.8
 Summary: Python SDK for Sentience AI Agent Browser Automation
-Requires-Python: >=3.8
+Author: Sentience Team
+License: MIT
+Project-URL: Homepage, https://github.com/SentienceAPI/sentience-python
+Project-URL: Repository, https://github.com/SentienceAPI/sentience-python
+Project-URL: Issues, https://github.com/SentienceAPI/sentience-python/issues
+Keywords: browser-automation,playwright,ai-agent,web-automation,sentience
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.11
+Requires-Python: >=3.11
 Description-Content-Type: text/markdown
+License-File: LICENSE.md
 Requires-Dist: playwright>=1.40.0
 Requires-Dist: pydantic>=2.0.0
 Requires-Dist: jsonschema>=4.0.0
+Requires-Dist: requests>=2.31.0
+Requires-Dist: playwright-stealth>=1.0.6
+Requires-Dist: markdownify>=0.11.6
 Provides-Extra: dev
 Requires-Dist: pytest>=7.0.0; extra == "dev"
 Requires-Dist: pytest-asyncio>=0.21.0; extra == "dev"
+Dynamic: license-file
 
 # Sentience Python SDK
 
-**Status**: ✅ Week 1 Complete
-
-Python SDK for Sentience AI Agent Browser Automation.
+The SDK is open under ELv2; the core semantic geometry and reliability logic runs in Sentience-hosted services.
 
 ## Installation
 
 ```bash
-cd sdk-python
 pip install -e .
 
 # Install Playwright browsers (required)
 playwright install chromium
+
+# For LLM Agent features (optional)
+pip install openai  # For OpenAI models
+pip install anthropic  # For Claude models
+pip install transformers torch  # For local LLMs
 ```
 
-## Quick Start
+## Quick Start: Choose Your Abstraction Level
+
+Sentience SDK offers **three abstraction levels** - use what fits your needs:
+
+### 🎯 **Level 3: Natural Language (Easiest)** - For non-technical users
+
+```python
+from sentience import SentienceBrowser, ConversationalAgent
+from sentience.llm_provider import OpenAIProvider
+
+browser = SentienceBrowser()
+llm = OpenAIProvider(api_key="your-key", model="gpt-4o")
+agent = ConversationalAgent(browser, llm)
+
+with browser:
+    response = agent.execute("Search for magic mouse on google.com")
+    print(response)
+    # → "I searched for 'magic mouse' and found several results.
+    #    The top result is from amazon.com selling Magic Mouse 2 for $79."
+```
+
+**Best for:** End users, chatbots, no-code platforms
+**Code required:** 3-5 lines
+**Technical knowledge:** None
+
+### ⚙️ **Level 2: Technical Commands (Recommended)** - For AI developers
+
+```python
+from sentience import SentienceBrowser, SentienceAgent
+from sentience.llm_provider import OpenAIProvider
+
+browser = SentienceBrowser()
+llm = OpenAIProvider(api_key="your-key", model="gpt-4o")
+agent = SentienceAgent(browser, llm)
+
+with browser:
+    browser.page.goto("https://google.com")
+    agent.act("Click the search box")
+    agent.act("Type 'magic mouse' into the search field")
+    agent.act("Press Enter key")
+```
+
+**Best for:** Building AI agents, automation scripts
+**Code required:** 10-15 lines
+**Technical knowledge:** Medium (Python basics)
+
+### 🔧 **Level 1: Direct SDK (Most Control)** - For production automation
 
 ```python
 from sentience import SentienceBrowser, snapshot, find, click
 
-# Start browser with extension
 with SentienceBrowser(headless=False) as browser:
     browser.page.goto("https://example.com")
-    browser.page.wait_for_load_state("networkidle")
-    
-    # Take snapshot
+
+    # Take snapshot - captures all interactive elements
     snap = snapshot(browser)
     print(f"Found {len(snap.elements)} elements")
-    
-    # Find and click a link
-    link = find(snap, "role=link")
+
+    # Find and click a link using semantic selectors
+    link = find(snap, "role=link text~'More information'")
     if link:
         result = click(browser, link.id)
         print(f"Click success: {result.success}")
 ```
 
-## Features
+**Best for:** Maximum control, performance-critical apps
+**Code required:** 20-50 lines
+**Technical knowledge:** High (SDK API, selectors)
+
+## Real-World Example: Amazon Shopping Bot
+
+This example demonstrates navigating Amazon, finding products, and adding items to cart:
+
+```python
+from sentience import SentienceBrowser, snapshot, find, click
+import time
+
+with SentienceBrowser(headless=False) as browser:
+    # Navigate to Amazon Best Sellers
+    browser.goto("https://www.amazon.com/gp/bestsellers/", wait_until="domcontentloaded")
+    time.sleep(2)  # Wait for dynamic content
+
+    # Take snapshot and find products
+    snap = snapshot(browser)
+    print(f"Found {len(snap.elements)} elements")
+
+    # Find first product in viewport using spatial filtering
+    products = [
+        el for el in snap.elements
+        if el.role == "link"
+        and el.visual_cues.is_clickable
+        and el.in_viewport
+        and not el.is_occluded
+        and el.bbox.y < 600  # First row
+    ]
+
+    if products:
+        # Sort by position (left to right, top to bottom)
+        products.sort(key=lambda e: (e.bbox.y, e.bbox.x))
+        first_product = products[0]
+
+        print(f"Clicking: {first_product.text}")
+        result = click(browser, first_product.id)
+
+        # Wait for product page
+        browser.page.wait_for_load_state("networkidle")
+        time.sleep(2)
+
+        # Find and click "Add to Cart" button
+        product_snap = snapshot(browser)
+        add_to_cart = find(product_snap, "role=button text~'add to cart'")
+
+        if add_to_cart:
+            cart_result = click(browser, add_to_cart.id)
+            print(f"Added to cart: {cart_result.success}")
+```
+
+**See the complete tutorial**: [Amazon Shopping Guide](../docs/AMAZON_SHOPPING_GUIDE.md)
+
+## Core Features
 
-### Day 2: Browser Harness
-- `SentienceBrowser` - Launch Playwright with extension loaded
-- Automatic extension loading and verification
+### Browser Control
+- **`SentienceBrowser`** - Playwright browser with Sentience extension pre-loaded
+- **`browser.goto(url)`** - Navigate with automatic extension readiness checks
+- Automatic bot evasion and stealth mode
+- Configurable headless/headed mode
 
-### Day 3: Snapshot
-- `snapshot(browser, options)` - Capture page state
+### Snapshot - Intelligent Page Analysis
+- **`snapshot(browser, screenshot=True)`** - Capture page state with AI-ranked elements
+- Returns semantic elements with roles, text, importance scores, and bounding boxes
+- Optional screenshot capture (PNG/JPEG)
 - Pydantic models for type safety
-- `snapshot.save(filepath)` - Save to JSON
-
-### Day 4: Query Engine
-- `query(snapshot, selector)` - Find elements matching selector
-- `find(snapshot, selector)` - Find single best match
-- String DSL: `"role=button text~'Sign in'"`
-
-### Day 5: Actions
-- `click(browser, element_id)` - Click element
-- `type_text(browser, element_id, text)` - Type into element
-- `press(browser, key)` - Press keyboard key
-
-### Day 6: Wait & Assert
-- `wait_for(browser, selector, timeout)` - Wait for element
-- `expect(browser, selector)` - Assertion helper
-  - `.to_exist()`
-  - `.to_be_visible()`
-  - `.to_have_text(text)`
-  - `.to_have_count(n)`
+- **`snapshot.save(filepath)`** - Export to JSON
+
+**Example:**
+```python
+snap = snapshot(browser, screenshot=True)
+
+# Access structured data
+print(f"URL: {snap.url}")
+print(f"Viewport: {snap.viewport.width}x{snap.viewport.height}")
+print(f"Elements: {len(snap.elements)}")
+
+# Iterate over elements
+for element in snap.elements:
+    print(f"{element.role}: {element.text} (importance: {element.importance})")
+```
+
+### Query Engine - Semantic Element Selection
+- **`query(snapshot, selector)`** - Find all matching elements
+- **`find(snapshot, selector)`** - Find single best match (by importance)
+- Powerful query DSL with multiple operators
+
+**Query Examples:**
+```python
+# Find by role and text
+button = find(snap, "role=button text='Sign in'")
+
+# Substring match (case-insensitive)
+link = find(snap, "role=link text~'more info'")
+
+# Spatial filtering
+top_left = find(snap, "bbox.x<=100 bbox.y<=200")
+
+# Multiple conditions (AND logic)
+primary_btn = find(snap, "role=button clickable=true visible=true importance>800")
+
+# Prefix/suffix matching
+starts_with = find(snap, "text^='Add'")
+ends_with = find(snap, "text$='Cart'")
+
+# Numeric comparisons
+important = query(snap, "importance>=700")
+first_row = query(snap, "bbox.y<600")
+```
+
+**📖 [Complete Query DSL Guide](docs/QUERY_DSL.md)** - All operators, fields, and advanced patterns
+
+### Actions - Interact with Elements
+- **`click(browser, element_id)`** - Click element by ID
+- **`click_rect(browser, rect)`** - Click at center of rectangle (coordinate-based)
+- **`type_text(browser, element_id, text)`** - Type into input fields
+- **`press(browser, key)`** - Press keyboard keys (Enter, Escape, Tab, etc.)
+
+All actions return `ActionResult` with success status, timing, and outcome:
+
+```python
+result = click(browser, element.id)
+
+print(f"Success: {result.success}")
+print(f"Outcome: {result.outcome}")  # "navigated", "dom_updated", "error"
+print(f"Duration: {result.duration_ms}ms")
+print(f"URL changed: {result.url_changed}")
+```
+
+**Coordinate-based clicking:**
+```python
+from sentience import click_rect
+
+# Click at center of rectangle (x, y, width, height)
+click_rect(browser, {"x": 100, "y": 200, "w": 50, "h": 30})
+
+# With visual highlight (default: red border for 2 seconds)
+click_rect(browser, {"x": 100, "y": 200, "w": 50, "h": 30}, highlight=True, highlight_duration=2.0)
+
+# Using element's bounding box
+snap = snapshot(browser)
+element = find(snap, "role=button")
+if element:
+    click_rect(browser, {
+        "x": element.bbox.x,
+        "y": element.bbox.y,
+        "w": element.bbox.width,
+        "h": element.bbox.height
+    })
+```
+
+### Wait & Assertions
+- **`wait_for(browser, selector, timeout=5.0, interval=None, use_api=None)`** - Wait for element to appear
+- **`expect(browser, selector)`** - Assertion helper with fluent API
+
+**Examples:**
+```python
+# Wait for element (auto-detects optimal interval based on API usage)
+result = wait_for(browser, "role=button text='Submit'", timeout=10.0)
+if result.found:
+    print(f"Found after {result.duration_ms}ms")
+
+# Use local extension with fast polling (0.25s interval)
+result = wait_for(browser, "role=button", timeout=5.0, use_api=False)
+
+# Use remote API with network-friendly polling (1.5s interval)
+result = wait_for(browser, "role=button", timeout=5.0, use_api=True)
+
+# Custom interval override
+result = wait_for(browser, "role=button", timeout=5.0, interval=0.5, use_api=False)
+
+# Semantic wait conditions
+wait_for(browser, "clickable=true", timeout=5.0)  # Wait for clickable element
+wait_for(browser, "importance>100", timeout=5.0)  # Wait for important element
+wait_for(browser, "role=link visible=true", timeout=5.0)  # Wait for visible link
+
+# Assertions
+expect(browser, "role=button text='Submit'").to_exist(timeout=5.0)
+expect(browser, "role=heading").to_be_visible()
+expect(browser, "role=button").to_have_text("Submit")
+expect(browser, "role=link").to_have_count(10)
+```
+
+### Content Reading
+- **`read(browser, format="text|markdown|raw")`** - Extract page content
+  - `format="text"` - Plain text extraction
+  - `format="markdown"` - High-quality markdown conversion (uses markdownify)
+  - `format="raw"` - Cleaned HTML (default)
+
+**Example:**
+```python
+from sentience import read
+
+# Get markdown content
+result = read(browser, format="markdown")
+print(result["content"])  # Markdown text
+
+# Get plain text
+result = read(browser, format="text")
+print(result["content"])  # Plain text
+```
+
+### Screenshots
+- **`screenshot(browser, format="png|jpeg", quality=80)`** - Standalone screenshot capture
+  - Returns base64-encoded data URL
+  - PNG or JPEG format
+  - Quality control for JPEG (1-100)
+
+**Example:**
+```python
+from sentience import screenshot
+import base64
+
+# Capture PNG screenshot
+data_url = screenshot(browser, format="png")
+
+# Save to file
+image_data = base64.b64decode(data_url.split(",")[1])
+with open("screenshot.png", "wb") as f:
+    f.write(image_data)
+
+# JPEG with quality control (smaller file size)
+data_url = screenshot(browser, format="jpeg", quality=85)
+```
+
+## Element Properties
+
+Elements returned by `snapshot()` have the following properties:
+
+```python
+element.id              # Unique identifier for interactions
+element.role            # ARIA role (button, link, textbox, heading, etc.)
+element.text            # Visible text content
+element.importance      # AI importance score (0-1000)
+element.bbox            # Bounding box (x, y, width, height)
+element.visual_cues     # Visual analysis (is_primary, is_clickable, background_color)
+element.in_viewport     # Is element visible in current viewport?
+element.is_occluded     # Is element covered by other elements?
+element.z_index         # CSS stacking order
+```
+
+## Query DSL Reference
+
+### Basic Operators
+
+| Operator | Description | Example |
+|----------|-------------|---------|
+| `=` | Exact match | `role=button` |
+| `!=` | Exclusion | `role!=link` |
+| `~` | Substring (case-insensitive) | `text~'sign in'` |
+| `^=` | Prefix match | `text^='Add'` |
+| `$=` | Suffix match | `text$='Cart'` |
+| `>`, `>=` | Greater than | `importance>500` |
+| `<`, `<=` | Less than | `bbox.y<600` |
+
+### Supported Fields
+
+- **Role**: `role=button|link|textbox|heading|...`
+- **Text**: `text`, `text~`, `text^=`, `text$=`
+- **Visibility**: `clickable=true|false`, `visible=true|false`
+- **Importance**: `importance`, `importance>=N`, `importance<N`
+- **Position**: `bbox.x`, `bbox.y`, `bbox.width`, `bbox.height`
+- **Layering**: `z_index`
 
 ## Examples
 
-See `examples/` directory:
-- `hello.py` - Extension bridge verification
-- `basic_agent.py` - Basic snapshot
-- `query_demo.py` - Query engine
-- `wait_and_click.py` - Wait and actions
+See the `examples/` directory for complete working examples:
+
+- **`hello.py`** - Extension bridge verification
+- **`basic_agent.py`** - Basic snapshot and element inspection
+- **`query_demo.py`** - Query engine demonstrations
+- **`wait_and_click.py`** - Waiting for elements and performing actions
+- **`read_markdown.py`** - Content extraction and markdown conversion
 
 ## Testing
 
 ```bash
+# Run all tests
 pytest tests/
+
+# Run specific test file
+pytest tests/test_snapshot.py
+
+# Run with verbose output
+pytest -v tests/
 ```
 
+## Configuration
+
+### Viewport Size
+
+Default viewport is **1280x800** pixels. You can customize it using Playwright's API:
+
+```python
+with SentienceBrowser(headless=False) as browser:
+    # Set custom viewport before navigating
+    browser.page.set_viewport_size({"width": 1920, "height": 1080})
+
+    browser.goto("https://example.com")
+```
+
+### Headless Mode
+
+```python
+# Headed mode (default in dev, shows browser window)
+browser = SentienceBrowser(headless=False)
+
+# Headless mode (default in CI environments)
+browser = SentienceBrowser(headless=True)
+
+# Auto-detect based on environment
+browser = SentienceBrowser()  # headless=True if CI=true, else False
+```
+
+## Best Practices
+
+### 1. Wait for Dynamic Content
+```python
+browser.goto("https://example.com", wait_until="domcontentloaded")
+time.sleep(1)  # Extra buffer for AJAX/animations
+```
+
+### 2. Use Multiple Strategies for Finding Elements
+```python
+# Try exact match first
+btn = find(snap, "role=button text='Add to Cart'")
+
+# Fallback to fuzzy match
+if not btn:
+    btn = find(snap, "role=button text~='cart'")
+```
+
+### 3. Check Element Visibility Before Clicking
+```python
+if element.in_viewport and not element.is_occluded:
+    click(browser, element.id)
+```
+
+### 4. Handle Navigation
+```python
+result = click(browser, link_id)
+if result.url_changed:
+    browser.page.wait_for_load_state("networkidle")
+```
+
+### 5. Use Screenshots Sparingly
+```python
+# Fast - no screenshot (only element data)
+snap = snapshot(browser)
+
+# Slower - with screenshot (for debugging/verification)
+snap = snapshot(browser, screenshot=True)
+```
+
+## Troubleshooting
+
+### "Extension failed to load"
+**Solution:** Build the extension first:
+```bash
+cd sentience-chrome
+./build.sh
+```
+
+### "Element not found"
+**Solutions:**
+- Ensure page is loaded: `browser.page.wait_for_load_state("networkidle")`
+- Use `wait_for()`: `wait_for(browser, "role=button", timeout=10)`
+- Debug elements: `print([el.text for el in snap.elements])`
+
+### Button not clickable
+**Solutions:**
+- Check visibility: `element.in_viewport and not element.is_occluded`
+- Scroll to element: `browser.page.evaluate(f"window.sentience_registry[{element.id}].scrollIntoView()")`
+
 ## Documentation
 
-- API Contract: `../spec/SNAPSHOT_V1.md`
-- Type Definitions: `../spec/sdk-types.md`
+- **📖 [Amazon Shopping Guide](../docs/AMAZON_SHOPPING_GUIDE.md)** - Complete tutorial with real-world example
+- **📖 [Query DSL Guide](docs/QUERY_DSL.md)** - Advanced query patterns and operators
+- **📄 [API Contract](../spec/SNAPSHOT_V1.md)** - Snapshot API specification
+- **📄 [Type Definitions](../spec/sdk-types.md)** - TypeScript/Python type definitions
+
+## License
+
+📜 **License**
+
+This SDK is licensed under the **Elastic License 2.0 (ELv2)**.
+
+The Elastic License 2.0 allows you to use, modify, and distribute this SDK for internal, research, and non-competitive purposes. It **does not permit offering this SDK or a derivative as a hosted or managed service**, nor using it to build a competing product or service.
+
+### Important Notes
+
+- This SDK is a **client-side library** that communicates with proprietary Sentience services and browser components.
+
+- The Sentience backend services (including semantic geometry grounding, ranking, visual cues, and trace processing) are **not open source** and are governed by Sentience’s Terms of Service.
+
+- Use of this SDK does **not** grant rights to operate, replicate, or reimplement Sentience’s hosted services.
+
+For commercial usage, hosted offerings, or enterprise deployments, please contact Sentience to obtain a commercial license.
+
+See the full license text in [`LICENSE`](./LICENSE.md).
diff --git a/sentience_python.egg-info/SOURCES.txt b/sentience_python.egg-info/SOURCES.txt
index 53f0ea9..8600025 100644
--- a/sentience_python.egg-info/SOURCES.txt
+++ b/sentience_python.egg-info/SOURCES.txt
@@ -1,15 +1,23 @@
+LICENSE.md
+MANIFEST.in
 README.md
 pyproject.toml
 sentience/__init__.py
 sentience/actions.py
+sentience/agent.py
+sentience/base_agent.py
 sentience/browser.py
 sentience/cli.py
+sentience/conversational_agent.py
 sentience/expect.py
 sentience/generator.py
 sentience/inspector.py
+sentience/llm_provider.py
 sentience/models.py
 sentience/query.py
+sentience/read.py
 sentience/recorder.py
+sentience/screenshot.py
 sentience/snapshot.py
 sentience/wait.py
 sentience_python.egg-info/PKG-INFO
@@ -18,12 +26,22 @@ sentience_python.egg-info/dependency_links.txt
 sentience_python.egg-info/entry_points.txt
 sentience_python.egg-info/requires.txt
 sentience_python.egg-info/top_level.txt
+spec/README.md
+spec/SNAPSHOT_V1.md
+spec/sdk-types.md
+spec/snapshot.schema.json
 tests/test_actions.py
+tests/test_agent.py
+tests/test_bot.py
+tests/test_conversational_agent.py
 tests/test_generator.py
 tests/test_inspector.py
 tests/test_query.py
+tests/test_read.py
 tests/test_recorder.py
+tests/test_screenshot.py
 tests/test_smart_selector.py
 tests/test_snapshot.py
 tests/test_spec_validation.py
+tests/test_stealth.py
 tests/test_wait.py
\ No newline at end of file
diff --git a/sentience_python.egg-info/requires.txt b/sentience_python.egg-info/requires.txt
index 180ad52..9052060 100644
--- a/sentience_python.egg-info/requires.txt
+++ b/sentience_python.egg-info/requires.txt
@@ -1,6 +1,9 @@
 playwright>=1.40.0
 pydantic>=2.0.0
 jsonschema>=4.0.0
+requests>=2.31.0
+playwright-stealth>=1.0.6
+markdownify>=0.11.6
 
 [dev]
 pytest>=7.0.0