Explain Current Chrome Tab

POST
/tools-api/chrome/current-tab/explain

Provides detailed information about the content of the current Chrome tab, including the most relevant HTML elements that a user or agent might interact with. Contains reliable CSS selectors for use with other Chrome tools.

This endpoint is particularly useful for AI agents that need to understand the structure and content of a web page in order to interact with it effectively. The information returned includes a list of the most relevant HTML elements on the page, along with their CSS selectors, XPaths, and other attributes.

Token Usage: Each invocation of this endpoint consumes 25 Smooth Operator API tokens.

Best Practice: Always call this endpoint before performing other Chrome actions to identify the most appropriate elements to interact with. The CSS selectors provided are highly reliable for use with other Chrome endpoints like chrome_click_element and chrome_simulate_input.

Request Format

This endpoint requires no parameters. Simply send an empty JSON object.

{}

Response Format

The response includes detailed information about the current Chrome tab and its content.

Response Object Structure

Field Type Description
chromeInstances Array List of Chrome instances currently running
currentChromeTabMostRelevantElements Array List of the most relevant HTML elements on the current page that a user might interact with
currentTabTitle String Title of the current tab
currentTabIndex Integer Index of the current tab
note String Additional information or notes about the current tab state

Element Object Structure

Each element in the currentChromeTabMostRelevantElements array contains:

Field Type Description
elementType String The HTML element type (e.g., "input", "button", "a")
innerText String The text content of the element
cssSelector String A reliable CSS selector that can be used to uniquely identify this element
xpath String XPath expression to identify the element
attributes Object Dictionary of element attributes like id, class, href, etc.

Example Response

{
  "chromeInstances": [
    {
      "id": "chrome-1",
      "title": "Google Chrome",
      "tabs": [
        {
          "id": "tab-1",
          "title": "Google - Google Chrome",
          "url": "https://www.google.com/"
        }
      ]
    }
  ],
  "currentChromeTabMostRelevantElements": [
    {
      "elementType": "input",
      "innerText": "",
      "cssSelector": "input[name='q']",
      "xpath": "//input[@name='q']",
      "attributes": {
        "name": "q",
        "type": "text",
        "maxlength": "2048",
        "class": "gLFyf"
      }
    },
    {
      "elementType": "button",
      "innerText": "Google Search",
      "cssSelector": "input[name='btnK']",
      "xpath": "//input[@name='btnK']",
      "attributes": {
        "name": "btnK",
        "type": "submit",
        "value": "Google Search"
      }
    }
  ],
  "currentTabTitle": "Google",
  "currentTabIndex": 0,
  "note": "Google search page with search input and buttons"
}
Note: All JSON keys in the response are in camelCase format (e.g., "currentChromeTabMostRelevantElements", "elementType", "cssSelector").

Use Cases

This endpoint is particularly useful for:

Code Examples

import requests
import json

def explain_current_chrome_tab(api_key):
    """
    Get detailed information about the current Chrome tab including relevant HTML elements
    
    Args:
        api_key (str): Your API key for authentication
    
    Returns:
        dict: Detailed information about the current Chrome tab
    """
    endpoint = "http://localhost:54321/tools-api/chrome/current-tab/explain"
    
    headers = {
        "Content-Type": "application/json",
        "Authorization": f"Bearer {api_key}"
    }
    
    response = requests.post(endpoint, headers=headers, data=json.dumps({}))
    return response.json()

# Example usage
api_key = "your_api_key_here"

# First open Chrome
# ... (code to open Chrome)

# Then get tab details
tab_details = explain_current_chrome_tab(api_key)

# Use the information to interact with elements
if tab_details and "currentChromeTabMostRelevantElements" in tab_details:
    elements = tab_details["currentChromeTabMostRelevantElements"]
    
    # Find a search input if it exists
    search_input = next((e for e in elements if e["elementType"] == "input" and 
                         ("search" in e.get("attributes", {}).get("name", "").lower() or 
                          "q" == e.get("attributes", {}).get("name", ""))), None)
    
    if search_input:
        print(f"Found search input with selector: {search_input['cssSelector']}")
        # Now you can use this selector with chrome_simulate_input
    else:
        print("No search input found on page")
using System;
using System.Net.Http;
using System.Net.Http.Headers;
using System.Text;
using System.Text.Json;
using System.Threading.Tasks;

public class ChromeTabDetails
{
    public ChromeOverview[] chromeInstances { get; set; }
    public ChromeElementInfo[] currentChromeTabMostRelevantElements { get; set; }
    public string currentTabTitle { get; set; }
    public int currentTabIndex { get; set; }
    public string note { get; set; }
}

public class ChromeOverview
{
    public string id { get; set; }
    public string title { get; set; }
    public ChromeTab[] tabs { get; set; }
}

public class ChromeTab
{
    public string id { get; set; }
    public string title { get; set; }
    public string url { get; set; }
}

public class ChromeElementInfo
{
    public string elementType { get; set; }
    public string innerText { get; set; }
    public string cssSelector { get; set; }
    public string xpath { get; set; }
    public Dictionary attributes { get; set; }
}

public class ToolsServerClient
{
    private readonly HttpClient _httpClient;
    
    public ToolsServerClient(string apiKey)
    {
        _httpClient = new HttpClient();
        _httpClient.BaseAddress = new Uri("http://localhost:54321/");
        _httpClient.DefaultRequestHeaders.Accept.Clear();
        _httpClient.DefaultRequestHeaders.Accept.Add(new MediaTypeWithQualityHeaderValue("application/json"));
        _httpClient.DefaultRequestHeaders.Authorization = new AuthenticationHeaderValue("Bearer", apiKey);
    }
    
    public async Task ExplainCurrentChromeTabAsync()
    {
        var content = new StringContent("{}", Encoding.UTF8, "application/json");
        
        var response = await _httpClient.PostAsync("tools-api/chrome/current-tab/explain", content);
        response.EnsureSuccessStatusCode();
        
        var responseString = await response.Content.ReadAsStringAsync();
        return JsonSerializer.Deserialize(responseString);
    }
}

// Example usage
class Program
{
    static async Task Main()
    {
        var client = new ToolsServerClient("your_api_key_here");
        
        // First open Chrome
        // ... (code to open Chrome)
        
        // Then get tab details
        var tabDetails = await client.ExplainCurrentChromeTabAsync();
        
        // Use the information to interact with elements
        if (tabDetails?.currentChromeTabMostRelevantElements != null)
        {
            var searchInput = tabDetails.currentChromeTabMostRelevantElements
                .FirstOrDefault(e => e.elementType == "input" && 
                    (e.attributes?.ContainsKey("name") == true && 
                     (e.attributes["name"].ToLower().Contains("search") || e.attributes["name"] == "q")));
            
            if (searchInput != null)
            {
                Console.WriteLine($"Found search input with selector: {searchInput.cssSelector}");
                // Now you can use this selector with chrome_simulate_input
            }
            else
            {
                Console.WriteLine("No search input found on page");
            }
        }
    }
}
interface ChromeTab {
  id: string;
  title: string;
  url: string;
}

interface ChromeOverview {
  id: string;
  title: string;
  tabs: ChromeTab[];
}

interface ChromeElementInfo {
  elementType: string;
  innerText: string;
  cssSelector: string;
  xpath: string;
  attributes: Record;
}

interface ChromeTabDetails {
  chromeInstances: ChromeOverview[];
  currentChromeTabMostRelevantElements: ChromeElementInfo[];
  currentTabTitle: string;
  currentTabIndex: number;
  note: string;
}

/**
 * Gets detailed information about the current Chrome tab
 * @param apiKey Your API key for authentication
 * @returns Promise with the Chrome tab details
 */
async function explainCurrentChromeTab(apiKey: string): Promise {
  const endpoint = "http://localhost:54321/tools-api/chrome/current-tab/explain";
  
  const response = await fetch(endpoint, {
    method: "POST",
    headers: {
      "Content-Type": "application/json",
      "Authorization": `Bearer ${apiKey}`
    },
    body: JSON.stringify({})
  });
  
  if (!response.ok) {
    throw new Error(`HTTP error! Status: ${response.status}`);
  }
  
  return await response.json() as ChromeTabDetails;
}

// Example usage
const apiKey = "your_api_key_here";

// First open Chrome
// ... (code to open Chrome)

// Then get tab details
explainCurrentChromeTab(apiKey)
  .then(tabDetails => {
    // Use the information to interact with elements
    const elements = tabDetails.currentChromeTabMostRelevantElements;
    
    // Find a search input if it exists
    const searchInput = elements.find(e => 
      e.elementType === "input" && 
      (e.attributes?.name?.toLowerCase().includes("search") || e.attributes?.name === "q")
    );
    
    if (searchInput) {
      console.log(`Found search input with selector: ${searchInput.cssSelector}`);
      // Now you can use this selector with chrome_simulate_input
    } else {
      console.log("No search input found on page");
    }
  })
  .catch(error => console.error("Error:", error));

Related Endpoints