Provides detailed information about the content of the current Chrome tab, including the most relevant HTML elements that a user or agent might interact with. Contains reliable CSS selectors for use with other Chrome tools.
This endpoint is particularly useful for AI agents that need to understand the structure and content of a web page in order to interact with it effectively. The information returned includes a list of the most relevant HTML elements on the page, along with their CSS selectors, XPaths, and other attributes.
Token Usage: Each invocation of this endpoint consumes 25 Smooth Operator API tokens.
chrome_click_element
and chrome_simulate_input
.
This endpoint requires no parameters. Simply send an empty JSON object.
{}
The response includes detailed information about the current Chrome tab and its content.
Field | Type | Description |
---|---|---|
chromeInstances | Array | List of Chrome instances currently running |
currentChromeTabMostRelevantElements | Array | List of the most relevant HTML elements on the current page that a user might interact with |
currentTabTitle | String | Title of the current tab |
currentTabIndex | Integer | Index of the current tab |
note | String | Additional information or notes about the current tab state |
Each element in the currentChromeTabMostRelevantElements
array contains:
Field | Type | Description |
---|---|---|
elementType | String | The HTML element type (e.g., "input", "button", "a") |
innerText | String | The text content of the element |
cssSelector | String | A reliable CSS selector that can be used to uniquely identify this element |
xpath | String | XPath expression to identify the element |
attributes | Object | Dictionary of element attributes like id, class, href, etc. |
{
"chromeInstances": [
{
"id": "chrome-1",
"title": "Google Chrome",
"tabs": [
{
"id": "tab-1",
"title": "Google - Google Chrome",
"url": "https://www.google.com/"
}
]
}
],
"currentChromeTabMostRelevantElements": [
{
"elementType": "input",
"innerText": "",
"cssSelector": "input[name='q']",
"xpath": "//input[@name='q']",
"attributes": {
"name": "q",
"type": "text",
"maxlength": "2048",
"class": "gLFyf"
}
},
{
"elementType": "button",
"innerText": "Google Search",
"cssSelector": "input[name='btnK']",
"xpath": "//input[@name='btnK']",
"attributes": {
"name": "btnK",
"type": "submit",
"value": "Google Search"
}
}
],
"currentTabTitle": "Google",
"currentTabIndex": 0,
"note": "Google search page with search input and buttons"
}
This endpoint is particularly useful for:
import requests
import json
def explain_current_chrome_tab(api_key):
"""
Get detailed information about the current Chrome tab including relevant HTML elements
Args:
api_key (str): Your API key for authentication
Returns:
dict: Detailed information about the current Chrome tab
"""
endpoint = "http://localhost:54321/tools-api/chrome/current-tab/explain"
headers = {
"Content-Type": "application/json",
"Authorization": f"Bearer {api_key}"
}
response = requests.post(endpoint, headers=headers, data=json.dumps({}))
return response.json()
# Example usage
api_key = "your_api_key_here"
# First open Chrome
# ... (code to open Chrome)
# Then get tab details
tab_details = explain_current_chrome_tab(api_key)
# Use the information to interact with elements
if tab_details and "currentChromeTabMostRelevantElements" in tab_details:
elements = tab_details["currentChromeTabMostRelevantElements"]
# Find a search input if it exists
search_input = next((e for e in elements if e["elementType"] == "input" and
("search" in e.get("attributes", {}).get("name", "").lower() or
"q" == e.get("attributes", {}).get("name", ""))), None)
if search_input:
print(f"Found search input with selector: {search_input['cssSelector']}")
# Now you can use this selector with chrome_simulate_input
else:
print("No search input found on page")
using System;
using System.Net.Http;
using System.Net.Http.Headers;
using System.Text;
using System.Text.Json;
using System.Threading.Tasks;
public class ChromeTabDetails
{
public ChromeOverview[] chromeInstances { get; set; }
public ChromeElementInfo[] currentChromeTabMostRelevantElements { get; set; }
public string currentTabTitle { get; set; }
public int currentTabIndex { get; set; }
public string note { get; set; }
}
public class ChromeOverview
{
public string id { get; set; }
public string title { get; set; }
public ChromeTab[] tabs { get; set; }
}
public class ChromeTab
{
public string id { get; set; }
public string title { get; set; }
public string url { get; set; }
}
public class ChromeElementInfo
{
public string elementType { get; set; }
public string innerText { get; set; }
public string cssSelector { get; set; }
public string xpath { get; set; }
public Dictionary attributes { get; set; }
}
public class ToolsServerClient
{
private readonly HttpClient _httpClient;
public ToolsServerClient(string apiKey)
{
_httpClient = new HttpClient();
_httpClient.BaseAddress = new Uri("http://localhost:54321/");
_httpClient.DefaultRequestHeaders.Accept.Clear();
_httpClient.DefaultRequestHeaders.Accept.Add(new MediaTypeWithQualityHeaderValue("application/json"));
_httpClient.DefaultRequestHeaders.Authorization = new AuthenticationHeaderValue("Bearer", apiKey);
}
public async Task ExplainCurrentChromeTabAsync()
{
var content = new StringContent("{}", Encoding.UTF8, "application/json");
var response = await _httpClient.PostAsync("tools-api/chrome/current-tab/explain", content);
response.EnsureSuccessStatusCode();
var responseString = await response.Content.ReadAsStringAsync();
return JsonSerializer.Deserialize(responseString);
}
}
// Example usage
class Program
{
static async Task Main()
{
var client = new ToolsServerClient("your_api_key_here");
// First open Chrome
// ... (code to open Chrome)
// Then get tab details
var tabDetails = await client.ExplainCurrentChromeTabAsync();
// Use the information to interact with elements
if (tabDetails?.currentChromeTabMostRelevantElements != null)
{
var searchInput = tabDetails.currentChromeTabMostRelevantElements
.FirstOrDefault(e => e.elementType == "input" &&
(e.attributes?.ContainsKey("name") == true &&
(e.attributes["name"].ToLower().Contains("search") || e.attributes["name"] == "q")));
if (searchInput != null)
{
Console.WriteLine($"Found search input with selector: {searchInput.cssSelector}");
// Now you can use this selector with chrome_simulate_input
}
else
{
Console.WriteLine("No search input found on page");
}
}
}
}
interface ChromeTab {
id: string;
title: string;
url: string;
}
interface ChromeOverview {
id: string;
title: string;
tabs: ChromeTab[];
}
interface ChromeElementInfo {
elementType: string;
innerText: string;
cssSelector: string;
xpath: string;
attributes: Record;
}
interface ChromeTabDetails {
chromeInstances: ChromeOverview[];
currentChromeTabMostRelevantElements: ChromeElementInfo[];
currentTabTitle: string;
currentTabIndex: number;
note: string;
}
/**
* Gets detailed information about the current Chrome tab
* @param apiKey Your API key for authentication
* @returns Promise with the Chrome tab details
*/
async function explainCurrentChromeTab(apiKey: string): Promise {
const endpoint = "http://localhost:54321/tools-api/chrome/current-tab/explain";
const response = await fetch(endpoint, {
method: "POST",
headers: {
"Content-Type": "application/json",
"Authorization": `Bearer ${apiKey}`
},
body: JSON.stringify({})
});
if (!response.ok) {
throw new Error(`HTTP error! Status: ${response.status}`);
}
return await response.json() as ChromeTabDetails;
}
// Example usage
const apiKey = "your_api_key_here";
// First open Chrome
// ... (code to open Chrome)
// Then get tab details
explainCurrentChromeTab(apiKey)
.then(tabDetails => {
// Use the information to interact with elements
const elements = tabDetails.currentChromeTabMostRelevantElements;
// Find a search input if it exists
const searchInput = elements.find(e =>
e.elementType === "input" &&
(e.attributes?.name?.toLowerCase().includes("search") || e.attributes?.name === "q")
);
if (searchInput) {
console.log(`Found search input with selector: ${searchInput.cssSelector}`);
// Now you can use this selector with chrome_simulate_input
} else {
console.log("No search input found on page");
}
})
.catch(error => console.error("Error:", error));