WebActive
Webpage Reader
Fetch and extract clean readable text from any URL. Full JS rendering via Playwright — works on SPAs and dynamic sites. Returns title, text (cleaned content, default max 8000 chars), description, word_count, and optional links array. Ideal for web research, content summarization, or feeding page content to an LLM.
Input Schema
{
"type": "object",
"required": [
"url"
],
"properties": {
"url": {
"type": "string",
"format": "uri",
"description": "The URL to read and extract content from"
},
"include_links": {
"type": "boolean",
"default": false,
"description": "If true, include up to 50 links found on the page"
},
"max_chars": {
"type": "integer",
"default": 8000,
"description": "Maximum characters of text to return (truncated with …)"
}
}
}
Output Schema
{
"type": "object",
"required": [
"url",
"title",
"text",
"word_count",
"fetched_at"
],
"properties": {
"url": {
"type": "string",
"description": "Final URL after any redirects"
},
"title": {
"type": "string",
"description": "Page title (from tag)"
},
"description": {
"type": "string",
"description": "Meta description or Open Graph description"
},
"text": {
"type": "string",
"description": "Clean readable text extracted from the page body (scripts, styles, nav, footer removed)"
},
"word_count": {
"type": "integer",
"description": "Approximate number of words in the extracted text"
},
"links": {
"type": "array",
"description": "Links found on the page (only when include_links=true)",
"items": {
"type": "object",
"properties": {
"href": {
"type": "string",
"description": "Absolute URL of the link"
},
"text": {
"type": "string",
"description": "Visible link text"
}
}
}
},
"fetched_at": {
"type": "string",
"format": "date-time",
"description": "ISO 8601 timestamp of when the page was fetched"
},
"http_status": {
"type": "integer",
"description": "HTTP status code of the page response"
}
},
"example": {
"url": "https://example.com",
"title": "Example Domain",
"description": "This domain is for use in illustrative examples in documents.",
"text": "Example Domain\n\nThis domain is for use in illustrative examples in documents. You may use this domain in literature without prior coordination or asking for permission.\n\nMore information...",
"word_count": 34,
"fetched_at": "2026-04-07T12:00:00.000Z",
"http_status": 200
}
}