jigsawstack/ai-scrape 📝🔢 → 📝

▶️ 23 runs 📅 Jun 2025 ⚙️ Cog 0.15.8
data-extraction document-to-json web-scraping

About

Generate an image based on the given text by employing AI models like Flux, Stable Diffusion, and other top models.

Example Output

Output

{
"page_position": 1,
"page_position_length": 21,
"context": {
"Title": [
"vOCR",
"API Documentation",
"Core AI",
"Translate",
"Data",
"Web Scrape",
"Web Search",
"Prompt Engine",
"Vision",
"Speech to Text",
"Text to Speech",
"Validate",
"File Store"
]
},
"selectors": {
"Title": [
"#page-title",
"h1#page-title",
"header#header h1",
".sidebar-group-header h5",
"h5#sidebar-title"
]
},
"link": [
{
"href": "https://jigsawstack.com/",
"text": "JigsawStack home page",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/introduction",
"text": "Documentation",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/authentication",
"text": "API Reference",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/authentication",
"text": "Authentication",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/error",
"text": "Errors",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/sentiment",
"text": "POSTSentiment",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/summary",
"text": "POSTSummary",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/image-generation",
"text": "POSTImage Generation",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/translate/translate",
"text": "POSTText Translate",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/translate/image-translate",
"text": "POSTImage Translate",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/embedding",
"text": "POSTEmbedding",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/prediction",
"text": "POSTPrediction",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/text-to-sql",
"text": "POSTText to SQL",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/scrape",
"text": "POSTAI Scraper",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/web/html-to-any",
"text": "POSTHTML To Any",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/web/ai-search",
"text": "POSTAI Search",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/web/search-suggestion",
"text": "GETSearch Suggestion",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/prompt-engine/create",
"text": "POSTCreate Prompt",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/prompt-engine/run",
"text": "POSTRun Prompt",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/prompt-engine/retrieve",
"text": "GETGet Prompt",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/prompt-engine/list",
"text": "GETList Prompts",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/prompt-engine/delete",
"text": "DELDelete a Prompt",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/prompt-engine/run-direct",
"text": "POSTRun Prompt Direct",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/vocr",
"text": "POSTvOCR",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/object-detection",
"text": "POSTObject Detection",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/speech-to-text",
"text": "POSTSpeech to Text",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/audio/tts/text-to-speech",
"text": "POSTText to Speech",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/audio/tts/create-clone",
"text": "POSTCreate Voice Clone",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/audio/tts/list-clones",
"text": "GETList Voice Clones",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/audio/tts/delete-clone",
"text": "DELDelete Voice Clone",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/validate/nsfw",
"text": "POSTNSFW",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/validate/profanity",
"text": "POSTProfanity",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/validate/spellcheck",
"text": "POSTSpell Check",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/spam-check",
"text": "POSTSpam Check",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/store/file/add",
"text": "POSTUpload",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/store/file/get",
"text": "GETRetrieve",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/store/file/delete",
"text": "DELDelete",
"type": "a"
},
{
"href": "https://jigsawstack.com/help",
"text": "Support",
"type": "a"
},
{
"href": "https://jigsawstack.com/dashboard",
"text": "Dashboard",
"type": "a"
},
{
"href": "https://jigsawstack.com/",
"text": "JigsawStack home page",
"type": "a"
},
{
"href": "https://jigsawstack.com/help",
"text": "Support",
"type": "a"
},
{
"href": "https://jigsawstack.com/dashboard",
"text": "Dashboard",
"type": "a"
},
{
"href": "https://jigsawstack.com/dashboard",
"text": "Dashboard",
"type": "a"
},
{
"href": "https://jigsawstack.com/#body",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#param-prompt",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#param-url",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#param-file-store-key",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/store/file/add",
"text": "Storage",
"type": "a"
},
{
"href": "https://jigsawstack.com/#param-page-range",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#prompt-example",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#header",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#param-x-api-key",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#response",
"text": "\u200b",
"type": "a"
},
{
"href": "https://jigsawstack.com/#param-success",
"text": "\u200b",
"type": "a"
},
{
"href": "https://github.com/jigsawstack/docs/edit/main/docs/api-reference/ai/vocr.mdx",
"text": "Suggest edits",
"type": "a"
},
{
"href": "https://github.com/jigsawstack/docs/issues/new?title=Issue on docs&body=Path: /docs/api-reference/ai/vocr",
"text": "Raise issue",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/prompt-engine/run-direct",
"text": "Previous",
"type": "a"
},
{
"href": "https://jigsawstack.com/docs/api-reference/ai/object-detection",
"text": "Object DetectionRecognise objects within an image with great accuracy.Next",
"type": "a"
},
{
"href": "https://twitter.com/jigsawstack",
"text": "twitter",
"type": "a"
},
{
"href": "https://github.com/jigsawstack",
"text": "github",
"type": "a"
},
{
"href": "https://www.linkedin.com/company/jigsawstack",
"text": "linkedin",
"type": "a"
},
{
"href": "https://jigsawstack.com/discord",
"text": "discord",
"type": "a"
},
{
"href": "https://mintlify.com/preview-request?utm_campaign=poweredBy&utm_medium=referral&utm_source=jigsaw-13",
"text": "Powered by Mintlify",
"type": "a"
},
{
"href": "https://mintlify.s3.us-west-1.amazonaws.com/jigsaw-13/logo/logo.svg",
"text": "light logo",
"type": "img"
},
{
"href": "https://mintlify.s3.us-west-1.amazonaws.com/jigsaw-13/logo/logo.svg",
"text": "dark logo",
"type": "img"
},
{
"href": "https://mintlify.s3.us-west-1.amazonaws.com/jigsaw-13/logo/logo.svg",
"text": "light logo",
"type": "img"
},
{
"href": "https://mintlify.s3.us-west-1.amazonaws.com/jigsaw-13/logo/logo.svg",
"text": "dark logo",
"type": "img"
}
],
"data": [
{
"selector": "#page-title",
"results": [
{
"html": "vOCR",
"text": "vOCR",
"attributes": [
{
"name": "id",
"value": "page-title"
},
{
"name": "class",
"value": "inline-block text-2xl sm:text-3xl text-gray-900 tracking-tight dark:text-gray-200 font-semibold"
}
]
}
],
"key": "Title"
},
{
"selector": "h1#page-title",
"results": [
{
"html": "vOCR",
"text": "vOCR",
"attributes": [
{
"name": "id",
"value": "page-title"
},
{
"name": "class",
"value": "inline-block text-2xl sm:text-3xl text-gray-900 tracking-tight dark:text-gray-200 font-semibold"
}
]
}
],
"key": "Title"
},
{
"selector": "header#header h1",
"results": [
{
"html": "vOCR",
"text": "vOCR",
"attributes": [
{
"name": "id",
"value": "page-title"
},
{
"name": "class",
"value": "inline-block text-2xl sm:text-3xl text-gray-900 tracking-tight dark:text-gray-200 font-semibold"
}
]
}
],
"key": "Title"
},
{
"selector": ".sidebar-group-header h5",
"results": [
{
"html": "API Documentation",
"text": "API Documentation",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Core AI",
"text": "Core AI",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Translate",
"text": "Translate",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Data",
"text": "Data",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Web Scrape",
"text": "Web Scrape",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Web Search",
"text": "Web Search",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Prompt Engine",
"text": "Prompt Engine",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Vision",
"text": "Vision",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Speech to Text",
"text": "Speech to Text",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Text to Speech",
"text": "Text to Speech",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Validate",
"text": "Validate",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "File Store",
"text": "File Store",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
}
],
"key": "Title"
},
{
"selector": "h5#sidebar-title",
"results": [
{
"html": "API Documentation",
"text": "API Documentation",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Core AI",
"text": "Core AI",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Translate",
"text": "Translate",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Data",
"text": "Data",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Web Scrape",
"text": "Web Scrape",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Web Search",
"text": "Web Search",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Prompt Engine",
"text": "Prompt Engine",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Vision",
"text": "Vision",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Speech to Text",
"text": "Speech to Text",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Text to Speech",
"text": "Text to Speech",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "Validate",
"text": "Validate",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
},
{
"html": "File Store",
"text": "File Store",
"attributes": [
{
"name": "id",
"value": "sidebar-title"
}
]
}
],
"key": "Title"
}
],
"success": true,
"advance_config": {
"console": [],
"network": [],
"cookies": []
},
"_usage": {
"input_tokens": 49,
"output_tokens": 2566,
"inference_time_tokens": 108214,
"total_tokens": 110829
}
}

Performance Metrics

108.34s Prediction Time
108.35s Total Time
All Input Parameters
{
  "url": "https://jigsawstack.com/docs/api-reference/ai/vocr?slug=docs&slug=api-reference&slug=ai&slug=vocr",
  "html": "",
  "api_key": "sk_ba8d51db7829aef7ec445bb80dd59b7ff2c320d851eb6ae4cf41aacfab4df81c690774957983ebcc02f08429fccdfe42b4d8ee6a40b404399c10ca3bcabdbb72024KnIELzWIzzblw1gtM6",
  "page_position": 1,
  "element_prompts": "Title",
  "root_element_selector": "main"
}
Input Parameters
url Type: stringDefault:
URL of the page to scrape
html Type: stringDefault:
HTML content to scrape (alternative to URL)
api_key Type: string
🔐 Your JigsawStack API Key (required)
page_position Type: integerDefault: 1
Page number for pagination (minimum: 1)
element_prompts Type: stringDefault:
Comma-separated list of elements to scrape (max 5). E.g. 'Plan price, Plan title'
root_element_selector Type: stringDefault: main
CSS selector to limit scraping scope
Output Schema

Output

Type: string

Version Details
Version ID
1f2b4096ba192701c994075d4a7652c8071e86cc76bd9458d6bb3c8c22ff32c6
Version Created
June 24, 2025
Run on Replicate →