Decodo
diff --git a/‎.agents/AGENTS.md‎
Lines changed: 33 additions & 1 deletion b/‎.agents/AGENTS.md‎
Lines changed: 33 additions & 1 deletion
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 1 deletion b/‎.gitignore‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎README.md‎
Lines changed: 53 additions & 28 deletions b/‎README.md‎
Lines changed: 53 additions & 28 deletions
diff --git a/‎eslint.config.mjs‎
Lines changed: 1 addition & 0 deletions b/‎eslint.config.mjs‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎jest.config.js‎
Lines changed: 6 additions & 0 deletions b/‎jest.config.js‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/__tests__/scraper-api-client.test.ts‎ ‎…nts/__tests__/scraper-api-client.test.ts‎src/__tests__/scraper-api-client.test.ts renamed to src/clients/__tests__/scraper-api-client.test.ts
Lines changed: 1 addition & 1 deletion b/‎src/__tests__/scraper-api-client.test.ts‎ ‎…nts/__tests__/scraper-api-client.test.ts‎src/__tests__/scraper-api-client.test.ts renamed to src/clients/__tests__/scraper-api-client.test.ts
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/constants.ts‎
Lines changed: 29 additions & 0 deletions b/‎src/constants.ts‎
Lines changed: 29 additions & 0 deletions
diff --git a/‎src/index.ts‎
Lines changed: 3 additions & 2 deletions b/‎src/index.ts‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎src/server.ts‎
Lines changed: 1 addition & 3 deletions b/‎src/server.ts‎
Lines changed: 1 addition & 3 deletions
@@ -1 +1,33 @@
-- When adding a new tool, make sure that it has tests and that its usage is documented in the readme.
+When a new target is added to Decodo utils, transform that target into a tool usable within the MCP
+server.
+
+# Generation
+
+- Make sure you actually see the target configuration from which we'll build the tool. Do not guess
+  the tool setup.
+- You can find the target configuration in smartproxy-dashboard/repos/utils/scraping.
+- Make a new folder in `src/tools`.
+- Name the tool the same as the target name.
+- Add the target to an existing toolset. If none of the existing toolsets fit the target, either
+  raise an issue or add the tool to the `web` toolset.
+
+# Parameters
+
+- Only add the top 7 parameters for each target. These will likely be `url`, `query`, `geo`, `local`
+  and `jsRender`.
+- For `url` and `query`, make sure to add an example of a correct input inside the description.
+- Make sure to map `jsRender` to `headless: "html"`.
+- Only set `parse: true` if the target actually supports parsing.
+- Never add the `output` parameter.
+- If a target has a `markdown` parameter, always set it to `true`.
+- If both `parse` and `markdown` are available as parameters, prefer to use `markdown: true`.
+
+# Testing
+
+- Add tests that check successful and unsuccessful tool calls.
+- After generating the tool, call the tool to actually test it.
+- When testing by calling the tool, prefer to not set the `jsRender` parameter.
+
+# Documentation
+
+- Update readme with new tool, toolset and parameter information.
@@ -1,4 +1,5 @@
 node_modules
 build
 
-.env
+.env
+.vscode
@@ -4,7 +4,6 @@
 [![Install MCP Server](https://cursor.com/deeplink/mcp-install-dark.svg)](https://cursor.com/en-US/install-mcp?name=Decodo&config=eyJ1cmwiOiJodHRwczovL21jcC5kZWNvZG8uY29tL21jcCIsImhlYWRlcnMiOnsiQXV0aG9yaXphdGlvbiI6IkJhc2ljIDx3ZWJfYWR2YW5jZWRfdG9rZW4%2BIn19)
 [![smithery badge](https://smithery.ai/badge/@Decodo/decodo-mcp-server)](https://smithery.ai/server/@Decodo/decodo-mcp-server)
 
-
 <p align="center">
 <a href="https://dashboard.decodo.com/integrations?utm_source=github&utm_medium=social&utm_campaign=mcp_server"> <img src="https://github.com/user-attachments/assets/a1e52a9e-3da1-4081-b3c6-053aafb8f196"/></a>
 
@@ -23,9 +22,11 @@ services, streamlining access to our tools and capabilities.
 
 ## Connecting to [Decodo's MCP server](https://mcp.decodo.com/mcp)
 
-1. Go to [decodo.com](https://decodo.com/scraping/web) and start a Web Scraping API plan (free trials available).
+1. Go to [decodo.com](https://decodo.com/scraping/web) and start a Web Scraping API plan (free
+   trials available).
 
-2. Once your plan has started, obtain a Web Scraping API basic authentication token from the [dashboard](https://dashboard.decodo.com/).
+2. Once your plan has started, obtain a Web Scraping API basic authentication token from the
+   [dashboard](https://dashboard.decodo.com/).
 
 3. Open your preferred MCP client and add the following configuration:
 
@@ -100,41 +101,65 @@ comma-separated list via the `toolsets` query parameter:
 
 When no toolsets are specified, all tools are registered.
 
-| Toolset        | Tools                                                          |
-| -------------- | -------------------------------------------------------------- |
-| `web`          | `scrape_as_markdown`, `screenshot`                             |
-| `search`       | `google_search_parsed`                                         |
-| `ecommerce`    | `amazon_search_parsed`                                         |
-| `social_media` | `reddit_post`, `reddit_subreddit`                              |
-| `ai`           | `chatgpt`, `perplexity`                                        |
+| Toolset        | Tools                                                                                                                                                                               |
+| -------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `web`          | `scrape_as_markdown`, `screenshot`                                                                                                                                                  |
+| `search`       | `google_search`, `google_ads`, `google_lens`, `google_travel_hotels`, `bing_search`                                                                                                |
+| `ecommerce`    | `amazon_search`, `amazon_product`, `amazon_pricing`, `amazon_sellers`, `amazon_bestsellers`, `walmart_search`, `walmart_product`, `target_search`, `target_product`, `tiktok_shop_search`, `tiktok_shop_product`, `tiktok_shop_url` |
+| `social_media` | `reddit_post`, `reddit_subreddit`, `reddit_user`, `tiktok_post`, `youtube_video`, `youtube_metadata`, `youtube_channel`, `youtube_subtitles`, `youtube_search`                    |
+| `ai`           | `chatgpt`, `perplexity`, `google_ai_mode`                                                                                                                                           |
 
 ## Tools
 
 The server exposes the following tools:
 
-| Tool                   | Description                                                                                | Example prompt                                                                          |
-| ---------------------- | ------------------------------------------------------------------------------------------ | --------------------------------------------------------------------------------------- |
-| `scrape_as_markdown`   | Scrapes any target URL, expects a URL to be given via prompt. Returns results in Markdown. | Scrape peacock.com from a US IP address and tell me the pricing.                        |
-| `screenshot`           | Captures a screenshot of any webpage and returns it as a PNG image.                        | Take a screenshot of github.com from a US IP address.                                   |
-| `google_search_parsed` | Scrapes Google Search for a given query, and returns parsed results.                       | Scrape Google Search for shoes and tell me the top position.                            |
-| `amazon_search_parsed` | Scrapes Amazon Search for a given query, and returns parsed results.                       | Scrape Amazon Search for toothbrushes.                                                  |
-| `reddit_post`          | Scrapes a specific Reddit post for a given query, and returns parsed results.              | Scrape the following Reddit post: https://www.reddit.com/r/horseracing/comments/1nsrn3/ |
-| `reddit_subreddit`     | Scrapes a specific Reddit subreddit for a given query, and returns parsed results.         | Scrape the top 5 posts on r/Python this week.                                           |
-| `chatgpt`              | Search and interact with ChatGPT for AI-powered responses and conversations.               | Ask ChatGPT to explain quantum computing in simple terms.                               |
-| `perplexity`           | Search and interact with Perplexity for AI-powered responses and conversations.            | Ask Perplexity what the latest trends in web development are.                           |
+| Tool                    | Description                                                                                | Example prompt                                                                          |
+| ----------------------- | ------------------------------------------------------------------------------------------ | --------------------------------------------------------------------------------------- |
+| `scrape_as_markdown`    | Scrapes any target URL, expects a URL to be given via prompt. Returns results in Markdown. | Scrape peacock.com from a US IP address and tell me the pricing.                        |
+| `screenshot`            | Captures a screenshot of any webpage and returns it as a PNG image.                        | Take a screenshot of github.com from a US IP address.                                   |
+| `google_search`         | Scrapes Google Search for a given query, and returns parsed results.                       | Scrape Google Search for shoes and tell me the top position.                            |
+| `google_ads`            | Scrapes Google Ads search results with automatic parsing.                                  | Scrape Google Ads for laptop and show me the top ads.                                   |
+| `google_lens`           | Scrapes Google Lens image search results with automatic parsing.                           | Search Google Lens for this image: https://example.com/image.jpg                        |
+| `google_ai_mode`        | Scrapes Google AI Mode (Search with AI) results with automatic parsing.                    | Ask Google AI Mode: What are the top three dog breeds?                                  |
+| `google_travel_hotels`  | Scrapes Google Travel Hotels search results.                                               | Search Google Travel Hotels for hotels in Paris.                                        |
+| `amazon_search`         | Scrapes Amazon Search for a given query, and returns parsed results.                       | Scrape Amazon Search for wireless keyboard.                                             |
+| `amazon_product`        | Scrapes Amazon Product page with automatic parsing.                                        | Scrape Amazon product B09H74FXNW and show me the details.                               |
+| `amazon_pricing`        | Scrapes Amazon Product pricing information with automatic parsing.                         | Get pricing for Amazon product B09H74FXNW.                                              |
+| `amazon_sellers`        | Scrapes Amazon Seller information with automatic parsing.                                  | Get information about Amazon seller A1R0Z7FJGTKESH.                                     |
+| `amazon_bestsellers`    | Scrapes Amazon Bestsellers list with automatic parsing.                                    | Show me Amazon bestsellers in electronics.                                              |
+| `walmart_search`        | Scrapes Walmart Search for a given query, and returns parsed results.                      | Scrape Walmart Search for camping tent.                                                 |
+| `walmart_product`       | Scrapes Walmart Product page with automatic parsing.                                       | Scrape Walmart product 15296401808.                                                     |
+| `target_search`         | Scrapes Target Search for a given query, and returns parsed results.                       | Scrape Target Search for kitchen appliances.                                            |
+| `target_product`        | Scrapes Target Product page with automatic parsing.                                        | Scrape Target product 92186007.                                                         |
+| `tiktok_post`           | Scrapes a TikTok post URL for structured data (e.g. engagement, caption, hashtags).        | Scrape this TikTok post: https://www.tiktok.com/@nba/video/7393013274725403950          |
+| `tiktok_shop_search`    | Scrapes TikTok Shop Search for a given query, and returns parsed results.                  | Scrape TikTok Shop Search for phone cases.                                              |
+| `tiktok_shop_product`   | Scrapes TikTok Shop Product page.                                                          | Scrape TikTok Shop product 1731541214379741272.                                         |
+| `tiktok_shop_url`       | Scrapes TikTok Shop page by URL.                                                           | Scrape this TikTok Shop URL: https://www.tiktok.com/shop/s?q=HEADPHONES                 |
+| `youtube_video`         | Scrapes YouTube video information.                                                         | Scrape YouTube video 6Ejga4kJUts.                                                       |
+| `youtube_metadata`      | Scrapes YouTube video metadata.                                                            | Get metadata for YouTube video dFu9aKJoqGg.                                             |
+| `youtube_channel`       | Scrapes YouTube channel videos with automatic parsing.                                     | Scrape YouTube channel @decodo_official.                                                |
+| `youtube_subtitles`     | Scrapes YouTube video subtitles.                                                           | Get subtitles for YouTube video L8zSWbQN-v8.                                            |
+| `youtube_search`        | Search YouTube videos.                                                                     | Search YouTube for "How to care for chinchillas".                                       |
+| `reddit_post`           | Scrapes a specific Reddit post for a given query, and returns parsed results.              | Scrape the following Reddit post: https://www.reddit.com/r/horseracing/comments/1nsrn3/ |
+| `reddit_subreddit`      | Scrapes a specific Reddit subreddit for a given query, and returns parsed results.         | Scrape the top 5 posts on r/Python this week.                                           |
+| `reddit_user`           | Scrapes a Reddit user profile and their posts or comments.                                 | Scrape Reddit user u/spez's profile.                                                    |
+| `bing_search`           | Scrapes Bing Search results with automatic parsing.                                        | Search Bing for laptop reviews.                                                         |
+| `chatgpt`               | Search and interact with ChatGPT for AI-powered responses and conversations.               | Ask ChatGPT to explain quantum computing in simple terms.                               |
+| `perplexity`            | Search and interact with Perplexity for AI-powered responses and conversations.            | Ask Perplexity what the latest trends in web development are.                           |
 
 ## Parameters
 
 The following parameters are inferred from user prompts:
 
-| Parameter      | Description                                                                                          |
-| -------------- | ---------------------------------------------------------------------------------------------------- |
-| `jsRender`     | Renders target URL in a headless browser.                                                            |
-| `geo`          | Sets the country from which the request will originate.                                              |
-| `locale`       | Sets the locale of the request.                                                                      |
-| `tokenLimit`   | Truncates the response content up to this limit. Useful if the context window is small.              |
-| `prompt`       | Prompt to send to AI tools (`chatgpt`, `perplexity`).                                                |
-| `search`       | Activates ChatGPT's web search functionality (`chatgpt` only).                                       |
+| Parameter    | Description                                                                                           |
+| ------------ | ----------------------------------------------------------------------------------------------------- |
+| `jsRender`   | Renders target URL in a headless browser.                                                             |
+| `geo`        | Sets the country from which the request will originate.                                               |
+| `locale`     | Sets the locale of the request.                                                                       |
+| `tokenLimit` | Truncates the response content up to this limit. Useful if the context window is small.               |
+| `prompt`     | Prompt to send to AI tools (`chatgpt`, `perplexity`).                                                 |
+| `search`     | Activates ChatGPT's web search functionality (`chatgpt` only).                                        |
+| `xhr`        | When true, includes XHR or fetch responses in the scrape result where supported (e.g. `tiktok_post`). |
 
 ## Examples
 
 
@@ -8,6 +8,7 @@ export default tseslint.config(
     files: ['src/**/*.ts'],
     rules: {
       'curly': ['error', 'all'],
+      'lines-between-class-members': ['error', 'always', { exceptAfterSingleLine: false }],
       'prefer-arrow-callback': 'error',
       'no-restricted-syntax': [
         'error',
 
@@ -8,4 +8,10 @@ module.exports = {
   transform: {
     ...tsJestTransformCfg,
   },
+  moduleNameMapper: {
+    "^types$": "<rootDir>/src/types",
+    "^utils$": "<rootDir>/src/utils",
+    "^server/(.*)$": "<rootDir>/src/server/$1",
+    "^clients/(.*)$": "<rootDir>/src/clients/$1",
+  },
 };
@@ -1,5 +1,5 @@
 import axios, { AxiosError, AxiosHeaders } from 'axios';
-import { ScraperApiClient } from '../clients/scraper-api-client';
+import { ScraperApiClient } from '../scraper-api-client';
 
 const { AxiosError: RealAxiosError } = jest.requireActual<typeof import('axios')>('axios');
 
 
@@ -9,10 +9,39 @@ export enum TOOLSET {
 // todo: utils
 export enum SCRAPER_API_TARGETS {
   GOOGLE_SEARCH = 'google_search',
+  GOOGLE_TRAVEL_HOTELS = 'google_travel_hotels',
+  GOOGLE_ADS = 'google_ads',
+  GOOGLE_LENS = 'google_lens',
+  GOOGLE_AI_MODE = 'google_ai_mode',
+
   AMAZON_SEARCH = 'amazon_search',
+  AMAZON_PRODUCT = 'amazon_product',
+  AMAZON_PRICING = 'amazon_pricing',
+  AMAZON_SELLERS = 'amazon_sellers',
+  AMAZON_BESTSELLERS = 'amazon_bestsellers',
+
+  WALMART_SEARCH = 'walmart_search',
+  WALMART_PRODUCT = 'walmart_product',
+
+  TARGET_SEARCH = 'target_search',
+  TARGET_PRODUCT = 'target_product',
+
+  TIKTOK_POST = 'tiktok_post',
+  TIKTOK_SHOP_SEARCH = 'tiktok_shop_search',
+  TIKTOK_SHOP_PRODUCT = 'tiktok_shop_product',
+  TIKTOK_SHOP_URL = 'tiktok',
+
+  YOUTUBE_VIDEO = 'youtube_video',
+  YOUTUBE_METADATA = 'youtube_metadata',
+  YOUTUBE_CHANNEL = 'youtube_channel',
+  YOUTUBE_SUBTITLES = 'youtube_subtitles',
+  YOUTUBE_SEARCH = 'youtube_search',
 
   REDDIT_POST = 'reddit_post',
   REDDIT_SUBREDDIT = 'reddit_subreddit',
+  REDDIT_USER = 'reddit_user',
+
+  BING_SEARCH = 'bing_search',
 
   CHATGPT = 'chatgpt',
   PERPLEXITY = 'perplexity',
 
@@ -38,11 +38,12 @@ const main = async () => {
   // if there are no envs, some MCP clients will fail silently
   const { sapiUsername, sapiPassword } = parseEnvsOrExit();
 
+  const auth = Buffer.from(`${sapiUsername}:${sapiPassword}`).toString('base64');
+
   const toolsets = resolveToolsets(process.env.TOOLSETS);
 
   const sapiMcpServer = new ScraperAPIStdioServer({
-    sapiUsername,
-    sapiPassword,
+    auth,
     toolsets,
   });
   await sapiMcpServer.connect(transport);
 
@@ -39,7 +39,7 @@ app.post('/mcp', async (req, res) => {
 
   const toolsets = resolveToolsets(req.query.toolsets as string);
 
-  const server = new ScraperAPIHttpServer({ toolsets });
+  const server = new ScraperAPIHttpServer({ toolsets, auth: token });
 
   const transport = new StreamableHTTPServerTransport({
     sessionIdGenerator: undefined,
@@ -50,8 +50,6 @@ app.post('/mcp', async (req, res) => {
     transport.close();
   });
 
-  server.setAuthToken(token);
-
   await server.connect(transport);
 
   await transport.handleRequest(req, res, req.body);
-Original file line number
+Diff line change
@@ @@ -1,4 +1,5 @@ @@
 node_modules
 build
 -.env
 +.env
 +.vscode