Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 5 additions & 0 deletions lib/crewai-tools/pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,11 @@ Documentation = "https://docs.crewai.com"


[project.optional-dependencies]
skim = [
"x402[evm]>=2.0.0",
"eth-account>=0.13.0",
"requests>=2.31.0",
]
scrapfly-sdk = [
"scrapfly-sdk>=0.8.19",
]
Expand Down
2 changes: 2 additions & 0 deletions lib/crewai-tools/src/crewai_tools/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -188,6 +188,7 @@
from crewai_tools.tools.singlestore_search_tool.singlestore_search_tool import (
SingleStoreSearchTool,
)
from crewai_tools.tools.skim_reader_tool.skim_reader_tool import SkimReaderTool
from crewai_tools.tools.snowflake_search_tool.snowflake_search_tool import (
SnowflakeConfig,
SnowflakeSearchTool,
Expand Down Expand Up @@ -311,6 +312,7 @@
"SerplyWebSearchTool",
"SerplyWebpageToMarkdownTool",
"SingleStoreSearchTool",
"SkimReaderTool",
"SnowflakeConfig",
"SnowflakeSearchTool",
"SpiderTool",
Expand Down
2 changes: 2 additions & 0 deletions lib/crewai-tools/src/crewai_tools/tools/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -174,6 +174,7 @@
SerplyWebpageToMarkdownTool,
)
from crewai_tools.tools.singlestore_search_tool import SingleStoreSearchTool
from crewai_tools.tools.skim_reader_tool.skim_reader_tool import SkimReaderTool
from crewai_tools.tools.snowflake_search_tool import (
SnowflakeConfig,
SnowflakeSearchTool,
Expand Down Expand Up @@ -293,6 +294,7 @@
"SerplyWebSearchTool",
"SerplyWebpageToMarkdownTool",
"SingleStoreSearchTool",
"SkimReaderTool",
"SnowflakeConfig",
"SnowflakeSearchTool",
"SnowflakeSearchToolInput",
Expand Down
67 changes: 67 additions & 0 deletions lib/crewai-tools/src/crewai_tools/tools/skim_reader_tool/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,67 @@
# SkimReaderTool

## Description

[Skim](https://skim402.com) is the x402-native clean reader API for AI agents.
Give it any URL and it returns clean, agent-ready Markdown — nav, ads, and
boilerplate stripped — plus structured metadata (title, byline, published date,
language, excerpt).

`SkimReaderTool` is pay-per-call over the [x402](https://x402.org) protocol:
each read costs **$0.002 in USDC on Base**, paid automatically by a wallet you
control. There is no signup and there are no API keys — your wallet is your
identity. The private key never leaves your machine; it only signs an EIP-3009
USDC authorization locally.

## Installation

Install the x402 client (with EVM support) alongside `crewai[tools]`:

```
pip install "x402[evm]" 'crewai[tools]'
```
Comment on lines +20 to +22

Copy link
Copy Markdown

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

⚠️ Potential issue | 🟡 Minor | ⚡ Quick win

Add explicit fence languages to satisfy Markdown linting

Line 20 and Line 27 use unlabeled fenced code blocks, which triggers MD040. Please label both as bash.

Suggested patch
-```
+```bash
 pip install "x402[evm]" 'crewai[tools]'

- +bash
export SKIM_WALLET_PRIVATE_KEY=0xYOUR_BASE_WALLET_PRIVATE_KEY

Also applies to: 27-29

🧰 Tools
🪛 markdownlint-cli2 (0.22.1)

[warning] 20-20: Fenced code blocks should have a language specified

(MD040, fenced-code-language)

🤖 Prompt for AI Agents
Verify each finding against current code. Fix only still-valid issues, skip the
rest with a brief reason, keep changes minimal, and validate.

In `@lib/crewai-tools/src/crewai_tools/tools/skim_reader_tool/README.md` around
lines 20 - 22, The fenced code blocks in the README.md file are missing explicit
language labels, which violates the MD040 markdown linting rule. Add the
language identifier `bash` to both unlabeled code blocks: change the opening
fence on line 20 (before the pip install command) from three backticks to three
backticks followed by `bash`, and similarly update the opening fence on line 27
(before the export SKIM_WALLET_PRIVATE_KEY command) to include the `bash`
language label.

Source: Linters/SAST tools


Fund a dedicated Base wallet with a small amount of USDC (about $1 covers ~500
reads) and expose its private key to the tool:

```
export SKIM_WALLET_PRIVATE_KEY=0xYOUR_BASE_WALLET_PRIVATE_KEY
```

Use a fresh wallet, never your personal one. Step-by-step wallet setup:
<https://skim402.com/wallet>.

## Example

```python
from crewai_tools import SkimReaderTool

tool = SkimReaderTool() # reads SKIM_WALLET_PRIVATE_KEY from the environment
tool.run(url="https://en.wikipedia.org/wiki/HTTP_402")
```

Drop it into any agent's tool list:

```python
from crewai import Agent
from crewai_tools import SkimReaderTool

researcher = Agent(
role="Research Analyst",
goal="Read and summarize web articles accurately",
backstory="You turn messy web pages into clean, citable notes.",
tools=[SkimReaderTool()],
)
```

## Arguments

- `private_key`: Optional. Hex private key (with or without `0x`) for the Base
wallet that pays for reads. Defaults to the `SKIM_WALLET_PRIVATE_KEY`
environment variable. Use a dedicated wallet, never your personal one.
- `base_url`: Optional. Skim API base URL. Defaults to `https://skim402.com`.
- `max_price_usd`: Optional. Hard per-call price cap in USD. The wallet refuses
to sign for anything above this. Defaults to `0.01` (Skim is `$0.002`/call).
- `include_metadata`: Optional. When `True` (default), prepend a YAML
frontmatter block of the page metadata to the returned Markdown.
- `timeout`: Optional. Per-request timeout in seconds. Defaults to `60`.
Empty file.
Original file line number Diff line number Diff line change
@@ -0,0 +1,210 @@
"""CrewAI tool for Skim — the x402-native clean reader API for AI agents.

Exposes :class:`SkimReaderTool`, a CrewAI ``BaseTool`` that fetches any URL and
returns clean, agent-ready Markdown plus structured metadata. Each call is paid
automatically over the x402 protocol ($0.002 in USDC on Base) using a wallet you
control. The private key never leaves your machine — it only signs an EIP-3009
USDC authorization locally.
"""

from __future__ import annotations

import os
from typing import Any, Optional

from crewai.tools import BaseTool, EnvVar
from pydantic import BaseModel, Field, PrivateAttr, SecretStr

DEFAULT_BASE_URL = "https://skim402.com"


def _yaml_scalar(value: Any) -> str:
"""Render a metadata value as a safe single-line YAML scalar.

Collapses internal whitespace/newlines and double-quotes the value when it
contains characters that could otherwise produce invalid or ambiguous YAML.
"""
text = " ".join(str(value).split())
needs_quoting = (
text == ""
or text[0] in "!&*?|>%@`\"'#,[]{}:-"
or ": " in text
or text.endswith(":")
or text[0] in " "
)
if needs_quoting:
escaped = text.replace("\\", "\\\\").replace('"', '\\"')
return f'"{escaped}"'
return text


_TOOL_DESCRIPTION = (
"Fetch any URL and return clean, agent-ready Markdown via Skim (skim402.com). "
"Strips nav, ads, and boilerplate; preserves the article body plus structured "
"metadata (title, byline, published date, language, excerpt). Pays $0.002 per "
"call in USDC on Base over the x402 protocol — no API keys, no signup. Use this "
"whenever you need to read web content: articles, docs, blog posts, GitHub "
"READMEs, research papers, and similar pages."
)


class SkimReaderToolSchema(BaseModel):
"""Input schema for :class:`SkimReaderTool`."""

url: str = Field(
description="The fully-qualified URL to fetch and clean (https://...).",
)


class SkimReaderTool(BaseTool):
"""Read any URL as clean Markdown via Skim, paying per call over x402.

The tool lazily builds a payment-aware HTTP session the first time it runs,
using your Base wallet's private key to sign USDC authorizations on demand.

Args:
private_key (str): Optional. Hex private key (with or without ``0x``) for
the Base wallet that pays for reads. Falls back to the
``SKIM_WALLET_PRIVATE_KEY`` environment variable. Use a dedicated
wallet, never your personal one.
base_url (str): Optional. Skim API base URL. Defaults to
``https://skim402.com``.
max_price_usd (float): Optional. Hard per-call price cap in USD. The
wallet refuses to sign for anything above this. Defaults to ``0.01``
(Skim is ``$0.002``).
include_metadata (bool): Optional. When ``True`` (default), prepend a YAML
frontmatter block of the page metadata to the returned Markdown.
timeout (float): Optional. Per-request timeout in seconds. Defaults to
``60``.

Example:
from crewai_tools import SkimReaderTool

tool = SkimReaderTool() # reads SKIM_WALLET_PRIVATE_KEY from the env
tool.run(url="https://en.wikipedia.org/wiki/HTTP_402")
"""

name: str = "Skim web reader"
description: str = _TOOL_DESCRIPTION
args_schema: type[BaseModel] = SkimReaderToolSchema

base_url: str = DEFAULT_BASE_URL
max_price_usd: float = 0.01
include_metadata: bool = True
timeout: float = 60.0
private_key: Optional[SecretStr] = Field(default=None, exclude=True, repr=False)

_session: Any = PrivateAttr(default=None)
package_dependencies: list[str] = Field(
default_factory=lambda: ["x402[evm]", "eth-account", "requests"]
)
env_vars: list[EnvVar] = Field(
default_factory=lambda: [
EnvVar(
name="SKIM_WALLET_PRIVATE_KEY",
description=(
"Hex private key for the Base wallet that pays for Skim reads "
"over x402. Needed unless private_key is passed to the "
"constructor. The key never leaves your machine."
),
required=False,
),
]
)

def _get_session(self) -> Any:
"""Build (and cache) a requests Session that auto-pays 402 responses."""
if self._session is not None:
return self._session

try:
import requests
from eth_account import Account
from x402 import x402ClientSync
from x402.client import max_amount
from x402.http.clients.requests import wrapRequestsWithPayment
from x402.mechanisms.evm.exact.register import register_exact_evm_client
from x402.mechanisms.evm.signers import EthAccountSigner
except ImportError as exc: # pragma: no cover - import-guard
raise ImportError(
"SkimReaderTool needs the x402 client with EVM support. Install it "
'with: pip install "x402[evm]" requests eth-account'
) from exc

key = (
self.private_key.get_secret_value()
if self.private_key is not None
else os.environ.get("SKIM_WALLET_PRIVATE_KEY")
)
if not key:
raise ValueError(
"Skim requires payment via x402. Provide a Base wallet funded with "
"USDC by setting the SKIM_WALLET_PRIVATE_KEY environment variable, or "
"by passing private_key=... to SkimReaderTool(). The key never leaves "
"your machine — it only signs payment authorizations locally."
)

normalized = key[2:] if key.startswith("0x") else key
if len(normalized) != 64 or any(
c not in "0123456789abcdefABCDEF" for c in normalized
):
raise ValueError(
"SKIM_WALLET_PRIVATE_KEY must be a 64-character hex string (with or "
"without a 0x prefix)."
)

account = Account.from_key("0x" + normalized)
cap_atomic = int(round(self.max_price_usd * 1_000_000)) # USDC has 6 decimals
client = x402ClientSync()
register_exact_evm_client(
client,
EthAccountSigner(account),
policies=[max_amount(cap_atomic)],
)
self._session = wrapRequestsWithPayment(requests.Session(), client)
return self._session

def _run(self, url: str) -> str:
session = self._get_session()
endpoint = self.base_url.rstrip("/") + "/api/v1/read"

try:
res = session.post(
endpoint,
json={"url": url, "mode": "basic"},
timeout=self.timeout,
)
except Exception as exc: # network / payment-signing failure
raise RuntimeError(
f"Skim request failed: {exc}. Common causes: the wallet has no USDC "
f"on Base, or the price exceeded max_price_usd (${self.max_price_usd})."
) from exc

if not getattr(res, "ok", res.status_code < 400):
body = (res.text or "").strip()
raise RuntimeError(
f"Skim returned {res.status_code} {getattr(res, 'reason', '')}: "
f"{body or '(no body)'}"
)

try:
data = res.json()
except ValueError as exc:
raise RuntimeError(
"Skim returned a non-JSON response. This usually means the request "
f"did not reach the Skim API. Underlying error: {exc}"
) from exc

markdown = data.get("markdown") or data.get("text") or ""

metadata = data.get("metadata")
if self.include_metadata and isinstance(metadata, dict):
meta_lines = [
f"{k}: {_yaml_scalar(v)}"
for k, v in metadata.items()
if v is not None and v != ""
]
if meta_lines:
markdown = "---\n" + "\n".join(meta_lines) + "\n---\n\n" + markdown

return markdown
Loading