Files
gpt4free/g4f/mcp/tools.py
T

823 lines
28 KiB
Python

"""MCP Tools for gpt4free
This module provides MCP tool implementations that wrap gpt4free capabilities:
- WebSearchTool: Web search using ddg search
- WebScrapeTool: Web page scraping and content extraction
- ImageGenerationTool: Image generation using various AI providers
- PythonExecuteTool: Safe Python code execution with whitelisted modules
- FileReadTool: Read files from the ~/.g4f/workspace directory
- FileWriteTool: Write files to the ~/.g4f/workspace directory
- FileListTool: List files in the ~/.g4f/workspace directory
- FileDeleteTool: Delete files from the ~/.g4f/workspace directory
"""
from __future__ import annotations
import os
from pathlib import Path
from typing import Any, Dict, List
from abc import ABC, abstractmethod
import urllib.parse
from aiohttp import ClientSession
class MCPTool(ABC):
"""Base class for MCP tools"""
def __init__(self, safe_mode: bool = False) -> None:
"""Initialize tool with optional safe mode.
Args:
safe_mode: When ``True`` the tool operates in a restricted mode
where callers cannot expand the module allowlist and certain
sensitive listing operations are blocked.
"""
self.safe_mode = safe_mode
@property
@abstractmethod
def description(self) -> str:
"""Tool description"""
pass
@property
@abstractmethod
def input_schema(self) -> Dict[str, Any]:
"""JSON schema for tool input parameters"""
pass
@abstractmethod
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Execute the tool with given arguments
Args:
arguments: Tool input arguments matching the input_schema
Returns:
Dict containing either results or an error key with error message
"""
pass
class WebSearchTool(MCPTool):
"""Web search tool using gpt4free's search capabilities"""
@property
def description(self) -> str:
return "Search the web for information using DuckDuckGo. Returns search results with titles, URLs, and snippets."
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"query": {
"type": "string",
"description": "The search query to execute"
},
"max_results": {
"type": "integer",
"description": "Maximum number of results to return (default: 5)",
"default": 5
},
"region": {
"type": "string",
"description": "Search region (default: en-us)"
}
},
"required": ["query"]
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Execute web search
Returns:
Dict[str, Any]: Search results or error message
"""
from ..Provider.search.CachedSearch import CachedSearch
query = arguments.get("query", "")
max_results = arguments.get("max_results", 5)
region = arguments.get("region", "en-us")
if not query:
return {
"error": "Query parameter is required"
}
try:
# Perform search - query parameter is used for search execution
# and prompt parameter holds the content to be searched
search_results = await anext(CachedSearch.create_async_generator(
"",
[],
prompt=query,
max_results=max_results,
region=region
))
return {
"query": query,
**search_results.get_dict()
}
except Exception as e:
return {
"error": f"Search failed: {str(e)}"
}
class WebScrapeTool(MCPTool):
"""Web scraping tool using gpt4free's scraping capabilities"""
@property
def description(self) -> str:
return "Scrape and extract text content from a web page URL. Returns cleaned text content with optional word limit."
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"url": {
"type": "string",
"description": "The URL of the web page to scrape"
},
"max_words": {
"type": "integer",
"description": "Maximum number of words to extract (default: 1000)",
"default": 1000
}
},
"required": ["url"]
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Execute web scraping
Returns:
Dict[str, Any]: Scraped content or error message
"""
from ..tools.fetch_and_scrape import fetch_and_scrape
from aiohttp import ClientSession
url = arguments.get("url", "")
max_words = arguments.get("max_words", 1000)
if not url:
return {
"error": "URL parameter is required"
}
try:
# Scrape the URL
async with ClientSession() as session:
content = await fetch_and_scrape(
session=session,
url=url,
max_words=max_words,
add_metadata=True
)
if not content:
return {
"error": "Failed to scrape content from URL"
}
return {
"url": url,
"content": content,
"word_count": len(content.split())
}
except Exception as e:
return {
"error": f"Scraping failed: {str(e)}"
}
class ImageGenerationTool(MCPTool):
"""Image generation tool using gpt4free's image generation capabilities"""
@property
def description(self) -> str:
return "Generate images from text prompts using AI image generation providers. Returns a URL to the generated image."
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"prompt": {
"type": "string",
"description": "The text prompt describing the image to generate"
},
"model": {
"type": "string",
"description": "The image generation model to use (default: flux)",
"default": "flux"
},
"width": {
"type": "integer",
"description": "Image width in pixels (default: 1024)",
"default": 1024
},
"height": {
"type": "integer",
"description": "Image height in pixels (default: 1024)",
"default": 1024
}
},
"required": ["prompt"]
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Execute image generation
Returns:
Dict[str, Any]: Generated image data or error message
"""
from ..client import AsyncClient
prompt = arguments.get("prompt", "")
model = arguments.get("model", "flux")
width = arguments.get("width", 1024)
height = arguments.get("height", 1024)
if not prompt:
return {
"error": "Prompt parameter is required"
}
try:
# Generate image using gpt4free client
client = AsyncClient()
response = await client.images.generate(
model=model,
prompt=prompt,
width=width,
height=height
)
# Get the image data with proper validation
if not response:
return {
"error": "Image generation failed: No response from provider"
}
if not hasattr(response, 'data') or not response.data:
return {
"error": "Image generation failed: No image data in response"
}
if len(response.data) == 0:
return {
"error": "Image generation failed: Empty image data array"
}
image_data = response.data[0]
# Check if image_data has url attribute
if not hasattr(image_data, 'url'):
return {
"error": "Image generation failed: No URL in image data"
}
image_url = image_data.url
template = 'Display the image using this template: <a href="{image}" data-width="{width}" data-height="{height}"><img src="{image}" alt="{prompt}"></a>'
# Return result based on URL type
if image_url.startswith('data:'):
return {
"prompt": prompt,
"model": model,
"width": width,
"height": height,
"image": image_url,
"template": template
}
else:
if arguments.get("origin") and image_url.startswith("/media/"):
image_url = f"{arguments.get('origin')}{image_url}"
return {
"prompt": prompt,
"model": model,
"width": width,
"height": height,
"image_url": image_url,
"template": template
}
except Exception as e:
return {
"error": f"Image generation failed: {str(e)}"
}
class MarkItDownTool(MCPTool):
"""MarkItDown tool for converting URLs to markdown format"""
@property
def description(self) -> str:
return "Convert a URL to markdown format using MarkItDown. Supports HTTP/HTTPS URLs and returns formatted markdown content."
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"url": {
"type": "string",
"description": "The URL to convert to markdown format (must be HTTP/HTTPS)"
},
"max_content_length": {
"type": "integer",
"description": "Maximum content length for processing (default: 10000)",
"default": 10000
}
},
"required": ["url"]
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Execute MarkItDown conversion
Returns:
Dict[str, Any]: Markdown content or error message
"""
try:
from ..integration.markitdown import MarkItDown
except ImportError as e:
return {
"error": f"MarkItDown is not installed: {str(e)}"
}
url = arguments.get("url", "")
max_content_length = arguments.get("max_content_length", 10000)
if not url:
return {
"error": "URL parameter is required"
}
# Validate URL format
if not url.startswith(("http://", "https://")):
return {
"error": "URL must start with http:// or https://"
}
try:
# Initialize MarkItDown
md = MarkItDown()
# Convert URL to markdown
result = md.convert_url(url)
if not result:
return {
"error": "Failed to convert URL to markdown"
}
# Truncate if content exceeds max length
if len(result) > max_content_length:
result = result[:max_content_length] + "\n\n[Content truncated...]"
return {
"url": url,
"markdown_content": result,
"content_length": len(result),
"truncated": len(result) > max_content_length
}
except Exception as e:
return {
"error": f"MarkItDown conversion failed: {str(e)}"
}
class TextToAudioTool(MCPTool):
"""TextToAudio tool for generating audio from text prompts using Pollinations AI"""
@property
def description(self) -> str:
return "Generate an audio URL from a text prompt using Pollinations AI text-to-speech service. Returns a direct URL to the generated audio file."
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"prompt": {
"type": "string",
"description": "The text prompt to the audio model (example: 'Read this: Hello, world!')"
},
"voice": {
"type": "string",
"description": "Voice option for text-to-speech (default: 'alloy')",
"default": "alloy"
},
"url_encode": {
"type": "boolean",
"description": "Whether to URL-encode the prompt text (default: True)",
"default": True
}
},
"required": ["prompt"]
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
"""Execute text-to-speech conversion
Returns:
Dict[str, Any]: Audio URL or error message
"""
prompt = arguments.get("prompt", "")
voice = arguments.get("voice", "alloy")
url_encode = arguments.get("url_encode", True)
if not prompt:
return {
"error": "Prompt parameter is required"
}
# Validate prompt length (reasonable limit for text-to-speech)
if len(prompt) > 10000:
return {
"error": "Prompt is too long (max 10000 characters)"
}
try:
# Prepare the prompt for URL
if url_encode:
encoded_prompt = urllib.parse.quote(prompt)
else:
encoded_prompt = prompt.replace(" ", "%20") # Basic space encoding
# Construct the Pollinations AI text-to-speech URL
audio_url = f"/backend-api/v2/synthesize/Gemini?text={encoded_prompt}"
if arguments.get("origin"):
audio_url = f"{arguments.get('origin')}{audio_url}"
async with ClientSession() as session:
async with session.get(audio_url, max_redirects=0) as resp:
audio_url = str(resp.url)
template = 'Play the audio using this template: <audio controls src="{audio_url}">'
return {
"prompt": prompt,
"voice": voice,
"audio_url": audio_url,
"template": template
}
except Exception as e:
return {
"error": f"Text-to-speech URL generation failed: {str(e)}"
}
class PythonExecuteTool(MCPTool):
"""Safe Python code execution tool with whitelisted module imports.
Executes the supplied code snippet inside a restricted sandbox where only
a curated list of modules may be imported and file-system access is limited
to the ``~/.g4f/workspace`` directory. The value assigned to the ``result``
variable (if any) is returned along with captured stdout/stderr.
"""
@property
def description(self) -> str:
return (
"Execute a Python code snippet safely. Only whitelisted modules may "
"be imported (math, json, re, datetime, asyncio, aiohttp, g4f, …). "
"File access is restricted to the ~/.g4f/workspace directory. "
"Assign the value you want back to a variable named 'result'. "
"Returns stdout, stderr, and the value of 'result'."
)
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"code": {
"type": "string",
"description": "Python code to execute in the safe sandbox",
},
"allowed_extra_modules": {
"type": "array",
"items": {"type": "string"},
"description": (
"Optional list of additional module names to allow "
"beyond the default whitelist (ignored in safe mode)"
),
},
"timeout": {
"type": "number",
"description": (
"Wall-clock seconds to allow before aborting execution "
f"(max {30.0}s; ignored in safe mode)"
),
},
"max_depth": {
"type": "integer",
"description": (
"Maximum Python call-stack depth inside the sandbox "
f"(max {500}; ignored in safe mode)"
),
},
},
"required": ["code"],
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
from .pa_provider import execute_safe_code, SAFE_MODULES, MAX_EXEC_TIMEOUT, MAX_RECURSION_DEPTH
code = arguments.get("code", "")
if not code:
return {"error": "code parameter is required"}
if self.safe_mode:
# In safe mode the caller cannot override any security parameters
allowed = SAFE_MODULES
timeout = MAX_EXEC_TIMEOUT
max_depth = MAX_RECURSION_DEPTH
else:
extra_names = arguments.get("allowed_extra_modules") or []
allowed = SAFE_MODULES | frozenset(extra_names)
# Allow callers to reduce (but not exceed) the defaults
requested_timeout = arguments.get("timeout")
if requested_timeout is not None:
try:
timeout = min(float(requested_timeout), MAX_EXEC_TIMEOUT)
except (TypeError, ValueError):
return {"error": "timeout must be a number"}
else:
timeout = MAX_EXEC_TIMEOUT
requested_depth = arguments.get("max_depth")
if requested_depth is not None:
try:
max_depth = min(int(requested_depth), MAX_RECURSION_DEPTH)
except (TypeError, ValueError):
return {"error": "max_depth must be an integer"}
else:
max_depth = MAX_RECURSION_DEPTH
try:
exec_result = execute_safe_code(
code,
allowed_modules=allowed,
timeout=timeout,
max_depth=max_depth,
)
return exec_result.to_dict()
except Exception as exc:
return {"error": f"Execution error: {exc}"}
class FileReadTool(MCPTool):
"""Read a file from the ``~/.g4f/workspace`` directory."""
@property
def description(self) -> str:
return (
"Read the text content of a file inside the ~/.g4f/workspace directory. "
"Provide a relative path from the workspace root."
)
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"path": {
"type": "string",
"description": "Relative path to the file inside the workspace",
}
},
"required": ["path"],
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
from .pa_provider import get_workspace_dir
rel_path = arguments.get("path", "")
if not rel_path:
return {"error": "path parameter is required"}
workspace = get_workspace_dir()
try:
target = (workspace / rel_path).resolve()
if not str(target).startswith(str(workspace.resolve())):
return {"error": "Access outside the workspace is not allowed"}
if not target.exists():
return {"error": f"File not found: {rel_path}"}
if not target.is_file():
return {"error": f"Path is not a file: {rel_path}"}
content = target.read_text(encoding="utf-8")
return {
"path": rel_path,
"content": content,
"size": len(content),
}
except Exception as exc:
return {"error": f"Read failed: {exc}"}
class FileWriteTool(MCPTool):
"""Write (or create) a file inside the ``~/.g4f/workspace`` directory."""
@property
def description(self) -> str:
return (
"Write text content to a file inside the ~/.g4f/workspace directory. "
"Creates parent directories as needed. "
"Provide a relative path from the workspace root and the content to write."
)
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"path": {
"type": "string",
"description": "Relative path to the file inside the workspace",
},
"content": {
"type": "string",
"description": "Text content to write to the file",
},
"append": {
"type": "boolean",
"description": "If true, append to existing file instead of overwriting (default: false)",
"default": False,
},
},
"required": ["path", "content"],
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
from .pa_provider import get_workspace_dir
rel_path = arguments.get("path", "")
content = arguments.get("content")
append = bool(arguments.get("append", False))
if not rel_path:
return {"error": "path parameter is required"}
if content is None:
return {"error": "content parameter is required"}
workspace = get_workspace_dir()
try:
target = (workspace / rel_path).resolve()
if not str(target).startswith(str(workspace.resolve())):
return {"error": "Access outside the workspace is not allowed"}
target.parent.mkdir(parents=True, exist_ok=True)
if append:
with open(target, "a", encoding="utf-8") as f:
f.write(content)
else:
target.write_text(content, encoding="utf-8")
result: Dict[str, Any] = {
"path": rel_path,
"size": len(content),
"appended": append,
}
origin = arguments.get("origin")
if origin:
result["url"] = f"{origin}/pa/files/{rel_path}"
return result
except Exception as exc:
return {"error": f"Write failed: {exc}"}
class FileListTool(MCPTool):
"""List files and directories inside the ``~/.g4f/workspace`` directory."""
@property
def description(self) -> str:
return (
"List files and directories inside the ~/.g4f/workspace directory. "
"Optionally provide a subdirectory path relative to the workspace root. "
"Returns names, types, and sizes."
)
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"path": {
"type": "string",
"description": (
"Relative path to a subdirectory inside the workspace "
"(default: workspace root)"
),
"default": "",
},
"recursive": {
"type": "boolean",
"description": "If true, list files recursively (default: false)",
"default": False,
},
},
"required": [],
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
from .pa_provider import get_workspace_dir
rel_path = arguments.get("path", "") or ""
recursive = bool(arguments.get("recursive", False))
workspace = get_workspace_dir()
try:
target = (workspace / rel_path).resolve() if rel_path else workspace.resolve()
if not str(target).startswith(str(workspace.resolve())):
return {"error": "Access outside the workspace is not allowed"}
if self.safe_mode and target == workspace.resolve():
return {"error": "Listing the workspace root directory is not allowed in safe mode"}
if not target.exists():
return {"error": f"Directory not found: {rel_path or '/'}"}
if not target.is_dir():
return {"error": f"Path is not a directory: {rel_path}"}
entries = []
skipped = 0
iterator = target.rglob("*") if recursive else target.iterdir()
for entry in sorted(iterator):
try:
rel = str(entry.relative_to(workspace))
info: Dict[str, Any] = {
"path": rel,
"type": "file" if entry.is_file() else "directory",
}
if entry.is_file():
info["size"] = entry.stat().st_size
entries.append(info)
except Exception:
skipped += 1
continue
result: Dict[str, Any] = {
"workspace": "" if self.safe_mode else str(workspace),
"path": rel_path or "/",
"entries": entries,
"count": len(entries),
}
if skipped:
result["skipped"] = skipped
return result
except Exception as exc:
return {"error": f"List failed: {exc}"}
class FileDeleteTool(MCPTool):
"""Delete a file from the ``~/.g4f/workspace`` directory."""
@property
def description(self) -> str:
return (
"Delete a file from the ~/.g4f/workspace directory. "
"Provide a relative path from the workspace root. "
"Only files can be deleted; directories are not removed."
)
@property
def input_schema(self) -> Dict[str, Any]:
return {
"type": "object",
"properties": {
"path": {
"type": "string",
"description": "Relative path to the file inside the workspace",
}
},
"required": ["path"],
}
async def execute(self, arguments: Dict[str, Any]) -> Dict[str, Any]:
from .pa_provider import get_workspace_dir
rel_path = arguments.get("path", "")
if not rel_path:
return {"error": "path parameter is required"}
workspace = get_workspace_dir()
try:
target = (workspace / rel_path).resolve()
if not str(target).startswith(str(workspace.resolve())):
return {"error": "Access outside the workspace is not allowed"}
if not target.exists():
return {"error": f"File not found: {rel_path}"}
if not target.is_file():
return {"error": f"Path is not a file (directories cannot be deleted): {rel_path}"}
target.unlink()
return {"path": rel_path, "deleted": True}
except Exception as exc:
return {"error": f"Delete failed: {exc}"}