Improve tool use and computer use agents. Built on Model Context Protocol.
hud debug
hud analyze
uvx hud-python quickstart
claude mcp add docs-hud https://docs.hud.so/mcp
import asyncio, os, hud from hud.datasets import Task from hud.agents import ClaudeAgent async def main(): # Define evaluation task with remote MCP task = Task( prompt="Win a game of 2048 by reaching the 128 tile", mcp_config={ "hud": { "url": "https://mcp.hud.so/v3/mcp", "headers": { "Authorization": f"Bearer {os.getenv('HUD_API_KEY')}", "Mcp-Image": "hudpython/hud-text-2048:v1.2" } } }, setup_tool={"name": "setup", "arguments": {"name": "board", "arguments": { "board_size": 4}}}, evaluate_tool={"name": "evaluate", "arguments": {"name": "max_number", "arguments": {"target": 64}}} ) # Run agent (auto-creates MCP client) agent = ClaudeAgent() result = await agent.run(task) print(f"Score: {result.reward}") asyncio.run(main())
Was this page helpful?