{"id":"efd6f1d8-1bc5-481a-88c7-30634363e423","shortId":"Q9bbnn","kind":"skill","title":"Evaluate long-horizon agents against WildClawBench","tagline":"Use WildClawBench to benchmark agents on hard end-to-end OpenClaw tasks covering tool orchestration, multimodal work, coding, safety, and long-horizon planning.","description":"# Evaluate long-horizon agents against WildClawBench\n\nUse WildClawBench to benchmark agents on hard end-to-end OpenClaw tasks covering tool orchestration, multimodal work, coding, safety, and long-horizon planning.\n\n## Prerequisites\n\nWildClawBench assets; OpenClaw environment; target agent/model under test\n\n## Installation\n\nNo source-backed install or usage instructions could be extracted automatically. Review the upstream project before running this skill in a sensitive workflow.\n\n- Source: https://github.com/InternLM/WildClawBench\n\n## Documentation\n\n- https://internlm.github.io/WildClawBench/\n\n## Source\n\n- [Agent Skill Exchange](https://agentskillexchange.com/skills/evaluate-long-horizon-agents-against-wildclawbench/)","tags":["evaluate","long","horizon","agents","against","wildclawbench","skills","agentskillexchange","agent-skills","ai-agents","ai-tools","awesome-list"],"capabilities":["skill","source-agentskillexchange","skill-evaluate-long-horizon-agents-against-wildclawbench","topic-agent-skills","topic-ai-agents","topic-ai-tools","topic-awesome-list","topic-claude-code","topic-codex","topic-cursor","topic-llm","topic-mcp","topic-npx-skills","topic-openclaw","topic-skills-catalog"],"categories":["skills"],"synonyms":[],"warnings":[],"endpointUrl":"https://skills.sh/agentskillexchange/skills/evaluate-long-horizon-agents-against-wildclawbench","protocol":"skill","transport":"skills-sh","auth":{"type":"none","details":{"cli":"npx skills add agentskillexchange/skills","source_repo":"https://github.com/agentskillexchange/skills","install_from":"skills.sh"}},"qualityScore":"0.454","qualityRationale":"deterministic score 0.45 from registry signals: · indexed on github topic:agent-skills · 8 github stars · SKILL.md body (729 chars)","verified":false,"liveness":"unknown","lastLivenessCheck":null,"agentReviews":{"count":0,"score_avg":null,"cost_usd_avg":null,"success_rate":null,"latency_p50_ms":null,"narrative_summary":null,"summary_updated_at":null},"enrichmentModel":"deterministic:skill-github:v1","enrichmentVersion":1,"enrichedAt":"2026-05-18T19:10:22.922Z","embedding":null,"createdAt":"2026-05-18T13:16:26.426Z","updatedAt":"2026-05-18T19:10:22.922Z","lastSeenAt":"2026-05-18T19:10:22.922Z","tsv":"'/internlm/wildclawbench':102 '/skills/evaluate-long-horizon-agents-against-wildclawbench/)':113 '/wildclawbench/':106 'agent':5,12,37,44,108 'agent/model':71 'agentskillexchange.com':112 'agentskillexchange.com/skills/evaluate-long-horizon-agents-against-wildclawbench/)':111 'asset':67 'automat':86 'back':78 'benchmark':11,43 'code':26,58 'could':83 'cover':21,53 'document':103 'end':16,18,48,50 'end-to-end':15,47 'environ':69 'evalu':1,33 'exchang':110 'extract':85 'github.com':101 'github.com/internlm/wildclawbench':100 'hard':14,46 'horizon':4,31,36,63 'instal':74,79 'instruct':82 'internlm.github.io':105 'internlm.github.io/wildclawbench/':104 'long':3,30,35,62 'long-horizon':2,29,34,61 'multimod':24,56 'openclaw':19,51,68 'orchestr':23,55 'plan':32,64 'prerequisit':65 'project':90 'review':87 'run':92 'safeti':27,59 'sensit':97 'skill':94,109 'skill-evaluate-long-horizon-agents-against-wildclawbench' 'sourc':77,99,107 'source-agentskillexchange' 'source-back':76 'target':70 'task':20,52 'test':73 'tool':22,54 'topic-agent-skills' 'topic-ai-agents' 'topic-ai-tools' 'topic-awesome-list' 'topic-claude-code' 'topic-codex' 'topic-cursor' 'topic-llm' 'topic-mcp' 'topic-npx-skills' 'topic-openclaw' 'topic-skills-catalog' 'upstream':89 'usag':81 'use':8,40 'wildclawbench':7,9,39,41,66 'work':25,57 'workflow':98","prices":[{"id":"8b849869-9e91-4b8d-9f52-e4abca55e2c9","listingId":"efd6f1d8-1bc5-481a-88c7-30634363e423","amountUsd":"0","unit":"free","nativeCurrency":null,"nativeAmount":null,"chain":null,"payTo":null,"paymentMethod":"skill-free","isPrimary":true,"details":{"org":"agentskillexchange","category":"skills","install_from":"skills.sh"},"createdAt":"2026-05-18T13:16:26.426Z"}],"sources":[{"listingId":"efd6f1d8-1bc5-481a-88c7-30634363e423","source":"github","sourceId":"agentskillexchange/skills/evaluate-long-horizon-agents-against-wildclawbench","sourceUrl":"https://github.com/agentskillexchange/skills/tree/main/skills/evaluate-long-horizon-agents-against-wildclawbench","isPrimary":false,"firstSeenAt":"2026-05-18T13:16:26.426Z","lastSeenAt":"2026-05-18T19:10:22.922Z"}],"details":{"listingId":"efd6f1d8-1bc5-481a-88c7-30634363e423","quickStartSnippet":null,"exampleRequest":null,"exampleResponse":null,"schema":null,"openapiUrl":null,"agentsTxtUrl":null,"citations":[],"useCases":[],"bestFor":[],"notFor":[],"kindDetails":{"org":"agentskillexchange","slug":"evaluate-long-horizon-agents-against-wildclawbench","github":{"repo":"agentskillexchange/skills","stars":8,"topics":["agent-skills","ai-agents","ai-tools","awesome-list","claude-code","codex","cursor","llm","mcp","npx-skills","openclaw","skills-catalog"],"license":"mit","html_url":"https://github.com/agentskillexchange/skills","pushed_at":"2026-05-18T19:02:17Z","description":"The open catalog of AI agent skills — 2,000+ security-scanned skills for Claude Code, Cursor, Codex, and more.","skill_md_sha":"460ab872dc5e9825097d7712c2fec5b9e50f9bbe","skill_md_path":"skills/evaluate-long-horizon-agents-against-wildclawbench/SKILL.md","default_branch":"main","skill_tree_url":"https://github.com/agentskillexchange/skills/tree/main/skills/evaluate-long-horizon-agents-against-wildclawbench"},"layout":"multi","source":"github","category":"skills","frontmatter":{"name":"Evaluate long-horizon agents against WildClawBench","description":"Use WildClawBench to benchmark agents on hard end-to-end OpenClaw tasks covering tool orchestration, multimodal work, coding, safety, and long-horizon planning."},"skills_sh_url":"https://skills.sh/agentskillexchange/skills/evaluate-long-horizon-agents-against-wildclawbench"},"updatedAt":"2026-05-18T19:10:22.922Z"}}