{"slug":"livecodebench-livecodebench","name":"LiveCodeBench","description":"Official repository for the paper \"LiveCodeBench: Holistic and Contamination Free Evaluation of Large Language Models for Code\"","tagline":"Official repository for the paper \"LiveCodeBench: Holistic and Contamination Free Evaluation of Large Language Models for Code\"","category":"testing-qa","tags":["test-generation","qa","developer-tools","coding","code-execution","code-generation","code-llms","code-repair","gpt-4","python"],"author":{"name":"LiveCodeBench","verified":false,"url":"https://github.com/LiveCodeBench"},"attribution":{"status":"community_indexed","statusLabel":"Community indexed","shortLabel":"COMMUNITY INDEXED","sourceLabel":"GitHub star discovery","sourceDetail":"LiveCodeBench/LiveCodeBench","creatorName":"LiveCodeBench","creatorUrl":"https://github.com/LiveCodeBench","sourceUrl":"https://github.com/LiveCodeBench/LiveCodeBench","indexedBy":"OpenAgentSkill community index","claimUrl":"https://www.openagentskill.com/skills/livecodebench-livecodebench#claim-this-skill","claimCta":"Claim this skill","trustNote":"This listing was indexed from public sources and is not marked official until a maintainer claim is approved.","publicNote":"Attribution links to the public repository or creator profile. Creators can claim the listing to update ownership signals."},"stats":{"stars":885,"forks":191,"downloads":0,"rating":0,"review_count":0,"quality_score":43.33},"quality":{"score":69,"tier":"promising","label":"Promising","summary":"Useful candidate, but compare it with alternatives before adopting.","signals":[{"label":"GitHub stars","value":"885","tone":"positive"},{"label":"Freshness","value":"11mo ago","tone":"positive"},{"label":"Install ready","value":"Yes","tone":"positive"},{"label":"License","value":"MIT","tone":"neutral"}],"warnings":[]},"trust":{"score":82,"tier":"strong","label":"Strong shortlist","summary":"Good trust signals with a few areas worth checking before rollout.","recommendedAction":"Test in a sandbox workflow and compare its install path with close alternatives.","dimensions":[{"id":"github_adoption","label":"GitHub adoption","score":76,"weight":0.16,"status":"info","detail":"885 GitHub stars"},{"id":"maintenance","label":"Recent maintenance","score":62,"weight":0.18,"status":"info","detail":"11mo since push"},{"id":"license","label":"License clarity","score":86,"weight":0.1,"status":"pass","detail":"MIT"},{"id":"documentation","label":"README/SKILL.md completeness","score":90,"weight":0.16,"status":"pass","detail":"Metadata includes enough usage and workflow context"},{"id":"dependency_risk","label":"Dependency risk","score":90,"weight":0.14,"status":"pass","detail":"no major dependency risk hints in public metadata"},{"id":"installability","label":"Install availability","score":92,"weight":0.14,"status":"pass","detail":"npx skills add LiveCodeBench/LiveCodeBench"},{"id":"repository","label":"Repository evidence","score":86,"weight":0.06,"status":"pass","detail":"https://github.com/LiveCodeBench/LiveCodeBench"},{"id":"review_status","label":"Review status","score":88,"weight":0.06,"status":"pass","detail":"AI review data available"}],"checks":[{"status":"info","label":"GitHub adoption","detail":"885 GitHub stars"},{"status":"info","label":"Recent maintenance","detail":"11mo since push"},{"status":"pass","label":"License clarity","detail":"MIT"},{"status":"pass","label":"README/SKILL.md completeness","detail":"Metadata includes enough usage and workflow context"},{"status":"pass","label":"Dependency risk","detail":"no major dependency risk hints in public metadata"},{"status":"pass","label":"Install availability","detail":"npx skills add LiveCodeBench/LiveCodeBench"},{"status":"pass","label":"Repository evidence","detail":"https://github.com/LiveCodeBench/LiveCodeBench"},{"status":"pass","label":"Review status","detail":"AI review data available"},{"status":"warn","label":"Ownership","detail":"No approved owner claim yet"},{"status":"info","label":"OpenAgentSkill usage","detail":"No local usage activity yet"}],"strengths":["AI review approved","Install path is available","Repository evidence is available","Meaningful GitHub adoption signal"],"warnings":["Quality score needs review"]},"safety":{"score":64,"level":"review_before_install","label":"Review before install","safety_tier":{"tier":"reviewed","label":"Reviewed with permission notes","badge":"REVIEWED","summary":"Usable candidate, but the agent should surface permission and audit notes before installation.","recommended_action":"Require human approval before installing into a real workspace.","auto_install_policy":"review","reasons":["Quality score needs review","64/100 agent safety score"]},"auto_install_allowed":false,"human_review_required":true,"blocked":false,"audit_risk":"needs_review","permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"}],"policy_warnings":["Quality score needs review"],"constraints_applied":{"max_risk":"medium","needs_install_command":true,"min_stars":0}},"safety_gate":{"tier":"reviewed","label":"Reviewed with permission notes","badge":"REVIEWED","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Require human approval before installing into a real workspace.","reasons":["Quality score needs review","64/100 agent safety score"]},"supply_profile":{"track":{"slug":"coding","label":"Coding and developer agents","shortLabel":"Coding","description":"Code review, repo analysis, testing, CI, GitHub, DevOps, and developer workflow skills."},"scenario":{"label":"Coding agents","description":"I need a coding agent that can understand a repository, edit code, and review pull requests.","useCases":[{"slug":"coding-agents","title":"Coding agents"},{"slug":"github-automation","title":"GitHub automation"},{"slug":"testing-qa","title":"Testing and QA"}]},"applicableAgents":["Claude Code","OpenAI Agents","CLI","Codex","Cursor"],"install":{"ready":true,"command":"npx skills add LiveCodeBench/LiveCodeBench","primaryTarget":"CLI","targetCount":4},"githubQuality":{"stars":885,"starsLabel":"885","forks":191,"license":"MIT","qualityScore":69,"trustScore":82,"auditScore":80},"maintenance":{"status":"stable","label":"11mo since push","daysSincePush":335,"lastPushedAt":"2025-07-16T00:58:38+00:00"},"risk":{"level":"needs_review","label":"Needs review","requiresReview":true,"notes":["Quality score needs review","Needs review"]},"coverageTags":["Coding","Coding agents","testing-qa","test-generation","qa","developer-tools","code-execution","code-generation"]},"audit":{"audit_score":80,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Quality score needs review"]},"decision":{"readiness_score":71,"readiness_label":"Prototype first","headline":"Fallback candidate for Coding agents","role":"Fallback candidate","primary_fit":"Coding agents","best_for":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals"],"risks":["No OpenAgentSkill engagement data yet"],"next_steps":["Install it in a sandbox agent and run one Coding agents task end to end.","Compare output quality, latency, and failure behavior against at least one alternative.","Promote it into production only after reviewing repository permissions, license, and maintenance signals."]},"platforms":["Python","Testing","Claude Code","OpenAI Agents"],"use_cases":[{"slug":"coding-agents","title":"Coding agents","url":"https://www.openagentskill.com/use-cases/coding-agents"},{"slug":"github-automation","title":"GitHub automation","url":"https://www.openagentskill.com/use-cases/github-automation"},{"slug":"testing-qa","title":"Testing and QA","url":"https://www.openagentskill.com/use-cases/testing-qa"},{"slug":"rag-knowledge","title":"RAG and knowledge","url":"https://www.openagentskill.com/use-cases/rag-knowledge"}],"install":"npx skills add LiveCodeBench/LiveCodeBench","install_targets":[{"id":"openagentskill-cli","label":"CLI","title":"OpenAgentSkill CLI","kind":"command","value":"npx skills add LiveCodeBench/LiveCodeBench","description":"Use the registry command when your workflow supports the OpenAgentSkill installer.","copyLabel":"Copy command"},{"id":"codex","label":"Codex","title":"Codex install prompt","kind":"agent-prompt","value":"Install the \"LiveCodeBench\" agent skill from https://github.com/LiveCodeBench/LiveCodeBench. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Official repository for the paper \"LiveCodeBench: Holistic and Contamination Free Evaluation of Large Language Models for Code\"","description":"Give Codex a repo-aware install prompt when the skill is not available through a local CLI.","copyLabel":"Copy prompt"},{"id":"claude-code","label":"Claude Code","title":"Claude Code skill prompt","kind":"agent-prompt","value":"Add \"LiveCodeBench\" as a Claude Code skill from https://github.com/LiveCodeBench/LiveCodeBench. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Official repository for the paper \"LiveCodeBench: Holistic and Contamination Free Evaluation of Large Language Models for Code\"","description":"Use this prompt to ask Claude Code to add the skill and explain the local activation steps.","copyLabel":"Copy prompt"},{"id":"cursor","label":"Cursor","title":"Cursor rule prompt","kind":"agent-prompt","value":"Turn \"LiveCodeBench\" from https://github.com/LiveCodeBench/LiveCodeBench into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Official repository for the paper \"LiveCodeBench: Holistic and Contamination Free Evaluation of Large Language Models for Code\"","description":"Use this when installing as Cursor project rules or reusable agent instructions.","copyLabel":"Copy prompt"}],"repository":"https://github.com/LiveCodeBench/LiveCodeBench","github_repo":"LiveCodeBench/LiveCodeBench","version":"1.0.0","license":"MIT","updated_at":"2026-06-16T08:45:50.199197+00:00","canonical_key":"livecodebench/livecodebench","recommendation_reasons":["Useful GitHub adoption: 885 stars","Install handoff is available","Repository freshness signal is available"],"urls":{"web":"https://www.openagentskill.com/skills/livecodebench-livecodebench","api":"https://www.openagentskill.com/api/agent/skills/livecodebench-livecodebench","install_api":"https://www.openagentskill.com/api/skills/livecodebench-livecodebench/install","audit":"https://www.openagentskill.com/skills/livecodebench-livecodebench/audit","repository":"https://github.com/LiveCodeBench/LiveCodeBench"},"meta":{"endpoint":"/api/registry/manifest/{slug}","canonical_agent_endpoint":"/api/agent/skills/livecodebench-livecodebench","agent_friendly":true,"api_version":"1.0","generated_at":"2026-06-16T11:07:52.662Z"}}