{"eval":{"version":"openagentskill-skill-eval-v1","slug":"nkai-decision-team-llm-pysc2","name":"LLM PySC2","generated_at":"2026-07-03T22:22:31.351Z","task_input":"Evaluate LLM PySC2 before installing it in an AI agent workflow","status":"review","score":63,"risk_level":"medium","decision":{"recommendation":"manual_review","reason":"Test manually in an isolated workspace and compare against safer alternatives.","auto_install_allowed":false,"policy":"review","human_review_required":true},"task_fit":{"score":94,"suited_tasks":["Sports analytics workflows","Claude Code teams","builders willing to evaluate younger projects","Load football datasets","Compare teams and players","Explain match and tournament signals","Inspect repository metadata","Compare code changes"],"suited_agents":["Python","LLM","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add NKAI-Decision-Team/LLM-PySC2","ready":true,"policy":"review","safety_label":"Avoid automatic install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add NKAI-Decision-Team/LLM-PySC2"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"LLM PySC2\" agent skill from https://github.com/NKAI-Decision-Team/LLM-PySC2. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: LLM-PySC2 is NKAI Decision Team and NUDT Decision Team's Python component of the StarCraft II LLM Decision Environment. It exposes Deepmind's PySC2 Learning Environment API as a Python LLM Environment."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"LLM PySC2\" as a Claude Code skill from https://github.com/NKAI-Decision-Team/LLM-PySC2. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: LLM-PySC2 is NKAI Decision Team and NUDT Decision Team's Python component of the StarCraft II LLM Decision Environment. It exposes Deepmind's PySC2 Learning Environment API as a Python LLM Environment."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"LLM PySC2\" from https://github.com/NKAI-Decision-Team/LLM-PySC2 into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: LLM-PySC2 is NKAI Decision Team and NUDT Decision Team's Python component of the StarCraft II LLM Decision Environment. It exposes Deepmind's PySC2 Learning Environment API as a Python LLM Environment."}]},"trust":{"score":73,"label":"Strong shortlist","version":"trust-score-v4","evidence":{"stars":"156 GitHub stars","repoActivity":"156 stars, 16 forks","lastPushed":"1y since push","license":"Apache-2.0","repository":"https://github.com/NKAI-Decision-Team/LLM-PySC2","install":"npx skills add NKAI-Decision-Team/LLM-PySC2","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access, network or browser access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":65,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Repository appears stale","Repository looks stale","Quality score needs review","Stars/forks activity: 156 stars, 16 forks; issue activity unavailable in current metadata","Recent maintenance: 1y since push"]},"safety_gate":{"score":49,"tier":"experimental","label":"Experimental","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"}],"policy_warnings":["Repository appears stale"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":94,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate LLM PySC2 before installing it in an AI agent workflow","agent-frameworks","Sports analytics workflows; Claude Code teams; builders willing to evaluate younger projects"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add NKAI-Decision-Team/LLM-PySC2"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add NKAI-Decision-Team/LLM-PySC2"]},{"id":"trust_score","label":"Trust score","status":"warn","score":73,"required_for_auto_install":true,"detail":"Good trust signals with a few areas worth checking before rollout.","evidence":["Strong shortlist","156 GitHub stars","Apache-2.0"]},{"id":"audit_score","label":"Audit score","status":"warn","score":65,"required_for_auto_install":true,"detail":"Needs review","evidence":["Repository appears stale"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":49,"required_for_auto_install":true,"detail":"Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","evidence":["Test manually in an isolated workspace and compare against safer alternatives.","Repository appears stale"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"pass","score":90,"required_for_auto_install":false,"detail":"Metadata includes enough usage and workflow context","evidence":["Strong README/SKILL.md context"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"Apache-2.0","evidence":["Apache-2.0"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"fail","score":38,"required_for_auto_install":false,"detail":"1y since push","evidence":["1y since push"]},{"id":"permission_surface","label":"Permission surface","status":"warn","score":72,"required_for_auto_install":true,"detail":"filesystem or document access, network or browser access","evidence":["Network access: medium","Filesystem access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["significant-gravitas-autogpt","langchain-ai-langchain","nousresearch-hermes-agent","firecrawl-firecrawl"]}],"blockers":[],"warnings":["Trust score: Good trust signals with a few areas worth checking before rollout.","Audit score: Needs review","Agent safety gate: Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","Permission surface: filesystem or document access, network or browser access","Repository appears stale","Repository looks stale","Quality score needs review","Stars/forks activity: 156 stars, 16 forks; issue activity unavailable in current metadata","Recent maintenance: 1y since push"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that require actively maintained dependencies","production agents without a repository review","Repository looks stale","No OpenAgentSkill engagement data yet","Repository appears stale","Quality score needs review","Stars/forks activity: 156 stars, 16 forks; issue activity unavailable in current metadata","Recent maintenance: 1y since push"],"alternatives":[{"slug":"significant-gravitas-autogpt","name":"AutoGPT","url":"https://www.openagentskill.com/skills/significant-gravitas-autogpt","stars":185244,"install_command":"npx skills add Significant-Gravitas/AutoGPT","trust_score":86,"audit_score":92},{"slug":"langchain-ai-langchain","name":"Langchain","url":"https://www.openagentskill.com/skills/langchain-ai-langchain","stars":140782,"install_command":"npx skills add langchain-ai/langchain","trust_score":92,"audit_score":95},{"slug":"nousresearch-hermes-agent","name":"Hermes Agent","url":"https://www.openagentskill.com/skills/nousresearch-hermes-agent","stars":205451,"install_command":"npx skills add NousResearch/hermes-agent","trust_score":92,"audit_score":95},{"slug":"firecrawl-firecrawl","name":"Firecrawl","url":"https://www.openagentskill.com/skills/firecrawl-firecrawl","stars":139273,"install_command":"npx skills add firecrawl/firecrawl","trust_score":91,"audit_score":94}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"nkai-decision-team-llm-pysc2","name":"LLM PySC2","description":"LLM-PySC2 is NKAI Decision Team and NUDT Decision Team's Python component of the StarCraft II LLM Decision Environment. It exposes Deepmind's PySC2 Learning Environment API as a Python LLM Environment.","category":"agent-frameworks","url":"https://www.openagentskill.com/skills/nkai-decision-team-llm-pysc2","repository":"https://github.com/NKAI-Decision-Team/LLM-PySC2","github_repo":"NKAI-Decision-Team/LLM-PySC2"},"suited_tasks":["Sports analytics workflows","Claude Code teams","builders willing to evaluate younger projects","Load football datasets","Compare teams and players","Explain match and tournament signals","Inspect repository metadata","Compare code changes"],"suited_agents":["Python","LLM","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add NKAI-Decision-Team/LLM-PySC2","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add NKAI-Decision-Team/LLM-PySC2"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"LLM PySC2\" agent skill from https://github.com/NKAI-Decision-Team/LLM-PySC2. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: LLM-PySC2 is NKAI Decision Team and NUDT Decision Team's Python component of the StarCraft II LLM Decision Environment. It exposes Deepmind's PySC2 Learning Environment API as a Python LLM Environment."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"LLM PySC2\" as a Claude Code skill from https://github.com/NKAI-Decision-Team/LLM-PySC2. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: LLM-PySC2 is NKAI Decision Team and NUDT Decision Team's Python component of the StarCraft II LLM Decision Environment. It exposes Deepmind's PySC2 Learning Environment API as a Python LLM Environment."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"LLM PySC2\" from https://github.com/NKAI-Decision-Team/LLM-PySC2 into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: LLM-PySC2 is NKAI Decision Team and NUDT Decision Team's Python component of the StarCraft II LLM Decision Environment. It exposes Deepmind's PySC2 Learning Environment API as a Python LLM Environment."}],"handoff_url":"https://www.openagentskill.com/api/skills/nkai-decision-team-llm-pysc2/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/nkai-decision-team-llm-pysc2"},"trust":{"score":73,"label":"Strong shortlist","version":"trust-score-v4","install_policy":"human_review_before_install","evidence":{"stars":"156 GitHub stars","repoActivity":"156 stars, 16 forks","lastPushed":"1y since push","license":"Apache-2.0","repository":"https://github.com/NKAI-Decision-Team/LLM-PySC2","install":"npx skills add NKAI-Decision-Team/LLM-PySC2","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access, network or browser access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":false,"sandbox_required":true,"reason":"Human review or sandbox validation is required before automatic installation."},"best_for":["agent-frameworks","llm-agent","agents","environment","llm","llm-pysc2"],"known_risks":["Repository looks stale","Quality score needs review","Stars/forks activity: 156 stars, 16 forks; issue activity unavailable in current metadata","Recent maintenance: 1y since push"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":65,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Repository appears stale","Repository looks stale","Quality score needs review","Stars/forks activity: 156 stars, 16 forks; issue activity unavailable in current metadata","Recent maintenance: 1y since push"]},"safety_gate":{"tier":"experimental","label":"Experimental","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Test manually in an isolated workspace and compare against safer alternatives."},"quality":{"score":48,"label":"Needs review"},"supply":{"track":"Coding and developer agents","scenario":"GitHub automation","maintenance":"1y since push","risk":"Needs review"},"alternative_skills":[{"slug":"significant-gravitas-autogpt","name":"AutoGPT","url":"https://www.openagentskill.com/skills/significant-gravitas-autogpt","stars":185244,"install_command":"npx skills add Significant-Gravitas/AutoGPT","trust_score":86,"audit_score":92},{"slug":"langchain-ai-langchain","name":"Langchain","url":"https://www.openagentskill.com/skills/langchain-ai-langchain","stars":140782,"install_command":"npx skills add langchain-ai/langchain","trust_score":92,"audit_score":95},{"slug":"nousresearch-hermes-agent","name":"Hermes Agent","url":"https://www.openagentskill.com/skills/nousresearch-hermes-agent","stars":205451,"install_command":"npx skills add NousResearch/hermes-agent","trust_score":92,"audit_score":95},{"slug":"firecrawl-firecrawl","name":"Firecrawl","url":"https://www.openagentskill.com/skills/firecrawl-firecrawl","stars":139273,"install_command":"npx skills add firecrawl/firecrawl","trust_score":91,"audit_score":94}],"do_not_use_when":["teams that require actively maintained dependencies","production agents without a repository review","Repository looks stale","No OpenAgentSkill engagement data yet","Repository appears stale","Quality score needs review","Stars/forks activity: 156 stars, 16 forks; issue activity unavailable in current metadata","Recent maintenance: 1y since push"],"agent_contract":{"task_input":"Evaluate LLM PySC2 before installing it in an AI agent workflow","recommended_action":"Test manually in an isolated workspace and compare against safer alternatives.","install_policy":"review","minimum_review_before_use":["Trust: 73/100 Strong shortlist","Audit: 65/100 Needs review","Safety: 49/100 Avoid automatic install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"nkai-decision-team-llm-pysc2 (LLM PySC2)","install_command":"npx skills add NKAI-Decision-Team/LLM-PySC2","risk_summary":"Needs review; Experimental; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"nkai-decision-team-llm-pysc2","task":"Evaluate LLM PySC2 before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/nkai-decision-team-llm-pysc2","api":"https://www.openagentskill.com/api/agent/skills/nkai-decision-team-llm-pysc2","audit":"https://www.openagentskill.com/skills/nkai-decision-team-llm-pysc2/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=nkai-decision-team-llm-pysc2&task=Evaluate%20LLM%20PySC2%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20LLM%20PySC2%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20LLM%20PySC2%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/nkai-decision-team-llm-pysc2/install","manifest":"https://www.openagentskill.com/api/registry/manifest/nkai-decision-team-llm-pysc2"}},"endpoints":{"web":"https://www.openagentskill.com/skills/nkai-decision-team-llm-pysc2","api":"https://www.openagentskill.com/api/agent/skills/nkai-decision-team-llm-pysc2","eval":"https://www.openagentskill.com/api/agent/evals?slug=nkai-decision-team-llm-pysc2","audit":"https://www.openagentskill.com/skills/nkai-decision-team-llm-pysc2/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20LLM%20PySC2%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-03T22:22:31.351Z"}}