{"eval":{"version":"openagentskill-skill-eval-v1","slug":"hume-vla-hume","name":"Hume","generated_at":"2026-07-03T22:22:13.413Z","task_input":"Evaluate Hume before installing it in an AI agent workflow","status":"review","score":66,"risk_level":"medium","decision":{"recommendation":"manual_review","reason":"Test manually in an isolated workspace and compare against safer alternatives.","auto_install_allowed":false,"policy":"review","human_review_required":true},"task_fit":{"score":94,"suited_tasks":["Coding agents workflows","Claude Code teams","builders willing to evaluate younger projects","Inspect source files","Explain architecture","Patch bugs and verify changes","Chunk documents","Create embeddings"],"suited_agents":["Python","Robotics","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add hume-vla/hume","ready":true,"policy":"review","safety_label":"Avoid automatic install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add hume-vla/hume"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Hume\" agent skill from https://github.com/hume-vla/hume. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: 🦾 A Dual-System VLA with System2 Thinking"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Hume\" as a Claude Code skill from https://github.com/hume-vla/hume. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: 🦾 A Dual-System VLA with System2 Thinking"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Hume\" from https://github.com/hume-vla/hume into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: 🦾 A Dual-System VLA with System2 Thinking"}]},"trust":{"score":71,"label":"Manual review","version":"trust-score-v4","evidence":{"stars":"145 GitHub stars","repoActivity":"145 stars, 3 forks","lastPushed":"11mo since push","license":"Unknown","repository":"https://github.com/hume-vla/hume","install":"npx skills add hume-vla/hume","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":69,"risk_level":"needs_review","risk_label":"Needs review","warnings":["License is unclear","Quality score needs review","Stars/forks activity: 145 stars, 3 forks; issue activity unavailable in current metadata","License clarity: Unknown"]},"safety_gate":{"score":53,"tier":"experimental","label":"Experimental","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"}],"policy_warnings":["License is unclear"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":94,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate Hume before installing it in an AI agent workflow","robotics-iot","Coding agents workflows; Claude Code teams; builders willing to evaluate younger projects"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add hume-vla/hume"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add hume-vla/hume"]},{"id":"trust_score","label":"Trust score","status":"warn","score":71,"required_for_auto_install":true,"detail":"Potentially useful, but at least one trust signal needs human inspection.","evidence":["Manual review","145 GitHub stars","Unknown"]},{"id":"audit_score","label":"Audit score","status":"warn","score":69,"required_for_auto_install":true,"detail":"Needs review","evidence":["License is unclear"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":53,"required_for_auto_install":true,"detail":"Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","evidence":["Test manually in an isolated workspace and compare against safer alternatives.","License is unclear"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"warn","score":74,"required_for_auto_install":false,"detail":"Public metadata needs stronger README/SKILL.md context","evidence":["Usable metadata, review docs"]},{"id":"license_clarity","label":"License clarity","status":"warn","score":42,"required_for_auto_install":true,"detail":"Unknown","evidence":["Unknown"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"warn","score":62,"required_for_auto_install":false,"detail":"11mo since push","evidence":["11mo since push"]},{"id":"permission_surface","label":"Permission surface","status":"pass","score":86,"required_for_auto_install":true,"detail":"filesystem or document access","evidence":["Network access: medium","Filesystem access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["mayocream-koharu","henryndubuaku-maths-cs-ai-compendium","ceres-solver-ceres-solver","pinto0309-pinto-model-zoo"]}],"blockers":[],"warnings":["Trust score: Potentially useful, but at least one trust signal needs human inspection.","Audit score: Needs review","Agent safety gate: Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","License clarity: Unknown","Recent maintenance: 11mo since push","License is unclear","Quality score needs review","Stars/forks activity: 145 stars, 3 forks; issue activity unavailable in current metadata"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","License is unclear","Quality score needs review","Stars/forks activity: 145 stars, 3 forks; issue activity unavailable in current metadata","License clarity: Unknown","Production credentials, payments, or irreversible account changes without explicit human review"],"alternatives":[{"slug":"mayocream-koharu","name":"Koharu","url":"https://www.openagentskill.com/skills/mayocream-koharu","stars":4669,"install_command":"npx skills add mayocream/koharu","trust_score":89,"audit_score":94},{"slug":"henryndubuaku-maths-cs-ai-compendium","name":"Maths Cs AI Compendium","url":"https://www.openagentskill.com/skills/henryndubuaku-maths-cs-ai-compendium","stars":4528,"install_command":"npx skills add HenryNdubuaku/maths-cs-ai-compendium","trust_score":89,"audit_score":94},{"slug":"ceres-solver-ceres-solver","name":"Ceres Solver","url":"https://www.openagentskill.com/skills/ceres-solver-ceres-solver","stars":4503,"install_command":"npx skills add ceres-solver/ceres-solver","trust_score":86,"audit_score":91},{"slug":"pinto0309-pinto-model-zoo","name":"PINTO Model Zoo","url":"https://www.openagentskill.com/skills/pinto0309-pinto-model-zoo","stars":4445,"install_command":"npx skills add PINTO0309/PINTO_model_zoo","trust_score":91,"audit_score":94}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"hume-vla-hume","name":"Hume","description":"🦾  A Dual-System VLA with System2 Thinking","category":"robotics-iot","url":"https://www.openagentskill.com/skills/hume-vla-hume","repository":"https://github.com/hume-vla/hume","github_repo":"hume-vla/hume"},"suited_tasks":["Coding agents workflows","Claude Code teams","builders willing to evaluate younger projects","Inspect source files","Explain architecture","Patch bugs and verify changes","Chunk documents","Create embeddings"],"suited_agents":["Python","Robotics","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add hume-vla/hume","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add hume-vla/hume"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Hume\" agent skill from https://github.com/hume-vla/hume. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: 🦾 A Dual-System VLA with System2 Thinking"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Hume\" as a Claude Code skill from https://github.com/hume-vla/hume. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: 🦾 A Dual-System VLA with System2 Thinking"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Hume\" from https://github.com/hume-vla/hume into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: 🦾 A Dual-System VLA with System2 Thinking"}],"handoff_url":"https://www.openagentskill.com/api/skills/hume-vla-hume/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/hume-vla-hume"},"trust":{"score":71,"label":"Manual review","version":"trust-score-v4","install_policy":"human_review_before_install","evidence":{"stars":"145 GitHub stars","repoActivity":"145 stars, 3 forks","lastPushed":"11mo since push","license":"Unknown","repository":"https://github.com/hume-vla/hume","install":"npx skills add hume-vla/hume","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":false,"sandbox_required":true,"reason":"Human review or sandbox validation is required before automatic installation."},"best_for":["robotics-iot","robotics","automation","system2-thinking","test-time-computation","vla"],"known_risks":["License is unclear","Quality score needs review","Stars/forks activity: 145 stars, 3 forks; issue activity unavailable in current metadata","License clarity: Unknown"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":69,"risk_level":"needs_review","risk_label":"Needs review","warnings":["License is unclear","Quality score needs review","Stars/forks activity: 145 stars, 3 forks; issue activity unavailable in current metadata","License clarity: Unknown"]},"safety_gate":{"tier":"experimental","label":"Experimental","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Test manually in an isolated workspace and compare against safer alternatives."},"quality":{"score":56,"label":"Promising"},"supply":{"track":"Coding and developer agents","scenario":"Coding agents","maintenance":"11mo since push","risk":"Needs review"},"alternative_skills":[{"slug":"mayocream-koharu","name":"Koharu","url":"https://www.openagentskill.com/skills/mayocream-koharu","stars":4669,"install_command":"npx skills add mayocream/koharu","trust_score":89,"audit_score":94},{"slug":"henryndubuaku-maths-cs-ai-compendium","name":"Maths Cs AI Compendium","url":"https://www.openagentskill.com/skills/henryndubuaku-maths-cs-ai-compendium","stars":4528,"install_command":"npx skills add HenryNdubuaku/maths-cs-ai-compendium","trust_score":89,"audit_score":94},{"slug":"ceres-solver-ceres-solver","name":"Ceres Solver","url":"https://www.openagentskill.com/skills/ceres-solver-ceres-solver","stars":4503,"install_command":"npx skills add ceres-solver/ceres-solver","trust_score":86,"audit_score":91},{"slug":"pinto0309-pinto-model-zoo","name":"PINTO Model Zoo","url":"https://www.openagentskill.com/skills/pinto0309-pinto-model-zoo","stars":4445,"install_command":"npx skills add PINTO0309/PINTO_model_zoo","trust_score":91,"audit_score":94}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","License is unclear","Quality score needs review","Stars/forks activity: 145 stars, 3 forks; issue activity unavailable in current metadata","License clarity: Unknown","Production credentials, payments, or irreversible account changes without explicit human review"],"agent_contract":{"task_input":"Evaluate Hume before installing it in an AI agent workflow","recommended_action":"Test manually in an isolated workspace and compare against safer alternatives.","install_policy":"review","minimum_review_before_use":["Trust: 71/100 Manual review","Audit: 69/100 Needs review","Safety: 53/100 Avoid automatic install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"hume-vla-hume (Hume)","install_command":"npx skills add hume-vla/hume","risk_summary":"Needs review; Experimental; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"hume-vla-hume","task":"Evaluate Hume before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/hume-vla-hume","api":"https://www.openagentskill.com/api/agent/skills/hume-vla-hume","audit":"https://www.openagentskill.com/skills/hume-vla-hume/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=hume-vla-hume&task=Evaluate%20Hume%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Hume%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20Hume%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/hume-vla-hume/install","manifest":"https://www.openagentskill.com/api/registry/manifest/hume-vla-hume"}},"endpoints":{"web":"https://www.openagentskill.com/skills/hume-vla-hume","api":"https://www.openagentskill.com/api/agent/skills/hume-vla-hume","eval":"https://www.openagentskill.com/api/agent/evals?slug=hume-vla-hume","audit":"https://www.openagentskill.com/skills/hume-vla-hume/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Hume%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-03T22:22:13.413Z"}}