{"eval":{"version":"openagentskill-skill-eval-v1","slug":"mabel-dev-opteryx","name":"Opteryx","generated_at":"2026-07-04T00:14:35.066Z","task_input":"Evaluate Opteryx before installing it in an AI agent workflow","status":"failed","score":73,"risk_level":"high","decision":{"recommendation":"do_not_auto_install","reason":"Permission surface: shell or command execution, filesystem or document access","auto_install_allowed":false,"policy":"block","human_review_required":true},"task_fit":{"score":94,"suited_tasks":["Database and SQL workflows","Claude Code teams","builders willing to evaluate younger projects","Understand table relationships","Write safer queries","Explain database changes","Move data between tools","Transform files"],"suited_agents":["Python","SQL","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add mabel-dev/opteryx","ready":true,"policy":"review","safety_label":"Avoid automatic install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add mabel-dev/opteryx"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Opteryx\" agent skill from https://github.com/mabel-dev/opteryx. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: 🦖 A SQL-on-everything Query Engine you can execute over multiple databases and file formats. Query your data, where it lives."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Opteryx\" as a Claude Code skill from https://github.com/mabel-dev/opteryx. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: 🦖 A SQL-on-everything Query Engine you can execute over multiple databases and file formats. Query your data, where it lives."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Opteryx\" from https://github.com/mabel-dev/opteryx into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: 🦖 A SQL-on-everything Query Engine you can execute over multiple databases and file formats. Query your data, where it lives."}]},"trust":{"score":77,"label":"Strong shortlist","version":"trust-score-v4","evidence":{"stars":"113 GitHub stars","repoActivity":"113 stars, 14 forks","lastPushed":"1mo since push","license":"Apache-2.0","repository":"https://github.com/mabel-dev/opteryx","install":"npx skills add mabel-dev/opteryx","installSafety":"standard package or runtime install path","permissionSurface":"shell or command execution, filesystem or document access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":81,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: shell or command execution, filesystem or document access","Stars/forks activity: 113 stars, 14 forks; issue activity unavailable in current metadata","Permission surface: shell or command execution, filesystem or document access"]},"safety_gate":{"score":49,"tier":"experimental","label":"Experimental","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"shell","label":"Shell or command execution","reason":"Skill metadata references terminal, CLI, shell, subprocess, or command execution workflows.","severity":"high"},{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"},{"id":"database","label":"Database access","reason":"Skill may inspect schemas, query databases, or work with persistent stores.","severity":"medium"}],"policy_warnings":["High-risk permission hints: Shell or command execution","Permission surface may require sandboxing"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":94,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate Opteryx before installing it in an AI agent workflow","data-analysis","Database and SQL workflows; Claude Code teams; builders willing to evaluate younger projects"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add mabel-dev/opteryx"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add mabel-dev/opteryx"]},{"id":"trust_score","label":"Trust score","status":"warn","score":77,"required_for_auto_install":true,"detail":"Good trust signals with a few areas worth checking before rollout.","evidence":["Strong shortlist","113 GitHub stars","Apache-2.0"]},{"id":"audit_score","label":"Audit score","status":"warn","score":81,"required_for_auto_install":true,"detail":"Needs review","evidence":["Permission surface may require sandboxing"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":49,"required_for_auto_install":true,"detail":"Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","evidence":["Test manually in an isolated workspace and compare against safer alternatives.","High-risk permission hints: Shell or command execution"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"pass","score":90,"required_for_auto_install":false,"detail":"Metadata includes enough usage and workflow context","evidence":["Strong README/SKILL.md context"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"Apache-2.0","evidence":["Apache-2.0"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":88,"required_for_auto_install":false,"detail":"1mo since push","evidence":["1mo since push"]},{"id":"permission_surface","label":"Permission surface","status":"fail","score":50,"required_for_auto_install":true,"detail":"shell or command execution, filesystem or document access","evidence":["Shell or command execution: high","Network access: medium","Filesystem access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["d3-d3","grafana-grafana","apache-superset","apache-echarts"]}],"blockers":["Permission surface: shell or command execution, filesystem or document access"],"warnings":["Trust score: Good trust signals with a few areas worth checking before rollout.","Audit score: Needs review","Agent safety gate: Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","High-risk permission hints: Shell or command execution","Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: shell or command execution, filesystem or document access","Stars/forks activity: 113 stars, 14 forks; issue activity unavailable in current metadata","Permission surface: shell or command execution, filesystem or document access"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No OpenAgentSkill engagement data yet","High-risk permission hints: Shell or command execution","Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: shell or command execution, filesystem or document access","Stars/forks activity: 113 stars, 14 forks; issue activity unavailable in current metadata"],"alternatives":[{"slug":"d3-d3","name":"D3","url":"https://www.openagentskill.com/skills/d3-d3","stars":113096,"install_command":"npx skills add d3/d3","trust_score":89,"audit_score":91},{"slug":"grafana-grafana","name":"Grafana","url":"https://www.openagentskill.com/skills/grafana-grafana","stars":74422,"install_command":"npx skills add grafana/grafana","trust_score":92,"audit_score":94},{"slug":"apache-superset","name":"Superset","url":"https://www.openagentskill.com/skills/apache-superset","stars":73285,"install_command":"npx skills add apache/superset","trust_score":92,"audit_score":95},{"slug":"apache-echarts","name":"Echarts","url":"https://www.openagentskill.com/skills/apache-echarts","stars":66600,"install_command":"npx skills add apache/echarts","trust_score":91,"audit_score":92}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"mabel-dev-opteryx","name":"Opteryx","description":"🦖 A SQL-on-everything Query Engine you can execute over multiple databases and file formats. Query your data, where it lives.","category":"data-analysis","url":"https://www.openagentskill.com/skills/mabel-dev-opteryx","repository":"https://github.com/mabel-dev/opteryx","github_repo":"mabel-dev/opteryx"},"suited_tasks":["Database and SQL workflows","Claude Code teams","builders willing to evaluate younger projects","Understand table relationships","Write safer queries","Explain database changes","Move data between tools","Transform files"],"suited_agents":["Python","SQL","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add mabel-dev/opteryx","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add mabel-dev/opteryx"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Opteryx\" agent skill from https://github.com/mabel-dev/opteryx. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: 🦖 A SQL-on-everything Query Engine you can execute over multiple databases and file formats. Query your data, where it lives."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Opteryx\" as a Claude Code skill from https://github.com/mabel-dev/opteryx. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: 🦖 A SQL-on-everything Query Engine you can execute over multiple databases and file formats. Query your data, where it lives."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Opteryx\" from https://github.com/mabel-dev/opteryx into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: 🦖 A SQL-on-everything Query Engine you can execute over multiple databases and file formats. Query your data, where it lives."}],"handoff_url":"https://www.openagentskill.com/api/skills/mabel-dev-opteryx/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/mabel-dev-opteryx"},"trust":{"score":77,"label":"Strong shortlist","version":"trust-score-v4","install_policy":"human_review_before_install","evidence":{"stars":"113 GitHub stars","repoActivity":"113 stars, 14 forks","lastPushed":"1mo since push","license":"Apache-2.0","repository":"https://github.com/mabel-dev/opteryx","install":"npx skills add mabel-dev/opteryx","installSafety":"standard package or runtime install path","permissionSurface":"shell or command execution, filesystem or document access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":false,"sandbox_required":true,"reason":"Human review or sandbox validation is required before automatic installation."},"best_for":["data-analysis","sql","data","analytics","arrow","aws"],"known_risks":["Quality score needs review","Permission surface needs review: shell or command execution, filesystem or document access","Stars/forks activity: 113 stars, 14 forks; issue activity unavailable in current metadata","Permission surface: shell or command execution, filesystem or document access"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":81,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: shell or command execution, filesystem or document access","Stars/forks activity: 113 stars, 14 forks; issue activity unavailable in current metadata","Permission surface: shell or command execution, filesystem or document access"]},"safety_gate":{"tier":"experimental","label":"Experimental","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Test manually in an isolated workspace and compare against safer alternatives."},"quality":{"score":75,"label":"Strong"},"supply":{"track":"Data, BI, and analytics","scenario":"Database and SQL","maintenance":"1mo since push","risk":"Needs review"},"alternative_skills":[{"slug":"d3-d3","name":"D3","url":"https://www.openagentskill.com/skills/d3-d3","stars":113096,"install_command":"npx skills add d3/d3","trust_score":89,"audit_score":91},{"slug":"grafana-grafana","name":"Grafana","url":"https://www.openagentskill.com/skills/grafana-grafana","stars":74422,"install_command":"npx skills add grafana/grafana","trust_score":92,"audit_score":94},{"slug":"apache-superset","name":"Superset","url":"https://www.openagentskill.com/skills/apache-superset","stars":73285,"install_command":"npx skills add apache/superset","trust_score":92,"audit_score":95},{"slug":"apache-echarts","name":"Echarts","url":"https://www.openagentskill.com/skills/apache-echarts","stars":66600,"install_command":"npx skills add apache/echarts","trust_score":91,"audit_score":92}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No OpenAgentSkill engagement data yet","High-risk permission hints: Shell or command execution","Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: shell or command execution, filesystem or document access","Stars/forks activity: 113 stars, 14 forks; issue activity unavailable in current metadata"],"agent_contract":{"task_input":"Evaluate Opteryx before installing it in an AI agent workflow","recommended_action":"Test manually in an isolated workspace and compare against safer alternatives.","install_policy":"review","minimum_review_before_use":["Trust: 77/100 Strong shortlist","Audit: 81/100 Needs review","Safety: 49/100 Avoid automatic install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"mabel-dev-opteryx (Opteryx)","install_command":"npx skills add mabel-dev/opteryx","risk_summary":"Needs review; Experimental; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"mabel-dev-opteryx","task":"Evaluate Opteryx before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/mabel-dev-opteryx","api":"https://www.openagentskill.com/api/agent/skills/mabel-dev-opteryx","audit":"https://www.openagentskill.com/skills/mabel-dev-opteryx/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=mabel-dev-opteryx&task=Evaluate%20Opteryx%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Opteryx%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20Opteryx%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/mabel-dev-opteryx/install","manifest":"https://www.openagentskill.com/api/registry/manifest/mabel-dev-opteryx"}},"endpoints":{"web":"https://www.openagentskill.com/skills/mabel-dev-opteryx","api":"https://www.openagentskill.com/api/agent/skills/mabel-dev-opteryx","eval":"https://www.openagentskill.com/api/agent/evals?slug=mabel-dev-opteryx","audit":"https://www.openagentskill.com/skills/mabel-dev-opteryx/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Opteryx%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-04T00:14:35.066Z"}}