{"eval":{"version":"openagentskill-skill-eval-v1","slug":"umaar-learn-browser-testing","name":"Learn Browser Testing","generated_at":"2026-07-03T22:43:42.675Z","task_input":"Evaluate Learn Browser Testing before installing it in an AI agent workflow","status":"failed","score":56,"risk_level":"high","decision":{"recommendation":"do_not_auto_install","reason":"Audit score: Risky","auto_install_allowed":false,"policy":"block","human_review_required":true},"task_fit":{"score":94,"suited_tasks":["Coding agents workflows","Claude Code teams","builders willing to evaluate younger projects","Inspect source files","Explain architecture","Patch bugs and verify changes","Navigate pages","Click and type safely"],"suited_agents":["HTML","Browser Automation","Codex","Claude Code","Cursor","OpenAgentSkill CLI","Browser agents","CLI"]},"install":{"command":"npx skills add umaar/learn-browser-testing","ready":true,"policy":"block","safety_label":"Avoid automatic install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add umaar/learn-browser-testing"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Learn Browser Testing\" agent skill from https://github.com/umaar/learn-browser-testing. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Repository for my upcoming course & workshop"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Learn Browser Testing\" as a Claude Code skill from https://github.com/umaar/learn-browser-testing. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Repository for my upcoming course & workshop"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Learn Browser Testing\" from https://github.com/umaar/learn-browser-testing into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Repository for my upcoming course & workshop"}]},"trust":{"score":65,"label":"Manual review","version":"trust-score-v4","evidence":{"stars":"116 GitHub stars","repoActivity":"116 stars, 8 forks","lastPushed":"6y since push","license":"Unknown","repository":"https://github.com/umaar/learn-browser-testing","install":"npx skills add umaar/learn-browser-testing","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access, network or browser access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":58,"risk_level":"risky","risk_label":"Risky","warnings":["License is unclear","Repository appears stale","Repository looks stale","Quality score needs review","Stars/forks activity: 116 stars, 8 forks; issue activity unavailable in current metadata","Recent maintenance: 6y since push","License clarity: Unknown"]},"safety_gate":{"score":38,"tier":"blocked","label":"Blocked for auto-install","auto_install_policy":"block","blocked":true,"permission_hints":[{"id":"browser","label":"Browser automation","reason":"Skill may drive a browser or interact with web pages.","severity":"medium"},{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"}],"policy_warnings":["Audit risk risky exceeds max_risk=medium","License is unclear"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":94,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate Learn Browser Testing before installing it in an AI agent workflow","web-automation","Coding agents workflows; Claude Code teams; builders willing to evaluate younger projects"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add umaar/learn-browser-testing"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add umaar/learn-browser-testing"]},{"id":"trust_score","label":"Trust score","status":"warn","score":65,"required_for_auto_install":true,"detail":"Potentially useful, but at least one trust signal needs human inspection.","evidence":["Manual review","116 GitHub stars","Unknown"]},{"id":"audit_score","label":"Audit score","status":"fail","score":58,"required_for_auto_install":true,"detail":"Risky","evidence":["License is unclear"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"fail","score":38,"required_for_auto_install":true,"detail":"This skill should not be selected by an agent without explicit human security review.","evidence":["Do not auto-install. Inspect the source, dependencies, and permission surface first.","Audit risk exceeds the requested agent policy"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"warn","score":74,"required_for_auto_install":false,"detail":"Public metadata needs stronger README/SKILL.md context","evidence":["Usable metadata, review docs"]},{"id":"license_clarity","label":"License clarity","status":"warn","score":42,"required_for_auto_install":true,"detail":"Unknown","evidence":["Unknown"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"fail","score":22,"required_for_auto_install":false,"detail":"6y since push","evidence":["6y since push"]},{"id":"permission_surface","label":"Permission surface","status":"warn","score":72,"required_for_auto_install":true,"detail":"filesystem or document access, network or browser access","evidence":["Browser automation: medium","Network access: medium","Filesystem access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["crawl4ai","d4vinci-scrapling","scrapy-scrapy","naibowang-easyspider"]}],"blockers":["Audit score: Risky","Agent safety gate: This skill should not be selected by an agent without explicit human security review."],"warnings":["Trust score: Potentially useful, but at least one trust signal needs human inspection.","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","License clarity: Unknown","Permission surface: filesystem or document access, network or browser access","Audit risk risky exceeds max_risk=medium","License is unclear","Repository appears stale","Repository looks stale","Quality score needs review","Stars/forks activity: 116 stars, 8 forks; issue activity unavailable in current metadata","Recent maintenance: 6y since push"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that require actively maintained dependencies","production agents without a repository review","Repository looks stale","No OpenAgentSkill engagement data yet","Audit risk risky exceeds max_risk=medium","License is unclear","Repository appears stale","Quality score needs review"],"alternatives":[{"slug":"crawl4ai","name":"Crawl4AI","url":"https://www.openagentskill.com/skills/crawl4ai","stars":70774,"install_command":"npx skills add unclecode/crawl4ai","trust_score":93,"audit_score":95},{"slug":"d4vinci-scrapling","name":"Scrapling","url":"https://www.openagentskill.com/skills/d4vinci-scrapling","stars":67816,"install_command":"npx skills add D4Vinci/Scrapling","trust_score":85,"audit_score":90},{"slug":"scrapy-scrapy","name":"Scrapy","url":"https://www.openagentskill.com/skills/scrapy-scrapy","stars":62532,"install_command":"npx skills add scrapy/scrapy","trust_score":92,"audit_score":95},{"slug":"naibowang-easyspider","name":"EasySpider","url":"https://www.openagentskill.com/skills/naibowang-easyspider","stars":44121,"install_command":"npx skills add NaiboWang/EasySpider","trust_score":93,"audit_score":94}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"umaar-learn-browser-testing","name":"Learn Browser Testing","description":"Repository for my upcoming course & workshop","category":"web-automation","url":"https://www.openagentskill.com/skills/umaar-learn-browser-testing","repository":"https://github.com/umaar/learn-browser-testing","github_repo":"umaar/learn-browser-testing"},"suited_tasks":["Coding agents workflows","Claude Code teams","builders willing to evaluate younger projects","Inspect source files","Explain architecture","Patch bugs and verify changes","Navigate pages","Click and type safely"],"suited_agents":["HTML","Browser Automation","Codex","Claude Code","Cursor","OpenAgentSkill CLI","Browser agents","CLI"],"install":{"command":"npx skills add umaar/learn-browser-testing","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add umaar/learn-browser-testing"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Learn Browser Testing\" agent skill from https://github.com/umaar/learn-browser-testing. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Repository for my upcoming course & workshop"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Learn Browser Testing\" as a Claude Code skill from https://github.com/umaar/learn-browser-testing. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Repository for my upcoming course & workshop"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Learn Browser Testing\" from https://github.com/umaar/learn-browser-testing into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Repository for my upcoming course & workshop"}],"handoff_url":"https://www.openagentskill.com/api/skills/umaar-learn-browser-testing/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/umaar-learn-browser-testing"},"trust":{"score":65,"label":"Manual review","version":"trust-score-v4","install_policy":"human_review_before_install","evidence":{"stars":"116 GitHub stars","repoActivity":"116 stars, 8 forks","lastPushed":"6y since push","license":"Unknown","repository":"https://github.com/umaar/learn-browser-testing","install":"npx skills add umaar/learn-browser-testing","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access, network or browser access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":false,"sandbox_required":true,"reason":"Human review or sandbox validation is required before automatic installation."},"best_for":["web-automation","browser","automation","browser-automation","end-to-end-testing","puppeteer"],"known_risks":["License is unclear","Repository looks stale","Quality score needs review","Stars/forks activity: 116 stars, 8 forks; issue activity unavailable in current metadata","Recent maintenance: 6y since push","License clarity: Unknown"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":58,"risk_level":"risky","risk_label":"Risky","warnings":["License is unclear","Repository appears stale","Repository looks stale","Quality score needs review","Stars/forks activity: 116 stars, 8 forks; issue activity unavailable in current metadata","Recent maintenance: 6y since push","License clarity: Unknown"]},"safety_gate":{"tier":"blocked","label":"Blocked for auto-install","auto_install_policy":"block","auto_install_allowed":false,"human_review_required":true,"blocked":true,"recommended_action":"Do not auto-install. Inspect the source, dependencies, and permission surface first."},"quality":{"score":42,"label":"Needs review"},"supply":{"track":"Coding and developer agents","scenario":"Coding agents","maintenance":"6y since push","risk":"Risky"},"alternative_skills":[{"slug":"crawl4ai","name":"Crawl4AI","url":"https://www.openagentskill.com/skills/crawl4ai","stars":70774,"install_command":"npx skills add unclecode/crawl4ai","trust_score":93,"audit_score":95},{"slug":"d4vinci-scrapling","name":"Scrapling","url":"https://www.openagentskill.com/skills/d4vinci-scrapling","stars":67816,"install_command":"npx skills add D4Vinci/Scrapling","trust_score":85,"audit_score":90},{"slug":"scrapy-scrapy","name":"Scrapy","url":"https://www.openagentskill.com/skills/scrapy-scrapy","stars":62532,"install_command":"npx skills add scrapy/scrapy","trust_score":92,"audit_score":95},{"slug":"naibowang-easyspider","name":"EasySpider","url":"https://www.openagentskill.com/skills/naibowang-easyspider","stars":44121,"install_command":"npx skills add NaiboWang/EasySpider","trust_score":93,"audit_score":94}],"do_not_use_when":["teams that require actively maintained dependencies","production agents without a repository review","Repository looks stale","No OpenAgentSkill engagement data yet","Audit risk risky exceeds max_risk=medium","License is unclear","Repository appears stale","Quality score needs review"],"agent_contract":{"task_input":"Evaluate Learn Browser Testing before installing it in an AI agent workflow","recommended_action":"Do not auto-install. Inspect the source, dependencies, and permission surface first.","install_policy":"block","minimum_review_before_use":["Trust: 65/100 Manual review","Audit: 58/100 Risky","Safety: 38/100 Avoid automatic install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"umaar-learn-browser-testing (Learn Browser Testing)","install_command":"npx skills add umaar/learn-browser-testing","risk_summary":"Risky; Blocked for auto-install; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"umaar-learn-browser-testing","task":"Evaluate Learn Browser Testing before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/umaar-learn-browser-testing","api":"https://www.openagentskill.com/api/agent/skills/umaar-learn-browser-testing","audit":"https://www.openagentskill.com/skills/umaar-learn-browser-testing/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=umaar-learn-browser-testing&task=Evaluate%20Learn%20Browser%20Testing%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Learn%20Browser%20Testing%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20Learn%20Browser%20Testing%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/umaar-learn-browser-testing/install","manifest":"https://www.openagentskill.com/api/registry/manifest/umaar-learn-browser-testing"}},"endpoints":{"web":"https://www.openagentskill.com/skills/umaar-learn-browser-testing","api":"https://www.openagentskill.com/api/agent/skills/umaar-learn-browser-testing","eval":"https://www.openagentskill.com/api/agent/evals?slug=umaar-learn-browser-testing","audit":"https://www.openagentskill.com/skills/umaar-learn-browser-testing/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Learn%20Browser%20Testing%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-03T22:43:42.675Z"}}