{"eval":{"version":"openagentskill-skill-eval-v1","slug":"playwright","name":"Playwright","generated_at":"2026-06-20T17:48:00.332Z","task_input":"Evaluate Playwright before installing it in an AI agent workflow","status":"review","score":88,"risk_level":"medium","decision":{"recommendation":"manual_review","reason":"Review the audit page, then allow agent install in a sandboxed workflow.","auto_install_allowed":false,"policy":"review","human_review_required":true},"task_fit":{"score":84,"suited_tasks":["Browser automation workflows","OpenAI Agents teams","teams that value GitHub adoption signals","Navigate pages","Click and type safely","Check visual and DOM state","Run test suites","Capture failures"],"suited_agents":["Node.js","Python","Codex","Claude Code","Cursor","OpenAgentSkill CLI","OpenAI Agents","Browser agents"]},"install":{"command":"npx skills add microsoft/playwright","ready":true,"policy":"review","safety_label":"Review before install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add microsoft/playwright"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Playwright\" agent skill from https://github.com/microsoft/playwright. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Reliable browser automation and testing engine for web agent tasks."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Playwright\" as a Claude Code skill from https://github.com/microsoft/playwright. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Reliable browser automation and testing engine for web agent tasks."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Playwright\" from https://github.com/microsoft/playwright into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Reliable browser automation and testing engine for web agent tasks."}]},"trust":{"score":85,"label":"Strong shortlist","version":"trust-score-v3","evidence":{"stars":"76K GitHub stars","repoActivity":"76K stars, 0 forks","lastPushed":"19d since push","license":"Apache-2.0","repository":"https://github.com/microsoft/playwright","install":"npx skills add microsoft/playwright","installSafety":"standard package or runtime install path","permissionSurface":"network or browser access","documentation":"Thin public metadata"}},"audit":{"score":92,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":["Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"safety_gate":{"score":76,"tier":"reviewed","label":"Reviewed","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"browser","label":"Browser automation","reason":"Skill may drive a browser or interact with web pages.","severity":"medium"},{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"}],"policy_warnings":["Documentation summary is thin"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":84,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate Playwright before installing it in an AI agent workflow","Browser Automation","Browser automation workflows; OpenAI Agents teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add microsoft/playwright"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add microsoft/playwright"]},{"id":"trust_score","label":"Trust score","status":"pass","score":85,"required_for_auto_install":true,"detail":"Good trust signals with a few areas worth checking before rollout.","evidence":["Strong shortlist","76K GitHub stars","Apache-2.0"]},{"id":"audit_score","label":"Audit score","status":"pass","score":92,"required_for_auto_install":true,"detail":"Safe to try","evidence":["Documentation summary is thin"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":76,"required_for_auto_install":true,"detail":"Good audit and safety signals with no high-risk permission hints in public metadata.","evidence":["Review the audit page, then allow agent install in a sandboxed workflow.","Safe-to-try audit"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"fail","score":50,"required_for_auto_install":false,"detail":"Public metadata needs stronger README/SKILL.md context","evidence":["Thin public metadata"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"Apache-2.0","evidence":["Apache-2.0"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":100,"required_for_auto_install":false,"detail":"19d since push","evidence":["19d since push"]},{"id":"permission_surface","label":"Permission surface","status":"pass","score":86,"required_for_auto_install":true,"detail":"network or browser access","evidence":["Browser automation: medium","Network access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"info","score":55,"required_for_auto_install":false,"detail":"No close alternatives were found in the current shortlist.","evidence":[]}],"blockers":[],"warnings":["Agent safety gate: Good audit and safety signals with no high-risk permission hints in public metadata.","Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No OpenAgentSkill engagement data yet","Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"],"alternatives":[],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"playwright","name":"Playwright","description":"Reliable browser automation and testing engine for web agent tasks.","category":"Browser Automation","url":"https://www.openagentskill.com/skills/playwright","repository":"https://github.com/microsoft/playwright","github_repo":"microsoft/playwright"},"suited_tasks":["Browser automation workflows","OpenAI Agents teams","teams that value GitHub adoption signals","Navigate pages","Click and type safely","Check visual and DOM state","Run test suites","Capture failures"],"suited_agents":["Node.js","Python","Codex","Claude Code","Cursor","OpenAgentSkill CLI","OpenAI Agents","Browser agents"],"install":{"command":"npx skills add microsoft/playwright","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add microsoft/playwright"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Playwright\" agent skill from https://github.com/microsoft/playwright. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Reliable browser automation and testing engine for web agent tasks."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Playwright\" as a Claude Code skill from https://github.com/microsoft/playwright. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Reliable browser automation and testing engine for web agent tasks."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Playwright\" from https://github.com/microsoft/playwright into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Reliable browser automation and testing engine for web agent tasks."}],"handoff_url":"https://www.openagentskill.com/api/skills/playwright/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/playwright"},"trust":{"score":85,"label":"Strong shortlist","version":"trust-score-v3","install_policy":"human_review_before_install","evidence":{"stars":"76K GitHub stars","repoActivity":"76K stars, 0 forks","lastPushed":"19d since push","license":"Apache-2.0","repository":"https://github.com/microsoft/playwright","install":"npx skills add microsoft/playwright","installSafety":"standard package or runtime install path","permissionSurface":"network or browser access","documentation":"Thin public metadata"}},"audit":{"score":92,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":["Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"safety_gate":{"tier":"reviewed","label":"Reviewed","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Review the audit page, then allow agent install in a sandboxed workflow."},"quality":{"score":100,"label":"Excellent"},"supply":{"track":"Coding and developer agents","scenario":"Testing and QA","maintenance":"19d since push","risk":"Safe to try"},"alternative_skills":[],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No OpenAgentSkill engagement data yet","Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"],"agent_contract":{"task_input":"Evaluate Playwright before installing it in an AI agent workflow","recommended_action":"Review the audit page, then allow agent install in a sandboxed workflow.","install_policy":"review","minimum_review_before_use":["Trust: 85/100 Strong shortlist","Audit: 92/100 Safe to try","Safety: 76/100 Review before install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"playwright (Playwright)","install_command":"npx skills add microsoft/playwright","risk_summary":"Safe to try; Reviewed; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"endpoints":{"web":"https://www.openagentskill.com/skills/playwright","api":"https://www.openagentskill.com/api/agent/skills/playwright","audit":"https://www.openagentskill.com/skills/playwright/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=playwright&task=Evaluate%20Playwright%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Playwright%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","install":"https://www.openagentskill.com/api/skills/playwright/install","manifest":"https://www.openagentskill.com/api/registry/manifest/playwright"}},"endpoints":{"web":"https://www.openagentskill.com/skills/playwright","api":"https://www.openagentskill.com/api/agent/skills/playwright","eval":"https://www.openagentskill.com/api/agent/evals?slug=playwright","audit":"https://www.openagentskill.com/skills/playwright/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Playwright%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-06-20T17:48:00.332Z"}}